{"step": 0, "train_loss": 11.9334135055542, "lr": 0.0, "tps": 12837, "wall": 5.1} {"step": 1, "train_loss": 11.929274559020996, "lr": 4.0000000000000003e-07, "tps": 12994, "wall": 10.1} {"step": 2, "train_loss": 11.910177230834961, "lr": 8.000000000000001e-07, "tps": 13073, "wall": 15.0} {"step": 3, "train_loss": 11.912367820739746, "lr": 1.2000000000000002e-06, "tps": 13105, "wall": 20.0} {"step": 4, "train_loss": 11.895181655883789, "lr": 1.6000000000000001e-06, "tps": 13094, "wall": 25.0} {"step": 5, "train_loss": 11.896822929382324, "lr": 2e-06, "tps": 13117, "wall": 30.0} {"step": 6, "train_loss": 11.853190422058105, "lr": 2.4000000000000003e-06, "tps": 13117, "wall": 35.0} {"step": 7, "train_loss": 11.814668655395508, "lr": 2.8e-06, "tps": 13134, "wall": 39.9} {"step": 8, "train_loss": 11.732216835021973, "lr": 3.2000000000000003e-06, "tps": 13147, "wall": 44.9} {"step": 9, "train_loss": 11.687389373779297, "lr": 3.6000000000000003e-06, "tps": 13152, "wall": 49.8} {"step": 10, "train_loss": 11.624338150024414, "lr": 4e-06, "tps": 13146, "wall": 54.8} {"step": 11, "train_loss": 11.551264762878418, "lr": 4.4e-06, "tps": 13153, "wall": 59.8} {"step": 12, "train_loss": 11.447733879089355, "lr": 4.800000000000001e-06, "tps": 13158, "wall": 64.7} {"step": 13, "train_loss": 11.409244537353516, "lr": 5.200000000000001e-06, "tps": 13161, "wall": 69.7} {"step": 14, "train_loss": 11.291666984558105, "lr": 5.6e-06, "tps": 13165, "wall": 74.7} {"step": 15, "train_loss": 11.17678165435791, "lr": 6e-06, "tps": 13169, "wall": 79.6} {"step": 16, "train_loss": 11.124483108520508, "lr": 6.4000000000000006e-06, "tps": 13160, "wall": 84.7} {"step": 17, "train_loss": 11.0346040725708, "lr": 6.8e-06, "tps": 13161, "wall": 89.6} {"step": 18, "train_loss": 10.884632110595703, "lr": 7.2000000000000005e-06, "tps": 13163, "wall": 94.6} {"step": 19, "train_loss": 10.879730224609375, "lr": 7.6e-06, "tps": 13162, "wall": 99.6} {"step": 20, "train_loss": 10.818342208862305, "lr": 8e-06, "tps": 13165, "wall": 104.5} {"step": 21, "train_loss": 10.74754524230957, "lr": 8.400000000000001e-06, "tps": 13167, "wall": 109.5} {"step": 22, "train_loss": 10.648005485534668, "lr": 8.8e-06, "tps": 13168, "wall": 114.5} {"step": 23, "train_loss": 10.600135803222656, "lr": 9.2e-06, "tps": 13168, "wall": 119.4} {"step": 24, "train_loss": 10.599162101745605, "lr": 9.600000000000001e-06, "tps": 13170, "wall": 124.4} {"step": 25, "train_loss": 10.549919128417969, "lr": 1e-05, "tps": 13170, "wall": 129.4} {"step": 26, "train_loss": 10.471877098083496, "lr": 1.0400000000000002e-05, "tps": 13170, "wall": 134.3} {"step": 27, "train_loss": 10.426097869873047, "lr": 1.08e-05, "tps": 13171, "wall": 139.3} {"step": 28, "train_loss": 10.31871509552002, "lr": 1.12e-05, "tps": 13164, "wall": 144.4} {"step": 29, "train_loss": 10.26041316986084, "lr": 1.16e-05, "tps": 13166, "wall": 149.3} {"step": 30, "train_loss": 10.1779146194458, "lr": 1.2e-05, "tps": 13164, "wall": 154.3} {"step": 31, "train_loss": 10.240498542785645, "lr": 1.2400000000000002e-05, "tps": 13164, "wall": 159.3} {"step": 32, "train_loss": 10.15683364868164, "lr": 1.2800000000000001e-05, "tps": 13164, "wall": 164.3} {"step": 33, "train_loss": 10.097679138183594, "lr": 1.32e-05, "tps": 13163, "wall": 169.3} {"step": 34, "train_loss": 10.050121307373047, "lr": 1.36e-05, "tps": 13162, "wall": 174.3} {"step": 35, "train_loss": 10.051180839538574, "lr": 1.4e-05, "tps": 13161, "wall": 179.3} {"step": 36, "train_loss": 10.023061752319336, "lr": 1.4400000000000001e-05, "tps": 13162, "wall": 184.2} {"step": 37, "train_loss": 9.987103462219238, "lr": 1.48e-05, "tps": 13162, "wall": 189.2} {"step": 38, "train_loss": 9.971962928771973, "lr": 1.52e-05, "tps": 13161, "wall": 194.2} {"step": 39, "train_loss": 9.945789337158203, "lr": 1.56e-05, "tps": 13162, "wall": 199.2} {"step": 40, "train_loss": 9.898653030395508, "lr": 1.6e-05, "tps": 13158, "wall": 204.2} {"step": 41, "train_loss": 9.879378318786621, "lr": 1.6400000000000002e-05, "tps": 13158, "wall": 209.2} {"step": 42, "train_loss": 9.87710952758789, "lr": 1.6800000000000002e-05, "tps": 13157, "wall": 214.2} {"step": 43, "train_loss": 9.911809921264648, "lr": 1.72e-05, "tps": 13155, "wall": 219.2} {"step": 44, "train_loss": 9.830896377563477, "lr": 1.76e-05, "tps": 13155, "wall": 224.2} {"step": 45, "train_loss": 9.806295394897461, "lr": 1.8e-05, "tps": 13153, "wall": 229.2} {"step": 46, "train_loss": 9.789108276367188, "lr": 1.84e-05, "tps": 13153, "wall": 234.2} {"step": 47, "train_loss": 9.850732803344727, "lr": 1.88e-05, "tps": 13151, "wall": 239.2} {"step": 48, "train_loss": 9.767753601074219, "lr": 1.9200000000000003e-05, "tps": 13149, "wall": 244.2} {"step": 49, "train_loss": 9.727646827697754, "lr": 1.96e-05, "tps": 13147, "wall": 249.2} {"step": 50, "train_loss": 9.735565185546875, "lr": 2e-05, "tps": 13146, "wall": 254.2} {"step": 51, "train_loss": 9.744932174682617, "lr": 2.04e-05, "tps": 13146, "wall": 259.2} {"step": 52, "train_loss": 9.756589889526367, "lr": 2.0800000000000004e-05, "tps": 13141, "wall": 264.3} {"step": 53, "train_loss": 9.713404655456543, "lr": 2.12e-05, "tps": 13142, "wall": 269.3} {"step": 54, "train_loss": 9.652036666870117, "lr": 2.16e-05, "tps": 13142, "wall": 274.3} {"step": 55, "train_loss": 9.617311477661133, "lr": 2.2000000000000003e-05, "tps": 13140, "wall": 279.3} {"step": 56, "train_loss": 9.612953186035156, "lr": 2.24e-05, "tps": 13139, "wall": 284.3} {"step": 57, "train_loss": 9.613097190856934, "lr": 2.2800000000000002e-05, "tps": 13138, "wall": 289.3} {"step": 58, "train_loss": 9.609621047973633, "lr": 2.32e-05, "tps": 13137, "wall": 294.3} {"step": 59, "train_loss": 9.578662872314453, "lr": 2.36e-05, "tps": 13137, "wall": 299.3} {"step": 60, "train_loss": 9.544733047485352, "lr": 2.4e-05, "tps": 13136, "wall": 304.3} {"step": 61, "train_loss": 9.503551483154297, "lr": 2.44e-05, "tps": 13135, "wall": 309.3} {"step": 62, "train_loss": 9.552177429199219, "lr": 2.4800000000000003e-05, "tps": 13134, "wall": 314.4} {"step": 63, "train_loss": 9.46776008605957, "lr": 2.52e-05, "tps": 13133, "wall": 319.4} {"step": 64, "train_loss": 9.393982887268066, "lr": 2.5600000000000002e-05, "tps": 13129, "wall": 324.4} {"step": 65, "train_loss": 9.498525619506836, "lr": 2.6000000000000002e-05, "tps": 13129, "wall": 329.4} {"step": 66, "train_loss": 9.44943618774414, "lr": 2.64e-05, "tps": 13128, "wall": 334.4} {"step": 67, "train_loss": 9.359128952026367, "lr": 2.68e-05, "tps": 13127, "wall": 339.5} {"step": 68, "train_loss": 9.35368824005127, "lr": 2.72e-05, "tps": 13127, "wall": 344.5} {"step": 69, "train_loss": 9.321499824523926, "lr": 2.7600000000000003e-05, "tps": 13125, "wall": 349.5} {"step": 70, "train_loss": 9.345465660095215, "lr": 2.8e-05, "tps": 13122, "wall": 354.6} {"step": 71, "train_loss": 9.249122619628906, "lr": 2.8400000000000003e-05, "tps": 13121, "wall": 359.6} {"step": 72, "train_loss": 9.262167930603027, "lr": 2.8800000000000002e-05, "tps": 13118, "wall": 364.7} {"step": 73, "train_loss": 9.214588165283203, "lr": 2.92e-05, "tps": 13117, "wall": 369.7} {"step": 74, "train_loss": 9.265022277832031, "lr": 2.96e-05, "tps": 13115, "wall": 374.8} {"step": 75, "train_loss": 9.202199935913086, "lr": 3e-05, "tps": 13113, "wall": 379.8} {"step": 76, "train_loss": 9.133041381835938, "lr": 3.04e-05, "tps": 13108, "wall": 385.0} {"step": 77, "train_loss": 9.183025360107422, "lr": 3.08e-05, "tps": 13107, "wall": 390.0} {"step": 78, "train_loss": 9.15333080291748, "lr": 3.12e-05, "tps": 13106, "wall": 395.0} {"step": 79, "train_loss": 9.059078216552734, "lr": 3.16e-05, "tps": 13104, "wall": 400.1} {"step": 80, "train_loss": 9.081132888793945, "lr": 3.2e-05, "tps": 13103, "wall": 405.1} {"step": 81, "train_loss": 9.058558464050293, "lr": 3.24e-05, "tps": 13101, "wall": 410.2} {"step": 82, "train_loss": 8.988733291625977, "lr": 3.2800000000000004e-05, "tps": 13100, "wall": 415.2} {"step": 83, "train_loss": 9.032718658447266, "lr": 3.32e-05, "tps": 13098, "wall": 420.3} {"step": 84, "train_loss": 8.970378875732422, "lr": 3.3600000000000004e-05, "tps": 13096, "wall": 425.3} {"step": 85, "train_loss": 8.914607048034668, "lr": 3.4e-05, "tps": 13094, "wall": 430.4} {"step": 86, "train_loss": 8.905592918395996, "lr": 3.44e-05, "tps": 13092, "wall": 435.5} {"step": 87, "train_loss": 8.932666778564453, "lr": 3.4800000000000006e-05, "tps": 13091, "wall": 440.5} {"step": 88, "train_loss": 8.892816543579102, "lr": 3.52e-05, "tps": 13088, "wall": 445.6} {"step": 89, "train_loss": 8.82591438293457, "lr": 3.56e-05, "tps": 13087, "wall": 450.7} {"step": 90, "train_loss": 8.843690872192383, "lr": 3.6e-05, "tps": 13086, "wall": 455.7} {"step": 91, "train_loss": 8.799975395202637, "lr": 3.6400000000000004e-05, "tps": 13085, "wall": 460.8} {"step": 92, "train_loss": 8.773869514465332, "lr": 3.68e-05, "tps": 13084, "wall": 465.8} {"step": 93, "train_loss": 8.712754249572754, "lr": 3.72e-05, "tps": 13082, "wall": 470.9} {"step": 94, "train_loss": 8.767532348632812, "lr": 3.76e-05, "tps": 13081, "wall": 475.9} {"step": 95, "train_loss": 8.655813217163086, "lr": 3.8e-05, "tps": 13079, "wall": 481.0} {"step": 96, "train_loss": 8.64760971069336, "lr": 3.8400000000000005e-05, "tps": 13077, "wall": 486.1} {"step": 97, "train_loss": 8.67121696472168, "lr": 3.88e-05, "tps": 13076, "wall": 491.1} {"step": 98, "train_loss": 8.63354778289795, "lr": 3.92e-05, "tps": 13075, "wall": 496.2} {"step": 99, "train_loss": 8.612131118774414, "lr": 3.96e-05, "tps": 13074, "wall": 501.3} {"step": 100, "train_loss": 8.515628814697266, "lr": 4e-05, "tps": 13071, "wall": 506.4} {"step": 101, "train_loss": 8.542848587036133, "lr": 4.0400000000000006e-05, "tps": 13070, "wall": 511.4} {"step": 102, "train_loss": 8.54018497467041, "lr": 4.08e-05, "tps": 13068, "wall": 516.5} {"step": 103, "train_loss": 8.598257064819336, "lr": 4.12e-05, "tps": 13066, "wall": 521.6} {"step": 104, "train_loss": 8.537947654724121, "lr": 4.160000000000001e-05, "tps": 13064, "wall": 526.7} {"step": 105, "train_loss": 8.470306396484375, "lr": 4.2000000000000004e-05, "tps": 13063, "wall": 531.8} {"step": 106, "train_loss": 8.41865348815918, "lr": 4.24e-05, "tps": 13061, "wall": 536.9} {"step": 107, "train_loss": 8.456347465515137, "lr": 4.2800000000000004e-05, "tps": 13061, "wall": 541.9} {"step": 108, "train_loss": 8.339012145996094, "lr": 4.32e-05, "tps": 13059, "wall": 547.0} {"step": 109, "train_loss": 8.368863105773926, "lr": 4.36e-05, "tps": 13058, "wall": 552.1} {"step": 110, "train_loss": 8.38071346282959, "lr": 4.4000000000000006e-05, "tps": 13057, "wall": 557.1} {"step": 111, "train_loss": 8.305474281311035, "lr": 4.44e-05, "tps": 13056, "wall": 562.2} {"step": 112, "train_loss": 8.291518211364746, "lr": 4.48e-05, "tps": 13054, "wall": 567.3} {"step": 113, "train_loss": 8.242180824279785, "lr": 4.52e-05, "tps": 13052, "wall": 572.4} {"step": 114, "train_loss": 8.27255916595459, "lr": 4.5600000000000004e-05, "tps": 13051, "wall": 577.5} {"step": 115, "train_loss": 8.236261367797852, "lr": 4.6e-05, "tps": 13049, "wall": 582.6} {"step": 116, "train_loss": 8.200572967529297, "lr": 4.64e-05, "tps": 13048, "wall": 587.6} {"step": 117, "train_loss": 8.157893180847168, "lr": 4.68e-05, "tps": 13047, "wall": 592.7} {"step": 118, "train_loss": 8.228896141052246, "lr": 4.72e-05, "tps": 13046, "wall": 597.8} {"step": 119, "train_loss": 8.188470840454102, "lr": 4.7600000000000005e-05, "tps": 13045, "wall": 602.8} {"step": 120, "train_loss": 8.172041893005371, "lr": 4.8e-05, "tps": 13044, "wall": 607.9} {"step": 121, "train_loss": 8.056663513183594, "lr": 4.8400000000000004e-05, "tps": 13042, "wall": 613.0} {"step": 122, "train_loss": 8.204581260681152, "lr": 4.88e-05, "tps": 13041, "wall": 618.1} {"step": 123, "train_loss": 8.083930969238281, "lr": 4.92e-05, "tps": 13038, "wall": 623.3} {"step": 124, "train_loss": 8.029297828674316, "lr": 4.9600000000000006e-05, "tps": 13036, "wall": 628.4} {"step": 125, "train_loss": 8.056273460388184, "lr": 5e-05, "tps": 13035, "wall": 633.5} {"step": 126, "train_loss": 7.996861934661865, "lr": 5.04e-05, "tps": 13033, "wall": 638.6} {"step": 127, "train_loss": 7.909967422485352, "lr": 5.08e-05, "tps": 13032, "wall": 643.7} {"step": 128, "train_loss": 8.002439498901367, "lr": 5.1200000000000004e-05, "tps": 13029, "wall": 648.8} {"step": 129, "train_loss": 7.970865249633789, "lr": 5.16e-05, "tps": 13028, "wall": 653.9} {"step": 130, "train_loss": 7.999822616577148, "lr": 5.2000000000000004e-05, "tps": 13027, "wall": 659.0} {"step": 131, "train_loss": 8.008867263793945, "lr": 5.24e-05, "tps": 13025, "wall": 664.1} {"step": 132, "train_loss": 8.023078918457031, "lr": 5.28e-05, "tps": 13024, "wall": 669.2} {"step": 133, "train_loss": 7.960579872131348, "lr": 5.3200000000000006e-05, "tps": 13022, "wall": 674.3} {"step": 134, "train_loss": 7.802445411682129, "lr": 5.36e-05, "tps": 13021, "wall": 679.5} {"step": 135, "train_loss": 7.910876274108887, "lr": 5.4e-05, "tps": 13017, "wall": 684.7} {"step": 136, "train_loss": 7.800398826599121, "lr": 5.44e-05, "tps": 13016, "wall": 689.8} {"step": 137, "train_loss": 7.836018085479736, "lr": 5.4800000000000004e-05, "tps": 13014, "wall": 694.9} {"step": 138, "train_loss": 7.768095970153809, "lr": 5.520000000000001e-05, "tps": 13012, "wall": 700.0} {"step": 139, "train_loss": 7.86049222946167, "lr": 5.56e-05, "tps": 13010, "wall": 705.2} {"step": 140, "train_loss": 7.71937370300293, "lr": 5.6e-05, "tps": 13009, "wall": 710.3} {"step": 141, "train_loss": 7.792503833770752, "lr": 5.640000000000001e-05, "tps": 13006, "wall": 715.5} {"step": 142, "train_loss": 7.803567409515381, "lr": 5.6800000000000005e-05, "tps": 13005, "wall": 720.6} {"step": 143, "train_loss": 7.685601234436035, "lr": 5.72e-05, "tps": 13003, "wall": 725.8} {"step": 144, "train_loss": 7.766866683959961, "lr": 5.7600000000000004e-05, "tps": 13001, "wall": 730.9} {"step": 145, "train_loss": 7.70136833190918, "lr": 5.8e-05, "tps": 12999, "wall": 736.1} {"step": 146, "train_loss": 7.647207736968994, "lr": 5.84e-05, "tps": 12997, "wall": 741.2} {"step": 147, "train_loss": 7.603613376617432, "lr": 5.8800000000000006e-05, "tps": 12994, "wall": 746.4} {"step": 148, "train_loss": 7.579229354858398, "lr": 5.92e-05, "tps": 12992, "wall": 751.6} {"step": 149, "train_loss": 7.562046051025391, "lr": 5.96e-05, "tps": 12990, "wall": 756.7} {"step": 150, "train_loss": 7.6346211433410645, "lr": 6e-05, "tps": 12988, "wall": 761.9} {"step": 151, "train_loss": 7.61287260055542, "lr": 6.0400000000000004e-05, "tps": 12986, "wall": 767.1} {"step": 152, "train_loss": 7.623250961303711, "lr": 6.08e-05, "tps": 12984, "wall": 772.2} {"step": 153, "train_loss": 7.61068868637085, "lr": 6.120000000000001e-05, "tps": 12982, "wall": 777.4} {"step": 154, "train_loss": 7.551749229431152, "lr": 6.16e-05, "tps": 12981, "wall": 782.5} {"step": 155, "train_loss": 7.545273780822754, "lr": 6.2e-05, "tps": 12979, "wall": 787.7} {"step": 156, "train_loss": 7.617772102355957, "lr": 6.24e-05, "tps": 12977, "wall": 792.9} {"step": 157, "train_loss": 7.596831321716309, "lr": 6.280000000000001e-05, "tps": 12975, "wall": 798.0} {"step": 158, "train_loss": 7.539711952209473, "lr": 6.32e-05, "tps": 12974, "wall": 803.2} {"step": 159, "train_loss": 7.51534366607666, "lr": 6.36e-05, "tps": 12971, "wall": 808.4} {"step": 160, "train_loss": 7.577149391174316, "lr": 6.4e-05, "tps": 12970, "wall": 813.5} {"step": 161, "train_loss": 7.522848606109619, "lr": 6.44e-05, "tps": 12968, "wall": 818.6} {"step": 162, "train_loss": 7.439415454864502, "lr": 6.48e-05, "tps": 12967, "wall": 823.8} {"step": 163, "train_loss": 7.500565528869629, "lr": 6.520000000000001e-05, "tps": 12965, "wall": 829.0} {"step": 164, "train_loss": 7.426812171936035, "lr": 6.560000000000001e-05, "tps": 12963, "wall": 834.1} {"step": 165, "train_loss": 7.547463417053223, "lr": 6.6e-05, "tps": 12962, "wall": 839.3} {"step": 166, "train_loss": 7.450392723083496, "lr": 6.64e-05, "tps": 12960, "wall": 844.4} {"step": 167, "train_loss": 7.477350234985352, "lr": 6.68e-05, "tps": 12959, "wall": 849.6} {"step": 168, "train_loss": 7.5270609855651855, "lr": 6.720000000000001e-05, "tps": 12957, "wall": 854.8} {"step": 169, "train_loss": 7.509194374084473, "lr": 6.76e-05, "tps": 12955, "wall": 859.9} {"step": 170, "train_loss": 7.49745512008667, "lr": 6.8e-05, "tps": 12953, "wall": 865.1} {"step": 171, "train_loss": 7.478893280029297, "lr": 6.840000000000001e-05, "tps": 12952, "wall": 870.3} {"step": 172, "train_loss": 7.366469383239746, "lr": 6.88e-05, "tps": 12951, "wall": 875.4} {"step": 173, "train_loss": 7.37886381149292, "lr": 6.92e-05, "tps": 12949, "wall": 880.6} {"step": 174, "train_loss": 7.402528285980225, "lr": 6.960000000000001e-05, "tps": 12948, "wall": 885.8} {"step": 175, "train_loss": 7.411224365234375, "lr": 7.000000000000001e-05, "tps": 12946, "wall": 890.9} {"step": 176, "train_loss": 7.415987014770508, "lr": 7.04e-05, "tps": 12945, "wall": 896.1} {"step": 177, "train_loss": 7.37291145324707, "lr": 7.08e-05, "tps": 12943, "wall": 901.2} {"step": 178, "train_loss": 7.424803733825684, "lr": 7.12e-05, "tps": 12942, "wall": 906.4} {"step": 179, "train_loss": 7.365806579589844, "lr": 7.159999999999999e-05, "tps": 12941, "wall": 911.5} {"step": 180, "train_loss": 7.410187244415283, "lr": 7.2e-05, "tps": 12940, "wall": 916.7} {"step": 181, "train_loss": 7.355527400970459, "lr": 7.240000000000001e-05, "tps": 12939, "wall": 921.8} {"step": 182, "train_loss": 7.326568603515625, "lr": 7.280000000000001e-05, "tps": 12936, "wall": 927.1} {"step": 183, "train_loss": 7.332854270935059, "lr": 7.32e-05, "tps": 12935, "wall": 932.2} {"step": 184, "train_loss": 7.319502830505371, "lr": 7.36e-05, "tps": 12934, "wall": 937.4} {"step": 185, "train_loss": 7.435181617736816, "lr": 7.400000000000001e-05, "tps": 12932, "wall": 942.5} {"step": 186, "train_loss": 7.33798885345459, "lr": 7.44e-05, "tps": 12931, "wall": 947.7} {"step": 187, "train_loss": 7.397373676300049, "lr": 7.48e-05, "tps": 12930, "wall": 952.9} {"step": 188, "train_loss": 7.363593101501465, "lr": 7.52e-05, "tps": 12928, "wall": 958.1} {"step": 189, "train_loss": 7.3236541748046875, "lr": 7.56e-05, "tps": 12927, "wall": 963.2} {"step": 190, "train_loss": 7.340499401092529, "lr": 7.6e-05, "tps": 12926, "wall": 968.4} {"step": 191, "train_loss": 7.195595741271973, "lr": 7.640000000000001e-05, "tps": 12925, "wall": 973.5} {"step": 192, "train_loss": 7.194782257080078, "lr": 7.680000000000001e-05, "tps": 12924, "wall": 978.7} {"step": 193, "train_loss": 7.278714656829834, "lr": 7.72e-05, "tps": 12922, "wall": 983.9} {"step": 194, "train_loss": 7.167997360229492, "lr": 7.76e-05, "tps": 12921, "wall": 989.0} {"step": 195, "train_loss": 7.225996971130371, "lr": 7.8e-05, "tps": 12920, "wall": 994.2} {"step": 196, "train_loss": 7.2295942306518555, "lr": 7.84e-05, "tps": 12919, "wall": 999.3} {"step": 197, "train_loss": 7.264776706695557, "lr": 7.88e-05, "tps": 12918, "wall": 1004.5} {"step": 198, "train_loss": 7.302220821380615, "lr": 7.92e-05, "tps": 12916, "wall": 1009.7} {"step": 199, "train_loss": 7.2558274269104, "lr": 7.960000000000001e-05, "tps": 12916, "wall": 1014.8} {"step": 200, "train_loss": 7.2578959465026855, "lr": 8e-05, "tps": 12915, "wall": 1019.9} {"step": 201, "train_loss": 7.222497940063477, "lr": 8.04e-05, "tps": 12914, "wall": 1025.1} {"step": 202, "train_loss": 7.17840576171875, "lr": 8.080000000000001e-05, "tps": 12912, "wall": 1030.3} {"step": 203, "train_loss": 7.093888282775879, "lr": 8.120000000000001e-05, "tps": 12912, "wall": 1035.4} {"step": 204, "train_loss": 7.216327667236328, "lr": 8.16e-05, "tps": 12910, "wall": 1040.6} {"step": 205, "train_loss": 7.206729888916016, "lr": 8.2e-05, "tps": 12909, "wall": 1045.8} {"step": 206, "train_loss": 7.1880974769592285, "lr": 8.24e-05, "tps": 12908, "wall": 1051.0} {"step": 207, "train_loss": 7.130190372467041, "lr": 8.28e-05, "tps": 12907, "wall": 1056.1} {"step": 208, "train_loss": 7.137142658233643, "lr": 8.320000000000002e-05, "tps": 12905, "wall": 1061.3} {"step": 209, "train_loss": 7.094500541687012, "lr": 8.360000000000001e-05, "tps": 12904, "wall": 1066.5} {"step": 210, "train_loss": 7.135332107543945, "lr": 8.400000000000001e-05, "tps": 12903, "wall": 1071.6} {"step": 211, "train_loss": 7.077711582183838, "lr": 8.44e-05, "tps": 12902, "wall": 1076.8} {"step": 212, "train_loss": 7.1299896240234375, "lr": 8.48e-05, "tps": 12901, "wall": 1082.0} {"step": 213, "train_loss": 7.030309677124023, "lr": 8.52e-05, "tps": 12901, "wall": 1087.1} {"step": 214, "train_loss": 7.116090297698975, "lr": 8.560000000000001e-05, "tps": 12900, "wall": 1092.3} {"step": 215, "train_loss": 7.165168762207031, "lr": 8.6e-05, "tps": 12899, "wall": 1097.4} {"step": 216, "train_loss": 7.179386138916016, "lr": 8.64e-05, "tps": 12898, "wall": 1102.6} {"step": 217, "train_loss": 7.142568111419678, "lr": 8.68e-05, "tps": 12896, "wall": 1107.8} {"step": 218, "train_loss": 7.049089431762695, "lr": 8.72e-05, "tps": 12895, "wall": 1113.0} {"step": 219, "train_loss": 7.11231803894043, "lr": 8.76e-05, "tps": 12894, "wall": 1118.1} {"step": 220, "train_loss": 7.051003456115723, "lr": 8.800000000000001e-05, "tps": 12893, "wall": 1123.3} {"step": 221, "train_loss": 7.13132905960083, "lr": 8.840000000000001e-05, "tps": 12892, "wall": 1128.5} {"step": 222, "train_loss": 7.086899757385254, "lr": 8.88e-05, "tps": 12891, "wall": 1133.6} {"step": 223, "train_loss": 7.179282188415527, "lr": 8.92e-05, "tps": 12890, "wall": 1138.8} {"step": 224, "train_loss": 7.093719005584717, "lr": 8.96e-05, "tps": 12890, "wall": 1143.9} {"step": 225, "train_loss": 7.029384613037109, "lr": 9e-05, "tps": 12889, "wall": 1149.1} {"step": 226, "train_loss": 7.096097469329834, "lr": 9.04e-05, "tps": 12888, "wall": 1154.3} {"step": 227, "train_loss": 7.002593994140625, "lr": 9.080000000000001e-05, "tps": 12887, "wall": 1159.4} {"step": 228, "train_loss": 7.070346832275391, "lr": 9.120000000000001e-05, "tps": 12886, "wall": 1164.6} {"step": 229, "train_loss": 6.986166477203369, "lr": 9.16e-05, "tps": 12885, "wall": 1169.8} {"step": 230, "train_loss": 6.981106758117676, "lr": 9.2e-05, "tps": 12884, "wall": 1175.0} {"step": 231, "train_loss": 7.032906532287598, "lr": 9.240000000000001e-05, "tps": 12883, "wall": 1180.1} {"step": 232, "train_loss": 6.978477954864502, "lr": 9.28e-05, "tps": 12883, "wall": 1185.2} {"step": 233, "train_loss": 6.997651100158691, "lr": 9.32e-05, "tps": 12882, "wall": 1190.4} {"step": 234, "train_loss": 6.963988304138184, "lr": 9.36e-05, "tps": 12881, "wall": 1195.5} {"step": 235, "train_loss": 7.056290626525879, "lr": 9.4e-05, "tps": 12881, "wall": 1200.7} {"step": 236, "train_loss": 6.948718070983887, "lr": 9.44e-05, "tps": 12880, "wall": 1205.9} {"step": 237, "train_loss": 6.96592903137207, "lr": 9.480000000000001e-05, "tps": 12879, "wall": 1211.0} {"step": 238, "train_loss": 6.889782428741455, "lr": 9.520000000000001e-05, "tps": 12879, "wall": 1216.2} {"step": 239, "train_loss": 6.952486038208008, "lr": 9.56e-05, "tps": 12878, "wall": 1221.3} {"step": 240, "train_loss": 7.0038347244262695, "lr": 9.6e-05, "tps": 12877, "wall": 1226.5} {"step": 241, "train_loss": 6.9355974197387695, "lr": 9.64e-05, "tps": 12876, "wall": 1231.7} {"step": 242, "train_loss": 6.983513832092285, "lr": 9.680000000000001e-05, "tps": 12875, "wall": 1236.8} {"step": 243, "train_loss": 6.8895344734191895, "lr": 9.72e-05, "tps": 12874, "wall": 1242.0} {"step": 244, "train_loss": 6.929286003112793, "lr": 9.76e-05, "tps": 12873, "wall": 1247.2} {"step": 245, "train_loss": 7.033448219299316, "lr": 9.800000000000001e-05, "tps": 12872, "wall": 1252.4} {"step": 246, "train_loss": 6.864964485168457, "lr": 9.84e-05, "tps": 12872, "wall": 1257.5} {"step": 247, "train_loss": 6.9052510261535645, "lr": 9.88e-05, "tps": 12871, "wall": 1262.7} {"step": 248, "train_loss": 6.876766204833984, "lr": 9.920000000000001e-05, "tps": 12871, "wall": 1267.8} {"step": 249, "train_loss": 6.899509906768799, "lr": 9.960000000000001e-05, "tps": 12870, "wall": 1273.0} {"step": 250, "train_loss": 6.861688613891602, "lr": 0.0001, "tps": 12869, "wall": 1278.2} {"step": 251, "train_loss": 6.886258125305176, "lr": 0.0001004, "tps": 12868, "wall": 1283.4} {"step": 252, "train_loss": 6.823886871337891, "lr": 0.0001008, "tps": 12867, "wall": 1288.5} {"step": 253, "train_loss": 6.96673583984375, "lr": 0.0001012, "tps": 12866, "wall": 1293.7} {"step": 254, "train_loss": 6.8819732666015625, "lr": 0.0001016, "tps": 12866, "wall": 1298.9} {"step": 255, "train_loss": 6.833759784698486, "lr": 0.00010200000000000001, "tps": 12865, "wall": 1304.0} {"step": 256, "train_loss": 6.800100803375244, "lr": 0.00010240000000000001, "tps": 12864, "wall": 1309.2} {"step": 257, "train_loss": 6.953839302062988, "lr": 0.0001028, "tps": 12864, "wall": 1314.4} {"step": 258, "train_loss": 6.912923812866211, "lr": 0.0001032, "tps": 12863, "wall": 1319.6} {"step": 259, "train_loss": 6.843024730682373, "lr": 0.00010360000000000001, "tps": 12862, "wall": 1324.7} {"step": 260, "train_loss": 6.8170599937438965, "lr": 0.00010400000000000001, "tps": 12861, "wall": 1329.9} {"step": 261, "train_loss": 6.900547504425049, "lr": 0.0001044, "tps": 12861, "wall": 1335.0} {"step": 262, "train_loss": 6.810604572296143, "lr": 0.0001048, "tps": 12860, "wall": 1340.2} {"step": 263, "train_loss": 6.879966735839844, "lr": 0.0001052, "tps": 12859, "wall": 1345.4} {"step": 264, "train_loss": 6.8279852867126465, "lr": 0.0001056, "tps": 12859, "wall": 1350.6} {"step": 265, "train_loss": 6.856398582458496, "lr": 0.00010600000000000002, "tps": 12858, "wall": 1355.7} {"step": 266, "train_loss": 6.82148551940918, "lr": 0.00010640000000000001, "tps": 12857, "wall": 1360.9} {"step": 267, "train_loss": 6.777699947357178, "lr": 0.00010680000000000001, "tps": 12857, "wall": 1366.0} {"step": 268, "train_loss": 6.744632244110107, "lr": 0.0001072, "tps": 12856, "wall": 1371.2} {"step": 269, "train_loss": 6.722272872924805, "lr": 0.0001076, "tps": 12856, "wall": 1376.4} {"step": 270, "train_loss": 6.821207046508789, "lr": 0.000108, "tps": 12855, "wall": 1381.5} {"step": 271, "train_loss": 6.7534332275390625, "lr": 0.0001084, "tps": 12855, "wall": 1386.7} {"step": 272, "train_loss": 6.767140865325928, "lr": 0.0001088, "tps": 12854, "wall": 1391.8} {"step": 273, "train_loss": 6.797300338745117, "lr": 0.00010920000000000001, "tps": 12854, "wall": 1397.0} {"step": 274, "train_loss": 6.7273688316345215, "lr": 0.00010960000000000001, "tps": 12853, "wall": 1402.1} {"step": 275, "train_loss": 6.808360576629639, "lr": 0.00011, "tps": 12852, "wall": 1407.4} {"step": 276, "train_loss": 6.859362602233887, "lr": 0.00011040000000000001, "tps": 12851, "wall": 1412.6} {"step": 277, "train_loss": 6.795162200927734, "lr": 0.00011080000000000001, "tps": 12850, "wall": 1417.8} {"step": 278, "train_loss": 6.805563449859619, "lr": 0.0001112, "tps": 12850, "wall": 1422.9} {"step": 279, "train_loss": 6.908613204956055, "lr": 0.0001116, "tps": 12849, "wall": 1428.1} {"step": 280, "train_loss": 6.711430549621582, "lr": 0.000112, "tps": 12849, "wall": 1433.2} {"step": 281, "train_loss": 6.733260154724121, "lr": 0.0001124, "tps": 12848, "wall": 1438.4} {"step": 282, "train_loss": 6.683751583099365, "lr": 0.00011280000000000002, "tps": 12847, "wall": 1443.5} {"step": 283, "train_loss": 6.720704078674316, "lr": 0.00011320000000000001, "tps": 12847, "wall": 1448.7} {"step": 284, "train_loss": 6.743560314178467, "lr": 0.00011360000000000001, "tps": 12847, "wall": 1453.9} {"step": 285, "train_loss": 6.710814952850342, "lr": 0.000114, "tps": 12846, "wall": 1459.0} {"step": 286, "train_loss": 6.761664390563965, "lr": 0.0001144, "tps": 12845, "wall": 1464.3} {"step": 287, "train_loss": 6.6646881103515625, "lr": 0.0001148, "tps": 12845, "wall": 1469.4} {"step": 288, "train_loss": 6.763951301574707, "lr": 0.00011520000000000001, "tps": 12844, "wall": 1474.6} {"step": 289, "train_loss": 6.691097259521484, "lr": 0.0001156, "tps": 12843, "wall": 1479.7} {"step": 290, "train_loss": 6.724844455718994, "lr": 0.000116, "tps": 12843, "wall": 1484.9} {"step": 291, "train_loss": 6.688225269317627, "lr": 0.0001164, "tps": 12842, "wall": 1490.1} {"step": 292, "train_loss": 6.704649448394775, "lr": 0.0001168, "tps": 12842, "wall": 1495.2} {"step": 293, "train_loss": 6.719408988952637, "lr": 0.00011720000000000002, "tps": 12842, "wall": 1500.4} {"step": 294, "train_loss": 6.676101207733154, "lr": 0.00011760000000000001, "tps": 12841, "wall": 1505.5} {"step": 295, "train_loss": 6.615402698516846, "lr": 0.00011800000000000001, "tps": 12841, "wall": 1510.7} {"step": 296, "train_loss": 6.677227973937988, "lr": 0.0001184, "tps": 12840, "wall": 1515.8} {"step": 297, "train_loss": 6.6828436851501465, "lr": 0.0001188, "tps": 12840, "wall": 1521.0} {"step": 298, "train_loss": 6.643111228942871, "lr": 0.0001192, "tps": 12839, "wall": 1526.2} {"step": 299, "train_loss": 6.635785102844238, "lr": 0.00011960000000000001, "tps": 12838, "wall": 1531.4} {"step": 300, "train_loss": 6.635772228240967, "lr": 0.00012, "tps": 12838, "wall": 1536.5} {"step": 301, "train_loss": 6.68242073059082, "lr": 0.00012040000000000001, "tps": 12837, "wall": 1541.7} {"step": 302, "train_loss": 6.545066833496094, "lr": 0.00012080000000000001, "tps": 12837, "wall": 1546.8} {"step": 303, "train_loss": 6.591639518737793, "lr": 0.0001212, "tps": 12837, "wall": 1552.0} {"step": 304, "train_loss": 6.629812717437744, "lr": 0.0001216, "tps": 12836, "wall": 1557.1} {"step": 305, "train_loss": 6.571229934692383, "lr": 0.00012200000000000001, "tps": 12836, "wall": 1562.3} {"step": 306, "train_loss": 6.536562442779541, "lr": 0.00012240000000000002, "tps": 12835, "wall": 1567.4} {"step": 307, "train_loss": 6.614675045013428, "lr": 0.0001228, "tps": 12835, "wall": 1572.6} {"step": 308, "train_loss": 6.724498748779297, "lr": 0.0001232, "tps": 12834, "wall": 1577.8} {"step": 309, "train_loss": 6.523313999176025, "lr": 0.0001236, "tps": 12834, "wall": 1582.9} {"step": 310, "train_loss": 6.596161842346191, "lr": 0.000124, "tps": 12833, "wall": 1588.2} {"step": 311, "train_loss": 6.574120998382568, "lr": 0.00012440000000000002, "tps": 12832, "wall": 1593.3} {"step": 312, "train_loss": 6.620580673217773, "lr": 0.0001248, "tps": 12832, "wall": 1598.5} {"step": 313, "train_loss": 6.672554016113281, "lr": 0.0001252, "tps": 12832, "wall": 1603.7} {"step": 314, "train_loss": 6.569782733917236, "lr": 0.00012560000000000002, "tps": 12831, "wall": 1608.8} {"step": 315, "train_loss": 6.56313419342041, "lr": 0.000126, "tps": 12831, "wall": 1614.0} {"step": 316, "train_loss": 6.594146728515625, "lr": 0.0001264, "tps": 12830, "wall": 1619.2} {"step": 317, "train_loss": 6.499449253082275, "lr": 0.0001268, "tps": 12829, "wall": 1624.4} {"step": 318, "train_loss": 6.62069034576416, "lr": 0.0001272, "tps": 12829, "wall": 1629.5} {"step": 319, "train_loss": 6.464576721191406, "lr": 0.0001276, "tps": 12829, "wall": 1634.7} {"step": 320, "train_loss": 6.520885467529297, "lr": 0.000128, "tps": 12828, "wall": 1639.9} {"step": 321, "train_loss": 6.476810455322266, "lr": 0.0001284, "tps": 12827, "wall": 1645.1} {"step": 322, "train_loss": 6.488509654998779, "lr": 0.0001288, "tps": 12827, "wall": 1650.3} {"step": 323, "train_loss": 6.472236633300781, "lr": 0.0001292, "tps": 12826, "wall": 1655.4} {"step": 324, "train_loss": 6.536436557769775, "lr": 0.0001296, "tps": 12826, "wall": 1660.6} {"step": 325, "train_loss": 6.62058162689209, "lr": 0.00013000000000000002, "tps": 12826, "wall": 1665.7} {"step": 326, "train_loss": 6.530721664428711, "lr": 0.00013040000000000003, "tps": 12825, "wall": 1670.9} {"step": 327, "train_loss": 6.485265731811523, "lr": 0.0001308, "tps": 12825, "wall": 1676.0} {"step": 328, "train_loss": 6.520178318023682, "lr": 0.00013120000000000002, "tps": 12824, "wall": 1681.2} {"step": 329, "train_loss": 6.477439880371094, "lr": 0.0001316, "tps": 12824, "wall": 1686.4} {"step": 330, "train_loss": 6.538295745849609, "lr": 0.000132, "tps": 12824, "wall": 1691.5} {"step": 331, "train_loss": 6.488994121551514, "lr": 0.00013240000000000002, "tps": 12823, "wall": 1696.7} {"step": 332, "train_loss": 6.464236259460449, "lr": 0.0001328, "tps": 12823, "wall": 1701.9} {"step": 333, "train_loss": 6.39910888671875, "lr": 0.0001332, "tps": 12822, "wall": 1707.1} {"step": 334, "train_loss": 6.5091023445129395, "lr": 0.0001336, "tps": 12822, "wall": 1712.2} {"step": 335, "train_loss": 6.4847893714904785, "lr": 0.000134, "tps": 12821, "wall": 1717.4} {"step": 336, "train_loss": 6.4910430908203125, "lr": 0.00013440000000000001, "tps": 12821, "wall": 1722.6} {"step": 337, "train_loss": 6.48661470413208, "lr": 0.0001348, "tps": 12820, "wall": 1727.7} {"step": 338, "train_loss": 6.379571914672852, "lr": 0.0001352, "tps": 12820, "wall": 1732.9} {"step": 339, "train_loss": 6.437082290649414, "lr": 0.0001356, "tps": 12819, "wall": 1738.1} {"step": 340, "train_loss": 6.496612548828125, "lr": 0.000136, "tps": 12819, "wall": 1743.3} {"step": 341, "train_loss": 6.560155868530273, "lr": 0.00013639999999999998, "tps": 12819, "wall": 1748.4} {"step": 342, "train_loss": 6.492593765258789, "lr": 0.00013680000000000002, "tps": 12818, "wall": 1753.6} {"step": 343, "train_loss": 6.404050350189209, "lr": 0.00013720000000000003, "tps": 12818, "wall": 1758.8} {"step": 344, "train_loss": 6.490845680236816, "lr": 0.0001376, "tps": 12817, "wall": 1764.0} {"step": 345, "train_loss": 6.411348342895508, "lr": 0.00013800000000000002, "tps": 12817, "wall": 1769.1} {"step": 346, "train_loss": 6.374441146850586, "lr": 0.0001384, "tps": 12816, "wall": 1774.3} {"step": 347, "train_loss": 6.405170440673828, "lr": 0.0001388, "tps": 12816, "wall": 1779.5} {"step": 348, "train_loss": 6.326912879943848, "lr": 0.00013920000000000002, "tps": 12815, "wall": 1784.7} {"step": 349, "train_loss": 6.409815311431885, "lr": 0.0001396, "tps": 12815, "wall": 1789.9} {"step": 350, "train_loss": 6.425168991088867, "lr": 0.00014000000000000001, "tps": 12814, "wall": 1795.0} {"step": 351, "train_loss": 6.369142532348633, "lr": 0.0001404, "tps": 12814, "wall": 1800.2} {"step": 352, "train_loss": 6.5238518714904785, "lr": 0.0001408, "tps": 12814, "wall": 1805.4} {"step": 353, "train_loss": 6.375903129577637, "lr": 0.00014120000000000002, "tps": 12813, "wall": 1810.5} {"step": 354, "train_loss": 6.497627258300781, "lr": 0.0001416, "tps": 12813, "wall": 1815.7} {"step": 355, "train_loss": 6.350468158721924, "lr": 0.000142, "tps": 12813, "wall": 1820.8} {"step": 356, "train_loss": 6.392157554626465, "lr": 0.0001424, "tps": 12812, "wall": 1826.0} {"step": 357, "train_loss": 6.322015285491943, "lr": 0.0001428, "tps": 12812, "wall": 1831.2} {"step": 358, "train_loss": 6.411557197570801, "lr": 0.00014319999999999998, "tps": 12811, "wall": 1836.4} {"step": 359, "train_loss": 6.451173782348633, "lr": 0.0001436, "tps": 12811, "wall": 1841.6} {"step": 360, "train_loss": 6.390156269073486, "lr": 0.000144, "tps": 12811, "wall": 1846.7} {"step": 361, "train_loss": 6.431653022766113, "lr": 0.0001444, "tps": 12810, "wall": 1851.9} {"step": 362, "train_loss": 6.34612512588501, "lr": 0.00014480000000000002, "tps": 12810, "wall": 1857.1} {"step": 363, "train_loss": 6.372271537780762, "lr": 0.0001452, "tps": 12810, "wall": 1862.2} {"step": 364, "train_loss": 6.416375637054443, "lr": 0.00014560000000000002, "tps": 12809, "wall": 1867.3} {"step": 365, "train_loss": 6.304420471191406, "lr": 0.00014600000000000003, "tps": 12809, "wall": 1872.5} {"step": 366, "train_loss": 6.4383063316345215, "lr": 0.0001464, "tps": 12809, "wall": 1877.6} {"step": 367, "train_loss": 6.408089637756348, "lr": 0.00014680000000000002, "tps": 12809, "wall": 1882.7} {"step": 368, "train_loss": 6.3286566734313965, "lr": 0.0001472, "tps": 12809, "wall": 1887.9} {"step": 369, "train_loss": 6.3616108894348145, "lr": 0.0001476, "tps": 12809, "wall": 1893.0} {"step": 370, "train_loss": 6.314431667327881, "lr": 0.00014800000000000002, "tps": 12809, "wall": 1898.1} {"step": 371, "train_loss": 6.313862323760986, "lr": 0.0001484, "tps": 12809, "wall": 1903.2} {"step": 372, "train_loss": 6.298117637634277, "lr": 0.0001488, "tps": 12809, "wall": 1908.4} {"step": 373, "train_loss": 6.279856204986572, "lr": 0.0001492, "tps": 12809, "wall": 1913.5} {"step": 374, "train_loss": 6.263341903686523, "lr": 0.0001496, "tps": 12809, "wall": 1918.6} {"step": 375, "train_loss": 6.428635597229004, "lr": 0.00015, "tps": 12809, "wall": 1923.7} {"step": 376, "train_loss": 6.360032558441162, "lr": 0.0001504, "tps": 12809, "wall": 1928.9} {"step": 377, "train_loss": 6.306872844696045, "lr": 0.0001508, "tps": 12809, "wall": 1934.0} {"step": 378, "train_loss": 6.463536262512207, "lr": 0.0001512, "tps": 12809, "wall": 1939.1} {"step": 379, "train_loss": 6.360688209533691, "lr": 0.00015160000000000003, "tps": 12808, "wall": 1944.3} {"step": 380, "train_loss": 6.314515113830566, "lr": 0.000152, "tps": 12809, "wall": 1949.3} {"step": 381, "train_loss": 6.311466217041016, "lr": 0.00015240000000000002, "tps": 12809, "wall": 1954.4} {"step": 382, "train_loss": 6.369007110595703, "lr": 0.00015280000000000003, "tps": 12809, "wall": 1959.5} {"step": 383, "train_loss": 6.3837175369262695, "lr": 0.0001532, "tps": 12809, "wall": 1964.6} {"step": 384, "train_loss": 6.260622501373291, "lr": 0.00015360000000000002, "tps": 12809, "wall": 1969.7} {"step": 385, "train_loss": 6.315306663513184, "lr": 0.000154, "tps": 12809, "wall": 1974.8} {"step": 386, "train_loss": 6.3641791343688965, "lr": 0.0001544, "tps": 12810, "wall": 1979.9} {"step": 387, "train_loss": 6.287482261657715, "lr": 0.00015480000000000002, "tps": 12810, "wall": 1984.9} {"step": 388, "train_loss": 6.23002815246582, "lr": 0.0001552, "tps": 12810, "wall": 1990.0} {"step": 389, "train_loss": 6.358461856842041, "lr": 0.00015560000000000001, "tps": 12811, "wall": 1995.1} {"step": 390, "train_loss": 6.2769927978515625, "lr": 0.000156, "tps": 12811, "wall": 2000.1} {"step": 391, "train_loss": 6.2806549072265625, "lr": 0.0001564, "tps": 12811, "wall": 2005.3} {"step": 392, "train_loss": 6.164433479309082, "lr": 0.0001568, "tps": 12811, "wall": 2010.4} {"step": 393, "train_loss": 6.267524242401123, "lr": 0.0001572, "tps": 12811, "wall": 2015.4} {"step": 394, "train_loss": 6.2877631187438965, "lr": 0.0001576, "tps": 12811, "wall": 2020.5} {"step": 395, "train_loss": 6.271782398223877, "lr": 0.000158, "tps": 12812, "wall": 2025.6} {"step": 396, "train_loss": 6.239223957061768, "lr": 0.0001584, "tps": 12812, "wall": 2030.7} {"step": 397, "train_loss": 6.253592491149902, "lr": 0.00015879999999999998, "tps": 12812, "wall": 2035.7} {"step": 398, "train_loss": 6.261213302612305, "lr": 0.00015920000000000002, "tps": 12813, "wall": 2040.8} {"step": 399, "train_loss": 6.2076263427734375, "lr": 0.00015960000000000003, "tps": 12813, "wall": 2045.9} {"step": 400, "train_loss": 6.244935035705566, "lr": 0.00016, "tps": 12813, "wall": 2050.9} {"step": 401, "train_loss": 6.218770503997803, "lr": 0.00016040000000000002, "tps": 12814, "wall": 2056.0} {"step": 402, "train_loss": 6.261422157287598, "lr": 0.0001608, "tps": 12814, "wall": 2061.0} {"step": 403, "train_loss": 6.313381195068359, "lr": 0.00016120000000000002, "tps": 12814, "wall": 2066.1} {"step": 404, "train_loss": 6.2017388343811035, "lr": 0.00016160000000000002, "tps": 12815, "wall": 2071.2} {"step": 405, "train_loss": 6.193002700805664, "lr": 0.000162, "tps": 12815, "wall": 2076.2} {"step": 406, "train_loss": 6.238607406616211, "lr": 0.00016240000000000002, "tps": 12815, "wall": 2081.3} {"step": 407, "train_loss": 6.3622002601623535, "lr": 0.0001628, "tps": 12816, "wall": 2086.3} {"step": 408, "train_loss": 6.386172294616699, "lr": 0.0001632, "tps": 12816, "wall": 2091.4} {"step": 409, "train_loss": 6.216442108154297, "lr": 0.0001636, "tps": 12817, "wall": 2096.4} {"step": 410, "train_loss": 6.319633960723877, "lr": 0.000164, "tps": 12817, "wall": 2101.5} {"step": 411, "train_loss": 6.14587926864624, "lr": 0.0001644, "tps": 12817, "wall": 2106.5} {"step": 412, "train_loss": 6.170947074890137, "lr": 0.0001648, "tps": 12818, "wall": 2111.6} {"step": 413, "train_loss": 6.24901008605957, "lr": 0.0001652, "tps": 12818, "wall": 2116.6} {"step": 414, "train_loss": 6.289575576782227, "lr": 0.0001656, "tps": 12818, "wall": 2121.7} {"step": 415, "train_loss": 6.283885478973389, "lr": 0.000166, "tps": 12818, "wall": 2126.8} {"step": 416, "train_loss": 6.268581867218018, "lr": 0.00016640000000000003, "tps": 12819, "wall": 2131.9} {"step": 417, "train_loss": 6.209212303161621, "lr": 0.00016680000000000002, "tps": 12819, "wall": 2136.9} {"step": 418, "train_loss": 6.249321937561035, "lr": 0.00016720000000000003, "tps": 12819, "wall": 2141.9} {"step": 419, "train_loss": 6.09821081161499, "lr": 0.0001676, "tps": 12820, "wall": 2147.0} {"step": 420, "train_loss": 6.196371555328369, "lr": 0.00016800000000000002, "tps": 12820, "wall": 2152.1} {"step": 421, "train_loss": 6.126687049865723, "lr": 0.00016840000000000003, "tps": 12821, "wall": 2157.1} {"step": 422, "train_loss": 6.118746757507324, "lr": 0.0001688, "tps": 12821, "wall": 2162.1} {"step": 423, "train_loss": 6.181883811950684, "lr": 0.00016920000000000002, "tps": 12821, "wall": 2167.2} {"step": 424, "train_loss": 6.149712562561035, "lr": 0.0001696, "tps": 12821, "wall": 2172.3} {"step": 425, "train_loss": 6.243256568908691, "lr": 0.00017, "tps": 12822, "wall": 2177.3} {"step": 426, "train_loss": 6.246029853820801, "lr": 0.0001704, "tps": 12822, "wall": 2182.3} {"step": 427, "train_loss": 6.242412567138672, "lr": 0.0001708, "tps": 12822, "wall": 2187.5} {"step": 428, "train_loss": 6.155479907989502, "lr": 0.00017120000000000001, "tps": 12823, "wall": 2192.5} {"step": 429, "train_loss": 6.191985130310059, "lr": 0.0001716, "tps": 12823, "wall": 2197.5} {"step": 430, "train_loss": 6.15164852142334, "lr": 0.000172, "tps": 12824, "wall": 2202.6} {"step": 431, "train_loss": 6.1369781494140625, "lr": 0.0001724, "tps": 12824, "wall": 2207.6} {"step": 432, "train_loss": 6.233741760253906, "lr": 0.0001728, "tps": 12824, "wall": 2212.7} {"step": 433, "train_loss": 6.251614570617676, "lr": 0.0001732, "tps": 12825, "wall": 2217.7} {"step": 434, "train_loss": 6.131402969360352, "lr": 0.0001736, "tps": 12825, "wall": 2222.8} {"step": 435, "train_loss": 6.13899564743042, "lr": 0.00017400000000000003, "tps": 12825, "wall": 2227.8} {"step": 436, "train_loss": 6.082230567932129, "lr": 0.0001744, "tps": 12826, "wall": 2232.9} {"step": 437, "train_loss": 6.133360385894775, "lr": 0.00017480000000000002, "tps": 12826, "wall": 2237.9} {"step": 438, "train_loss": 6.098720550537109, "lr": 0.0001752, "tps": 12827, "wall": 2242.9} {"step": 439, "train_loss": 6.139976501464844, "lr": 0.0001756, "tps": 12827, "wall": 2248.0} {"step": 440, "train_loss": 6.1720194816589355, "lr": 0.00017600000000000002, "tps": 12827, "wall": 2253.1} {"step": 441, "train_loss": 6.062950611114502, "lr": 0.0001764, "tps": 12828, "wall": 2258.1} {"step": 442, "train_loss": 6.083674430847168, "lr": 0.00017680000000000001, "tps": 12828, "wall": 2263.1} {"step": 443, "train_loss": 6.143088340759277, "lr": 0.0001772, "tps": 12828, "wall": 2268.2} {"step": 444, "train_loss": 6.023529052734375, "lr": 0.0001776, "tps": 12829, "wall": 2273.2} {"step": 445, "train_loss": 6.175748825073242, "lr": 0.00017800000000000002, "tps": 12829, "wall": 2278.2} {"step": 446, "train_loss": 6.059772968292236, "lr": 0.0001784, "tps": 12830, "wall": 2283.3} {"step": 447, "train_loss": 6.139204978942871, "lr": 0.0001788, "tps": 12830, "wall": 2288.3} {"step": 448, "train_loss": 6.053457260131836, "lr": 0.0001792, "tps": 12831, "wall": 2293.3} {"step": 449, "train_loss": 6.0684356689453125, "lr": 0.0001796, "tps": 12831, "wall": 2298.3} {"step": 450, "train_loss": 6.162984371185303, "lr": 0.00018, "tps": 12832, "wall": 2303.3} {"step": 451, "train_loss": 6.161435604095459, "lr": 0.0001804, "tps": 12832, "wall": 2308.4} {"step": 452, "train_loss": 6.121722221374512, "lr": 0.0001808, "tps": 12833, "wall": 2313.4} {"step": 453, "train_loss": 6.1175336837768555, "lr": 0.0001812, "tps": 12833, "wall": 2318.4} {"step": 454, "train_loss": 6.106119632720947, "lr": 0.00018160000000000002, "tps": 12834, "wall": 2323.4} {"step": 455, "train_loss": 6.042308807373047, "lr": 0.000182, "tps": 12834, "wall": 2328.4} {"step": 456, "train_loss": 6.144205093383789, "lr": 0.00018240000000000002, "tps": 12835, "wall": 2333.4} {"step": 457, "train_loss": 6.084390163421631, "lr": 0.00018280000000000003, "tps": 12835, "wall": 2338.5} {"step": 458, "train_loss": 6.004528999328613, "lr": 0.0001832, "tps": 12835, "wall": 2343.5} {"step": 459, "train_loss": 5.993685722351074, "lr": 0.00018360000000000002, "tps": 12836, "wall": 2348.5} {"step": 460, "train_loss": 6.115257263183594, "lr": 0.000184, "tps": 12836, "wall": 2353.5} {"step": 461, "train_loss": 5.96043586730957, "lr": 0.0001844, "tps": 12837, "wall": 2358.5} {"step": 462, "train_loss": 6.0621538162231445, "lr": 0.00018480000000000002, "tps": 12838, "wall": 2363.5} {"step": 463, "train_loss": 6.021843910217285, "lr": 0.0001852, "tps": 12838, "wall": 2368.6} {"step": 464, "train_loss": 6.169068336486816, "lr": 0.0001856, "tps": 12839, "wall": 2373.6} {"step": 465, "train_loss": 6.093168258666992, "lr": 0.000186, "tps": 12839, "wall": 2378.5} {"step": 466, "train_loss": 6.090127468109131, "lr": 0.0001864, "tps": 12840, "wall": 2383.5} {"step": 467, "train_loss": 6.082448959350586, "lr": 0.00018680000000000001, "tps": 12840, "wall": 2388.5} {"step": 468, "train_loss": 6.200514793395996, "lr": 0.0001872, "tps": 12841, "wall": 2393.5} {"step": 469, "train_loss": 6.065539360046387, "lr": 0.0001876, "tps": 12842, "wall": 2398.5} {"step": 470, "train_loss": 6.028040409088135, "lr": 0.000188, "tps": 12842, "wall": 2403.5} {"step": 471, "train_loss": 6.111598968505859, "lr": 0.0001884, "tps": 12843, "wall": 2408.5} {"step": 472, "train_loss": 6.041073322296143, "lr": 0.0001888, "tps": 12843, "wall": 2413.5} {"step": 473, "train_loss": 6.0326128005981445, "lr": 0.00018920000000000002, "tps": 12844, "wall": 2418.5} {"step": 474, "train_loss": 5.928859710693359, "lr": 0.00018960000000000003, "tps": 12844, "wall": 2423.5} {"step": 475, "train_loss": 6.08843994140625, "lr": 0.00019, "tps": 12845, "wall": 2428.5} {"step": 476, "train_loss": 5.979431629180908, "lr": 0.00019040000000000002, "tps": 12846, "wall": 2433.5} {"step": 477, "train_loss": 6.024507999420166, "lr": 0.0001908, "tps": 12846, "wall": 2438.4} {"step": 478, "train_loss": 6.083595275878906, "lr": 0.0001912, "tps": 12847, "wall": 2443.4} {"step": 479, "train_loss": 5.927206993103027, "lr": 0.00019160000000000002, "tps": 12848, "wall": 2448.4} {"step": 480, "train_loss": 6.007574558258057, "lr": 0.000192, "tps": 12848, "wall": 2453.4} {"step": 481, "train_loss": 6.030559539794922, "lr": 0.00019240000000000001, "tps": 12849, "wall": 2458.4} {"step": 482, "train_loss": 6.035654067993164, "lr": 0.0001928, "tps": 12850, "wall": 2463.3} {"step": 483, "train_loss": 6.154646873474121, "lr": 0.0001932, "tps": 12850, "wall": 2468.3} {"step": 484, "train_loss": 6.031426429748535, "lr": 0.00019360000000000002, "tps": 12851, "wall": 2473.3} {"step": 485, "train_loss": 6.082369804382324, "lr": 0.000194, "tps": 12852, "wall": 2478.2} {"step": 486, "train_loss": 6.0629072189331055, "lr": 0.0001944, "tps": 12852, "wall": 2483.2} {"step": 487, "train_loss": 6.096935272216797, "lr": 0.0001948, "tps": 12853, "wall": 2488.2} {"step": 488, "train_loss": 6.06242036819458, "lr": 0.0001952, "tps": 12853, "wall": 2493.2} {"step": 489, "train_loss": 5.9375386238098145, "lr": 0.00019559999999999998, "tps": 12854, "wall": 2498.3} {"step": 490, "train_loss": 5.9888916015625, "lr": 0.00019600000000000002, "tps": 12854, "wall": 2503.2} {"step": 491, "train_loss": 6.003706455230713, "lr": 0.00019640000000000003, "tps": 12855, "wall": 2508.2} {"step": 492, "train_loss": 5.974316596984863, "lr": 0.0001968, "tps": 12855, "wall": 2513.2} {"step": 493, "train_loss": 6.040033340454102, "lr": 0.00019720000000000002, "tps": 12856, "wall": 2518.2} {"step": 494, "train_loss": 5.940321445465088, "lr": 0.0001976, "tps": 12857, "wall": 2523.2} {"step": 495, "train_loss": 5.930732727050781, "lr": 0.00019800000000000002, "tps": 12857, "wall": 2528.1} {"step": 496, "train_loss": 6.010073184967041, "lr": 0.00019840000000000002, "tps": 12858, "wall": 2533.1} {"step": 497, "train_loss": 5.964547157287598, "lr": 0.0001988, "tps": 12858, "wall": 2538.1} {"step": 498, "train_loss": 5.923205852508545, "lr": 0.00019920000000000002, "tps": 12859, "wall": 2543.0} {"step": 499, "train_loss": 5.9147772789001465, "lr": 0.0001996, "tps": 12860, "wall": 2548.1} {"step": 500, "train_loss": 5.996562480926514, "lr": 0.0002, "tps": 12860, "wall": 2553.0} {"step": 501, "train_loss": 5.958456993103027, "lr": 0.00020040000000000002, "tps": 12860, "wall": 2558.1} {"step": 502, "train_loss": 5.8637919425964355, "lr": 0.0002008, "tps": 12861, "wall": 2563.1} {"step": 503, "train_loss": 5.967641830444336, "lr": 0.0002012, "tps": 12861, "wall": 2568.1} {"step": 504, "train_loss": 5.955610752105713, "lr": 0.0002016, "tps": 12862, "wall": 2573.1} {"step": 505, "train_loss": 5.957830429077148, "lr": 0.000202, "tps": 12863, "wall": 2578.0} {"step": 506, "train_loss": 5.907709121704102, "lr": 0.0002024, "tps": 12863, "wall": 2583.0} {"step": 507, "train_loss": 5.872612476348877, "lr": 0.0002028, "tps": 12864, "wall": 2587.9} {"step": 508, "train_loss": 5.991995334625244, "lr": 0.0002032, "tps": 12865, "wall": 2592.9} {"step": 509, "train_loss": 5.947447776794434, "lr": 0.00020360000000000002, "tps": 12865, "wall": 2597.8} {"step": 510, "train_loss": 5.925743103027344, "lr": 0.00020400000000000003, "tps": 12866, "wall": 2602.8} {"step": 511, "train_loss": 5.960272789001465, "lr": 0.0002044, "tps": 12866, "wall": 2607.8} {"step": 512, "train_loss": 5.992669105529785, "lr": 0.00020480000000000002, "tps": 12867, "wall": 2612.8} {"step": 513, "train_loss": 5.964126110076904, "lr": 0.00020520000000000003, "tps": 12868, "wall": 2617.7} {"step": 514, "train_loss": 5.889413833618164, "lr": 0.0002056, "tps": 12868, "wall": 2622.7} {"step": 515, "train_loss": 5.96971321105957, "lr": 0.00020600000000000002, "tps": 12869, "wall": 2627.6} {"step": 516, "train_loss": 5.791154384613037, "lr": 0.0002064, "tps": 12870, "wall": 2632.6} {"step": 517, "train_loss": 5.954029560089111, "lr": 0.0002068, "tps": 12871, "wall": 2637.5} {"step": 518, "train_loss": 5.879824638366699, "lr": 0.00020720000000000002, "tps": 12872, "wall": 2642.4} {"step": 519, "train_loss": 5.925008296966553, "lr": 0.0002076, "tps": 12872, "wall": 2647.3} {"step": 520, "train_loss": 5.853214740753174, "lr": 0.00020800000000000001, "tps": 12873, "wall": 2652.3} {"step": 521, "train_loss": 5.837308406829834, "lr": 0.0002084, "tps": 12874, "wall": 2657.2} {"step": 522, "train_loss": 5.908632755279541, "lr": 0.0002088, "tps": 12875, "wall": 2662.1} {"step": 523, "train_loss": 5.883017539978027, "lr": 0.0002092, "tps": 12875, "wall": 2667.1} {"step": 524, "train_loss": 5.961799144744873, "lr": 0.0002096, "tps": 12876, "wall": 2672.1} {"step": 525, "train_loss": 5.817046165466309, "lr": 0.00021, "tps": 12877, "wall": 2677.0} {"step": 526, "train_loss": 5.835506439208984, "lr": 0.0002104, "tps": 12877, "wall": 2681.9} {"step": 527, "train_loss": 5.748818397521973, "lr": 0.00021080000000000003, "tps": 12878, "wall": 2686.8} {"step": 528, "train_loss": 5.821694850921631, "lr": 0.0002112, "tps": 12879, "wall": 2691.8} {"step": 529, "train_loss": 5.891044616699219, "lr": 0.00021160000000000002, "tps": 12882, "wall": 2696.2} {"step": 530, "train_loss": 5.926685810089111, "lr": 0.00021200000000000003, "tps": 12884, "wall": 2701.0} {"step": 531, "train_loss": 5.949342727661133, "lr": 0.0002124, "tps": 12885, "wall": 2705.7} {"step": 532, "train_loss": 5.908756256103516, "lr": 0.00021280000000000002, "tps": 12886, "wall": 2710.5} {"step": 533, "train_loss": 5.9019246101379395, "lr": 0.0002132, "tps": 12888, "wall": 2715.4} {"step": 534, "train_loss": 5.916233062744141, "lr": 0.00021360000000000001, "tps": 12889, "wall": 2720.2} {"step": 535, "train_loss": 5.805663585662842, "lr": 0.00021400000000000002, "tps": 12890, "wall": 2725.2} {"step": 536, "train_loss": 5.899423122406006, "lr": 0.0002144, "tps": 12890, "wall": 2730.0} {"step": 537, "train_loss": 5.834723949432373, "lr": 0.00021480000000000002, "tps": 12891, "wall": 2735.0} {"step": 538, "train_loss": 5.769102096557617, "lr": 0.0002152, "tps": 12892, "wall": 2739.9} {"step": 539, "train_loss": 5.85974645614624, "lr": 0.0002156, "tps": 12893, "wall": 2744.8} {"step": 540, "train_loss": 5.813241481781006, "lr": 0.000216, "tps": 12893, "wall": 2749.8} {"step": 541, "train_loss": 5.810332298278809, "lr": 0.0002164, "tps": 12894, "wall": 2754.8} {"step": 542, "train_loss": 5.937317848205566, "lr": 0.0002168, "tps": 12894, "wall": 2759.7} {"step": 543, "train_loss": 5.846417427062988, "lr": 0.0002172, "tps": 12895, "wall": 2764.7} {"step": 544, "train_loss": 5.8366780281066895, "lr": 0.0002176, "tps": 12896, "wall": 2769.6} {"step": 545, "train_loss": 5.778996467590332, "lr": 0.00021799999999999999, "tps": 12896, "wall": 2774.5} {"step": 546, "train_loss": 5.8378705978393555, "lr": 0.00021840000000000002, "tps": 12897, "wall": 2779.5} {"step": 547, "train_loss": 5.863823413848877, "lr": 0.00021880000000000003, "tps": 12898, "wall": 2784.3} {"step": 548, "train_loss": 5.847461700439453, "lr": 0.00021920000000000002, "tps": 12901, "wall": 2788.8} {"step": 549, "train_loss": 5.971471786499023, "lr": 0.00021960000000000003, "tps": 12902, "wall": 2793.6} {"step": 550, "train_loss": 5.711641311645508, "lr": 0.00022, "tps": 12903, "wall": 2798.4} {"step": 551, "train_loss": 5.859531402587891, "lr": 0.00022040000000000002, "tps": 12904, "wall": 2803.2} {"step": 552, "train_loss": 5.753543376922607, "lr": 0.00022080000000000003, "tps": 12906, "wall": 2808.1} {"step": 553, "train_loss": 5.872531890869141, "lr": 0.0002212, "tps": 12906, "wall": 2813.0} {"step": 554, "train_loss": 5.794254302978516, "lr": 0.00022160000000000002, "tps": 12907, "wall": 2817.9} {"step": 555, "train_loss": 5.850761890411377, "lr": 0.000222, "tps": 12908, "wall": 2822.8} {"step": 556, "train_loss": 5.684512615203857, "lr": 0.0002224, "tps": 12909, "wall": 2827.7} {"step": 557, "train_loss": 5.712203502655029, "lr": 0.0002228, "tps": 12909, "wall": 2832.6} {"step": 558, "train_loss": 5.8260698318481445, "lr": 0.0002232, "tps": 12910, "wall": 2837.6} {"step": 559, "train_loss": 5.773526668548584, "lr": 0.00022360000000000001, "tps": 12911, "wall": 2842.5} {"step": 560, "train_loss": 5.774186134338379, "lr": 0.000224, "tps": 12911, "wall": 2847.5} {"step": 561, "train_loss": 5.751910209655762, "lr": 0.0002244, "tps": 12912, "wall": 2852.5} {"step": 562, "train_loss": 5.795129776000977, "lr": 0.0002248, "tps": 12912, "wall": 2857.4} {"step": 563, "train_loss": 5.819757461547852, "lr": 0.0002252, "tps": 12914, "wall": 2862.0} {"step": 564, "train_loss": 5.727734565734863, "lr": 0.00022560000000000004, "tps": 12916, "wall": 2866.7} {"step": 565, "train_loss": 5.759158611297607, "lr": 0.00022600000000000002, "tps": 12917, "wall": 2871.5} {"step": 566, "train_loss": 5.82168436050415, "lr": 0.00022640000000000003, "tps": 12918, "wall": 2876.3} {"step": 567, "train_loss": 5.827311992645264, "lr": 0.0002268, "tps": 12919, "wall": 2881.2} {"step": 568, "train_loss": 5.67936372756958, "lr": 0.00022720000000000002, "tps": 12920, "wall": 2886.1} {"step": 569, "train_loss": 5.752442359924316, "lr": 0.00022760000000000003, "tps": 12921, "wall": 2891.0} {"step": 570, "train_loss": 5.635977745056152, "lr": 0.000228, "tps": 12922, "wall": 2895.9} {"step": 571, "train_loss": 5.7560224533081055, "lr": 0.00022840000000000002, "tps": 12922, "wall": 2900.8} {"step": 572, "train_loss": 5.678360939025879, "lr": 0.0002288, "tps": 12923, "wall": 2905.8} {"step": 573, "train_loss": 5.825821876525879, "lr": 0.00022920000000000001, "tps": 12923, "wall": 2910.7} {"step": 574, "train_loss": 5.7595534324646, "lr": 0.0002296, "tps": 12924, "wall": 2915.7} {"step": 575, "train_loss": 5.714634895324707, "lr": 0.00023, "tps": 12924, "wall": 2920.6} {"step": 576, "train_loss": 5.815689563751221, "lr": 0.00023040000000000002, "tps": 12925, "wall": 2925.6} {"step": 577, "train_loss": 5.689175128936768, "lr": 0.0002308, "tps": 12925, "wall": 2930.5} {"step": 578, "train_loss": 5.701148986816406, "lr": 0.0002312, "tps": 12926, "wall": 2935.5} {"step": 579, "train_loss": 5.733248233795166, "lr": 0.0002316, "tps": 12926, "wall": 2940.4} {"step": 580, "train_loss": 5.748325347900391, "lr": 0.000232, "tps": 12927, "wall": 2945.4} {"step": 581, "train_loss": 5.806573390960693, "lr": 0.0002324, "tps": 12927, "wall": 2950.4} {"step": 582, "train_loss": 5.746426582336426, "lr": 0.0002328, "tps": 12928, "wall": 2955.3} {"step": 583, "train_loss": 5.75889778137207, "lr": 0.00023320000000000003, "tps": 12929, "wall": 2960.2} {"step": 584, "train_loss": 5.7984418869018555, "lr": 0.0002336, "tps": 12929, "wall": 2965.1} {"step": 585, "train_loss": 5.66950798034668, "lr": 0.00023400000000000002, "tps": 12930, "wall": 2970.0} {"step": 586, "train_loss": 5.785399436950684, "lr": 0.00023440000000000003, "tps": 12931, "wall": 2974.9} {"step": 587, "train_loss": 5.6552019119262695, "lr": 0.00023480000000000002, "tps": 12931, "wall": 2979.9} {"step": 588, "train_loss": 5.678261756896973, "lr": 0.00023520000000000002, "tps": 12932, "wall": 2984.9} {"step": 589, "train_loss": 5.702921390533447, "lr": 0.0002356, "tps": 12932, "wall": 2989.8} {"step": 590, "train_loss": 5.707201957702637, "lr": 0.00023600000000000002, "tps": 12933, "wall": 2994.7} {"step": 591, "train_loss": 5.819362163543701, "lr": 0.0002364, "tps": 12933, "wall": 2999.7} {"step": 592, "train_loss": 5.743590831756592, "lr": 0.0002368, "tps": 12934, "wall": 3004.7} {"step": 593, "train_loss": 5.791676998138428, "lr": 0.00023720000000000002, "tps": 12934, "wall": 3009.6} {"step": 594, "train_loss": 5.776898384094238, "lr": 0.0002376, "tps": 12935, "wall": 3014.6} {"step": 595, "train_loss": 5.68189811706543, "lr": 0.000238, "tps": 12935, "wall": 3019.5} {"step": 596, "train_loss": 5.629362106323242, "lr": 0.0002384, "tps": 12935, "wall": 3024.5} {"step": 597, "train_loss": 5.748600006103516, "lr": 0.0002388, "tps": 12936, "wall": 3029.5} {"step": 598, "train_loss": 5.839866638183594, "lr": 0.00023920000000000001, "tps": 12936, "wall": 3034.4} {"step": 599, "train_loss": 5.703601837158203, "lr": 0.0002396, "tps": 12937, "wall": 3039.4} {"step": 600, "train_loss": 5.73879861831665, "lr": 0.00024, "tps": 12937, "wall": 3044.4} {"step": 601, "train_loss": 5.640645503997803, "lr": 0.00024040000000000002, "tps": 12937, "wall": 3049.4} {"step": 602, "train_loss": 5.802707195281982, "lr": 0.00024080000000000003, "tps": 12938, "wall": 3054.4} {"step": 603, "train_loss": 5.694733142852783, "lr": 0.0002412, "tps": 12938, "wall": 3059.4} {"step": 604, "train_loss": 5.678302764892578, "lr": 0.00024160000000000002, "tps": 12938, "wall": 3064.3} {"step": 605, "train_loss": 5.678246974945068, "lr": 0.00024200000000000003, "tps": 12939, "wall": 3069.3} {"step": 606, "train_loss": 5.648252487182617, "lr": 0.0002424, "tps": 12939, "wall": 3074.3} {"step": 607, "train_loss": 5.6632771492004395, "lr": 0.00024280000000000002, "tps": 12939, "wall": 3079.3} {"step": 608, "train_loss": 5.683871269226074, "lr": 0.0002432, "tps": 12939, "wall": 3084.4} {"step": 609, "train_loss": 5.5546464920043945, "lr": 0.0002436, "tps": 12940, "wall": 3089.4} {"step": 610, "train_loss": 5.747114181518555, "lr": 0.00024400000000000002, "tps": 12940, "wall": 3094.4} {"step": 611, "train_loss": 5.613054275512695, "lr": 0.00024440000000000003, "tps": 12940, "wall": 3099.4} {"step": 612, "train_loss": 5.612577438354492, "lr": 0.00024480000000000004, "tps": 12940, "wall": 3104.4} {"step": 613, "train_loss": 5.704916000366211, "lr": 0.0002452, "tps": 12941, "wall": 3109.4} {"step": 614, "train_loss": 5.631939888000488, "lr": 0.0002456, "tps": 12941, "wall": 3114.4} {"step": 615, "train_loss": 5.7205705642700195, "lr": 0.000246, "tps": 12941, "wall": 3119.4} {"step": 616, "train_loss": 5.748003005981445, "lr": 0.0002464, "tps": 12941, "wall": 3124.4} {"step": 617, "train_loss": 5.782521724700928, "lr": 0.00024680000000000004, "tps": 12942, "wall": 3129.4} {"step": 618, "train_loss": 5.589323997497559, "lr": 0.0002472, "tps": 12942, "wall": 3134.4} {"step": 619, "train_loss": 5.691083908081055, "lr": 0.0002476, "tps": 12942, "wall": 3139.4} {"step": 620, "train_loss": 5.7374420166015625, "lr": 0.000248, "tps": 12942, "wall": 3144.5} {"step": 621, "train_loss": 5.676213264465332, "lr": 0.0002484, "tps": 12942, "wall": 3149.5} {"step": 622, "train_loss": 5.6023736000061035, "lr": 0.00024880000000000003, "tps": 12943, "wall": 3154.5} {"step": 623, "train_loss": 5.742042064666748, "lr": 0.0002492, "tps": 12943, "wall": 3159.5} {"step": 624, "train_loss": 5.6953535079956055, "lr": 0.0002496, "tps": 12943, "wall": 3164.5} {"step": 625, "train_loss": 5.582660675048828, "lr": 0.00025, "tps": 12943, "wall": 3169.5} {"step": 626, "train_loss": 5.646921634674072, "lr": 0.0002504, "tps": 12944, "wall": 3174.5} {"step": 627, "train_loss": 5.683225154876709, "lr": 0.0002508, "tps": 12944, "wall": 3179.5} {"step": 628, "train_loss": 5.6818952560424805, "lr": 0.00025120000000000003, "tps": 12944, "wall": 3184.5} {"step": 629, "train_loss": 5.637875556945801, "lr": 0.0002516, "tps": 12944, "wall": 3189.5} {"step": 630, "train_loss": 5.710309982299805, "lr": 0.000252, "tps": 12945, "wall": 3194.5} {"step": 631, "train_loss": 5.575571060180664, "lr": 0.0002524, "tps": 12945, "wall": 3199.5} {"step": 632, "train_loss": 5.69234037399292, "lr": 0.0002528, "tps": 12945, "wall": 3204.5} {"step": 633, "train_loss": 5.620065212249756, "lr": 0.00025320000000000003, "tps": 12945, "wall": 3209.5} {"step": 634, "train_loss": 5.572121620178223, "lr": 0.0002536, "tps": 12945, "wall": 3214.5} {"step": 635, "train_loss": 5.682713508605957, "lr": 0.000254, "tps": 12946, "wall": 3219.6} {"step": 636, "train_loss": 5.630777835845947, "lr": 0.0002544, "tps": 12946, "wall": 3224.6} {"step": 637, "train_loss": 5.605785846710205, "lr": 0.0002548, "tps": 12946, "wall": 3229.6} {"step": 638, "train_loss": 5.545088768005371, "lr": 0.0002552, "tps": 12946, "wall": 3234.5} {"step": 639, "train_loss": 5.665183067321777, "lr": 0.0002556, "tps": 12947, "wall": 3239.5} {"step": 640, "train_loss": 5.581580638885498, "lr": 0.000256, "tps": 12947, "wall": 3244.5} {"step": 641, "train_loss": 5.513541221618652, "lr": 0.0002564, "tps": 12947, "wall": 3249.6} {"step": 642, "train_loss": 5.533535480499268, "lr": 0.0002568, "tps": 12947, "wall": 3254.6} {"step": 643, "train_loss": 5.614610195159912, "lr": 0.0002572, "tps": 12948, "wall": 3259.6} {"step": 644, "train_loss": 5.6726908683776855, "lr": 0.0002576, "tps": 12947, "wall": 3264.7} {"step": 645, "train_loss": 5.604567527770996, "lr": 0.000258, "tps": 12948, "wall": 3269.6} {"step": 646, "train_loss": 5.493133068084717, "lr": 0.0002584, "tps": 12948, "wall": 3274.6} {"step": 647, "train_loss": 5.62930154800415, "lr": 0.00025880000000000006, "tps": 12948, "wall": 3279.6} {"step": 648, "train_loss": 5.702630519866943, "lr": 0.0002592, "tps": 12949, "wall": 3284.6} {"step": 649, "train_loss": 5.536123275756836, "lr": 0.0002596, "tps": 12949, "wall": 3289.6} {"step": 650, "train_loss": 5.625580310821533, "lr": 0.00026000000000000003, "tps": 12949, "wall": 3294.6} {"step": 651, "train_loss": 5.671883583068848, "lr": 0.00026040000000000004, "tps": 12949, "wall": 3299.6} {"step": 652, "train_loss": 5.656143665313721, "lr": 0.00026080000000000005, "tps": 12949, "wall": 3304.7} {"step": 653, "train_loss": 5.713288307189941, "lr": 0.0002612, "tps": 12950, "wall": 3309.7} {"step": 654, "train_loss": 5.628629207611084, "lr": 0.0002616, "tps": 12950, "wall": 3314.7} {"step": 655, "train_loss": 5.604288101196289, "lr": 0.000262, "tps": 12950, "wall": 3319.7} {"step": 656, "train_loss": 5.587828159332275, "lr": 0.00026240000000000004, "tps": 12950, "wall": 3324.8} {"step": 657, "train_loss": 5.633610725402832, "lr": 0.00026280000000000005, "tps": 12950, "wall": 3329.8} {"step": 658, "train_loss": 5.548878192901611, "lr": 0.0002632, "tps": 12950, "wall": 3334.8} {"step": 659, "train_loss": 5.520743370056152, "lr": 0.0002636, "tps": 12951, "wall": 3339.8} {"step": 660, "train_loss": 5.568305492401123, "lr": 0.000264, "tps": 12951, "wall": 3344.8} {"step": 661, "train_loss": 5.54009485244751, "lr": 0.00026440000000000003, "tps": 12951, "wall": 3349.8} {"step": 662, "train_loss": 5.560774803161621, "lr": 0.00026480000000000004, "tps": 12951, "wall": 3354.8} {"step": 663, "train_loss": 5.602258205413818, "lr": 0.0002652, "tps": 12951, "wall": 3359.9} {"step": 664, "train_loss": 5.567882537841797, "lr": 0.0002656, "tps": 12951, "wall": 3364.9} {"step": 665, "train_loss": 5.483578205108643, "lr": 0.000266, "tps": 12951, "wall": 3369.9} {"step": 666, "train_loss": 5.591720104217529, "lr": 0.0002664, "tps": 12952, "wall": 3374.9} {"step": 667, "train_loss": 5.627083778381348, "lr": 0.00026680000000000003, "tps": 12952, "wall": 3379.9} {"step": 668, "train_loss": 5.501709461212158, "lr": 0.0002672, "tps": 12952, "wall": 3385.0} {"step": 669, "train_loss": 5.589934349060059, "lr": 0.0002676, "tps": 12952, "wall": 3390.0} {"step": 670, "train_loss": 5.58474063873291, "lr": 0.000268, "tps": 12952, "wall": 3395.0} {"step": 671, "train_loss": 5.532108783721924, "lr": 0.0002684, "tps": 12953, "wall": 3400.0} {"step": 672, "train_loss": 5.52168083190918, "lr": 0.00026880000000000003, "tps": 12953, "wall": 3405.0} {"step": 673, "train_loss": 5.606819152832031, "lr": 0.0002692, "tps": 12953, "wall": 3410.0} {"step": 674, "train_loss": 5.500093460083008, "lr": 0.0002696, "tps": 12953, "wall": 3415.0} {"step": 675, "train_loss": 5.549217700958252, "lr": 0.00027, "tps": 12953, "wall": 3420.0} {"step": 676, "train_loss": 5.523038864135742, "lr": 0.0002704, "tps": 12954, "wall": 3425.0} {"step": 677, "train_loss": 5.528746604919434, "lr": 0.0002708, "tps": 12954, "wall": 3430.0} {"step": 678, "train_loss": 5.57552433013916, "lr": 0.0002712, "tps": 12954, "wall": 3435.0} {"step": 679, "train_loss": 5.616130828857422, "lr": 0.0002716, "tps": 12954, "wall": 3440.0} {"step": 680, "train_loss": 5.568203926086426, "lr": 0.000272, "tps": 12954, "wall": 3445.1} {"step": 681, "train_loss": 5.514626502990723, "lr": 0.0002724, "tps": 12954, "wall": 3450.1} {"step": 682, "train_loss": 5.483175277709961, "lr": 0.00027279999999999996, "tps": 12955, "wall": 3455.1} {"step": 683, "train_loss": 5.492404937744141, "lr": 0.00027319999999999997, "tps": 12955, "wall": 3460.1} {"step": 684, "train_loss": 5.434774875640869, "lr": 0.00027360000000000004, "tps": 12955, "wall": 3465.1} {"step": 685, "train_loss": 5.510507583618164, "lr": 0.00027400000000000005, "tps": 12955, "wall": 3470.2} {"step": 686, "train_loss": 5.654592990875244, "lr": 0.00027440000000000006, "tps": 12955, "wall": 3475.2} {"step": 687, "train_loss": 5.59937858581543, "lr": 0.0002748, "tps": 12955, "wall": 3480.2} {"step": 688, "train_loss": 5.459660530090332, "lr": 0.0002752, "tps": 12956, "wall": 3485.2} {"step": 689, "train_loss": 5.568676948547363, "lr": 0.00027560000000000003, "tps": 12956, "wall": 3490.2} {"step": 690, "train_loss": 5.484584808349609, "lr": 0.00027600000000000004, "tps": 12956, "wall": 3495.2} {"step": 691, "train_loss": 5.594359874725342, "lr": 0.00027640000000000005, "tps": 12956, "wall": 3500.2} {"step": 692, "train_loss": 5.543590068817139, "lr": 0.0002768, "tps": 12956, "wall": 3505.2} {"step": 693, "train_loss": 5.5158185958862305, "lr": 0.0002772, "tps": 12956, "wall": 3510.2} {"step": 694, "train_loss": 5.579851150512695, "lr": 0.0002776, "tps": 12957, "wall": 3515.2} {"step": 695, "train_loss": 5.5614471435546875, "lr": 0.00027800000000000004, "tps": 12957, "wall": 3520.3} {"step": 696, "train_loss": 5.527743339538574, "lr": 0.00027840000000000005, "tps": 12957, "wall": 3525.3} {"step": 697, "train_loss": 5.508007526397705, "lr": 0.0002788, "tps": 12957, "wall": 3530.3} {"step": 698, "train_loss": 5.510560035705566, "lr": 0.0002792, "tps": 12957, "wall": 3535.2} {"step": 699, "train_loss": 5.519960403442383, "lr": 0.0002796, "tps": 12958, "wall": 3540.3} {"step": 700, "train_loss": 5.49217414855957, "lr": 0.00028000000000000003, "tps": 12958, "wall": 3545.3} {"step": 701, "train_loss": 5.429018497467041, "lr": 0.00028040000000000004, "tps": 12958, "wall": 3550.3} {"step": 702, "train_loss": 5.463597297668457, "lr": 0.0002808, "tps": 12958, "wall": 3555.3} {"step": 703, "train_loss": 5.420702934265137, "lr": 0.0002812, "tps": 12958, "wall": 3560.3} {"step": 704, "train_loss": 5.543501377105713, "lr": 0.0002816, "tps": 12958, "wall": 3565.4} {"step": 705, "train_loss": 5.509710788726807, "lr": 0.000282, "tps": 12958, "wall": 3570.4} {"step": 706, "train_loss": 5.419300556182861, "lr": 0.00028240000000000003, "tps": 12958, "wall": 3575.4} {"step": 707, "train_loss": 5.536778450012207, "lr": 0.0002828, "tps": 12958, "wall": 3580.5} {"step": 708, "train_loss": 5.467130661010742, "lr": 0.0002832, "tps": 12958, "wall": 3585.6} {"step": 709, "train_loss": 5.539925575256348, "lr": 0.0002836, "tps": 12958, "wall": 3590.6} {"step": 710, "train_loss": 5.477188587188721, "lr": 0.000284, "tps": 12958, "wall": 3595.7} {"step": 711, "train_loss": 5.507214069366455, "lr": 0.0002844, "tps": 12958, "wall": 3600.8} {"step": 712, "train_loss": 5.367311477661133, "lr": 0.0002848, "tps": 12958, "wall": 3605.9} {"step": 713, "train_loss": 5.377236366271973, "lr": 0.0002852, "tps": 12958, "wall": 3611.0} {"step": 714, "train_loss": 5.462746620178223, "lr": 0.0002856, "tps": 12958, "wall": 3616.1} {"step": 715, "train_loss": 5.487159252166748, "lr": 0.000286, "tps": 12958, "wall": 3621.2} {"step": 716, "train_loss": 5.448348045349121, "lr": 0.00028639999999999997, "tps": 12957, "wall": 3626.3} {"step": 717, "train_loss": 5.460391521453857, "lr": 0.0002868, "tps": 12957, "wall": 3631.4} {"step": 718, "train_loss": 5.42954158782959, "lr": 0.0002872, "tps": 12957, "wall": 3636.5} {"step": 719, "train_loss": 5.477403163909912, "lr": 0.0002876, "tps": 12957, "wall": 3641.7} {"step": 720, "train_loss": 5.5542755126953125, "lr": 0.000288, "tps": 12957, "wall": 3646.8} {"step": 721, "train_loss": 5.460492134094238, "lr": 0.00028839999999999996, "tps": 12956, "wall": 3651.9} {"step": 722, "train_loss": 5.3784379959106445, "lr": 0.0002888, "tps": 12956, "wall": 3657.1} {"step": 723, "train_loss": 5.50382137298584, "lr": 0.00028920000000000004, "tps": 12956, "wall": 3662.2} {"step": 724, "train_loss": 5.4511518478393555, "lr": 0.00028960000000000005, "tps": 12955, "wall": 3667.4} {"step": 725, "train_loss": 5.5294880867004395, "lr": 0.00029000000000000006, "tps": 12955, "wall": 3672.5} {"step": 726, "train_loss": 5.5343852043151855, "lr": 0.0002904, "tps": 12955, "wall": 3677.6} {"step": 727, "train_loss": 5.40963077545166, "lr": 0.0002908, "tps": 12955, "wall": 3682.7} {"step": 728, "train_loss": 5.43172550201416, "lr": 0.00029120000000000003, "tps": 12954, "wall": 3687.9} {"step": 729, "train_loss": 5.402311325073242, "lr": 0.00029160000000000004, "tps": 12954, "wall": 3693.0} {"step": 730, "train_loss": 5.422787666320801, "lr": 0.00029200000000000005, "tps": 12954, "wall": 3698.2} {"step": 731, "train_loss": 5.444425582885742, "lr": 0.0002924, "tps": 12953, "wall": 3703.3} {"step": 732, "train_loss": 5.400594711303711, "lr": 0.0002928, "tps": 12953, "wall": 3708.5} {"step": 733, "train_loss": 5.397210597991943, "lr": 0.0002932, "tps": 12953, "wall": 3713.6} {"step": 734, "train_loss": 5.478955268859863, "lr": 0.00029360000000000003, "tps": 12952, "wall": 3718.8} {"step": 735, "train_loss": 5.533449649810791, "lr": 0.00029400000000000004, "tps": 12952, "wall": 3723.9} {"step": 736, "train_loss": 5.400540828704834, "lr": 0.0002944, "tps": 12952, "wall": 3729.0} {"step": 737, "train_loss": 5.3377580642700195, "lr": 0.0002948, "tps": 12952, "wall": 3734.1} {"step": 738, "train_loss": 5.479832172393799, "lr": 0.0002952, "tps": 12952, "wall": 3739.3} {"step": 739, "train_loss": 5.453027725219727, "lr": 0.00029560000000000003, "tps": 12951, "wall": 3744.5} {"step": 740, "train_loss": 5.385915279388428, "lr": 0.00029600000000000004, "tps": 12951, "wall": 3749.6} {"step": 741, "train_loss": 5.461893081665039, "lr": 0.0002964, "tps": 12951, "wall": 3754.7} {"step": 742, "train_loss": 5.42415714263916, "lr": 0.0002968, "tps": 12950, "wall": 3759.8} {"step": 743, "train_loss": 5.410772800445557, "lr": 0.0002972, "tps": 12950, "wall": 3764.9} {"step": 744, "train_loss": 5.548166751861572, "lr": 0.0002976, "tps": 12950, "wall": 3770.1} {"step": 745, "train_loss": 5.344998359680176, "lr": 0.000298, "tps": 12950, "wall": 3775.2} {"step": 746, "train_loss": 5.469427108764648, "lr": 0.0002984, "tps": 12950, "wall": 3780.3} {"step": 747, "train_loss": 5.484825611114502, "lr": 0.0002988, "tps": 12949, "wall": 3785.4} {"step": 748, "train_loss": 5.3822479248046875, "lr": 0.0002992, "tps": 12949, "wall": 3790.5} {"step": 749, "train_loss": 5.371377468109131, "lr": 0.0002996, "tps": 12949, "wall": 3795.6} {"step": 750, "train_loss": 5.438387870788574, "lr": 0.0003, "tps": 12949, "wall": 3800.8} {"step": 751, "train_loss": 5.463041305541992, "lr": 0.0003004, "tps": 12949, "wall": 3805.9} {"step": 752, "train_loss": 5.348359107971191, "lr": 0.0003008, "tps": 12948, "wall": 3811.1} {"step": 753, "train_loss": 5.353653907775879, "lr": 0.0003012, "tps": 12948, "wall": 3816.2} {"step": 754, "train_loss": 5.345923900604248, "lr": 0.0003016, "tps": 12948, "wall": 3821.3} {"step": 755, "train_loss": 5.460442066192627, "lr": 0.00030199999999999997, "tps": 12948, "wall": 3826.4} {"step": 756, "train_loss": 5.418931484222412, "lr": 0.0003024, "tps": 12947, "wall": 3831.6} {"step": 757, "train_loss": 5.3339691162109375, "lr": 0.0003028, "tps": 12947, "wall": 3836.7} {"step": 758, "train_loss": 5.42163610458374, "lr": 0.00030320000000000005, "tps": 12947, "wall": 3841.8} {"step": 759, "train_loss": 5.3358564376831055, "lr": 0.00030360000000000006, "tps": 12947, "wall": 3846.9} {"step": 760, "train_loss": 5.4040045738220215, "lr": 0.000304, "tps": 12947, "wall": 3852.0} {"step": 761, "train_loss": 5.325562953948975, "lr": 0.0003044, "tps": 12947, "wall": 3857.1} {"step": 762, "train_loss": 5.408895492553711, "lr": 0.00030480000000000004, "tps": 12946, "wall": 3862.3} {"step": 763, "train_loss": 5.331888198852539, "lr": 0.00030520000000000005, "tps": 12946, "wall": 3867.5} {"step": 764, "train_loss": 5.4797868728637695, "lr": 0.00030560000000000006, "tps": 12946, "wall": 3872.6} {"step": 765, "train_loss": 5.401251316070557, "lr": 0.000306, "tps": 12945, "wall": 3877.7} {"step": 766, "train_loss": 5.382944583892822, "lr": 0.0003064, "tps": 12945, "wall": 3882.8} {"step": 767, "train_loss": 5.407533645629883, "lr": 0.00030680000000000003, "tps": 12945, "wall": 3888.0} {"step": 768, "train_loss": 5.454697608947754, "lr": 0.00030720000000000004, "tps": 12945, "wall": 3893.1} {"step": 769, "train_loss": 5.382604598999023, "lr": 0.00030760000000000005, "tps": 12945, "wall": 3898.2} {"step": 770, "train_loss": 5.329397678375244, "lr": 0.000308, "tps": 12945, "wall": 3903.3} {"step": 771, "train_loss": 5.3831987380981445, "lr": 0.0003084, "tps": 12944, "wall": 3908.4} {"step": 772, "train_loss": 5.317332744598389, "lr": 0.0003088, "tps": 12944, "wall": 3913.6} {"step": 773, "train_loss": 5.322814464569092, "lr": 0.00030920000000000003, "tps": 12944, "wall": 3918.7} {"step": 774, "train_loss": 5.455862045288086, "lr": 0.00030960000000000004, "tps": 12943, "wall": 3923.9} {"step": 775, "train_loss": 5.4454264640808105, "lr": 0.00031, "tps": 12943, "wall": 3929.0} {"step": 776, "train_loss": 5.389196872711182, "lr": 0.0003104, "tps": 12943, "wall": 3934.1} {"step": 777, "train_loss": 5.459235191345215, "lr": 0.0003108, "tps": 12943, "wall": 3939.2} {"step": 778, "train_loss": 5.356931686401367, "lr": 0.00031120000000000003, "tps": 12943, "wall": 3944.4} {"step": 779, "train_loss": 5.340535640716553, "lr": 0.0003116, "tps": 12942, "wall": 3949.5} {"step": 780, "train_loss": 5.325107097625732, "lr": 0.000312, "tps": 12942, "wall": 3954.6} {"step": 781, "train_loss": 5.414668083190918, "lr": 0.0003124, "tps": 12942, "wall": 3959.8} {"step": 782, "train_loss": 5.30817985534668, "lr": 0.0003128, "tps": 12942, "wall": 3964.9} {"step": 783, "train_loss": 5.4657087326049805, "lr": 0.0003132, "tps": 12941, "wall": 3970.1} {"step": 784, "train_loss": 5.279942512512207, "lr": 0.0003136, "tps": 12941, "wall": 3975.2} {"step": 785, "train_loss": 5.431490421295166, "lr": 0.000314, "tps": 12941, "wall": 3980.3} {"step": 786, "train_loss": 5.298947334289551, "lr": 0.0003144, "tps": 12941, "wall": 3985.5} {"step": 787, "train_loss": 5.373107433319092, "lr": 0.0003148, "tps": 12940, "wall": 3990.7} {"step": 788, "train_loss": 5.308611869812012, "lr": 0.0003152, "tps": 12940, "wall": 3995.8} {"step": 789, "train_loss": 5.322030544281006, "lr": 0.0003156, "tps": 12940, "wall": 4000.9} {"step": 790, "train_loss": 5.322301864624023, "lr": 0.000316, "tps": 12940, "wall": 4006.0} {"step": 791, "train_loss": 5.328780651092529, "lr": 0.0003164, "tps": 12940, "wall": 4011.2} {"step": 792, "train_loss": 5.275051593780518, "lr": 0.0003168, "tps": 12939, "wall": 4016.3} {"step": 793, "train_loss": 5.38682746887207, "lr": 0.0003172, "tps": 12939, "wall": 4021.4} {"step": 794, "train_loss": 5.40399694442749, "lr": 0.00031759999999999997, "tps": 12939, "wall": 4026.5} {"step": 795, "train_loss": 5.252516269683838, "lr": 0.00031800000000000003, "tps": 12939, "wall": 4031.7} {"step": 796, "train_loss": 5.406332969665527, "lr": 0.00031840000000000004, "tps": 12939, "wall": 4036.8} {"step": 797, "train_loss": 5.261051177978516, "lr": 0.00031880000000000005, "tps": 12938, "wall": 4041.9} {"step": 798, "train_loss": 5.337342262268066, "lr": 0.00031920000000000006, "tps": 12938, "wall": 4047.1} {"step": 799, "train_loss": 5.243715286254883, "lr": 0.0003196, "tps": 12938, "wall": 4052.3} {"step": 800, "train_loss": 5.395998954772949, "lr": 0.00032, "tps": 12937, "wall": 4057.4} {"step": 801, "train_loss": 5.341279029846191, "lr": 0.00032040000000000004, "tps": 12937, "wall": 4062.6} {"step": 802, "train_loss": 5.431926727294922, "lr": 0.00032080000000000005, "tps": 12937, "wall": 4067.7} {"step": 803, "train_loss": 5.354260444641113, "lr": 0.00032120000000000006, "tps": 12937, "wall": 4072.8} {"step": 804, "train_loss": 5.378561019897461, "lr": 0.0003216, "tps": 12937, "wall": 4077.9} {"step": 805, "train_loss": 5.461839199066162, "lr": 0.000322, "tps": 12936, "wall": 4083.0} {"step": 806, "train_loss": 5.2990827560424805, "lr": 0.00032240000000000003, "tps": 12936, "wall": 4088.2} {"step": 807, "train_loss": 5.300728797912598, "lr": 0.00032280000000000004, "tps": 12936, "wall": 4093.3} {"step": 808, "train_loss": 5.311367511749268, "lr": 0.00032320000000000005, "tps": 12936, "wall": 4098.4} {"step": 809, "train_loss": 5.324341297149658, "lr": 0.0003236, "tps": 12936, "wall": 4103.6} {"step": 810, "train_loss": 5.257938385009766, "lr": 0.000324, "tps": 12935, "wall": 4108.7} {"step": 811, "train_loss": 5.270914077758789, "lr": 0.0003244, "tps": 12935, "wall": 4113.9} {"step": 812, "train_loss": 5.127988815307617, "lr": 0.00032480000000000003, "tps": 12935, "wall": 4119.0} {"step": 813, "train_loss": 5.302048206329346, "lr": 0.0003252, "tps": 12935, "wall": 4124.1} {"step": 814, "train_loss": 5.339770317077637, "lr": 0.0003256, "tps": 12934, "wall": 4129.3} {"step": 815, "train_loss": 5.2749199867248535, "lr": 0.000326, "tps": 12934, "wall": 4134.4} {"step": 816, "train_loss": 5.354966163635254, "lr": 0.0003264, "tps": 12934, "wall": 4139.5} {"step": 817, "train_loss": 5.299873352050781, "lr": 0.00032680000000000003, "tps": 12934, "wall": 4144.7} {"step": 818, "train_loss": 5.336575508117676, "lr": 0.0003272, "tps": 12934, "wall": 4149.8} {"step": 819, "train_loss": 5.352538108825684, "lr": 0.0003276, "tps": 12933, "wall": 4154.9} {"step": 820, "train_loss": 5.275312900543213, "lr": 0.000328, "tps": 12933, "wall": 4160.1} {"step": 821, "train_loss": 5.2870073318481445, "lr": 0.0003284, "tps": 12933, "wall": 4165.3} {"step": 822, "train_loss": 5.243016719818115, "lr": 0.0003288, "tps": 12933, "wall": 4170.4} {"step": 823, "train_loss": 5.416879653930664, "lr": 0.0003292, "tps": 12932, "wall": 4175.5} {"step": 824, "train_loss": 5.299139022827148, "lr": 0.0003296, "tps": 12932, "wall": 4180.7} {"step": 825, "train_loss": 5.276993274688721, "lr": 0.00033, "tps": 12932, "wall": 4185.8} {"step": 826, "train_loss": 5.294687747955322, "lr": 0.0003304, "tps": 12932, "wall": 4191.0} {"step": 827, "train_loss": 5.339985370635986, "lr": 0.0003308, "tps": 12931, "wall": 4196.1} {"step": 828, "train_loss": 5.402297019958496, "lr": 0.0003312, "tps": 12931, "wall": 4201.3} {"step": 829, "train_loss": 5.347886085510254, "lr": 0.0003316, "tps": 12931, "wall": 4206.4} {"step": 830, "train_loss": 5.278829097747803, "lr": 0.000332, "tps": 12931, "wall": 4211.5} {"step": 831, "train_loss": 5.2288994789123535, "lr": 0.0003324, "tps": 12931, "wall": 4216.6} {"step": 832, "train_loss": 5.29140043258667, "lr": 0.00033280000000000007, "tps": 12931, "wall": 4221.8} {"step": 833, "train_loss": 5.346423149108887, "lr": 0.0003332, "tps": 12930, "wall": 4226.9} {"step": 834, "train_loss": 5.364577293395996, "lr": 0.00033360000000000003, "tps": 12930, "wall": 4232.1} {"step": 835, "train_loss": 5.256248950958252, "lr": 0.00033400000000000004, "tps": 12930, "wall": 4237.2} {"step": 836, "train_loss": 5.42708683013916, "lr": 0.00033440000000000005, "tps": 12930, "wall": 4242.3} {"step": 837, "train_loss": 5.256687641143799, "lr": 0.00033480000000000006, "tps": 12929, "wall": 4247.4} {"step": 838, "train_loss": 5.400329113006592, "lr": 0.0003352, "tps": 12929, "wall": 4252.6} {"step": 839, "train_loss": 5.29494047164917, "lr": 0.0003356, "tps": 12929, "wall": 4257.7} {"step": 840, "train_loss": 5.314636707305908, "lr": 0.00033600000000000004, "tps": 12929, "wall": 4262.8} {"step": 841, "train_loss": 5.214656352996826, "lr": 0.00033640000000000005, "tps": 12929, "wall": 4268.0} {"step": 842, "train_loss": 5.171053409576416, "lr": 0.00033680000000000006, "tps": 12929, "wall": 4273.1} {"step": 843, "train_loss": 5.21352481842041, "lr": 0.0003372, "tps": 12928, "wall": 4278.2} {"step": 844, "train_loss": 5.177850723266602, "lr": 0.0003376, "tps": 12928, "wall": 4283.4} {"step": 845, "train_loss": 5.213889122009277, "lr": 0.00033800000000000003, "tps": 12928, "wall": 4288.6} {"step": 846, "train_loss": 5.3076887130737305, "lr": 0.00033840000000000004, "tps": 12927, "wall": 4293.7} {"step": 847, "train_loss": 5.335256099700928, "lr": 0.0003388, "tps": 12927, "wall": 4298.8} {"step": 848, "train_loss": 5.25025749206543, "lr": 0.0003392, "tps": 12927, "wall": 4304.0} {"step": 849, "train_loss": 5.250413417816162, "lr": 0.0003396, "tps": 12927, "wall": 4309.1} {"step": 850, "train_loss": 5.207926273345947, "lr": 0.00034, "tps": 12927, "wall": 4314.2} {"step": 851, "train_loss": 5.263923168182373, "lr": 0.00034040000000000003, "tps": 12927, "wall": 4319.3} {"step": 852, "train_loss": 5.2844624519348145, "lr": 0.0003408, "tps": 12926, "wall": 4324.5} {"step": 853, "train_loss": 5.371564865112305, "lr": 0.0003412, "tps": 12926, "wall": 4329.6} {"step": 854, "train_loss": 5.224803924560547, "lr": 0.0003416, "tps": 12926, "wall": 4334.8} {"step": 855, "train_loss": 5.284096717834473, "lr": 0.000342, "tps": 12926, "wall": 4339.9} {"step": 856, "train_loss": 5.30938720703125, "lr": 0.00034240000000000003, "tps": 12925, "wall": 4345.1} {"step": 857, "train_loss": 5.249260902404785, "lr": 0.0003428, "tps": 12925, "wall": 4350.2} {"step": 858, "train_loss": 5.234516620635986, "lr": 0.0003432, "tps": 12925, "wall": 4355.4} {"step": 859, "train_loss": 5.244704723358154, "lr": 0.0003436, "tps": 12925, "wall": 4360.5} {"step": 860, "train_loss": 5.186657905578613, "lr": 0.000344, "tps": 12925, "wall": 4365.7} {"step": 861, "train_loss": 5.203670501708984, "lr": 0.0003444, "tps": 12924, "wall": 4370.8} {"step": 862, "train_loss": 5.186431407928467, "lr": 0.0003448, "tps": 12924, "wall": 4376.0} {"step": 863, "train_loss": 5.179869174957275, "lr": 0.0003452, "tps": 12924, "wall": 4381.1} {"step": 864, "train_loss": 5.227642059326172, "lr": 0.0003456, "tps": 12924, "wall": 4386.2} {"step": 865, "train_loss": 5.335268020629883, "lr": 0.000346, "tps": 12924, "wall": 4391.4} {"step": 866, "train_loss": 5.16691255569458, "lr": 0.0003464, "tps": 12923, "wall": 4396.5} {"step": 867, "train_loss": 5.302791595458984, "lr": 0.00034679999999999997, "tps": 12923, "wall": 4401.6} {"step": 868, "train_loss": 5.211005210876465, "lr": 0.0003472, "tps": 12923, "wall": 4406.8} {"step": 869, "train_loss": 5.201194763183594, "lr": 0.00034760000000000005, "tps": 12923, "wall": 4411.9} {"step": 870, "train_loss": 5.163672924041748, "lr": 0.00034800000000000006, "tps": 12923, "wall": 4417.0} {"step": 871, "train_loss": 5.226396083831787, "lr": 0.00034840000000000007, "tps": 12922, "wall": 4422.2} {"step": 872, "train_loss": 5.194231033325195, "lr": 0.0003488, "tps": 12922, "wall": 4427.3} {"step": 873, "train_loss": 5.206887245178223, "lr": 0.00034920000000000003, "tps": 12922, "wall": 4432.4} {"step": 874, "train_loss": 5.1826252937316895, "lr": 0.00034960000000000004, "tps": 12922, "wall": 4437.6} {"step": 875, "train_loss": 5.23326301574707, "lr": 0.00035000000000000005, "tps": 12922, "wall": 4442.7} {"step": 876, "train_loss": 5.256241798400879, "lr": 0.0003504, "tps": 12922, "wall": 4447.8} {"step": 877, "train_loss": 5.214084625244141, "lr": 0.0003508, "tps": 12921, "wall": 4453.0} {"step": 878, "train_loss": 5.249508857727051, "lr": 0.0003512, "tps": 12921, "wall": 4458.1} {"step": 879, "train_loss": 5.158962249755859, "lr": 0.00035160000000000004, "tps": 12921, "wall": 4463.2} {"step": 880, "train_loss": 5.152047157287598, "lr": 0.00035200000000000005, "tps": 12921, "wall": 4468.4} {"step": 881, "train_loss": 5.0853166580200195, "lr": 0.0003524, "tps": 12921, "wall": 4473.5} {"step": 882, "train_loss": 5.253781318664551, "lr": 0.0003528, "tps": 12920, "wall": 4478.7} {"step": 883, "train_loss": 5.241611957550049, "lr": 0.0003532, "tps": 12920, "wall": 4483.8} {"step": 884, "train_loss": 5.29595422744751, "lr": 0.00035360000000000003, "tps": 12920, "wall": 4488.9} {"step": 885, "train_loss": 5.181746482849121, "lr": 0.00035400000000000004, "tps": 12920, "wall": 4494.0} {"step": 886, "train_loss": 5.139272212982178, "lr": 0.0003544, "tps": 12920, "wall": 4499.2} {"step": 887, "train_loss": 5.100183963775635, "lr": 0.0003548, "tps": 12920, "wall": 4504.3} {"step": 888, "train_loss": 5.071255683898926, "lr": 0.0003552, "tps": 12919, "wall": 4509.4} {"step": 889, "train_loss": 5.1168012619018555, "lr": 0.0003556, "tps": 12919, "wall": 4514.6} {"step": 890, "train_loss": 5.32720947265625, "lr": 0.00035600000000000003, "tps": 12919, "wall": 4519.7} {"step": 891, "train_loss": 5.127945423126221, "lr": 0.0003564, "tps": 12919, "wall": 4524.9} {"step": 892, "train_loss": 5.120978832244873, "lr": 0.0003568, "tps": 12919, "wall": 4530.0} {"step": 893, "train_loss": 5.196165561676025, "lr": 0.0003572, "tps": 12918, "wall": 4535.1} {"step": 894, "train_loss": 5.125482559204102, "lr": 0.0003576, "tps": 12918, "wall": 4540.3} {"step": 895, "train_loss": 5.261534690856934, "lr": 0.00035800000000000003, "tps": 12918, "wall": 4545.4} {"step": 896, "train_loss": 5.237512588500977, "lr": 0.0003584, "tps": 12918, "wall": 4550.5} {"step": 897, "train_loss": 5.228179931640625, "lr": 0.0003588, "tps": 12918, "wall": 4555.7} {"step": 898, "train_loss": 5.171537399291992, "lr": 0.0003592, "tps": 12917, "wall": 4560.9} {"step": 899, "train_loss": 5.128933906555176, "lr": 0.0003596, "tps": 12917, "wall": 4566.0} {"step": 900, "train_loss": 5.156101226806641, "lr": 0.00036, "tps": 12917, "wall": 4571.1} {"step": 901, "train_loss": 5.227888107299805, "lr": 0.0003604, "tps": 12917, "wall": 4576.2} {"step": 902, "train_loss": 5.217113018035889, "lr": 0.0003608, "tps": 12917, "wall": 4581.3} {"step": 903, "train_loss": 5.205323219299316, "lr": 0.0003612, "tps": 12917, "wall": 4586.5} {"step": 904, "train_loss": 5.212242603302002, "lr": 0.0003616, "tps": 12916, "wall": 4591.7} {"step": 905, "train_loss": 5.174870491027832, "lr": 0.000362, "tps": 12916, "wall": 4596.8} {"step": 906, "train_loss": 5.155285835266113, "lr": 0.0003624, "tps": 12916, "wall": 4602.0} {"step": 907, "train_loss": 5.141669750213623, "lr": 0.00036280000000000004, "tps": 12916, "wall": 4607.1} {"step": 908, "train_loss": 5.096489906311035, "lr": 0.00036320000000000005, "tps": 12916, "wall": 4612.3} {"step": 909, "train_loss": 5.200392723083496, "lr": 0.00036360000000000006, "tps": 12915, "wall": 4617.4} {"step": 910, "train_loss": 5.174771785736084, "lr": 0.000364, "tps": 12915, "wall": 4622.5} {"step": 911, "train_loss": 5.160182952880859, "lr": 0.0003644, "tps": 12915, "wall": 4627.7} {"step": 912, "train_loss": 5.178170204162598, "lr": 0.00036480000000000003, "tps": 12915, "wall": 4632.8} {"step": 913, "train_loss": 5.17773962020874, "lr": 0.00036520000000000004, "tps": 12915, "wall": 4637.9} {"step": 914, "train_loss": 5.17728328704834, "lr": 0.00036560000000000005, "tps": 12915, "wall": 4643.1} {"step": 915, "train_loss": 5.172386169433594, "lr": 0.000366, "tps": 12914, "wall": 4648.3} {"step": 916, "train_loss": 5.239079475402832, "lr": 0.0003664, "tps": 12914, "wall": 4653.4} {"step": 917, "train_loss": 5.1782941818237305, "lr": 0.0003668, "tps": 12914, "wall": 4658.5} {"step": 918, "train_loss": 5.09865665435791, "lr": 0.00036720000000000004, "tps": 12914, "wall": 4663.6} {"step": 919, "train_loss": 5.19330358505249, "lr": 0.00036760000000000004, "tps": 12914, "wall": 4668.8} {"step": 920, "train_loss": 5.066971302032471, "lr": 0.000368, "tps": 12913, "wall": 4673.9} {"step": 921, "train_loss": 5.139760971069336, "lr": 0.0003684, "tps": 12913, "wall": 4679.0} {"step": 922, "train_loss": 5.091315746307373, "lr": 0.0003688, "tps": 12913, "wall": 4684.2} {"step": 923, "train_loss": 5.173414707183838, "lr": 0.00036920000000000003, "tps": 12913, "wall": 4689.3} {"step": 924, "train_loss": 5.197332382202148, "lr": 0.00036960000000000004, "tps": 12913, "wall": 4694.4} {"step": 925, "train_loss": 5.145449638366699, "lr": 0.00037, "tps": 12913, "wall": 4699.6} {"step": 926, "train_loss": 5.185613632202148, "lr": 0.0003704, "tps": 12912, "wall": 4704.8} {"step": 927, "train_loss": 5.086558818817139, "lr": 0.0003708, "tps": 12912, "wall": 4709.9} {"step": 928, "train_loss": 5.095090866088867, "lr": 0.0003712, "tps": 12912, "wall": 4715.1} {"step": 929, "train_loss": 5.084308624267578, "lr": 0.00037160000000000003, "tps": 12912, "wall": 4720.2} {"step": 930, "train_loss": 5.127131938934326, "lr": 0.000372, "tps": 12912, "wall": 4725.4} {"step": 931, "train_loss": 5.168671607971191, "lr": 0.0003724, "tps": 12911, "wall": 4730.5} {"step": 932, "train_loss": 5.201559066772461, "lr": 0.0003728, "tps": 12911, "wall": 4735.6} {"step": 933, "train_loss": 5.117642402648926, "lr": 0.0003732, "tps": 12911, "wall": 4740.8} {"step": 934, "train_loss": 5.084695816040039, "lr": 0.00037360000000000003, "tps": 12911, "wall": 4745.9} {"step": 935, "train_loss": 5.117243766784668, "lr": 0.000374, "tps": 12911, "wall": 4751.0} {"step": 936, "train_loss": 5.094130516052246, "lr": 0.0003744, "tps": 12911, "wall": 4756.2} {"step": 937, "train_loss": 5.048742294311523, "lr": 0.0003748, "tps": 12910, "wall": 4761.3} {"step": 938, "train_loss": 5.26018762588501, "lr": 0.0003752, "tps": 12910, "wall": 4766.5} {"step": 939, "train_loss": 5.150074481964111, "lr": 0.0003756, "tps": 12910, "wall": 4771.6} {"step": 940, "train_loss": 4.986924171447754, "lr": 0.000376, "tps": 12910, "wall": 4776.7} {"step": 941, "train_loss": 5.096118927001953, "lr": 0.0003764, "tps": 12910, "wall": 4781.9} {"step": 942, "train_loss": 5.140353679656982, "lr": 0.0003768, "tps": 12910, "wall": 4787.0} {"step": 943, "train_loss": 5.061984539031982, "lr": 0.00037720000000000006, "tps": 12909, "wall": 4792.1} {"step": 944, "train_loss": 5.092776298522949, "lr": 0.0003776, "tps": 12909, "wall": 4797.3} {"step": 945, "train_loss": 5.134352207183838, "lr": 0.000378, "tps": 12909, "wall": 4802.4} {"step": 946, "train_loss": 5.117870807647705, "lr": 0.00037840000000000004, "tps": 12909, "wall": 4807.5} {"step": 947, "train_loss": 5.218264579772949, "lr": 0.00037880000000000005, "tps": 12909, "wall": 4812.7} {"step": 948, "train_loss": 5.1242265701293945, "lr": 0.00037920000000000006, "tps": 12909, "wall": 4817.8} {"step": 949, "train_loss": 5.060122966766357, "lr": 0.0003796, "tps": 12908, "wall": 4823.0} {"step": 950, "train_loss": 5.055283546447754, "lr": 0.00038, "tps": 12908, "wall": 4828.2} {"step": 951, "train_loss": 5.0067667961120605, "lr": 0.00038040000000000003, "tps": 12908, "wall": 4833.3} {"step": 952, "train_loss": 5.085114479064941, "lr": 0.00038080000000000004, "tps": 12908, "wall": 4838.5} {"step": 953, "train_loss": 5.119616508483887, "lr": 0.00038120000000000005, "tps": 12907, "wall": 4843.6} {"step": 954, "train_loss": 5.100530624389648, "lr": 0.0003816, "tps": 12907, "wall": 4848.7} {"step": 955, "train_loss": 4.923511028289795, "lr": 0.000382, "tps": 12907, "wall": 4853.9} {"step": 956, "train_loss": 5.003081798553467, "lr": 0.0003824, "tps": 12907, "wall": 4859.0} {"step": 957, "train_loss": 5.099199295043945, "lr": 0.00038280000000000003, "tps": 12907, "wall": 4864.2} {"step": 958, "train_loss": 4.977171897888184, "lr": 0.00038320000000000004, "tps": 12907, "wall": 4869.3} {"step": 959, "train_loss": 5.03582763671875, "lr": 0.0003836, "tps": 12906, "wall": 4874.5} {"step": 960, "train_loss": 4.9712233543396, "lr": 0.000384, "tps": 12906, "wall": 4879.6} {"step": 961, "train_loss": 5.040082931518555, "lr": 0.0003844, "tps": 12906, "wall": 4884.8} {"step": 962, "train_loss": 4.985476016998291, "lr": 0.00038480000000000003, "tps": 12906, "wall": 4889.9} {"step": 963, "train_loss": 5.00779914855957, "lr": 0.00038520000000000004, "tps": 12906, "wall": 4895.1} {"step": 964, "train_loss": 5.012748718261719, "lr": 0.0003856, "tps": 12905, "wall": 4900.2} {"step": 965, "train_loss": 5.111207008361816, "lr": 0.000386, "tps": 12905, "wall": 4905.4} {"step": 966, "train_loss": 5.082116603851318, "lr": 0.0003864, "tps": 12905, "wall": 4910.5} {"step": 967, "train_loss": 5.042976379394531, "lr": 0.0003868, "tps": 12905, "wall": 4915.7} {"step": 968, "train_loss": 5.100941181182861, "lr": 0.00038720000000000003, "tps": 12905, "wall": 4920.8} {"step": 969, "train_loss": 4.96515417098999, "lr": 0.0003876, "tps": 12905, "wall": 4926.0} {"step": 970, "train_loss": 5.085428237915039, "lr": 0.000388, "tps": 12904, "wall": 4931.1} {"step": 971, "train_loss": 4.936301231384277, "lr": 0.0003884, "tps": 12904, "wall": 4936.2} {"step": 972, "train_loss": 5.0225830078125, "lr": 0.0003888, "tps": 12904, "wall": 4941.4} {"step": 973, "train_loss": 5.039892196655273, "lr": 0.00038920000000000003, "tps": 12904, "wall": 4946.6} {"step": 974, "train_loss": 5.02803373336792, "lr": 0.0003896, "tps": 12904, "wall": 4951.7} {"step": 975, "train_loss": 5.056571006774902, "lr": 0.00039, "tps": 12903, "wall": 4956.9} {"step": 976, "train_loss": 5.078827857971191, "lr": 0.0003904, "tps": 12903, "wall": 4962.0} {"step": 977, "train_loss": 4.953367710113525, "lr": 0.0003908, "tps": 12903, "wall": 4967.1} {"step": 978, "train_loss": 5.0864577293396, "lr": 0.00039119999999999997, "tps": 12903, "wall": 4972.3} {"step": 979, "train_loss": 5.002409934997559, "lr": 0.0003916, "tps": 12903, "wall": 4977.4} {"step": 980, "train_loss": 5.088358402252197, "lr": 0.00039200000000000004, "tps": 12903, "wall": 4982.5} {"step": 981, "train_loss": 4.967309951782227, "lr": 0.00039240000000000005, "tps": 12903, "wall": 4987.7} {"step": 982, "train_loss": 5.045736312866211, "lr": 0.00039280000000000006, "tps": 12902, "wall": 4992.8} {"step": 983, "train_loss": 4.999208450317383, "lr": 0.0003932, "tps": 12902, "wall": 4997.9} {"step": 984, "train_loss": 5.02837610244751, "lr": 0.0003936, "tps": 12902, "wall": 5003.1} {"step": 985, "train_loss": 4.960477352142334, "lr": 0.00039400000000000004, "tps": 12902, "wall": 5008.3} {"step": 986, "train_loss": 4.940474987030029, "lr": 0.00039440000000000005, "tps": 12902, "wall": 5013.4} {"step": 987, "train_loss": 5.008482933044434, "lr": 0.00039480000000000006, "tps": 12902, "wall": 5018.6} {"step": 988, "train_loss": 5.09538459777832, "lr": 0.0003952, "tps": 12901, "wall": 5023.7} {"step": 989, "train_loss": 5.009078502655029, "lr": 0.0003956, "tps": 12901, "wall": 5028.9} {"step": 990, "train_loss": 5.0546040534973145, "lr": 0.00039600000000000003, "tps": 12901, "wall": 5034.0} {"step": 991, "train_loss": 5.066396236419678, "lr": 0.00039640000000000004, "tps": 12901, "wall": 5039.1} {"step": 992, "train_loss": 5.028505802154541, "lr": 0.00039680000000000005, "tps": 12901, "wall": 5044.3} {"step": 993, "train_loss": 5.019338130950928, "lr": 0.0003972, "tps": 12901, "wall": 5049.4} {"step": 994, "train_loss": 4.982344150543213, "lr": 0.0003976, "tps": 12900, "wall": 5054.5} {"step": 995, "train_loss": 4.998553276062012, "lr": 0.000398, "tps": 12900, "wall": 5059.7} {"step": 996, "train_loss": 5.026206016540527, "lr": 0.00039840000000000003, "tps": 12900, "wall": 5064.9} {"step": 997, "train_loss": 4.895677089691162, "lr": 0.00039880000000000004, "tps": 12900, "wall": 5070.0} {"step": 998, "train_loss": 4.881150245666504, "lr": 0.0003992, "tps": 12900, "wall": 5075.2} {"step": 999, "train_loss": 4.932165145874023, "lr": 0.0003996, "tps": 12899, "wall": 5080.4} {"step": 1000, "train_loss": 4.946451663970947, "lr": 0.0004, "tps": 12899, "wall": 5085.5, "val_loss_monitor": 5.0032383646423275} {"step": 1001, "train_loss": 5.049793720245361, "lr": 0.00039999999898047517, "tps": 12773, "wall": 5140.8} {"step": 1002, "train_loss": 5.049690246582031, "lr": 0.00039999999592190056, "tps": 12773, "wall": 5146.0} {"step": 1003, "train_loss": 4.979762077331543, "lr": 0.00039999999082427625, "tps": 12773, "wall": 5151.3} {"step": 1004, "train_loss": 4.8603644371032715, "lr": 0.00039999998368760235, "tps": 12772, "wall": 5156.5} {"step": 1005, "train_loss": 4.935542106628418, "lr": 0.0003999999745118789, "tps": 12772, "wall": 5161.7} {"step": 1006, "train_loss": 5.018393516540527, "lr": 0.00039999996329710593, "tps": 12772, "wall": 5166.8} {"step": 1007, "train_loss": 5.131832599639893, "lr": 0.00039999995004328374, "tps": 12772, "wall": 5172.0} {"step": 1008, "train_loss": 4.953432559967041, "lr": 0.0003999999347504123, "tps": 12772, "wall": 5177.1} {"step": 1009, "train_loss": 4.972070217132568, "lr": 0.00039999991741849187, "tps": 12772, "wall": 5182.3} {"step": 1010, "train_loss": 5.111318588256836, "lr": 0.0003999998980475227, "tps": 12772, "wall": 5187.5} {"step": 1011, "train_loss": 4.9764723777771, "lr": 0.00039999987663750483, "tps": 12772, "wall": 5192.7} {"step": 1012, "train_loss": 4.964090824127197, "lr": 0.0003999998531884387, "tps": 12772, "wall": 5197.8} {"step": 1013, "train_loss": 4.919774055480957, "lr": 0.00039999982770032446, "tps": 12772, "wall": 5203.0} {"step": 1014, "train_loss": 5.030452728271484, "lr": 0.0003999998001731625, "tps": 12772, "wall": 5208.1} {"step": 1015, "train_loss": 4.955636024475098, "lr": 0.00039999977060695304, "tps": 12772, "wall": 5213.2} {"step": 1016, "train_loss": 4.948298454284668, "lr": 0.00039999973900169643, "tps": 12772, "wall": 5218.4} {"step": 1017, "train_loss": 4.913895606994629, "lr": 0.000399999705357393, "tps": 12772, "wall": 5223.5} {"step": 1018, "train_loss": 4.894491195678711, "lr": 0.0003999996696740432, "tps": 12772, "wall": 5228.7} {"step": 1019, "train_loss": 4.9469404220581055, "lr": 0.00039999963195164743, "tps": 12772, "wall": 5233.8} {"step": 1020, "train_loss": 5.047122001647949, "lr": 0.0003999995921902061, "tps": 12772, "wall": 5239.0} {"step": 1021, "train_loss": 5.043478965759277, "lr": 0.0003999995503897196, "tps": 12771, "wall": 5244.2} {"step": 1022, "train_loss": 4.925594329833984, "lr": 0.0003999995065501884, "tps": 12771, "wall": 5249.3} {"step": 1023, "train_loss": 5.04356575012207, "lr": 0.00039999946067161316, "tps": 12771, "wall": 5254.5} {"step": 1024, "train_loss": 4.895684719085693, "lr": 0.0003999994127539943, "tps": 12771, "wall": 5259.6} {"step": 1025, "train_loss": 4.978384971618652, "lr": 0.0003999993627973323, "tps": 12771, "wall": 5264.7} {"step": 1026, "train_loss": 4.970042705535889, "lr": 0.0003999993108016278, "tps": 12771, "wall": 5269.9} {"step": 1027, "train_loss": 4.869287967681885, "lr": 0.00039999925676688136, "tps": 12771, "wall": 5275.0} {"step": 1028, "train_loss": 4.995716094970703, "lr": 0.0003999992006930936, "tps": 12771, "wall": 5280.2} {"step": 1029, "train_loss": 5.053715229034424, "lr": 0.00039999914258026514, "tps": 12771, "wall": 5285.3} {"step": 1030, "train_loss": 4.9319353103637695, "lr": 0.0003999990824283967, "tps": 12771, "wall": 5290.4} {"step": 1031, "train_loss": 4.9501729011535645, "lr": 0.0003999990202374889, "tps": 12771, "wall": 5295.6} {"step": 1032, "train_loss": 4.966821670532227, "lr": 0.0003999989560075425, "tps": 12771, "wall": 5300.7} {"step": 1033, "train_loss": 4.91105842590332, "lr": 0.0003999988897385581, "tps": 12771, "wall": 5305.9} {"step": 1034, "train_loss": 4.943819046020508, "lr": 0.0003999988214305366, "tps": 12771, "wall": 5311.1} {"step": 1035, "train_loss": 5.064743995666504, "lr": 0.0003999987510834787, "tps": 12771, "wall": 5316.2} {"step": 1036, "train_loss": 5.010611534118652, "lr": 0.00039999867869738517, "tps": 12771, "wall": 5321.4} {"step": 1037, "train_loss": 4.948687553405762, "lr": 0.0003999986042722569, "tps": 12771, "wall": 5326.5} {"step": 1038, "train_loss": 4.961407661437988, "lr": 0.0003999985278080947, "tps": 12771, "wall": 5331.7} {"step": 1039, "train_loss": 4.92701530456543, "lr": 0.0003999984493048995, "tps": 12771, "wall": 5336.8} {"step": 1040, "train_loss": 4.95629358291626, "lr": 0.000399998368762672, "tps": 12771, "wall": 5341.9} {"step": 1041, "train_loss": 4.894410133361816, "lr": 0.00039999828618141335, "tps": 12771, "wall": 5347.1} {"step": 1042, "train_loss": 4.9772562980651855, "lr": 0.0003999982015611244, "tps": 12771, "wall": 5352.2} {"step": 1043, "train_loss": 4.877593994140625, "lr": 0.000399998114901806, "tps": 12771, "wall": 5357.3} {"step": 1044, "train_loss": 4.8648810386657715, "lr": 0.00039999802620345926, "tps": 12771, "wall": 5362.5} {"step": 1045, "train_loss": 4.831485271453857, "lr": 0.0003999979354660851, "tps": 12770, "wall": 5367.7} {"step": 1046, "train_loss": 4.93849515914917, "lr": 0.0003999978426896846, "tps": 12770, "wall": 5372.9} {"step": 1047, "train_loss": 4.913337230682373, "lr": 0.00039999774787425886, "tps": 12770, "wall": 5378.0} {"step": 1048, "train_loss": 4.889270782470703, "lr": 0.00039999765101980883, "tps": 12770, "wall": 5383.2} {"step": 1049, "train_loss": 4.891148090362549, "lr": 0.00039999755212633567, "tps": 12770, "wall": 5388.3} {"step": 1050, "train_loss": 4.915431022644043, "lr": 0.0003999974511938405, "tps": 12770, "wall": 5393.4} {"step": 1051, "train_loss": 4.8863444328308105, "lr": 0.00039999734822232454, "tps": 12770, "wall": 5398.5} {"step": 1052, "train_loss": 4.923586845397949, "lr": 0.00039999724321178884, "tps": 12770, "wall": 5403.7} {"step": 1053, "train_loss": 4.992121696472168, "lr": 0.0003999971361622346, "tps": 12770, "wall": 5408.8} {"step": 1054, "train_loss": 4.861593723297119, "lr": 0.0003999970270736631, "tps": 12770, "wall": 5413.9} {"step": 1055, "train_loss": 4.998296737670898, "lr": 0.00039999691594607556, "tps": 12770, "wall": 5419.0} {"step": 1056, "train_loss": 4.939348220825195, "lr": 0.0003999968027794731, "tps": 12770, "wall": 5424.2} {"step": 1057, "train_loss": 4.925835132598877, "lr": 0.00039999668757385724, "tps": 12770, "wall": 5429.3} {"step": 1058, "train_loss": 4.851971626281738, "lr": 0.0003999965703292291, "tps": 12770, "wall": 5434.5} {"step": 1059, "train_loss": 4.897090435028076, "lr": 0.00039999645104559016, "tps": 12770, "wall": 5439.6} {"step": 1060, "train_loss": 4.805217742919922, "lr": 0.0003999963297229416, "tps": 12770, "wall": 5444.8} {"step": 1061, "train_loss": 4.93387508392334, "lr": 0.00039999620636128495, "tps": 12770, "wall": 5449.9} {"step": 1062, "train_loss": 4.870651721954346, "lr": 0.00039999608096062146, "tps": 12770, "wall": 5455.1} {"step": 1063, "train_loss": 4.883062839508057, "lr": 0.0003999959535209527, "tps": 12770, "wall": 5460.2} {"step": 1064, "train_loss": 4.861430644989014, "lr": 0.00039999582404228, "tps": 12770, "wall": 5465.4} {"step": 1065, "train_loss": 4.887815475463867, "lr": 0.0003999956925246048, "tps": 12770, "wall": 5470.5} {"step": 1066, "train_loss": 4.836458206176758, "lr": 0.0003999955589679288, "tps": 12770, "wall": 5475.6} {"step": 1067, "train_loss": 4.97470235824585, "lr": 0.00039999542337225327, "tps": 12770, "wall": 5480.7} {"step": 1068, "train_loss": 4.941323757171631, "lr": 0.0003999952857375799, "tps": 12770, "wall": 5485.9} {"step": 1069, "train_loss": 4.882184982299805, "lr": 0.00039999514606391015, "tps": 12770, "wall": 5491.1} {"step": 1070, "train_loss": 4.849297046661377, "lr": 0.00039999500435124565, "tps": 12770, "wall": 5496.2} {"step": 1071, "train_loss": 4.868265151977539, "lr": 0.00039999486059958805, "tps": 12770, "wall": 5501.3} {"step": 1072, "train_loss": 4.8336968421936035, "lr": 0.0003999947148089389, "tps": 12770, "wall": 5506.5} {"step": 1073, "train_loss": 4.881011962890625, "lr": 0.0003999945669792999, "tps": 12770, "wall": 5511.6} {"step": 1074, "train_loss": 4.897332668304443, "lr": 0.0003999944171106727, "tps": 12770, "wall": 5516.8} {"step": 1075, "train_loss": 4.882025718688965, "lr": 0.000399994265203059, "tps": 12770, "wall": 5521.9} {"step": 1076, "train_loss": 4.909471035003662, "lr": 0.0003999941112564605, "tps": 12770, "wall": 5527.0} {"step": 1077, "train_loss": 4.835838317871094, "lr": 0.000399993955270879, "tps": 12770, "wall": 5532.1} {"step": 1078, "train_loss": 4.86014461517334, "lr": 0.00039999379724631624, "tps": 12770, "wall": 5537.2} {"step": 1079, "train_loss": 4.804996013641357, "lr": 0.000399993637182774, "tps": 12770, "wall": 5542.3} {"step": 1080, "train_loss": 4.7709059715271, "lr": 0.00039999347508025407, "tps": 12770, "wall": 5547.5} {"step": 1081, "train_loss": 4.839055061340332, "lr": 0.00039999331093875843, "tps": 12770, "wall": 5552.7} {"step": 1082, "train_loss": 4.970308303833008, "lr": 0.0003999931447582887, "tps": 12770, "wall": 5557.8} {"step": 1083, "train_loss": 4.859161376953125, "lr": 0.0003999929765388469, "tps": 12770, "wall": 5562.9} {"step": 1084, "train_loss": 4.90802526473999, "lr": 0.00039999280628043494, "tps": 12770, "wall": 5568.1} {"step": 1085, "train_loss": 4.885679721832275, "lr": 0.00039999263398305475, "tps": 12770, "wall": 5573.2} {"step": 1086, "train_loss": 4.923105239868164, "lr": 0.0003999924596467083, "tps": 12770, "wall": 5578.4} {"step": 1087, "train_loss": 4.836508750915527, "lr": 0.0003999922832713975, "tps": 12770, "wall": 5583.5} {"step": 1088, "train_loss": 4.891693592071533, "lr": 0.0003999921048571244, "tps": 12770, "wall": 5588.7} {"step": 1089, "train_loss": 4.996591091156006, "lr": 0.00039999192440389093, "tps": 12770, "wall": 5593.8} {"step": 1090, "train_loss": 4.836562156677246, "lr": 0.0003999917419116992, "tps": 12770, "wall": 5598.9} {"step": 1091, "train_loss": 4.9182610511779785, "lr": 0.00039999155738055137, "tps": 12770, "wall": 5604.1} {"step": 1092, "train_loss": 4.791420936584473, "lr": 0.00039999137081044944, "tps": 12770, "wall": 5609.2} {"step": 1093, "train_loss": 4.8734450340271, "lr": 0.00039999118220139545, "tps": 12770, "wall": 5614.3} {"step": 1094, "train_loss": 4.862732410430908, "lr": 0.0003999909915533916, "tps": 12770, "wall": 5619.5} {"step": 1095, "train_loss": 4.832159042358398, "lr": 0.00039999079886644015, "tps": 12770, "wall": 5624.6} {"step": 1096, "train_loss": 4.83639669418335, "lr": 0.00039999060414054317, "tps": 12770, "wall": 5629.7} {"step": 1097, "train_loss": 4.918414115905762, "lr": 0.0003999904073757028, "tps": 12770, "wall": 5634.8} {"step": 1098, "train_loss": 4.796321392059326, "lr": 0.0003999902085719215, "tps": 12770, "wall": 5639.9} {"step": 1099, "train_loss": 4.920832633972168, "lr": 0.00039999000772920126, "tps": 12770, "wall": 5645.1} {"step": 1100, "train_loss": 4.822110652923584, "lr": 0.00039998980484754447, "tps": 12770, "wall": 5650.2} {"step": 1101, "train_loss": 4.718808650970459, "lr": 0.0003999895999269535, "tps": 12770, "wall": 5655.3} {"step": 1102, "train_loss": 4.7953877449035645, "lr": 0.0003999893929674306, "tps": 12770, "wall": 5660.4} {"step": 1103, "train_loss": 4.873287677764893, "lr": 0.0003999891839689781, "tps": 12770, "wall": 5665.6} {"step": 1104, "train_loss": 4.821014881134033, "lr": 0.00039998897293159834, "tps": 12770, "wall": 5670.7} {"step": 1105, "train_loss": 4.715718746185303, "lr": 0.0003999887598552938, "tps": 12770, "wall": 5675.8} {"step": 1106, "train_loss": 4.78839111328125, "lr": 0.0003999885447400669, "tps": 12770, "wall": 5680.9} {"step": 1107, "train_loss": 4.747080326080322, "lr": 0.00039998832758592, "tps": 12770, "wall": 5686.1} {"step": 1108, "train_loss": 4.756779193878174, "lr": 0.00039998810839285556, "tps": 12770, "wall": 5691.2} {"step": 1109, "train_loss": 4.769546031951904, "lr": 0.0003999878871608761, "tps": 12770, "wall": 5696.3} {"step": 1110, "train_loss": 4.856611728668213, "lr": 0.00039998766388998414, "tps": 12770, "wall": 5701.4} {"step": 1111, "train_loss": 4.781309604644775, "lr": 0.00039998743858018213, "tps": 12770, "wall": 5706.5} {"step": 1112, "train_loss": 4.804653167724609, "lr": 0.0003999872112314727, "tps": 12770, "wall": 5711.7} {"step": 1113, "train_loss": 4.812324523925781, "lr": 0.00039998698184385846, "tps": 12770, "wall": 5716.8} {"step": 1114, "train_loss": 4.818443298339844, "lr": 0.00039998675041734194, "tps": 12770, "wall": 5721.9} {"step": 1115, "train_loss": 4.887302398681641, "lr": 0.0003999865169519257, "tps": 12770, "wall": 5727.0} {"step": 1116, "train_loss": 4.854024887084961, "lr": 0.0003999862814476125, "tps": 12770, "wall": 5732.2} {"step": 1117, "train_loss": 4.842877388000488, "lr": 0.00039998604390440503, "tps": 12770, "wall": 5737.3} {"step": 1118, "train_loss": 4.7593584060668945, "lr": 0.00039998580432230586, "tps": 12770, "wall": 5742.4} {"step": 1119, "train_loss": 4.788496971130371, "lr": 0.00039998556270131767, "tps": 12770, "wall": 5747.5} {"step": 1120, "train_loss": 4.86453104019165, "lr": 0.0003999853190414434, "tps": 12770, "wall": 5752.6} {"step": 1121, "train_loss": 4.829160213470459, "lr": 0.0003999850733426857, "tps": 12770, "wall": 5757.8} {"step": 1122, "train_loss": 4.916670322418213, "lr": 0.00039998482560504737, "tps": 12770, "wall": 5762.9} {"step": 1123, "train_loss": 4.880051612854004, "lr": 0.00039998457582853116, "tps": 12770, "wall": 5768.0} {"step": 1124, "train_loss": 4.902279376983643, "lr": 0.0003999843240131399, "tps": 12770, "wall": 5773.1} {"step": 1125, "train_loss": 4.903446674346924, "lr": 0.0003999840701588765, "tps": 12771, "wall": 5778.2} {"step": 1126, "train_loss": 4.8494110107421875, "lr": 0.00039998381426574383, "tps": 12770, "wall": 5783.3} {"step": 1127, "train_loss": 4.83381462097168, "lr": 0.00039998355633374483, "tps": 12770, "wall": 5788.5} {"step": 1128, "train_loss": 4.701363563537598, "lr": 0.00039998329636288234, "tps": 12770, "wall": 5793.6} {"step": 1129, "train_loss": 4.784160614013672, "lr": 0.00039998303435315923, "tps": 12771, "wall": 5798.7} {"step": 1130, "train_loss": 4.758096694946289, "lr": 0.0003999827703045787, "tps": 12771, "wall": 5803.8} {"step": 1131, "train_loss": 5.006762504577637, "lr": 0.0003999825042171435, "tps": 12771, "wall": 5808.9} {"step": 1132, "train_loss": 4.789880275726318, "lr": 0.0003999822360908569, "tps": 12771, "wall": 5814.1} {"step": 1133, "train_loss": 4.8459672927856445, "lr": 0.0003999819659257217, "tps": 12771, "wall": 5819.2} {"step": 1134, "train_loss": 4.913975238800049, "lr": 0.00039998169372174107, "tps": 12771, "wall": 5824.3} {"step": 1135, "train_loss": 4.8183274269104, "lr": 0.00039998141947891806, "tps": 12771, "wall": 5829.4} {"step": 1136, "train_loss": 4.816446781158447, "lr": 0.00039998114319725575, "tps": 12771, "wall": 5834.5} {"step": 1137, "train_loss": 4.822370529174805, "lr": 0.00039998086487675737, "tps": 12771, "wall": 5839.6} {"step": 1138, "train_loss": 4.678377151489258, "lr": 0.000399980584517426, "tps": 12771, "wall": 5844.8} {"step": 1139, "train_loss": 4.78424072265625, "lr": 0.00039998030211926486, "tps": 12771, "wall": 5849.9} {"step": 1140, "train_loss": 4.761247634887695, "lr": 0.0003999800176822771, "tps": 12771, "wall": 5855.0} {"step": 1141, "train_loss": 4.819069862365723, "lr": 0.000399979731206466, "tps": 12771, "wall": 5860.2} {"step": 1142, "train_loss": 4.7489094734191895, "lr": 0.00039997944269183476, "tps": 12771, "wall": 5865.3} {"step": 1143, "train_loss": 4.829094886779785, "lr": 0.0003999791521383866, "tps": 12771, "wall": 5870.4} {"step": 1144, "train_loss": 4.819544315338135, "lr": 0.00039997885954612487, "tps": 12771, "wall": 5875.5} {"step": 1145, "train_loss": 4.765462875366211, "lr": 0.00039997856491505294, "tps": 12771, "wall": 5880.7} {"step": 1146, "train_loss": 4.8217010498046875, "lr": 0.00039997826824517406, "tps": 12771, "wall": 5885.8} {"step": 1147, "train_loss": 4.751864910125732, "lr": 0.0003999779695364916, "tps": 12771, "wall": 5890.9} {"step": 1148, "train_loss": 4.815444469451904, "lr": 0.000399977668789009, "tps": 12771, "wall": 5896.0} {"step": 1149, "train_loss": 4.717094421386719, "lr": 0.00039997736600272957, "tps": 12771, "wall": 5901.1} {"step": 1150, "train_loss": 4.750498294830322, "lr": 0.0003999770611776569, "tps": 12771, "wall": 5906.3} {"step": 1151, "train_loss": 4.762548923492432, "lr": 0.0003999767543137943, "tps": 12771, "wall": 5911.5} {"step": 1152, "train_loss": 4.766170024871826, "lr": 0.00039997644541114527, "tps": 12771, "wall": 5916.6} {"step": 1153, "train_loss": 4.767514228820801, "lr": 0.0003999761344697134, "tps": 12771, "wall": 5921.8} {"step": 1154, "train_loss": 4.799758434295654, "lr": 0.0003999758214895021, "tps": 12771, "wall": 5926.9} {"step": 1155, "train_loss": 4.781227111816406, "lr": 0.0003999755064705149, "tps": 12771, "wall": 5932.0} {"step": 1156, "train_loss": 4.778460502624512, "lr": 0.00039997518941275545, "tps": 12771, "wall": 5937.1} {"step": 1157, "train_loss": 4.789222240447998, "lr": 0.00039997487031622733, "tps": 12771, "wall": 5942.2} {"step": 1158, "train_loss": 4.70097017288208, "lr": 0.00039997454918093417, "tps": 12771, "wall": 5947.3} {"step": 1159, "train_loss": 4.7989630699157715, "lr": 0.00039997422600687954, "tps": 12771, "wall": 5952.5} {"step": 1160, "train_loss": 4.74877405166626, "lr": 0.0003999739007940672, "tps": 12771, "wall": 5957.6} {"step": 1161, "train_loss": 4.834374904632568, "lr": 0.00039997357354250074, "tps": 12771, "wall": 5962.7} {"step": 1162, "train_loss": 4.705407619476318, "lr": 0.00039997324425218383, "tps": 12771, "wall": 5968.0} {"step": 1163, "train_loss": 4.726304054260254, "lr": 0.00039997291292312036, "tps": 12771, "wall": 5973.1} {"step": 1164, "train_loss": 4.743198871612549, "lr": 0.00039997257955531396, "tps": 12771, "wall": 5978.2} {"step": 1165, "train_loss": 4.705380439758301, "lr": 0.00039997224414876843, "tps": 12771, "wall": 5983.3} {"step": 1166, "train_loss": 4.774308204650879, "lr": 0.0003999719067034877, "tps": 12771, "wall": 5988.4} {"step": 1167, "train_loss": 4.656162261962891, "lr": 0.0003999715672194754, "tps": 12771, "wall": 5993.5} {"step": 1168, "train_loss": 4.765331268310547, "lr": 0.00039997122569673533, "tps": 12771, "wall": 5998.6} {"step": 1169, "train_loss": 4.639427185058594, "lr": 0.00039997088213527166, "tps": 12771, "wall": 6003.8} {"step": 1170, "train_loss": 4.837304592132568, "lr": 0.000399970536535088, "tps": 12771, "wall": 6008.9} {"step": 1171, "train_loss": 4.687198638916016, "lr": 0.00039997018889618844, "tps": 12771, "wall": 6014.0} {"step": 1172, "train_loss": 4.788760185241699, "lr": 0.00039996983921857676, "tps": 12771, "wall": 6019.1} {"step": 1173, "train_loss": 4.786526203155518, "lr": 0.00039996948750225706, "tps": 12771, "wall": 6024.3} {"step": 1174, "train_loss": 4.746749401092529, "lr": 0.0003999691337472333, "tps": 12771, "wall": 6029.4} {"step": 1175, "train_loss": 4.774167060852051, "lr": 0.00039996877795350934, "tps": 12771, "wall": 6034.6} {"step": 1176, "train_loss": 4.726655960083008, "lr": 0.0003999684201210894, "tps": 12771, "wall": 6039.7} {"step": 1177, "train_loss": 4.753310680389404, "lr": 0.00039996806024997743, "tps": 12771, "wall": 6044.8} {"step": 1178, "train_loss": 4.72355842590332, "lr": 0.0003999676983401776, "tps": 12771, "wall": 6049.9} {"step": 1179, "train_loss": 4.660004138946533, "lr": 0.0003999673343916939, "tps": 12771, "wall": 6055.0} {"step": 1180, "train_loss": 4.740949630737305, "lr": 0.00039996696840453053, "tps": 12771, "wall": 6060.2} {"step": 1181, "train_loss": 4.666282653808594, "lr": 0.00039996660037869156, "tps": 12771, "wall": 6065.3} {"step": 1182, "train_loss": 4.732138633728027, "lr": 0.00039996623031418127, "tps": 12771, "wall": 6070.4} {"step": 1183, "train_loss": 4.670233726501465, "lr": 0.00039996585821100374, "tps": 12771, "wall": 6075.6} {"step": 1184, "train_loss": 4.702626705169678, "lr": 0.00039996548406916324, "tps": 12771, "wall": 6080.7} {"step": 1185, "train_loss": 4.815526008605957, "lr": 0.000399965107888664, "tps": 12771, "wall": 6085.9} {"step": 1186, "train_loss": 4.721435070037842, "lr": 0.0003999647296695103, "tps": 12771, "wall": 6091.0} {"step": 1187, "train_loss": 4.5716872215271, "lr": 0.0003999643494117064, "tps": 12771, "wall": 6096.1} {"step": 1188, "train_loss": 4.859239101409912, "lr": 0.00039996396711525656, "tps": 12771, "wall": 6101.2} {"step": 1189, "train_loss": 4.777340412139893, "lr": 0.00039996358278016525, "tps": 12771, "wall": 6106.3} {"step": 1190, "train_loss": 4.6903204917907715, "lr": 0.00039996319640643667, "tps": 12771, "wall": 6111.4} {"step": 1191, "train_loss": 4.68683385848999, "lr": 0.00039996280799407526, "tps": 12771, "wall": 6116.6} {"step": 1192, "train_loss": 4.65671443939209, "lr": 0.00039996241754308546, "tps": 12771, "wall": 6121.7} {"step": 1193, "train_loss": 4.726699352264404, "lr": 0.00039996202505347163, "tps": 12771, "wall": 6126.8} {"step": 1194, "train_loss": 4.707906723022461, "lr": 0.00039996163052523836, "tps": 12771, "wall": 6131.9} {"step": 1195, "train_loss": 4.837495803833008, "lr": 0.0003999612339583898, "tps": 12771, "wall": 6137.0} {"step": 1196, "train_loss": 4.794319152832031, "lr": 0.0003999608353529308, "tps": 12771, "wall": 6142.1} {"step": 1197, "train_loss": 4.692215442657471, "lr": 0.0003999604347088657, "tps": 12771, "wall": 6147.3} {"step": 1198, "train_loss": 4.8342485427856445, "lr": 0.00039996003202619906, "tps": 12771, "wall": 6152.5} {"step": 1199, "train_loss": 4.758050918579102, "lr": 0.00039995962730493545, "tps": 12771, "wall": 6157.6} {"step": 1200, "train_loss": 4.837338447570801, "lr": 0.00039995922054507935, "tps": 12771, "wall": 6162.7} {"step": 1201, "train_loss": 4.667311668395996, "lr": 0.0003999588117466356, "tps": 12771, "wall": 6167.8} {"step": 1202, "train_loss": 4.754823684692383, "lr": 0.00039995840090960863, "tps": 12771, "wall": 6173.0} {"step": 1203, "train_loss": 4.754995346069336, "lr": 0.00039995798803400313, "tps": 12771, "wall": 6178.1} {"step": 1204, "train_loss": 4.797717094421387, "lr": 0.00039995757311982384, "tps": 12771, "wall": 6183.2} {"step": 1205, "train_loss": 4.70149564743042, "lr": 0.0003999571561670754, "tps": 12771, "wall": 6188.3} {"step": 1206, "train_loss": 4.722011566162109, "lr": 0.0003999567371757626, "tps": 12771, "wall": 6193.4} {"step": 1207, "train_loss": 4.784695148468018, "lr": 0.0003999563161458901, "tps": 12771, "wall": 6198.6} {"step": 1208, "train_loss": 4.70099401473999, "lr": 0.00039995589307746275, "tps": 12771, "wall": 6203.7} {"step": 1209, "train_loss": 4.668002605438232, "lr": 0.0003999554679704853, "tps": 12771, "wall": 6208.9} {"step": 1210, "train_loss": 4.6821370124816895, "lr": 0.00039995504082496257, "tps": 12771, "wall": 6214.0} {"step": 1211, "train_loss": 4.664642333984375, "lr": 0.00039995461164089944, "tps": 12771, "wall": 6219.1} {"step": 1212, "train_loss": 4.678645133972168, "lr": 0.00039995418041830063, "tps": 12771, "wall": 6224.3} {"step": 1213, "train_loss": 4.726269721984863, "lr": 0.00039995374715717124, "tps": 12771, "wall": 6229.4} {"step": 1214, "train_loss": 4.700240135192871, "lr": 0.00039995331185751603, "tps": 12771, "wall": 6234.5} {"step": 1215, "train_loss": 4.671250343322754, "lr": 0.00039995287451933994, "tps": 12771, "wall": 6239.6} {"step": 1216, "train_loss": 4.759413242340088, "lr": 0.00039995243514264796, "tps": 12771, "wall": 6244.7} {"step": 1217, "train_loss": 4.809291839599609, "lr": 0.00039995199372744506, "tps": 12772, "wall": 6249.8} {"step": 1218, "train_loss": 4.669630527496338, "lr": 0.00039995155027373625, "tps": 12772, "wall": 6254.9} {"step": 1219, "train_loss": 4.7022247314453125, "lr": 0.0003999511047815265, "tps": 12772, "wall": 6260.0} {"step": 1220, "train_loss": 4.691649913787842, "lr": 0.000399950657250821, "tps": 12771, "wall": 6265.3} {"step": 1221, "train_loss": 4.683464050292969, "lr": 0.00039995020768162466, "tps": 12771, "wall": 6270.4} {"step": 1222, "train_loss": 4.786229133605957, "lr": 0.00039994975607394263, "tps": 12771, "wall": 6275.5} {"step": 1223, "train_loss": 4.7082929611206055, "lr": 0.00039994930242778, "tps": 12771, "wall": 6280.7} {"step": 1224, "train_loss": 4.733307838439941, "lr": 0.000399948846743142, "tps": 12771, "wall": 6285.8} {"step": 1225, "train_loss": 4.7260661125183105, "lr": 0.0003999483890200337, "tps": 12771, "wall": 6290.9} {"step": 1226, "train_loss": 4.682936191558838, "lr": 0.0003999479292584603, "tps": 12771, "wall": 6296.0} {"step": 1227, "train_loss": 4.925856113433838, "lr": 0.00039994746745842705, "tps": 12771, "wall": 6301.2} {"step": 1228, "train_loss": 4.656347751617432, "lr": 0.00039994700361993914, "tps": 12771, "wall": 6306.3} {"step": 1229, "train_loss": 4.69148063659668, "lr": 0.00039994653774300186, "tps": 12772, "wall": 6311.4} {"step": 1230, "train_loss": 4.675397872924805, "lr": 0.0003999460698276204, "tps": 12772, "wall": 6316.5} {"step": 1231, "train_loss": 4.664364337921143, "lr": 0.0003999455998738002, "tps": 12772, "wall": 6321.6} {"step": 1232, "train_loss": 4.577954292297363, "lr": 0.00039994512788154646, "tps": 12771, "wall": 6326.8} {"step": 1233, "train_loss": 4.6761274337768555, "lr": 0.0003999446538508646, "tps": 12771, "wall": 6331.9} {"step": 1234, "train_loss": 4.665307521820068, "lr": 0.00039994417778175997, "tps": 12771, "wall": 6337.1} {"step": 1235, "train_loss": 4.728941917419434, "lr": 0.00039994369967423797, "tps": 12771, "wall": 6342.2} {"step": 1236, "train_loss": 4.756099224090576, "lr": 0.000399943219528304, "tps": 12771, "wall": 6347.4} {"step": 1237, "train_loss": 4.754831314086914, "lr": 0.0003999427373439635, "tps": 12771, "wall": 6352.5} {"step": 1238, "train_loss": 4.668278217315674, "lr": 0.00039994225312122187, "tps": 12771, "wall": 6357.7} {"step": 1239, "train_loss": 4.677672386169434, "lr": 0.0003999417668600848, "tps": 12771, "wall": 6362.8} {"step": 1240, "train_loss": 4.67462158203125, "lr": 0.00039994127856055755, "tps": 12771, "wall": 6367.9} {"step": 1241, "train_loss": 4.665664196014404, "lr": 0.00039994078822264573, "tps": 12771, "wall": 6373.0} {"step": 1242, "train_loss": 4.717581748962402, "lr": 0.00039994029584635506, "tps": 12771, "wall": 6378.2} {"step": 1243, "train_loss": 4.724104881286621, "lr": 0.00039993980143169085, "tps": 12771, "wall": 6383.3} {"step": 1244, "train_loss": 4.716249465942383, "lr": 0.0003999393049786589, "tps": 12771, "wall": 6388.5} {"step": 1245, "train_loss": 4.847477912902832, "lr": 0.0003999388064872648, "tps": 12771, "wall": 6393.6} {"step": 1246, "train_loss": 4.8182759284973145, "lr": 0.0003999383059575141, "tps": 12771, "wall": 6398.7} {"step": 1247, "train_loss": 4.757062911987305, "lr": 0.0003999378033894126, "tps": 12771, "wall": 6403.9} {"step": 1248, "train_loss": 4.740340232849121, "lr": 0.0003999372987829659, "tps": 12771, "wall": 6409.0} {"step": 1249, "train_loss": 4.634732246398926, "lr": 0.00039993679213817974, "tps": 12771, "wall": 6414.1} {"step": 1250, "train_loss": 4.722637176513672, "lr": 0.00039993628345505987, "tps": 12771, "wall": 6419.2} {"step": 1251, "train_loss": 4.722565650939941, "lr": 0.0003999357727336121, "tps": 12771, "wall": 6424.4} {"step": 1252, "train_loss": 4.654738426208496, "lr": 0.00039993525997384207, "tps": 12771, "wall": 6429.5} {"step": 1253, "train_loss": 4.665098667144775, "lr": 0.0003999347451757557, "tps": 12771, "wall": 6434.6} {"step": 1254, "train_loss": 4.690162658691406, "lr": 0.00039993422833935877, "tps": 12771, "wall": 6439.7} {"step": 1255, "train_loss": 4.633540630340576, "lr": 0.0003999337094646572, "tps": 12771, "wall": 6444.9} {"step": 1256, "train_loss": 4.638603210449219, "lr": 0.00039993318855165687, "tps": 12771, "wall": 6450.0} {"step": 1257, "train_loss": 4.616635322570801, "lr": 0.0003999326656003637, "tps": 12771, "wall": 6455.1} {"step": 1258, "train_loss": 4.727721691131592, "lr": 0.00039993214061078347, "tps": 12771, "wall": 6460.3} {"step": 1259, "train_loss": 4.631913661956787, "lr": 0.0003999316135829222, "tps": 12771, "wall": 6465.4} {"step": 1260, "train_loss": 4.688093662261963, "lr": 0.00039993108451678595, "tps": 12771, "wall": 6470.6} {"step": 1261, "train_loss": 4.7502593994140625, "lr": 0.00039993055341238054, "tps": 12771, "wall": 6475.7} {"step": 1262, "train_loss": 4.636571884155273, "lr": 0.0003999300202697122, "tps": 12771, "wall": 6480.8} {"step": 1263, "train_loss": 4.619159698486328, "lr": 0.0003999294850887868, "tps": 12771, "wall": 6485.9} {"step": 1264, "train_loss": 4.614790916442871, "lr": 0.00039992894786961046, "tps": 12771, "wall": 6491.1} {"step": 1265, "train_loss": 4.673666954040527, "lr": 0.00039992840861218925, "tps": 12771, "wall": 6496.2} {"step": 1266, "train_loss": 4.642418384552002, "lr": 0.0003999278673165293, "tps": 12771, "wall": 6501.3} {"step": 1267, "train_loss": 4.573925018310547, "lr": 0.00039992732398263673, "tps": 12771, "wall": 6506.5} {"step": 1268, "train_loss": 4.612142562866211, "lr": 0.0003999267786105178, "tps": 12771, "wall": 6511.6} {"step": 1269, "train_loss": 4.779352188110352, "lr": 0.00039992623120017846, "tps": 12771, "wall": 6516.7} {"step": 1270, "train_loss": 4.6002302169799805, "lr": 0.0003999256817516251, "tps": 12771, "wall": 6521.9} {"step": 1271, "train_loss": 4.66124963760376, "lr": 0.0003999251302648638, "tps": 12771, "wall": 6527.0} {"step": 1272, "train_loss": 4.683802127838135, "lr": 0.00039992457673990097, "tps": 12771, "wall": 6532.1} {"step": 1273, "train_loss": 4.669313430786133, "lr": 0.00039992402117674283, "tps": 12771, "wall": 6537.3} {"step": 1274, "train_loss": 4.66254186630249, "lr": 0.00039992346357539557, "tps": 12771, "wall": 6542.4} {"step": 1275, "train_loss": 4.674232006072998, "lr": 0.0003999229039358656, "tps": 12771, "wall": 6547.5} {"step": 1276, "train_loss": 4.707489013671875, "lr": 0.00039992234225815924, "tps": 12771, "wall": 6552.6} {"step": 1277, "train_loss": 4.69706916809082, "lr": 0.00039992177854228286, "tps": 12771, "wall": 6557.8} {"step": 1278, "train_loss": 4.647855758666992, "lr": 0.00039992121278824283, "tps": 12771, "wall": 6562.9} {"step": 1279, "train_loss": 4.730147361755371, "lr": 0.0003999206449960456, "tps": 12771, "wall": 6568.1} {"step": 1280, "train_loss": 4.546052932739258, "lr": 0.00039992007516569757, "tps": 12771, "wall": 6573.2} {"step": 1281, "train_loss": 4.606112003326416, "lr": 0.00039991950329720517, "tps": 12771, "wall": 6578.3} {"step": 1282, "train_loss": 4.604608535766602, "lr": 0.00039991892939057495, "tps": 12771, "wall": 6583.4} {"step": 1283, "train_loss": 4.68628454208374, "lr": 0.0003999183534458133, "tps": 12771, "wall": 6588.6} {"step": 1284, "train_loss": 4.631690502166748, "lr": 0.00039991777546292685, "tps": 12771, "wall": 6593.7} {"step": 1285, "train_loss": 4.652411460876465, "lr": 0.0003999171954419221, "tps": 12771, "wall": 6598.8} {"step": 1286, "train_loss": 4.652868747711182, "lr": 0.0003999166133828056, "tps": 12771, "wall": 6604.0} {"step": 1287, "train_loss": 4.592573165893555, "lr": 0.000399916029285584, "tps": 12771, "wall": 6609.1} {"step": 1288, "train_loss": 4.672699451446533, "lr": 0.00039991544315026386, "tps": 12771, "wall": 6614.2} {"step": 1289, "train_loss": 4.709750175476074, "lr": 0.0003999148549768518, "tps": 12771, "wall": 6619.3} {"step": 1290, "train_loss": 4.666558265686035, "lr": 0.0003999142647653546, "tps": 12771, "wall": 6624.5} {"step": 1291, "train_loss": 4.652181625366211, "lr": 0.0003999136725157789, "tps": 12771, "wall": 6629.6} {"step": 1292, "train_loss": 4.679716110229492, "lr": 0.00039991307822813133, "tps": 12771, "wall": 6634.7} {"step": 1293, "train_loss": 4.655666351318359, "lr": 0.00039991248190241873, "tps": 12771, "wall": 6639.8} {"step": 1294, "train_loss": 4.616402626037598, "lr": 0.00039991188353864776, "tps": 12771, "wall": 6644.9} {"step": 1295, "train_loss": 4.654811382293701, "lr": 0.00039991128313682526, "tps": 12772, "wall": 6650.0} {"step": 1296, "train_loss": 4.662698745727539, "lr": 0.000399910680696958, "tps": 12772, "wall": 6655.1} {"step": 1297, "train_loss": 4.621395587921143, "lr": 0.00039991007621905284, "tps": 12772, "wall": 6660.2} {"step": 1298, "train_loss": 4.602444648742676, "lr": 0.0003999094697031165, "tps": 12772, "wall": 6665.3} {"step": 1299, "train_loss": 4.643848896026611, "lr": 0.0003999088611491561, "tps": 12772, "wall": 6670.4} {"step": 1300, "train_loss": 4.7029523849487305, "lr": 0.00039990825055717834, "tps": 12772, "wall": 6675.5} {"step": 1301, "train_loss": 4.550281524658203, "lr": 0.00039990763792719015, "tps": 12772, "wall": 6680.6} {"step": 1302, "train_loss": 4.686648368835449, "lr": 0.00039990702325919857, "tps": 12772, "wall": 6685.8} {"step": 1303, "train_loss": 4.677287578582764, "lr": 0.0003999064065532104, "tps": 12772, "wall": 6690.9} {"step": 1304, "train_loss": 4.57882022857666, "lr": 0.00039990578780923277, "tps": 12772, "wall": 6695.9} {"step": 1305, "train_loss": 4.597957134246826, "lr": 0.00039990516702727264, "tps": 12772, "wall": 6701.0} {"step": 1306, "train_loss": 4.678347587585449, "lr": 0.0003999045442073371, "tps": 12772, "wall": 6706.1} {"step": 1307, "train_loss": 4.610104560852051, "lr": 0.00039990391934943307, "tps": 12772, "wall": 6711.2} {"step": 1308, "train_loss": 4.6391167640686035, "lr": 0.0003999032924535677, "tps": 12772, "wall": 6716.3} {"step": 1309, "train_loss": 4.671017646789551, "lr": 0.0003999026635197482, "tps": 12773, "wall": 6721.4} {"step": 1310, "train_loss": 4.590185642242432, "lr": 0.0003999020325479815, "tps": 12773, "wall": 6726.4} {"step": 1311, "train_loss": 4.627499580383301, "lr": 0.0003999013995382749, "tps": 12773, "wall": 6731.5} {"step": 1312, "train_loss": 4.566246032714844, "lr": 0.0003999007644906355, "tps": 12773, "wall": 6736.6} {"step": 1313, "train_loss": 4.639101982116699, "lr": 0.0003999001274050705, "tps": 12773, "wall": 6741.7} {"step": 1314, "train_loss": 4.676661968231201, "lr": 0.0003998994882815871, "tps": 12773, "wall": 6746.8} {"step": 1315, "train_loss": 4.642645359039307, "lr": 0.0003998988471201926, "tps": 12773, "wall": 6751.9} {"step": 1316, "train_loss": 4.733956336975098, "lr": 0.0003998982039208942, "tps": 12773, "wall": 6756.9} {"step": 1317, "train_loss": 4.67344331741333, "lr": 0.00039989755868369926, "tps": 12773, "wall": 6762.0} {"step": 1318, "train_loss": 4.55921745300293, "lr": 0.00039989691140861504, "tps": 12773, "wall": 6767.1} {"step": 1319, "train_loss": 4.686806678771973, "lr": 0.00039989626209564885, "tps": 12773, "wall": 6772.2} {"step": 1320, "train_loss": 4.600241184234619, "lr": 0.00039989561074480807, "tps": 12773, "wall": 6777.3} {"step": 1321, "train_loss": 4.664916515350342, "lr": 0.0003998949573561, "tps": 12774, "wall": 6782.4} {"step": 1322, "train_loss": 4.672172546386719, "lr": 0.00039989430192953224, "tps": 12773, "wall": 6787.6} {"step": 1323, "train_loss": 4.541329383850098, "lr": 0.00039989364446511204, "tps": 12773, "wall": 6792.7} {"step": 1324, "train_loss": 4.674524784088135, "lr": 0.00039989298496284696, "tps": 12773, "wall": 6797.8} {"step": 1325, "train_loss": 4.629478931427002, "lr": 0.00039989232342274437, "tps": 12773, "wall": 6803.0} {"step": 1326, "train_loss": 4.58253288269043, "lr": 0.0003998916598448118, "tps": 12773, "wall": 6808.2} {"step": 1327, "train_loss": 4.573537826538086, "lr": 0.0003998909942290568, "tps": 12773, "wall": 6813.4} {"step": 1328, "train_loss": 4.770662307739258, "lr": 0.0003998903265754869, "tps": 12773, "wall": 6818.6} {"step": 1329, "train_loss": 4.566864967346191, "lr": 0.0003998896568841096, "tps": 12773, "wall": 6823.8} {"step": 1330, "train_loss": 4.632777690887451, "lr": 0.00039988898515493256, "tps": 12773, "wall": 6828.9} {"step": 1331, "train_loss": 4.607237815856934, "lr": 0.0003998883113879633, "tps": 12773, "wall": 6834.1} {"step": 1332, "train_loss": 4.6067585945129395, "lr": 0.0003998876355832096, "tps": 12773, "wall": 6839.3} {"step": 1333, "train_loss": 4.530730724334717, "lr": 0.00039988695774067904, "tps": 12772, "wall": 6844.5} {"step": 1334, "train_loss": 4.546127796173096, "lr": 0.00039988627786037925, "tps": 12772, "wall": 6849.8} {"step": 1335, "train_loss": 4.583500862121582, "lr": 0.000399885595942318, "tps": 12772, "wall": 6855.0} {"step": 1336, "train_loss": 4.6235504150390625, "lr": 0.00039988491198650295, "tps": 12772, "wall": 6860.2} {"step": 1337, "train_loss": 4.522752285003662, "lr": 0.00039988422599294195, "tps": 12772, "wall": 6865.5} {"step": 1338, "train_loss": 4.658148288726807, "lr": 0.00039988353796164265, "tps": 12771, "wall": 6870.7} {"step": 1339, "train_loss": 4.458678245544434, "lr": 0.0003998828478926129, "tps": 12771, "wall": 6876.0} {"step": 1340, "train_loss": 4.657999515533447, "lr": 0.00039988215578586045, "tps": 12771, "wall": 6881.2} {"step": 1341, "train_loss": 4.657474994659424, "lr": 0.0003998814616413934, "tps": 12771, "wall": 6886.5} {"step": 1342, "train_loss": 4.722978115081787, "lr": 0.0003998807654592193, "tps": 12771, "wall": 6891.7} {"step": 1343, "train_loss": 4.538326263427734, "lr": 0.0003998800672393461, "tps": 12770, "wall": 6897.0} {"step": 1344, "train_loss": 4.572133541107178, "lr": 0.0003998793669817819, "tps": 12770, "wall": 6902.3} {"step": 1345, "train_loss": 4.61840295791626, "lr": 0.00039987866468653443, "tps": 12770, "wall": 6907.5} {"step": 1346, "train_loss": 4.674093246459961, "lr": 0.00039987796035361166, "tps": 12770, "wall": 6912.8} {"step": 1347, "train_loss": 4.558664798736572, "lr": 0.0003998772539830217, "tps": 12769, "wall": 6918.0} {"step": 1348, "train_loss": 4.676955223083496, "lr": 0.0003998765455747725, "tps": 12769, "wall": 6923.3} {"step": 1349, "train_loss": 4.521111965179443, "lr": 0.000399875835128872, "tps": 12769, "wall": 6928.7} {"step": 1350, "train_loss": 4.685002326965332, "lr": 0.00039987512264532836, "tps": 12768, "wall": 6933.9} {"step": 1351, "train_loss": 4.606853008270264, "lr": 0.0003998744081241495, "tps": 12768, "wall": 6939.2} {"step": 1352, "train_loss": 4.505911350250244, "lr": 0.0003998736915653437, "tps": 12768, "wall": 6944.5} {"step": 1353, "train_loss": 4.665674686431885, "lr": 0.00039987297296891904, "tps": 12768, "wall": 6949.7} {"step": 1354, "train_loss": 4.562932968139648, "lr": 0.0003998722523348835, "tps": 12767, "wall": 6955.0} {"step": 1355, "train_loss": 4.543036937713623, "lr": 0.00039987152966324544, "tps": 12767, "wall": 6960.3} {"step": 1356, "train_loss": 4.549561500549316, "lr": 0.0003998708049540128, "tps": 12767, "wall": 6965.6} {"step": 1357, "train_loss": 4.511806488037109, "lr": 0.0003998700782071941, "tps": 12767, "wall": 6970.9} {"step": 1358, "train_loss": 4.639093399047852, "lr": 0.00039986934942279746, "tps": 12766, "wall": 6976.2} {"step": 1359, "train_loss": 4.656639099121094, "lr": 0.000399868618600831, "tps": 12766, "wall": 6981.5} {"step": 1360, "train_loss": 4.586856842041016, "lr": 0.00039986788574130315, "tps": 12766, "wall": 6986.8} {"step": 1361, "train_loss": 4.577460289001465, "lr": 0.0003998671508442221, "tps": 12765, "wall": 6992.1} {"step": 1362, "train_loss": 4.60463285446167, "lr": 0.0003998664139095963, "tps": 12765, "wall": 6997.3} {"step": 1363, "train_loss": 4.537853717803955, "lr": 0.000399865674937434, "tps": 12765, "wall": 7002.6} {"step": 1364, "train_loss": 4.567083835601807, "lr": 0.00039986493392774367, "tps": 12765, "wall": 7007.9} {"step": 1365, "train_loss": 4.577589988708496, "lr": 0.00039986419088053354, "tps": 12764, "wall": 7013.2} {"step": 1366, "train_loss": 4.589782238006592, "lr": 0.00039986344579581213, "tps": 12764, "wall": 7018.4} {"step": 1367, "train_loss": 4.669239044189453, "lr": 0.0003998626986735879, "tps": 12764, "wall": 7023.7} {"step": 1368, "train_loss": 4.584951877593994, "lr": 0.00039986194951386933, "tps": 12764, "wall": 7029.0} {"step": 1369, "train_loss": 4.520655632019043, "lr": 0.00039986119831666485, "tps": 12763, "wall": 7034.2} {"step": 1370, "train_loss": 4.527613639831543, "lr": 0.00039986044508198297, "tps": 12763, "wall": 7039.5} {"step": 1371, "train_loss": 4.53052282333374, "lr": 0.00039985968980983216, "tps": 12763, "wall": 7044.9} {"step": 1372, "train_loss": 4.59139347076416, "lr": 0.00039985893250022114, "tps": 12763, "wall": 7050.1} {"step": 1373, "train_loss": 4.580715179443359, "lr": 0.00039985817315315843, "tps": 12762, "wall": 7055.4} {"step": 1374, "train_loss": 4.571547508239746, "lr": 0.0003998574117686526, "tps": 12762, "wall": 7060.7} {"step": 1375, "train_loss": 4.5145182609558105, "lr": 0.0003998566483467122, "tps": 12762, "wall": 7066.0} {"step": 1376, "train_loss": 4.551911354064941, "lr": 0.00039985588288734604, "tps": 12761, "wall": 7071.3} {"step": 1377, "train_loss": 4.554067611694336, "lr": 0.0003998551153905627, "tps": 12761, "wall": 7076.5} {"step": 1378, "train_loss": 4.538896560668945, "lr": 0.0003998543458563708, "tps": 12761, "wall": 7081.9} {"step": 1379, "train_loss": 4.6040472984313965, "lr": 0.00039985357428477916, "tps": 12761, "wall": 7087.1} {"step": 1380, "train_loss": 4.605306625366211, "lr": 0.0003998528006757965, "tps": 12760, "wall": 7092.4} {"step": 1381, "train_loss": 4.568838596343994, "lr": 0.0003998520250294317, "tps": 12760, "wall": 7097.6} {"step": 1382, "train_loss": 4.5660247802734375, "lr": 0.00039985124734569336, "tps": 12760, "wall": 7102.9} {"step": 1383, "train_loss": 4.492321968078613, "lr": 0.0003998504676245903, "tps": 12760, "wall": 7108.3} {"step": 1384, "train_loss": 4.593102931976318, "lr": 0.0003998496858661315, "tps": 12759, "wall": 7113.5} {"step": 1385, "train_loss": 4.608883380889893, "lr": 0.0003998489020703257, "tps": 12759, "wall": 7118.8} {"step": 1386, "train_loss": 4.673956394195557, "lr": 0.0003998481162371818, "tps": 12759, "wall": 7124.1} {"step": 1387, "train_loss": 4.517642498016357, "lr": 0.0003998473283667087, "tps": 12759, "wall": 7129.4} {"step": 1388, "train_loss": 4.676481246948242, "lr": 0.00039984653845891535, "tps": 12758, "wall": 7134.6} {"step": 1389, "train_loss": 4.566210746765137, "lr": 0.0003998457465138107, "tps": 12758, "wall": 7139.9} {"step": 1390, "train_loss": 4.630331039428711, "lr": 0.0003998449525314037, "tps": 12758, "wall": 7145.2} {"step": 1391, "train_loss": 4.569022178649902, "lr": 0.0003998441565117033, "tps": 12758, "wall": 7150.4} {"step": 1392, "train_loss": 4.5280351638793945, "lr": 0.0003998433584547186, "tps": 12757, "wall": 7155.7} {"step": 1393, "train_loss": 4.590216159820557, "lr": 0.00039984255836045864, "tps": 12757, "wall": 7161.0} {"step": 1394, "train_loss": 4.546241760253906, "lr": 0.00039984175622893235, "tps": 12757, "wall": 7166.3} {"step": 1395, "train_loss": 4.547207832336426, "lr": 0.000399840952060149, "tps": 12757, "wall": 7171.5} {"step": 1396, "train_loss": 4.570201873779297, "lr": 0.00039984014585411757, "tps": 12756, "wall": 7176.8} {"step": 1397, "train_loss": 4.536874771118164, "lr": 0.00039983933761084724, "tps": 12756, "wall": 7182.1} {"step": 1398, "train_loss": 4.555885314941406, "lr": 0.0003998385273303472, "tps": 12756, "wall": 7187.3} {"step": 1399, "train_loss": 4.556177139282227, "lr": 0.00039983771501262664, "tps": 12756, "wall": 7192.6} {"step": 1400, "train_loss": 4.5600080490112305, "lr": 0.0003998369006576946, "tps": 12756, "wall": 7197.8} {"step": 1401, "train_loss": 4.529140949249268, "lr": 0.0003998360842655605, "tps": 12755, "wall": 7203.1} {"step": 1402, "train_loss": 4.578239917755127, "lr": 0.0003998352658362335, "tps": 12755, "wall": 7208.4} {"step": 1403, "train_loss": 4.511876106262207, "lr": 0.0003998344453697228, "tps": 12755, "wall": 7213.6} {"step": 1404, "train_loss": 4.524331092834473, "lr": 0.0003998336228660379, "tps": 12755, "wall": 7218.8} {"step": 1405, "train_loss": 4.460886001586914, "lr": 0.0003998327983251879, "tps": 12754, "wall": 7224.2} {"step": 1406, "train_loss": 4.490845203399658, "lr": 0.00039983197174718225, "tps": 12754, "wall": 7229.4} {"step": 1407, "train_loss": 4.64471435546875, "lr": 0.00039983114313203033, "tps": 12754, "wall": 7234.7} {"step": 1408, "train_loss": 4.513208389282227, "lr": 0.00039983031247974146, "tps": 12754, "wall": 7240.0} {"step": 1409, "train_loss": 4.5252580642700195, "lr": 0.0003998294797903251, "tps": 12754, "wall": 7245.2} {"step": 1410, "train_loss": 4.623366355895996, "lr": 0.00039982864506379065, "tps": 12753, "wall": 7250.4} {"step": 1411, "train_loss": 4.646259307861328, "lr": 0.0003998278083001476, "tps": 12753, "wall": 7255.8} {"step": 1412, "train_loss": 4.454761028289795, "lr": 0.0003998269694994054, "tps": 12753, "wall": 7261.1} {"step": 1413, "train_loss": 4.579720497131348, "lr": 0.0003998261286615735, "tps": 12753, "wall": 7266.3} {"step": 1414, "train_loss": 4.508602619171143, "lr": 0.00039982528578666156, "tps": 12752, "wall": 7271.7} {"step": 1415, "train_loss": 4.578019618988037, "lr": 0.000399824440874679, "tps": 12752, "wall": 7277.1} {"step": 1001, "train_loss": 4.946249961853027, "lr": 0.00039999999898047517, "tps": 14000075, "wall": 4.7} {"step": 1002, "train_loss": 4.988781452178955, "lr": 0.00039999999592190056, "tps": 7412272, "wall": 8.9} {"step": 1003, "train_loss": 4.899431228637695, "lr": 0.00039999999082427625, "tps": 5007761, "wall": 13.1} {"step": 1004, "train_loss": 5.062699317932129, "lr": 0.00039999998368760235, "tps": 3748306, "wall": 17.6} {"step": 1005, "train_loss": 4.930610179901123, "lr": 0.0003999999745118789, "tps": 2989892, "wall": 22.1} {"step": 1006, "train_loss": 5.0265793800354, "lr": 0.00039999996329710593, "tps": 2481824, "wall": 26.6} {"step": 1007, "train_loss": 4.952437400817871, "lr": 0.00039999995004328374, "tps": 2119993, "wall": 31.2} {"step": 1008, "train_loss": 5.096253871917725, "lr": 0.0003999999347504123, "tps": 1851745, "wall": 35.7} {"step": 1009, "train_loss": 4.990782737731934, "lr": 0.00039999991741849187, "tps": 1643579, "wall": 40.3} {"step": 1010, "train_loss": 5.021570682525635, "lr": 0.0003999998980475227, "tps": 1476526, "wall": 44.9} {"step": 1011, "train_loss": 4.929018497467041, "lr": 0.00039999987663750483, "tps": 1340620, "wall": 49.5} {"step": 1012, "train_loss": 4.992334365844727, "lr": 0.0003999998531884387, "tps": 1227545, "wall": 54.1} {"step": 1013, "train_loss": 4.950827121734619, "lr": 0.00039999982770032446, "tps": 1132264, "wall": 58.7} {"step": 1014, "train_loss": 4.974678993225098, "lr": 0.0003999998001731625, "tps": 1050477, "wall": 63.3} {"step": 1015, "train_loss": 5.053749084472656, "lr": 0.00039999977060695304, "tps": 980229, "wall": 67.9} {"step": 1016, "train_loss": 4.959734916687012, "lr": 0.00039999973900169643, "tps": 918570, "wall": 72.6} {"step": 1017, "train_loss": 4.905055522918701, "lr": 0.000399999705357393, "tps": 864374, "wall": 77.2} {"step": 1018, "train_loss": 5.016406536102295, "lr": 0.0003999996696740432, "tps": 816512, "wall": 81.8} {"step": 1019, "train_loss": 4.97929573059082, "lr": 0.00039999963195164743, "tps": 773229, "wall": 86.5} {"step": 1020, "train_loss": 4.978377819061279, "lr": 0.0003999995921902061, "tps": 734554, "wall": 91.1} {"step": 1021, "train_loss": 5.0283684730529785, "lr": 0.0003999995503897196, "tps": 699720, "wall": 95.7} {"step": 1022, "train_loss": 5.0132317543029785, "lr": 0.0003999995065501884, "tps": 667972, "wall": 100.4} {"step": 1023, "train_loss": 4.997824192047119, "lr": 0.00039999946067161316, "tps": 639129, "wall": 105.0} {"step": 1024, "train_loss": 4.897250175476074, "lr": 0.0003999994127539943, "tps": 612517, "wall": 109.7} {"step": 1025, "train_loss": 4.909379959106445, "lr": 0.0003999993627973323, "tps": 588144, "wall": 114.3} {"step": 1026, "train_loss": 4.96248722076416, "lr": 0.0003999993108016278, "tps": 565602, "wall": 119.0} {"step": 1027, "train_loss": 5.032212257385254, "lr": 0.00039999925676688136, "tps": 544785, "wall": 123.7} {"step": 1028, "train_loss": 5.049559593200684, "lr": 0.0003999992006930936, "tps": 525492, "wall": 128.3} {"step": 1029, "train_loss": 4.955166339874268, "lr": 0.00039999914258026514, "tps": 507523, "wall": 133.0} {"step": 1030, "train_loss": 4.95694637298584, "lr": 0.0003999990824283967, "tps": 490755, "wall": 137.7} {"step": 1031, "train_loss": 4.881662845611572, "lr": 0.0003999990202374889, "tps": 474999, "wall": 142.4} {"step": 1032, "train_loss": 4.9904046058654785, "lr": 0.0003999989560075425, "tps": 460200, "wall": 147.1} {"step": 1033, "train_loss": 4.957696914672852, "lr": 0.0003999988897385581, "tps": 446455, "wall": 151.8} {"step": 1034, "train_loss": 4.857043743133545, "lr": 0.0003999988214305366, "tps": 433505, "wall": 156.5} {"step": 1035, "train_loss": 4.997043609619141, "lr": 0.0003999987510834787, "tps": 421293, "wall": 161.2} {"step": 1036, "train_loss": 4.952486038208008, "lr": 0.00039999867869738517, "tps": 409753, "wall": 165.9} {"step": 1037, "train_loss": 4.999503135681152, "lr": 0.0003999986042722569, "tps": 398854, "wall": 170.6} {"step": 1038, "train_loss": 4.901011943817139, "lr": 0.0003999985278080947, "tps": 388495, "wall": 175.3} {"step": 1039, "train_loss": 4.843657970428467, "lr": 0.0003999984493048995, "tps": 378710, "wall": 180.0} {"step": 1040, "train_loss": 4.932975769042969, "lr": 0.000399998368762672, "tps": 369390, "wall": 184.7} {"step": 1041, "train_loss": 4.873388767242432, "lr": 0.00039999828618141335, "tps": 360549, "wall": 189.4} {"step": 1042, "train_loss": 4.966788291931152, "lr": 0.0003999982015611244, "tps": 352120, "wall": 194.1} {"step": 1043, "train_loss": 4.846796989440918, "lr": 0.000399998114901806, "tps": 344084, "wall": 198.8} {"step": 1044, "train_loss": 4.999252796173096, "lr": 0.00039999802620345926, "tps": 336443, "wall": 203.6} {"step": 1045, "train_loss": 4.871524810791016, "lr": 0.0003999979354660851, "tps": 329071, "wall": 208.3} {"step": 1046, "train_loss": 4.932421684265137, "lr": 0.0003999978426896846, "tps": 322070, "wall": 213.0} {"step": 1047, "train_loss": 4.808749675750732, "lr": 0.00039999774787425886, "tps": 315344, "wall": 217.8} {"step": 1048, "train_loss": 5.033149719238281, "lr": 0.00039999765101980883, "tps": 308951, "wall": 222.5} {"step": 1049, "train_loss": 4.972644805908203, "lr": 0.00039999755212633567, "tps": 302825, "wall": 227.2} {"step": 1050, "train_loss": 4.88274621963501, "lr": 0.0003999974511938405, "tps": 296590, "wall": 232.2} {"step": 1051, "train_loss": 4.87001895904541, "lr": 0.00039999734822232454, "tps": 290886, "wall": 237.0} {"step": 1052, "train_loss": 4.963575839996338, "lr": 0.00039999724321178884, "tps": 285322, "wall": 241.9} {"step": 1053, "train_loss": 5.012842655181885, "lr": 0.0003999971361622346, "tps": 279969, "wall": 246.7} {"step": 1054, "train_loss": 4.928402900695801, "lr": 0.0003999970270736631, "tps": 274969, "wall": 251.4} {"step": 1055, "train_loss": 4.9027910232543945, "lr": 0.00039999691594607556, "tps": 270040, "wall": 256.3} {"step": 1056, "train_loss": 4.8687825202941895, "lr": 0.0003999968027794731, "tps": 265236, "wall": 261.2} {"step": 1057, "train_loss": 4.903493881225586, "lr": 0.00039999668757385724, "tps": 260668, "wall": 266.0} {"step": 1058, "train_loss": 4.938985824584961, "lr": 0.0003999965703292291, "tps": 256308, "wall": 270.8} {"step": 1059, "train_loss": 4.900143146514893, "lr": 0.00039999645104559016, "tps": 252106, "wall": 275.6} {"step": 1060, "train_loss": 5.011448860168457, "lr": 0.0003999963297229416, "tps": 248034, "wall": 280.3} {"step": 1061, "train_loss": 4.954051494598389, "lr": 0.00039999620636128495, "tps": 244045, "wall": 285.2} {"step": 1062, "train_loss": 4.920457363128662, "lr": 0.00039999608096062146, "tps": 240233, "wall": 290.0} {"step": 1063, "train_loss": 4.993807315826416, "lr": 0.0003999959535209527, "tps": 236530, "wall": 294.8} {"step": 1064, "train_loss": 4.90762996673584, "lr": 0.00039999582404228, "tps": 232897, "wall": 299.7} {"step": 1065, "train_loss": 4.837579727172852, "lr": 0.0003999956925246048, "tps": 229365, "wall": 304.6} {"step": 1066, "train_loss": 4.969509124755859, "lr": 0.0003999955589679288, "tps": 225992, "wall": 309.4} {"step": 1067, "train_loss": 4.937496185302734, "lr": 0.00039999542337225327, "tps": 222708, "wall": 314.3} {"step": 1068, "train_loss": 4.847822189331055, "lr": 0.0003999952857375799, "tps": 219515, "wall": 319.1} {"step": 1069, "train_loss": 4.867393493652344, "lr": 0.00039999514606391015, "tps": 216377, "wall": 324.1} {"step": 1070, "train_loss": 4.997208595275879, "lr": 0.00039999500435124565, "tps": 213282, "wall": 329.1} {"step": 1071, "train_loss": 4.913311004638672, "lr": 0.00039999486059958805, "tps": 210341, "wall": 334.0} {"step": 1072, "train_loss": 4.851856708526611, "lr": 0.0003999947148089389, "tps": 207499, "wall": 338.9} {"step": 1073, "train_loss": 4.922671318054199, "lr": 0.0003999945669792999, "tps": 204719, "wall": 343.8} {"step": 1074, "train_loss": 4.811698913574219, "lr": 0.0003999944171106727, "tps": 202017, "wall": 348.7} {"step": 1075, "train_loss": 4.950202941894531, "lr": 0.000399994265203059, "tps": 199380, "wall": 353.7} {"step": 1076, "train_loss": 4.942966461181641, "lr": 0.0003999941112564605, "tps": 196874, "wall": 358.5} {"step": 1077, "train_loss": 4.882843971252441, "lr": 0.000399993955270879, "tps": 194423, "wall": 363.4} {"step": 1078, "train_loss": 5.0107645988464355, "lr": 0.00039999379724631624, "tps": 192032, "wall": 368.2} {"step": 1079, "train_loss": 5.014845848083496, "lr": 0.000399993637182774, "tps": 189703, "wall": 373.1} {"step": 1080, "train_loss": 4.770176410675049, "lr": 0.00039999347508025407, "tps": 187437, "wall": 378.0} {"step": 1081, "train_loss": 4.858062267303467, "lr": 0.00039999331093875843, "tps": 185224, "wall": 382.8} {"step": 1082, "train_loss": 4.890530109405518, "lr": 0.0003999931447582887, "tps": 183047, "wall": 387.7} {"step": 1083, "train_loss": 4.891350269317627, "lr": 0.0003999929765388469, "tps": 180941, "wall": 392.6} {"step": 1084, "train_loss": 4.895115375518799, "lr": 0.00039999280628043494, "tps": 178868, "wall": 397.5} {"step": 1085, "train_loss": 4.9148945808410645, "lr": 0.00039999263398305475, "tps": 176807, "wall": 402.5} {"step": 1086, "train_loss": 4.880542278289795, "lr": 0.0003999924596467083, "tps": 174777, "wall": 407.6} {"step": 1087, "train_loss": 4.833627223968506, "lr": 0.0003999922832713975, "tps": 172798, "wall": 412.6} {"step": 1088, "train_loss": 4.919712543487549, "lr": 0.0003999921048571244, "tps": 170897, "wall": 417.6} {"step": 1089, "train_loss": 4.935518264770508, "lr": 0.00039999192440389093, "tps": 169024, "wall": 422.6} {"step": 1090, "train_loss": 4.863096237182617, "lr": 0.0003999917419116992, "tps": 167193, "wall": 427.6} {"step": 1091, "train_loss": 4.8575358390808105, "lr": 0.00039999155738055137, "tps": 165415, "wall": 432.6} {"step": 1092, "train_loss": 4.866370677947998, "lr": 0.00039999137081044944, "tps": 163661, "wall": 437.7} {"step": 1093, "train_loss": 4.8623433113098145, "lr": 0.00039999118220139545, "tps": 161956, "wall": 442.7} {"step": 1094, "train_loss": 4.871519088745117, "lr": 0.0003999909915533916, "tps": 160254, "wall": 447.8} {"step": 1095, "train_loss": 4.8419389724731445, "lr": 0.00039999079886644015, "tps": 158601, "wall": 452.9} {"step": 1096, "train_loss": 4.815539360046387, "lr": 0.00039999060414054317, "tps": 156997, "wall": 457.9} {"step": 1097, "train_loss": 4.812204360961914, "lr": 0.0003999904073757028, "tps": 155398, "wall": 463.1} {"step": 1098, "train_loss": 4.8817901611328125, "lr": 0.0003999902085719215, "tps": 153869, "wall": 468.1} {"step": 1099, "train_loss": 4.874334812164307, "lr": 0.00039999000772920126, "tps": 152370, "wall": 473.1} {"step": 1100, "train_loss": 4.863745212554932, "lr": 0.00039998980484754447, "tps": 150895, "wall": 478.2} {"step": 1101, "train_loss": 4.727312088012695, "lr": 0.0003999895999269535, "tps": 149453, "wall": 483.2} {"step": 1102, "train_loss": 4.808712482452393, "lr": 0.0003999893929674306, "tps": 148029, "wall": 488.3} {"step": 1103, "train_loss": 4.786268711090088, "lr": 0.0003999891839689781, "tps": 146643, "wall": 493.4} {"step": 1104, "train_loss": 4.849895000457764, "lr": 0.00039998897293159834, "tps": 145277, "wall": 498.5} {"step": 1105, "train_loss": 4.875755310058594, "lr": 0.0003999887598552938, "tps": 143873, "wall": 503.8} {"step": 1106, "train_loss": 4.929468154907227, "lr": 0.0003999885447400669, "tps": 142520, "wall": 509.0} {"step": 1107, "train_loss": 4.831131458282471, "lr": 0.00039998832758592, "tps": 141198, "wall": 514.3} {"step": 1108, "train_loss": 4.8796820640563965, "lr": 0.00039998810839285556, "tps": 139913, "wall": 519.5} {"step": 1109, "train_loss": 4.830845355987549, "lr": 0.0003999878871608761, "tps": 138618, "wall": 524.8} {"step": 1110, "train_loss": 4.85062313079834, "lr": 0.00039998766388998414, "tps": 137359, "wall": 530.1} {"step": 1111, "train_loss": 4.8187665939331055, "lr": 0.00039998743858018213, "tps": 136149, "wall": 535.3} {"step": 1001, "train_loss": 4.946249961853027, "lr": 0.00039999999898047517, "tps": 14002636, "wall": 4.7} {"step": 1002, "train_loss": 4.988781452178955, "lr": 0.00039999999592190056, "tps": 7384559, "wall": 8.9} {"step": 1003, "train_loss": 4.899431228637695, "lr": 0.00039999999082427625, "tps": 4999171, "wall": 13.2} {"step": 1004, "train_loss": 5.062699317932129, "lr": 0.00039999998368760235, "tps": 3757249, "wall": 17.5} {"step": 1005, "train_loss": 4.930610179901123, "lr": 0.0003999999745118789, "tps": 2998911, "wall": 22.0} {"step": 1006, "train_loss": 5.0265793800354, "lr": 0.00039999996329710593, "tps": 2492693, "wall": 26.5} {"step": 1007, "train_loss": 4.952437400817871, "lr": 0.00039999995004328374, "tps": 2131809, "wall": 31.0} {"step": 1008, "train_loss": 5.096253871917725, "lr": 0.0003999999347504123, "tps": 1862121, "wall": 35.5} {"step": 1009, "train_loss": 4.990782737731934, "lr": 0.00039999991741849187, "tps": 1652753, "wall": 40.0} {"step": 1010, "train_loss": 5.021570682525635, "lr": 0.0003999998980475227, "tps": 1485330, "wall": 44.6} {"step": 1011, "train_loss": 4.929018497467041, "lr": 0.00039999987663750483, "tps": 1348755, "wall": 49.2} {"step": 1012, "train_loss": 4.992334365844727, "lr": 0.0003999998531884387, "tps": 1234272, "wall": 53.8} {"step": 1013, "train_loss": 4.950827121734619, "lr": 0.00039999982770032446, "tps": 1138439, "wall": 58.4} {"step": 1014, "train_loss": 4.974678993225098, "lr": 0.0003999998001731625, "tps": 1056282, "wall": 63.0} {"step": 1015, "train_loss": 5.053749084472656, "lr": 0.00039999977060695304, "tps": 985525, "wall": 67.6} {"step": 1016, "train_loss": 4.959734916687012, "lr": 0.00039999973900169643, "tps": 923565, "wall": 72.2} {"step": 1017, "train_loss": 4.905055522918701, "lr": 0.000399999705357393, "tps": 868998, "wall": 76.8} {"step": 1018, "train_loss": 5.016406536102295, "lr": 0.0003999996696740432, "tps": 820558, "wall": 81.4} {"step": 1019, "train_loss": 4.97929573059082, "lr": 0.00039999963195164743, "tps": 777181, "wall": 86.0} {"step": 1020, "train_loss": 4.978377819061279, "lr": 0.0003999995921902061, "tps": 738303, "wall": 90.6} {"step": 1021, "train_loss": 5.0283684730529785, "lr": 0.0003999995503897196, "tps": 703186, "wall": 95.2} {"step": 1022, "train_loss": 5.0132317543029785, "lr": 0.0003999995065501884, "tps": 671256, "wall": 99.9} {"step": 1023, "train_loss": 4.997824192047119, "lr": 0.00039999946067161316, "tps": 642183, "wall": 104.5} {"step": 1024, "train_loss": 4.897250175476074, "lr": 0.0003999994127539943, "tps": 615541, "wall": 109.1} {"step": 1025, "train_loss": 4.909379959106445, "lr": 0.0003999993627973323, "tps": 590743, "wall": 113.8} {"step": 1026, "train_loss": 4.96248722076416, "lr": 0.0003999993108016278, "tps": 568160, "wall": 118.5} {"step": 1027, "train_loss": 5.032212257385254, "lr": 0.00039999925676688136, "tps": 547264, "wall": 123.1} {"step": 1028, "train_loss": 5.049559593200684, "lr": 0.0003999992006930936, "tps": 527762, "wall": 127.8} {"step": 1029, "train_loss": 4.955166339874268, "lr": 0.00039999914258026514, "tps": 509763, "wall": 132.4} {"step": 1030, "train_loss": 4.95694637298584, "lr": 0.0003999990824283967, "tps": 492969, "wall": 137.1} {"step": 1031, "train_loss": 4.881662845611572, "lr": 0.0003999990202374889, "tps": 477272, "wall": 141.7} {"step": 1032, "train_loss": 4.9904046058654785, "lr": 0.0003999989560075425, "tps": 462560, "wall": 146.4} {"step": 1033, "train_loss": 4.957696914672852, "lr": 0.0003999988897385581, "tps": 448723, "wall": 151.0} {"step": 1034, "train_loss": 4.857043743133545, "lr": 0.0003999988214305366, "tps": 435715, "wall": 155.7} {"step": 1035, "train_loss": 4.997043609619141, "lr": 0.0003999987510834787, "tps": 423499, "wall": 160.3} {"step": 1036, "train_loss": 4.952486038208008, "lr": 0.00039999867869738517, "tps": 411952, "wall": 165.0} {"step": 1037, "train_loss": 4.999503135681152, "lr": 0.0003999986042722569, "tps": 401044, "wall": 169.6} {"step": 1038, "train_loss": 4.901011943817139, "lr": 0.0003999985278080947, "tps": 390531, "wall": 174.4} {"step": 1039, "train_loss": 4.843657970428467, "lr": 0.0003999984493048995, "tps": 380695, "wall": 179.0} {"step": 1040, "train_loss": 4.932975769042969, "lr": 0.000399998368762672, "tps": 371376, "wall": 183.7} {"step": 1041, "train_loss": 4.873388767242432, "lr": 0.00039999828618141335, "tps": 362524, "wall": 188.4} {"step": 1042, "train_loss": 4.966788291931152, "lr": 0.0003999982015611244, "tps": 354080, "wall": 193.0} {"step": 1043, "train_loss": 4.846796989440918, "lr": 0.000399998114901806, "tps": 346045, "wall": 197.7} {"step": 1044, "train_loss": 4.999252796173096, "lr": 0.00039999802620345926, "tps": 338336, "wall": 202.4} {"step": 1045, "train_loss": 4.871524810791016, "lr": 0.0003999979354660851, "tps": 331023, "wall": 207.1} {"step": 1046, "train_loss": 4.932421684265137, "lr": 0.0003999978426896846, "tps": 324021, "wall": 211.8} {"step": 1047, "train_loss": 4.808749675750732, "lr": 0.00039999774787425886, "tps": 317317, "wall": 216.4} {"step": 1048, "train_loss": 5.033149719238281, "lr": 0.00039999765101980883, "tps": 310891, "wall": 221.1} {"step": 1049, "train_loss": 4.972644805908203, "lr": 0.00039999755212633567, "tps": 304727, "wall": 225.8} {"step": 1050, "train_loss": 4.88274621963501, "lr": 0.0003999974511938405, "tps": 298807, "wall": 230.5} {"step": 1051, "train_loss": 4.87001895904541, "lr": 0.00039999734822232454, "tps": 293034, "wall": 235.3} {"step": 1052, "train_loss": 4.963575839996338, "lr": 0.00039999724321178884, "tps": 287595, "wall": 240.0} {"step": 1053, "train_loss": 5.012842655181885, "lr": 0.0003999971361622346, "tps": 282341, "wall": 244.7} {"step": 1054, "train_loss": 4.928402900695801, "lr": 0.0003999970270736631, "tps": 277292, "wall": 249.3} {"step": 1055, "train_loss": 4.9027910232543945, "lr": 0.00039999691594607556, "tps": 272419, "wall": 254.0} {"step": 1056, "train_loss": 4.8687825202941895, "lr": 0.0003999968027794731, "tps": 267699, "wall": 258.8} {"step": 1057, "train_loss": 4.903493881225586, "lr": 0.00039999668757385724, "tps": 263176, "wall": 263.5} {"step": 1058, "train_loss": 4.938985824584961, "lr": 0.0003999965703292291, "tps": 258800, "wall": 268.2} {"step": 1059, "train_loss": 4.900143146514893, "lr": 0.00039999645104559016, "tps": 254572, "wall": 272.9} {"step": 1060, "train_loss": 5.011448860168457, "lr": 0.0003999963297229416, "tps": 250488, "wall": 277.6} {"step": 1061, "train_loss": 4.954051494598389, "lr": 0.00039999620636128495, "tps": 246541, "wall": 282.3} {"step": 1062, "train_loss": 4.920457363128662, "lr": 0.00039999608096062146, "tps": 242722, "wall": 287.0} {"step": 1063, "train_loss": 4.993807315826416, "lr": 0.0003999959535209527, "tps": 238964, "wall": 291.8} {"step": 1064, "train_loss": 4.90762996673584, "lr": 0.00039999582404228, "tps": 235401, "wall": 296.5} {"step": 1065, "train_loss": 4.837579727172852, "lr": 0.0003999956925246048, "tps": 231931, "wall": 301.2} {"step": 1066, "train_loss": 4.969509124755859, "lr": 0.0003999955589679288, "tps": 228566, "wall": 305.9} {"step": 1067, "train_loss": 4.937496185302734, "lr": 0.00039999542337225327, "tps": 225316, "wall": 310.6} {"step": 1068, "train_loss": 4.847822189331055, "lr": 0.0003999952857375799, "tps": 222148, "wall": 315.4} {"step": 1069, "train_loss": 4.867393493652344, "lr": 0.00039999514606391015, "tps": 219075, "wall": 320.1} {"step": 1070, "train_loss": 4.997208595275879, "lr": 0.00039999500435124565, "tps": 216083, "wall": 324.8} {"step": 1071, "train_loss": 4.913311004638672, "lr": 0.00039999486059958805, "tps": 213185, "wall": 329.5} {"step": 1072, "train_loss": 4.851856708526611, "lr": 0.0003999947148089389, "tps": 210362, "wall": 334.3} {"step": 1073, "train_loss": 4.922671318054199, "lr": 0.0003999945669792999, "tps": 207626, "wall": 339.0} {"step": 1074, "train_loss": 4.811698913574219, "lr": 0.0003999944171106727, "tps": 204971, "wall": 343.7} {"step": 1075, "train_loss": 4.950202941894531, "lr": 0.000399994265203059, "tps": 202384, "wall": 348.4} {"step": 1076, "train_loss": 4.942966461181641, "lr": 0.0003999941112564605, "tps": 199828, "wall": 353.2} {"step": 1077, "train_loss": 4.882843971252441, "lr": 0.000399993955270879, "tps": 197362, "wall": 358.0} {"step": 1078, "train_loss": 5.0107645988464355, "lr": 0.00039999379724631624, "tps": 194962, "wall": 362.7} {"step": 1079, "train_loss": 5.014845848083496, "lr": 0.000399993637182774, "tps": 192623, "wall": 367.4} {"step": 1080, "train_loss": 4.770176410675049, "lr": 0.00039999347508025407, "tps": 190353, "wall": 372.2} {"step": 1081, "train_loss": 4.858062267303467, "lr": 0.00039999331093875843, "tps": 188137, "wall": 376.9} {"step": 1082, "train_loss": 4.890530109405518, "lr": 0.0003999931447582887, "tps": 185979, "wall": 381.6} {"step": 1083, "train_loss": 4.891350269317627, "lr": 0.0003999929765388469, "tps": 183871, "wall": 386.4} {"step": 1084, "train_loss": 4.895115375518799, "lr": 0.00039999280628043494, "tps": 181808, "wall": 391.1} {"step": 1085, "train_loss": 4.9148945808410645, "lr": 0.00039999263398305475, "tps": 179800, "wall": 395.8} {"step": 1086, "train_loss": 4.880542278289795, "lr": 0.0003999924596467083, "tps": 177836, "wall": 400.6} {"step": 1087, "train_loss": 4.833627223968506, "lr": 0.0003999922832713975, "tps": 175919, "wall": 405.3} {"step": 1088, "train_loss": 4.919712543487549, "lr": 0.0003999921048571244, "tps": 174039, "wall": 410.1} {"step": 1089, "train_loss": 4.935518264770508, "lr": 0.00039999192440389093, "tps": 172180, "wall": 414.9} {"step": 1090, "train_loss": 4.863096237182617, "lr": 0.0003999917419116992, "tps": 170395, "wall": 419.6} {"step": 1091, "train_loss": 4.8575358390808105, "lr": 0.00039999155738055137, "tps": 168639, "wall": 424.4} {"step": 1092, "train_loss": 4.866370677947998, "lr": 0.00039999137081044944, "tps": 166925, "wall": 429.1} {"step": 1093, "train_loss": 4.8623433113098145, "lr": 0.00039999118220139545, "tps": 165247, "wall": 433.9} {"step": 1094, "train_loss": 4.871519088745117, "lr": 0.0003999909915533916, "tps": 163605, "wall": 438.6} {"step": 1095, "train_loss": 4.8419389724731445, "lr": 0.00039999079886644015, "tps": 161998, "wall": 443.4} {"step": 1096, "train_loss": 4.815539360046387, "lr": 0.00039999060414054317, "tps": 160427, "wall": 448.1} {"step": 1097, "train_loss": 4.812204360961914, "lr": 0.0003999904073757028, "tps": 158890, "wall": 452.9} {"step": 1098, "train_loss": 4.8817901611328125, "lr": 0.0003999902085719215, "tps": 157383, "wall": 457.6} {"step": 1099, "train_loss": 4.874334812164307, "lr": 0.00039999000772920126, "tps": 155903, "wall": 462.4} {"step": 1100, "train_loss": 4.863745212554932, "lr": 0.00039998980484754447, "tps": 154453, "wall": 467.2} {"step": 1101, "train_loss": 4.727312088012695, "lr": 0.0003999895999269535, "tps": 153008, "wall": 472.0} {"step": 1102, "train_loss": 4.808712482452393, "lr": 0.0003999893929674306, "tps": 151614, "wall": 476.8} {"step": 1103, "train_loss": 4.786268711090088, "lr": 0.0003999891839689781, "tps": 150248, "wall": 481.5} {"step": 1104, "train_loss": 4.849895000457764, "lr": 0.00039998897293159834, "tps": 148901, "wall": 486.3} {"step": 1105, "train_loss": 4.875755310058594, "lr": 0.0003999887598552938, "tps": 147580, "wall": 491.1} {"step": 1106, "train_loss": 4.929468154907227, "lr": 0.0003999885447400669, "tps": 146286, "wall": 495.9} {"step": 1107, "train_loss": 4.831131458282471, "lr": 0.00039998832758592, "tps": 145009, "wall": 500.8} {"step": 1108, "train_loss": 4.8796820640563965, "lr": 0.00039998810839285556, "tps": 143753, "wall": 505.6} {"step": 1109, "train_loss": 4.830845355987549, "lr": 0.0003999878871608761, "tps": 142529, "wall": 510.4} {"step": 1110, "train_loss": 4.85062313079834, "lr": 0.00039998766388998414, "tps": 141317, "wall": 515.2} {"step": 1111, "train_loss": 4.8187665939331055, "lr": 0.00039998743858018213, "tps": 140140, "wall": 520.0} {"step": 1112, "train_loss": 4.8372883796691895, "lr": 0.0003999872112314727, "tps": 138988, "wall": 524.8} {"step": 1113, "train_loss": 4.8739824295043945, "lr": 0.00039998698184385846, "tps": 137849, "wall": 529.6} {"step": 1114, "train_loss": 4.776785850524902, "lr": 0.00039998675041734194, "tps": 136724, "wall": 534.5} {"step": 1115, "train_loss": 4.842484951019287, "lr": 0.0003999865169519257, "tps": 135628, "wall": 539.3} {"step": 1116, "train_loss": 4.776174545288086, "lr": 0.0003999862814476125, "tps": 134553, "wall": 544.0} {"step": 1117, "train_loss": 4.829901695251465, "lr": 0.00039998604390440503, "tps": 133496, "wall": 548.8} {"step": 1118, "train_loss": 4.788071632385254, "lr": 0.00039998580432230586, "tps": 132456, "wall": 553.7} {"step": 1119, "train_loss": 4.8868207931518555, "lr": 0.00039998556270131767, "tps": 131432, "wall": 558.5} {"step": 1120, "train_loss": 4.878384113311768, "lr": 0.0003999853190414434, "tps": 130426, "wall": 563.3} {"step": 1121, "train_loss": 4.833227157592773, "lr": 0.0003999850733426857, "tps": 129438, "wall": 568.1} {"step": 1122, "train_loss": 4.847841262817383, "lr": 0.00039998482560504737, "tps": 128466, "wall": 572.9} {"step": 1123, "train_loss": 4.861566066741943, "lr": 0.00039998457582853116, "tps": 127509, "wall": 577.7} {"step": 1124, "train_loss": 4.829439640045166, "lr": 0.0003999843240131399, "tps": 126572, "wall": 582.5} {"step": 1125, "train_loss": 4.8038458824157715, "lr": 0.0003999840701588765, "tps": 125650, "wall": 587.3} {"step": 1126, "train_loss": 4.851208209991455, "lr": 0.00039998381426574383, "tps": 124729, "wall": 592.2} {"step": 1127, "train_loss": 4.830570220947266, "lr": 0.00039998355633374483, "tps": 123839, "wall": 596.9} {"step": 1128, "train_loss": 4.761490345001221, "lr": 0.00039998329636288234, "tps": 122957, "wall": 601.8} {"step": 1129, "train_loss": 4.825746059417725, "lr": 0.00039998303435315923, "tps": 122091, "wall": 606.6} {"step": 1130, "train_loss": 4.8517866134643555, "lr": 0.0003999827703045787, "tps": 121236, "wall": 611.4} {"step": 1131, "train_loss": 4.834341526031494, "lr": 0.0003999825042171435, "tps": 120397, "wall": 616.2} {"step": 1132, "train_loss": 4.9035539627075195, "lr": 0.0003999822360908569, "tps": 119567, "wall": 621.0} {"step": 1133, "train_loss": 4.754521369934082, "lr": 0.0003999819659257217, "tps": 118747, "wall": 625.8} {"step": 1134, "train_loss": 4.744677543640137, "lr": 0.00039998169372174107, "tps": 117942, "wall": 630.7} {"step": 1135, "train_loss": 4.707732200622559, "lr": 0.00039998141947891806, "tps": 117152, "wall": 635.5} {"step": 1136, "train_loss": 4.960798263549805, "lr": 0.00039998114319725575, "tps": 116374, "wall": 640.3} {"step": 1137, "train_loss": 4.850599765777588, "lr": 0.00039998086487675737, "tps": 115606, "wall": 645.1} {"step": 1138, "train_loss": 4.752962589263916, "lr": 0.000399980584517426, "tps": 114852, "wall": 649.9} {"step": 1139, "train_loss": 4.86557149887085, "lr": 0.00039998030211926486, "tps": 114102, "wall": 654.8} {"step": 1140, "train_loss": 4.703927516937256, "lr": 0.0003999800176822771, "tps": 113370, "wall": 659.6} {"step": 1141, "train_loss": 4.795825481414795, "lr": 0.000399979731206466, "tps": 112647, "wall": 664.4} {"step": 1142, "train_loss": 4.80592155456543, "lr": 0.00039997944269183476, "tps": 111934, "wall": 669.2} {"step": 1143, "train_loss": 4.903641223907471, "lr": 0.0003999791521383866, "tps": 111228, "wall": 674.0} {"step": 1144, "train_loss": 4.882521152496338, "lr": 0.00039997885954612487, "tps": 110533, "wall": 678.9} {"step": 1145, "train_loss": 4.8396806716918945, "lr": 0.00039997856491505294, "tps": 109851, "wall": 683.7} {"step": 1146, "train_loss": 4.711197853088379, "lr": 0.00039997826824517406, "tps": 109176, "wall": 688.5} {"step": 1147, "train_loss": 4.744325160980225, "lr": 0.0003999779695364916, "tps": 108509, "wall": 693.4} {"step": 1148, "train_loss": 4.759660243988037, "lr": 0.000399977668789009, "tps": 107852, "wall": 698.2} {"step": 1149, "train_loss": 4.759189605712891, "lr": 0.00039997736600272957, "tps": 107204, "wall": 703.0} {"step": 1150, "train_loss": 4.645319938659668, "lr": 0.0003999770611776569, "tps": 106566, "wall": 707.8} {"step": 1151, "train_loss": 4.765787124633789, "lr": 0.0003999767543137943, "tps": 105927, "wall": 712.7} {"step": 1152, "train_loss": 4.792457580566406, "lr": 0.00039997644541114527, "tps": 105303, "wall": 717.6} {"step": 1153, "train_loss": 4.814796447753906, "lr": 0.0003999761344697134, "tps": 104688, "wall": 722.4} {"step": 1154, "train_loss": 4.750810623168945, "lr": 0.0003999758214895021, "tps": 104082, "wall": 727.3} {"step": 1155, "train_loss": 4.714654922485352, "lr": 0.0003999755064705149, "tps": 103482, "wall": 732.1} {"step": 1156, "train_loss": 4.754089832305908, "lr": 0.00039997518941275545, "tps": 102890, "wall": 736.9} {"step": 1157, "train_loss": 4.747649192810059, "lr": 0.00039997487031622733, "tps": 102307, "wall": 741.8} {"step": 1158, "train_loss": 4.8458733558654785, "lr": 0.00039997454918093417, "tps": 101725, "wall": 746.7} {"step": 1159, "train_loss": 4.73002290725708, "lr": 0.00039997422600687954, "tps": 101156, "wall": 751.5} {"step": 1160, "train_loss": 4.748664855957031, "lr": 0.0003999739007940672, "tps": 100593, "wall": 756.4} {"step": 1161, "train_loss": 4.9080657958984375, "lr": 0.00039997357354250074, "tps": 100038, "wall": 761.2} {"step": 1162, "train_loss": 4.6996283531188965, "lr": 0.00039997324425218383, "tps": 99490, "wall": 766.1} {"step": 1163, "train_loss": 4.766323566436768, "lr": 0.00039997291292312036, "tps": 98943, "wall": 771.0} {"step": 1164, "train_loss": 4.688066482543945, "lr": 0.00039997257955531396, "tps": 98405, "wall": 775.9} {"step": 1165, "train_loss": 4.712065696716309, "lr": 0.00039997224414876843, "tps": 97878, "wall": 780.7} {"step": 1166, "train_loss": 4.906067848205566, "lr": 0.0003999719067034877, "tps": 97356, "wall": 785.6} {"step": 1167, "train_loss": 4.691905498504639, "lr": 0.0003999715672194754, "tps": 96841, "wall": 790.4} {"step": 1168, "train_loss": 4.728294849395752, "lr": 0.00039997122569673533, "tps": 96331, "wall": 795.3} {"step": 1169, "train_loss": 4.750223159790039, "lr": 0.00039997088213527166, "tps": 95823, "wall": 800.2} {"step": 1170, "train_loss": 4.8370184898376465, "lr": 0.000399970536535088, "tps": 95325, "wall": 805.1} {"step": 1171, "train_loss": 4.76344633102417, "lr": 0.00039997018889618844, "tps": 94834, "wall": 809.9} {"step": 1172, "train_loss": 4.836026191711426, "lr": 0.00039996983921857676, "tps": 94348, "wall": 814.8} {"step": 1173, "train_loss": 4.637042045593262, "lr": 0.00039996948750225706, "tps": 93868, "wall": 819.7} {"step": 1174, "train_loss": 4.7211432456970215, "lr": 0.0003999691337472333, "tps": 93392, "wall": 824.5} {"step": 1175, "train_loss": 4.825125217437744, "lr": 0.00039996877795350934, "tps": 92923, "wall": 829.4} {"step": 1176, "train_loss": 4.734600067138672, "lr": 0.0003999684201210894, "tps": 92454, "wall": 834.3} {"step": 1177, "train_loss": 4.762845993041992, "lr": 0.00039996806024997743, "tps": 91992, "wall": 839.2} {"step": 1178, "train_loss": 4.728160858154297, "lr": 0.0003999676983401776, "tps": 91539, "wall": 844.1} {"step": 1179, "train_loss": 4.77366304397583, "lr": 0.0003999673343916939, "tps": 91090, "wall": 849.0} {"step": 1180, "train_loss": 4.652709007263184, "lr": 0.00039996696840453053, "tps": 90646, "wall": 853.8} {"step": 1181, "train_loss": 4.819474220275879, "lr": 0.00039996660037869156, "tps": 90207, "wall": 858.7} {"step": 1182, "train_loss": 4.722229480743408, "lr": 0.00039996623031418127, "tps": 89774, "wall": 863.6} {"step": 1183, "train_loss": 4.773453712463379, "lr": 0.00039996585821100374, "tps": 89344, "wall": 868.5} {"step": 1184, "train_loss": 4.749451160430908, "lr": 0.00039996548406916324, "tps": 88920, "wall": 873.4} {"step": 1185, "train_loss": 4.775318622589111, "lr": 0.000399965107888664, "tps": 88501, "wall": 878.2} {"step": 1186, "train_loss": 4.867807388305664, "lr": 0.0003999647296695103, "tps": 88087, "wall": 883.1} {"step": 1187, "train_loss": 4.783457279205322, "lr": 0.0003999643494117064, "tps": 87677, "wall": 888.0} {"step": 1188, "train_loss": 4.8035969734191895, "lr": 0.00039996396711525656, "tps": 87266, "wall": 892.9} {"step": 1189, "train_loss": 4.809825897216797, "lr": 0.00039996358278016525, "tps": 86864, "wall": 897.8} {"step": 1190, "train_loss": 4.627274036407471, "lr": 0.00039996319640643667, "tps": 86466, "wall": 902.7} {"step": 1191, "train_loss": 4.90110445022583, "lr": 0.00039996280799407526, "tps": 86073, "wall": 907.6} {"step": 1192, "train_loss": 4.639273643493652, "lr": 0.00039996241754308546, "tps": 85684, "wall": 912.5} {"step": 1193, "train_loss": 4.608239650726318, "lr": 0.00039996202505347163, "tps": 85299, "wall": 917.4} {"step": 1194, "train_loss": 4.720376491546631, "lr": 0.00039996163052523836, "tps": 84919, "wall": 922.2} {"step": 1195, "train_loss": 4.65869665145874, "lr": 0.0003999612339583898, "tps": 84543, "wall": 927.1} {"step": 1196, "train_loss": 4.768554210662842, "lr": 0.0003999608353529308, "tps": 84169, "wall": 932.0} {"step": 1197, "train_loss": 4.658349990844727, "lr": 0.0003999604347088657, "tps": 83801, "wall": 936.9} {"step": 1198, "train_loss": 4.732334136962891, "lr": 0.00039996003202619906, "tps": 83436, "wall": 941.8} {"step": 1199, "train_loss": 4.839376926422119, "lr": 0.00039995962730493545, "tps": 83074, "wall": 946.7} {"step": 1200, "train_loss": 4.784080505371094, "lr": 0.00039995922054507935, "tps": 82709, "wall": 951.6} {"step": 1201, "train_loss": 4.816163063049316, "lr": 0.0003999588117466356, "tps": 82354, "wall": 956.5} {"step": 1202, "train_loss": 4.765105724334717, "lr": 0.00039995840090960863, "tps": 82004, "wall": 961.4} {"step": 1203, "train_loss": 4.752877712249756, "lr": 0.00039995798803400313, "tps": 81657, "wall": 966.3} {"step": 1204, "train_loss": 4.61608362197876, "lr": 0.00039995757311982384, "tps": 81313, "wall": 971.2} {"step": 1205, "train_loss": 4.696308612823486, "lr": 0.0003999571561670754, "tps": 80974, "wall": 976.1} {"step": 1206, "train_loss": 4.7512006759643555, "lr": 0.0003999567371757626, "tps": 80638, "wall": 981.0} {"step": 1207, "train_loss": 4.729006767272949, "lr": 0.0003999563161458901, "tps": 80305, "wall": 985.8} {"step": 1208, "train_loss": 4.664820671081543, "lr": 0.00039995589307746275, "tps": 79975, "wall": 990.7} {"step": 1209, "train_loss": 4.742294788360596, "lr": 0.0003999554679704853, "tps": 79649, "wall": 995.6} {"step": 1210, "train_loss": 4.615843772888184, "lr": 0.00039995504082496257, "tps": 79327, "wall": 1000.5} {"step": 1211, "train_loss": 4.7004499435424805, "lr": 0.00039995461164089944, "tps": 79008, "wall": 1005.3} {"step": 1212, "train_loss": 4.642458915710449, "lr": 0.00039995418041830063, "tps": 78690, "wall": 1010.2} {"step": 1213, "train_loss": 4.673859596252441, "lr": 0.00039995374715717124, "tps": 78371, "wall": 1015.2} {"step": 1214, "train_loss": 4.637346267700195, "lr": 0.00039995331185751603, "tps": 78058, "wall": 1020.1} {"step": 1215, "train_loss": 4.769390106201172, "lr": 0.00039995287451933994, "tps": 77750, "wall": 1025.0} {"step": 1216, "train_loss": 4.732454299926758, "lr": 0.00039995243514264796, "tps": 77445, "wall": 1029.8} {"step": 1217, "train_loss": 4.726252555847168, "lr": 0.00039995199372744506, "tps": 77143, "wall": 1034.7} {"step": 1218, "train_loss": 4.734901428222656, "lr": 0.00039995155027373625, "tps": 76842, "wall": 1039.6} {"step": 1219, "train_loss": 4.686056613922119, "lr": 0.0003999511047815265, "tps": 76545, "wall": 1044.5} {"step": 1220, "train_loss": 4.759585380554199, "lr": 0.000399950657250821, "tps": 76251, "wall": 1049.4} {"step": 1221, "train_loss": 4.710699558258057, "lr": 0.00039995020768162466, "tps": 75959, "wall": 1054.3} {"step": 1222, "train_loss": 4.764553546905518, "lr": 0.00039994975607394263, "tps": 75671, "wall": 1059.2} {"step": 1223, "train_loss": 4.729687690734863, "lr": 0.00039994930242778, "tps": 75385, "wall": 1064.1} {"step": 1224, "train_loss": 4.806064605712891, "lr": 0.000399948846743142, "tps": 75101, "wall": 1069.0} {"step": 1225, "train_loss": 4.7959771156311035, "lr": 0.0003999483890200337, "tps": 74815, "wall": 1073.9} {"step": 1226, "train_loss": 4.683816432952881, "lr": 0.0003999479292584603, "tps": 74536, "wall": 1078.8} {"step": 1227, "train_loss": 4.644733905792236, "lr": 0.00039994746745842705, "tps": 74260, "wall": 1083.7} {"step": 1228, "train_loss": 4.7096076011657715, "lr": 0.00039994700361993914, "tps": 73986, "wall": 1088.6} {"step": 1229, "train_loss": 4.761719703674316, "lr": 0.00039994653774300186, "tps": 73715, "wall": 1093.5} {"step": 1230, "train_loss": 4.628067970275879, "lr": 0.0003999460698276204, "tps": 73443, "wall": 1098.5} {"step": 1231, "train_loss": 4.681777000427246, "lr": 0.0003999455998738002, "tps": 73175, "wall": 1103.4} {"step": 1232, "train_loss": 4.646113872528076, "lr": 0.00039994512788154646, "tps": 72910, "wall": 1108.3} {"step": 1233, "train_loss": 4.678154468536377, "lr": 0.0003999446538508646, "tps": 72648, "wall": 1113.2} {"step": 1234, "train_loss": 4.74930477142334, "lr": 0.00039994417778175997, "tps": 72389, "wall": 1118.1} {"step": 1235, "train_loss": 4.638510227203369, "lr": 0.00039994369967423797, "tps": 72131, "wall": 1123.0} {"step": 1236, "train_loss": 4.690528392791748, "lr": 0.000399943219528304, "tps": 71876, "wall": 1127.9} {"step": 1237, "train_loss": 4.721004962921143, "lr": 0.0003999427373439635, "tps": 71619, "wall": 1132.8} {"step": 1238, "train_loss": 4.744695663452148, "lr": 0.00039994225312122187, "tps": 71368, "wall": 1137.8} {"step": 1239, "train_loss": 4.6590189933776855, "lr": 0.0003999417668600848, "tps": 71119, "wall": 1142.7} {"step": 1240, "train_loss": 4.686022758483887, "lr": 0.00039994127856055755, "tps": 70873, "wall": 1147.5} {"step": 1241, "train_loss": 4.654062271118164, "lr": 0.00039994078822264573, "tps": 70626, "wall": 1152.5} {"step": 1242, "train_loss": 4.678635597229004, "lr": 0.00039994029584635506, "tps": 70383, "wall": 1157.4} {"step": 1243, "train_loss": 4.720662593841553, "lr": 0.00039993980143169085, "tps": 70143, "wall": 1162.3} {"step": 1244, "train_loss": 4.654045581817627, "lr": 0.0003999393049786589, "tps": 69905, "wall": 1167.2} {"step": 1245, "train_loss": 4.729598522186279, "lr": 0.0003999388064872648, "tps": 69670, "wall": 1172.1} {"step": 1246, "train_loss": 4.687628269195557, "lr": 0.0003999383059575141, "tps": 69436, "wall": 1177.0} {"step": 1247, "train_loss": 4.703118324279785, "lr": 0.0003999378033894126, "tps": 69203, "wall": 1181.9} {"step": 1248, "train_loss": 4.656728744506836, "lr": 0.0003999372987829659, "tps": 68973, "wall": 1186.8} {"step": 1249, "train_loss": 4.701832294464111, "lr": 0.00039993679213817974, "tps": 68739, "wall": 1191.7} {"step": 1250, "train_loss": 4.6896867752075195, "lr": 0.00039993628345505987, "tps": 68513, "wall": 1196.6} {"step": 1251, "train_loss": 4.6346564292907715, "lr": 0.0003999357727336121, "tps": 68289, "wall": 1201.5} {"step": 1252, "train_loss": 4.6235575675964355, "lr": 0.00039993525997384207, "tps": 68066, "wall": 1206.4} {"step": 1253, "train_loss": 4.628199577331543, "lr": 0.0003999347451757557, "tps": 67845, "wall": 1211.3} {"step": 1254, "train_loss": 4.767936706542969, "lr": 0.00039993422833935877, "tps": 67625, "wall": 1216.2} {"step": 1255, "train_loss": 4.717453956604004, "lr": 0.0003999337094646572, "tps": 67407, "wall": 1221.1} {"step": 1256, "train_loss": 4.688146114349365, "lr": 0.00039993318855165687, "tps": 67191, "wall": 1226.0} {"step": 1257, "train_loss": 4.569314002990723, "lr": 0.0003999326656003637, "tps": 66977, "wall": 1230.9} {"step": 1258, "train_loss": 4.724424839019775, "lr": 0.00039993214061078347, "tps": 66764, "wall": 1235.8} {"step": 1259, "train_loss": 4.754143714904785, "lr": 0.0003999316135829222, "tps": 66553, "wall": 1240.7} {"step": 1260, "train_loss": 4.559446811676025, "lr": 0.00039993108451678595, "tps": 66343, "wall": 1245.7} {"step": 1261, "train_loss": 4.627029895782471, "lr": 0.00039993055341238054, "tps": 66136, "wall": 1250.5} {"step": 1262, "train_loss": 4.720188140869141, "lr": 0.0003999300202697122, "tps": 65928, "wall": 1255.5} {"step": 1263, "train_loss": 4.74894905090332, "lr": 0.0003999294850887868, "tps": 65723, "wall": 1260.4} {"step": 1264, "train_loss": 4.711122035980225, "lr": 0.00039992894786961046, "tps": 65520, "wall": 1265.3} {"step": 1265, "train_loss": 4.534266471862793, "lr": 0.00039992840861218925, "tps": 65319, "wall": 1270.2} {"step": 1266, "train_loss": 4.61533784866333, "lr": 0.0003999278673165293, "tps": 65119, "wall": 1275.1} {"step": 1267, "train_loss": 4.665241241455078, "lr": 0.00039992732398263673, "tps": 64921, "wall": 1280.0} {"step": 1268, "train_loss": 4.67249059677124, "lr": 0.0003999267786105178, "tps": 64724, "wall": 1284.9} {"step": 1269, "train_loss": 4.606163024902344, "lr": 0.00039992623120017846, "tps": 64529, "wall": 1289.8} {"step": 1270, "train_loss": 4.645265102386475, "lr": 0.0003999256817516251, "tps": 64334, "wall": 1294.7} {"step": 1271, "train_loss": 4.6709136962890625, "lr": 0.0003999251302648638, "tps": 64142, "wall": 1299.6} {"step": 1272, "train_loss": 4.641697406768799, "lr": 0.00039992457673990097, "tps": 63951, "wall": 1304.5} {"step": 1273, "train_loss": 4.572587966918945, "lr": 0.00039992402117674283, "tps": 63762, "wall": 1309.4} {"step": 1274, "train_loss": 4.738323211669922, "lr": 0.00039992346357539557, "tps": 63571, "wall": 1314.4} {"step": 1275, "train_loss": 4.604058742523193, "lr": 0.0003999229039358656, "tps": 63383, "wall": 1319.3} {"step": 1276, "train_loss": 4.65369987487793, "lr": 0.00039992234225815924, "tps": 63198, "wall": 1324.2} {"step": 1277, "train_loss": 4.864614486694336, "lr": 0.00039992177854228286, "tps": 63011, "wall": 1329.2} {"step": 1278, "train_loss": 4.668481826782227, "lr": 0.00039992121278824283, "tps": 62829, "wall": 1334.1} {"step": 1279, "train_loss": 4.711302280426025, "lr": 0.0003999206449960456, "tps": 62648, "wall": 1339.0} {"step": 1280, "train_loss": 4.776585578918457, "lr": 0.00039992007516569757, "tps": 62467, "wall": 1343.9} {"step": 1281, "train_loss": 4.601125717163086, "lr": 0.00039991950329720517, "tps": 62288, "wall": 1348.8} {"step": 1282, "train_loss": 4.6540093421936035, "lr": 0.00039991892939057495, "tps": 62111, "wall": 1353.7} {"step": 1283, "train_loss": 4.605147838592529, "lr": 0.0003999183534458133, "tps": 61935, "wall": 1358.6} {"step": 1284, "train_loss": 4.66188907623291, "lr": 0.00039991777546292685, "tps": 61760, "wall": 1363.5} {"step": 1285, "train_loss": 4.686729431152344, "lr": 0.0003999171954419221, "tps": 61587, "wall": 1368.5} {"step": 1286, "train_loss": 4.663834095001221, "lr": 0.0003999166133828056, "tps": 61412, "wall": 1373.4} {"step": 1287, "train_loss": 4.69584321975708, "lr": 0.000399916029285584, "tps": 61241, "wall": 1378.3} {"step": 1288, "train_loss": 4.634556770324707, "lr": 0.00039991544315026386, "tps": 61071, "wall": 1383.2} {"step": 1289, "train_loss": 4.628905296325684, "lr": 0.0003999148549768518, "tps": 60903, "wall": 1388.1} {"step": 1290, "train_loss": 4.676016330718994, "lr": 0.0003999142647653546, "tps": 60735, "wall": 1393.0} {"step": 1291, "train_loss": 4.733148574829102, "lr": 0.0003999136725157789, "tps": 60569, "wall": 1397.9} {"step": 1292, "train_loss": 4.614426136016846, "lr": 0.00039991307822813133, "tps": 60403, "wall": 1402.9} {"step": 1293, "train_loss": 4.656604290008545, "lr": 0.00039991248190241873, "tps": 60239, "wall": 1407.8} {"step": 1294, "train_loss": 4.690710544586182, "lr": 0.00039991188353864776, "tps": 60075, "wall": 1412.7} {"step": 1295, "train_loss": 4.617526531219482, "lr": 0.00039991128313682526, "tps": 59913, "wall": 1417.6} {"step": 1296, "train_loss": 4.64365291595459, "lr": 0.000399910680696958, "tps": 59752, "wall": 1422.5} {"step": 1297, "train_loss": 4.682845592498779, "lr": 0.00039991007621905284, "tps": 59593, "wall": 1427.4} {"step": 1298, "train_loss": 4.7030253410339355, "lr": 0.0003999094697031165, "tps": 59432, "wall": 1432.4} {"step": 1299, "train_loss": 4.707547187805176, "lr": 0.0003999088611491561, "tps": 59274, "wall": 1437.3} {"step": 1300, "train_loss": 4.558964252471924, "lr": 0.00039990825055717834, "tps": 59118, "wall": 1442.2} {"step": 1301, "train_loss": 4.680548667907715, "lr": 0.00039990763792719015, "tps": 58963, "wall": 1447.1} {"step": 1302, "train_loss": 4.628995895385742, "lr": 0.00039990702325919857, "tps": 58810, "wall": 1452.0} {"step": 1303, "train_loss": 4.584903240203857, "lr": 0.0003999064065532104, "tps": 58657, "wall": 1456.9} {"step": 1304, "train_loss": 4.576442718505859, "lr": 0.00039990578780923277, "tps": 58505, "wall": 1461.8} {"step": 1305, "train_loss": 4.618996620178223, "lr": 0.00039990516702727264, "tps": 58353, "wall": 1466.7} {"step": 1306, "train_loss": 4.59958553314209, "lr": 0.0003999045442073371, "tps": 58204, "wall": 1471.6} {"step": 1307, "train_loss": 4.546566009521484, "lr": 0.00039990391934943307, "tps": 58054, "wall": 1476.6} {"step": 1308, "train_loss": 4.6218953132629395, "lr": 0.0003999032924535677, "tps": 57906, "wall": 1481.5} {"step": 1309, "train_loss": 4.653003692626953, "lr": 0.0003999026635197482, "tps": 57759, "wall": 1486.4} {"step": 1310, "train_loss": 4.501714706420898, "lr": 0.0003999020325479815, "tps": 57610, "wall": 1491.4} {"step": 1311, "train_loss": 4.644724369049072, "lr": 0.0003999013995382749, "tps": 57465, "wall": 1496.3} {"step": 1312, "train_loss": 4.621045112609863, "lr": 0.0003999007644906355, "tps": 57321, "wall": 1501.2} {"step": 1313, "train_loss": 4.676820755004883, "lr": 0.0003999001274050705, "tps": 57177, "wall": 1506.1} {"step": 1314, "train_loss": 4.691351890563965, "lr": 0.0003998994882815871, "tps": 57035, "wall": 1511.0} {"step": 1315, "train_loss": 4.614520072937012, "lr": 0.0003998988471201926, "tps": 56893, "wall": 1515.9} {"step": 1316, "train_loss": 4.558149814605713, "lr": 0.0003998982039208942, "tps": 56753, "wall": 1520.8} {"step": 1317, "train_loss": 4.669447422027588, "lr": 0.00039989755868369926, "tps": 56613, "wall": 1525.7} {"step": 1318, "train_loss": 4.540246486663818, "lr": 0.00039989691140861504, "tps": 56475, "wall": 1530.6} {"step": 1319, "train_loss": 4.630648612976074, "lr": 0.00039989626209564885, "tps": 56337, "wall": 1535.5} {"step": 1320, "train_loss": 4.524071216583252, "lr": 0.00039989561074480807, "tps": 56200, "wall": 1540.4} {"step": 1321, "train_loss": 4.67475700378418, "lr": 0.0003998949573561, "tps": 56063, "wall": 1545.4} {"step": 1322, "train_loss": 4.585197448730469, "lr": 0.00039989430192953224, "tps": 55929, "wall": 1550.3} {"step": 1323, "train_loss": 4.550561428070068, "lr": 0.00039989364446511204, "tps": 55792, "wall": 1555.2} {"step": 1324, "train_loss": 4.4931793212890625, "lr": 0.00039989298496284696, "tps": 55658, "wall": 1560.1} {"step": 1325, "train_loss": 4.5664567947387695, "lr": 0.00039989232342274437, "tps": 55525, "wall": 1565.1} {"step": 1326, "train_loss": 4.688346862792969, "lr": 0.0003998916598448118, "tps": 55393, "wall": 1570.0} {"step": 1327, "train_loss": 4.701613426208496, "lr": 0.0003998909942290568, "tps": 55262, "wall": 1574.9} {"step": 1328, "train_loss": 4.566756725311279, "lr": 0.0003998903265754869, "tps": 55133, "wall": 1579.8} {"step": 1329, "train_loss": 4.55023193359375, "lr": 0.0003998896568841096, "tps": 55002, "wall": 1584.7} {"step": 1330, "train_loss": 4.5369038581848145, "lr": 0.00039988898515493256, "tps": 54874, "wall": 1589.6} {"step": 1331, "train_loss": 4.681216716766357, "lr": 0.0003998883113879633, "tps": 54746, "wall": 1594.5} {"step": 1332, "train_loss": 4.549868106842041, "lr": 0.0003998876355832096, "tps": 54617, "wall": 1599.5} {"step": 1333, "train_loss": 4.580176830291748, "lr": 0.00039988695774067904, "tps": 54490, "wall": 1604.4} {"step": 1334, "train_loss": 4.49027681350708, "lr": 0.00039988627786037925, "tps": 54365, "wall": 1609.3} {"step": 1335, "train_loss": 4.6838178634643555, "lr": 0.000399885595942318, "tps": 54239, "wall": 1614.3} {"step": 1336, "train_loss": 4.58165168762207, "lr": 0.00039988491198650295, "tps": 54114, "wall": 1619.2} {"step": 1337, "train_loss": 4.623272895812988, "lr": 0.00039988422599294195, "tps": 53991, "wall": 1624.1} {"step": 1338, "train_loss": 4.639877796173096, "lr": 0.00039988353796164265, "tps": 53868, "wall": 1629.0} {"step": 1339, "train_loss": 4.504405498504639, "lr": 0.0003998828478926129, "tps": 53746, "wall": 1633.9} {"step": 1340, "train_loss": 4.544501781463623, "lr": 0.00039988215578586045, "tps": 53625, "wall": 1638.8} {"step": 1341, "train_loss": 4.590455532073975, "lr": 0.0003998814616413934, "tps": 53505, "wall": 1643.7} {"step": 1342, "train_loss": 4.799252510070801, "lr": 0.0003998807654592193, "tps": 53385, "wall": 1648.7} {"step": 1343, "train_loss": 4.629047393798828, "lr": 0.0003998800672393461, "tps": 53266, "wall": 1653.6} {"step": 1344, "train_loss": 4.571049213409424, "lr": 0.0003998793669817819, "tps": 53148, "wall": 1658.5} {"step": 1345, "train_loss": 4.617059707641602, "lr": 0.00039987866468653443, "tps": 53031, "wall": 1663.4} {"step": 1346, "train_loss": 4.575624942779541, "lr": 0.00039987796035361166, "tps": 52914, "wall": 1668.3} {"step": 1347, "train_loss": 4.579472064971924, "lr": 0.0003998772539830217, "tps": 52795, "wall": 1673.3} {"step": 1348, "train_loss": 4.5523600578308105, "lr": 0.0003998765455747725, "tps": 52679, "wall": 1678.2} {"step": 1349, "train_loss": 4.52830171585083, "lr": 0.000399875835128872, "tps": 52565, "wall": 1683.1} {"step": 1350, "train_loss": 4.522387504577637, "lr": 0.00039987512264532836, "tps": 52451, "wall": 1688.0} {"step": 1351, "train_loss": 4.6328206062316895, "lr": 0.0003998744081241495, "tps": 52337, "wall": 1692.9} {"step": 1352, "train_loss": 4.523361682891846, "lr": 0.0003998736915653437, "tps": 52224, "wall": 1697.9} {"step": 1353, "train_loss": 4.668751239776611, "lr": 0.00039987297296891904, "tps": 52112, "wall": 1702.8} {"step": 1354, "train_loss": 4.616785049438477, "lr": 0.0003998722523348835, "tps": 51999, "wall": 1707.7} {"step": 1355, "train_loss": 4.6514081954956055, "lr": 0.00039987152966324544, "tps": 51888, "wall": 1712.6} {"step": 1356, "train_loss": 4.531893253326416, "lr": 0.0003998708049540128, "tps": 51777, "wall": 1717.6} {"step": 1357, "train_loss": 4.587674617767334, "lr": 0.0003998700782071941, "tps": 51666, "wall": 1722.5} {"step": 1358, "train_loss": 4.559559345245361, "lr": 0.00039986934942279746, "tps": 51557, "wall": 1727.4} {"step": 1359, "train_loss": 4.544008255004883, "lr": 0.000399868618600831, "tps": 51447, "wall": 1732.4} {"step": 1360, "train_loss": 4.574918270111084, "lr": 0.00039986788574130315, "tps": 51339, "wall": 1737.3} {"step": 1361, "train_loss": 4.556431770324707, "lr": 0.0003998671508442221, "tps": 51232, "wall": 1742.3} {"step": 1362, "train_loss": 4.589485168457031, "lr": 0.0003998664139095963, "tps": 51125, "wall": 1747.2} {"step": 1363, "train_loss": 4.520368576049805, "lr": 0.000399865674937434, "tps": 51019, "wall": 1752.1} {"step": 1364, "train_loss": 4.554105281829834, "lr": 0.00039986493392774367, "tps": 50914, "wall": 1757.0} {"step": 1365, "train_loss": 4.586728096008301, "lr": 0.00039986419088053354, "tps": 50809, "wall": 1761.9} {"step": 1366, "train_loss": 4.521640777587891, "lr": 0.00039986344579581213, "tps": 50703, "wall": 1766.9} {"step": 1367, "train_loss": 4.6954264640808105, "lr": 0.0003998626986735879, "tps": 50600, "wall": 1771.8} {"step": 1368, "train_loss": 4.468796730041504, "lr": 0.00039986194951386933, "tps": 50496, "wall": 1776.7} {"step": 1369, "train_loss": 4.518811225891113, "lr": 0.00039986119831666485, "tps": 50394, "wall": 1781.6} {"step": 1370, "train_loss": 4.495624542236328, "lr": 0.00039986044508198297, "tps": 50292, "wall": 1786.5} {"step": 1371, "train_loss": 4.514124870300293, "lr": 0.00039985968980983216, "tps": 50189, "wall": 1791.5} {"step": 1372, "train_loss": 4.4580159187316895, "lr": 0.00039985893250022114, "tps": 50088, "wall": 1796.4} {"step": 1373, "train_loss": 4.566763401031494, "lr": 0.00039985817315315843, "tps": 49988, "wall": 1801.4} {"step": 1374, "train_loss": 4.474162578582764, "lr": 0.0003998574117686526, "tps": 49888, "wall": 1806.3} {"step": 1375, "train_loss": 4.4496989250183105, "lr": 0.0003998566483467122, "tps": 49789, "wall": 1811.2} {"step": 1376, "train_loss": 4.632296085357666, "lr": 0.00039985588288734604, "tps": 49690, "wall": 1816.1} {"step": 1377, "train_loss": 4.613598823547363, "lr": 0.0003998551153905627, "tps": 49592, "wall": 1821.0} {"step": 1378, "train_loss": 4.628142356872559, "lr": 0.0003998543458563708, "tps": 49494, "wall": 1825.9} {"step": 1379, "train_loss": 4.627649307250977, "lr": 0.00039985357428477916, "tps": 49397, "wall": 1830.9} {"step": 1380, "train_loss": 4.664977073669434, "lr": 0.0003998528006757965, "tps": 49301, "wall": 1835.8} {"step": 1381, "train_loss": 4.50976037979126, "lr": 0.0003998520250294317, "tps": 49205, "wall": 1840.7} {"step": 1382, "train_loss": 4.560602188110352, "lr": 0.00039985124734569336, "tps": 49110, "wall": 1845.6} {"step": 1383, "train_loss": 4.588864803314209, "lr": 0.0003998504676245903, "tps": 49014, "wall": 1850.5} {"step": 1384, "train_loss": 4.6306867599487305, "lr": 0.0003998496858661315, "tps": 48919, "wall": 1855.5} {"step": 1385, "train_loss": 4.464302062988281, "lr": 0.0003998489020703257, "tps": 48825, "wall": 1860.4} {"step": 1386, "train_loss": 4.5656938552856445, "lr": 0.0003998481162371818, "tps": 48730, "wall": 1865.3} {"step": 1387, "train_loss": 4.559319972991943, "lr": 0.0003998473283667087, "tps": 48637, "wall": 1870.2} {"step": 1388, "train_loss": 4.599039554595947, "lr": 0.00039984653845891535, "tps": 48545, "wall": 1875.2} {"step": 1389, "train_loss": 4.476394176483154, "lr": 0.0003998457465138107, "tps": 48452, "wall": 1880.1} {"step": 1390, "train_loss": 4.651638984680176, "lr": 0.0003998449525314037, "tps": 48361, "wall": 1885.0} {"step": 1391, "train_loss": 4.615943908691406, "lr": 0.0003998441565117033, "tps": 48270, "wall": 1889.9} {"step": 1392, "train_loss": 4.604959487915039, "lr": 0.0003998433584547186, "tps": 48179, "wall": 1894.8} {"step": 1393, "train_loss": 4.456634521484375, "lr": 0.00039984255836045864, "tps": 48088, "wall": 1899.8} {"step": 1394, "train_loss": 4.546645164489746, "lr": 0.00039984175622893235, "tps": 47998, "wall": 1904.7} {"step": 1395, "train_loss": 4.6144537925720215, "lr": 0.000399840952060149, "tps": 47909, "wall": 1909.6} {"step": 1396, "train_loss": 4.537128448486328, "lr": 0.00039984014585411757, "tps": 47818, "wall": 1914.6} {"step": 1397, "train_loss": 4.581592082977295, "lr": 0.00039983933761084724, "tps": 47730, "wall": 1919.5} {"step": 1398, "train_loss": 4.540223598480225, "lr": 0.0003998385273303472, "tps": 47641, "wall": 1924.5} {"step": 1399, "train_loss": 4.589783191680908, "lr": 0.00039983771501262664, "tps": 47554, "wall": 1929.4} {"step": 1400, "train_loss": 4.472585678100586, "lr": 0.0003998369006576946, "tps": 47467, "wall": 1934.3} {"step": 1401, "train_loss": 4.524109840393066, "lr": 0.0003998360842655605, "tps": 47381, "wall": 1939.2} {"step": 1402, "train_loss": 4.5580878257751465, "lr": 0.0003998352658362335, "tps": 47295, "wall": 1944.1} {"step": 1403, "train_loss": 4.566802024841309, "lr": 0.0003998344453697228, "tps": 47209, "wall": 1949.0} {"step": 1404, "train_loss": 4.647909164428711, "lr": 0.0003998336228660379, "tps": 47124, "wall": 1953.9} {"step": 1405, "train_loss": 4.52377986907959, "lr": 0.0003998327983251879, "tps": 47039, "wall": 1958.8} {"step": 1406, "train_loss": 4.592807292938232, "lr": 0.00039983197174718225, "tps": 46954, "wall": 1963.8} {"step": 1407, "train_loss": 4.499632358551025, "lr": 0.00039983114313203033, "tps": 46870, "wall": 1968.7} {"step": 1408, "train_loss": 4.611354351043701, "lr": 0.00039983031247974146, "tps": 46785, "wall": 1973.7} {"step": 1409, "train_loss": 4.688358783721924, "lr": 0.0003998294797903251, "tps": 46701, "wall": 1978.6} {"step": 1410, "train_loss": 4.514547824859619, "lr": 0.00039982864506379065, "tps": 46618, "wall": 1983.6} {"step": 1411, "train_loss": 4.550152778625488, "lr": 0.0003998278083001476, "tps": 46536, "wall": 1988.5} {"step": 1412, "train_loss": 4.4255547523498535, "lr": 0.0003998269694994054, "tps": 46455, "wall": 1993.4} {"step": 1413, "train_loss": 4.4842939376831055, "lr": 0.0003998261286615735, "tps": 46373, "wall": 1998.3} {"step": 1414, "train_loss": 4.53053617477417, "lr": 0.00039982528578666156, "tps": 46291, "wall": 2003.2} {"step": 1415, "train_loss": 4.66476583480835, "lr": 0.000399824440874679, "tps": 46210, "wall": 2008.2} {"step": 1416, "train_loss": 4.615541458129883, "lr": 0.00039982359392563556, "tps": 46130, "wall": 2013.1} {"step": 1417, "train_loss": 4.529441833496094, "lr": 0.0003998227449395406, "tps": 46050, "wall": 2018.0} {"step": 1418, "train_loss": 4.459108352661133, "lr": 0.0003998218939164039, "tps": 45970, "wall": 2022.9} {"step": 1419, "train_loss": 4.585306167602539, "lr": 0.00039982104085623503, "tps": 45891, "wall": 2027.8} {"step": 1420, "train_loss": 4.419863700866699, "lr": 0.0003998201857590437, "tps": 45811, "wall": 2032.8} {"step": 1421, "train_loss": 4.560238361358643, "lr": 0.00039981932862483957, "tps": 45732, "wall": 2037.7} {"step": 1422, "train_loss": 4.497608184814453, "lr": 0.0003998184694536324, "tps": 45655, "wall": 2042.7} {"step": 1423, "train_loss": 4.499667644500732, "lr": 0.00039981760824543184, "tps": 45577, "wall": 2047.6} {"step": 1424, "train_loss": 4.565336227416992, "lr": 0.0003998167450002477, "tps": 45499, "wall": 2052.5} {"step": 1425, "train_loss": 4.424074172973633, "lr": 0.00039981587971808975, "tps": 45423, "wall": 2057.4} {"step": 1426, "train_loss": 4.567027568817139, "lr": 0.0003998150123989678, "tps": 45346, "wall": 2062.3} {"step": 1427, "train_loss": 4.629752159118652, "lr": 0.0003998141430428916, "tps": 45270, "wall": 2067.2} {"step": 1428, "train_loss": 4.58975887298584, "lr": 0.0003998132716498711, "tps": 45195, "wall": 2072.2} {"step": 1429, "train_loss": 4.568757057189941, "lr": 0.0003998123982199161, "tps": 45111, "wall": 2077.5} {"step": 1430, "train_loss": 4.589269161224365, "lr": 0.00039981152275303663, "tps": 45034, "wall": 2082.4} {"step": 1431, "train_loss": 4.517363548278809, "lr": 0.0003998106452492424, "tps": 44958, "wall": 2087.4} {"step": 1432, "train_loss": 4.479729175567627, "lr": 0.0003998097657085435, "tps": 44881, "wall": 2092.5} {"step": 1433, "train_loss": 4.5830607414245605, "lr": 0.0003998088841309498, "tps": 44807, "wall": 2097.4} {"step": 1434, "train_loss": 4.632790565490723, "lr": 0.0003998080005164714, "tps": 44733, "wall": 2102.3} {"step": 1435, "train_loss": 4.564676284790039, "lr": 0.0003998071148651182, "tps": 44660, "wall": 2107.2} {"step": 1436, "train_loss": 4.547706604003906, "lr": 0.00039980622717690023, "tps": 44587, "wall": 2112.2} {"step": 1437, "train_loss": 4.52226448059082, "lr": 0.00039980533745182764, "tps": 44514, "wall": 2117.1} {"step": 1438, "train_loss": 4.532492637634277, "lr": 0.00039980444568991046, "tps": 44442, "wall": 2122.0} {"step": 1439, "train_loss": 4.4899582862854, "lr": 0.0003998035518911588, "tps": 44368, "wall": 2127.0} {"step": 1440, "train_loss": 4.480623245239258, "lr": 0.00039980265605558274, "tps": 44297, "wall": 2131.9} {"step": 1441, "train_loss": 4.541476249694824, "lr": 0.00039980175818319253, "tps": 44226, "wall": 2136.8} {"step": 1442, "train_loss": 4.419096946716309, "lr": 0.0003998008582739983, "tps": 44154, "wall": 2141.7} {"step": 1443, "train_loss": 4.5070013999938965, "lr": 0.0003997999563280101, "tps": 44083, "wall": 2146.7} {"step": 1444, "train_loss": 4.545703887939453, "lr": 0.00039979905234523833, "tps": 44011, "wall": 2151.7} {"step": 1445, "train_loss": 4.449830532073975, "lr": 0.00039979814632569314, "tps": 43931, "wall": 2157.1} {"step": 1446, "train_loss": 4.5596923828125, "lr": 0.0003997972382693849, "tps": 43851, "wall": 2162.5} {"step": 1447, "train_loss": 4.488410949707031, "lr": 0.0003997963281763238, "tps": 43776, "wall": 2167.7} {"step": 1448, "train_loss": 4.589617729187012, "lr": 0.0003997954160465201, "tps": 43706, "wall": 2172.7} {"step": 1449, "train_loss": 4.509510517120361, "lr": 0.0003997945018799842, "tps": 43635, "wall": 2177.8} {"step": 1450, "train_loss": 4.483712196350098, "lr": 0.0003997935856767265, "tps": 43555, "wall": 2183.2} {"step": 1451, "train_loss": 4.638399600982666, "lr": 0.00039979266743675733, "tps": 43480, "wall": 2188.5} {"step": 1452, "train_loss": 4.563316345214844, "lr": 0.0003997917471600871, "tps": 43403, "wall": 2193.9} {"step": 1453, "train_loss": 4.540190696716309, "lr": 0.0003997908248467262, "tps": 43330, "wall": 2199.1} {"step": 1454, "train_loss": 4.5244011878967285, "lr": 0.00039978990049668514, "tps": 43259, "wall": 2204.3} {"step": 1455, "train_loss": 4.632892608642578, "lr": 0.0003997889741099743, "tps": 43190, "wall": 2209.3} {"step": 1456, "train_loss": 4.487123489379883, "lr": 0.00039978804568660434, "tps": 43122, "wall": 2214.3} {"step": 1457, "train_loss": 4.543103218078613, "lr": 0.0003997871152265856, "tps": 43056, "wall": 2219.2} {"step": 1458, "train_loss": 4.471795082092285, "lr": 0.00039978618272992875, "tps": 42989, "wall": 2224.2} {"step": 1459, "train_loss": 4.448863983154297, "lr": 0.0003997852481966442, "tps": 42923, "wall": 2229.2} {"step": 1460, "train_loss": 4.462702751159668, "lr": 0.00039978431162674273, "tps": 42857, "wall": 2234.1} {"step": 1461, "train_loss": 4.525228977203369, "lr": 0.0003997833730202348, "tps": 42791, "wall": 2239.1} {"step": 1462, "train_loss": 4.409585952758789, "lr": 0.00039978243237713106, "tps": 42726, "wall": 2244.0} {"step": 1463, "train_loss": 4.479317665100098, "lr": 0.0003997814896974423, "tps": 42661, "wall": 2249.0} {"step": 1464, "train_loss": 4.434996128082275, "lr": 0.000399780544981179, "tps": 42596, "wall": 2254.0} {"step": 1465, "train_loss": 4.526790142059326, "lr": 0.00039977959822835206, "tps": 42531, "wall": 2258.9} {"step": 1466, "train_loss": 4.50493049621582, "lr": 0.00039977864943897205, "tps": 42468, "wall": 2263.9} {"step": 1467, "train_loss": 4.508723258972168, "lr": 0.00039977769861304977, "tps": 42404, "wall": 2268.8} {"step": 1468, "train_loss": 4.544611930847168, "lr": 0.000399776745750596, "tps": 42340, "wall": 2273.8} {"step": 1469, "train_loss": 4.563932418823242, "lr": 0.00039977579085162155, "tps": 42277, "wall": 2278.7} {"step": 1470, "train_loss": 4.552842617034912, "lr": 0.0003997748339161372, "tps": 42215, "wall": 2283.6} {"step": 1471, "train_loss": 4.439580917358398, "lr": 0.00039977387494415377, "tps": 42152, "wall": 2288.6} {"step": 1472, "train_loss": 4.588212013244629, "lr": 0.0003997729139356822, "tps": 42091, "wall": 2293.5} {"step": 1473, "train_loss": 4.4836297035217285, "lr": 0.0003997719508907333, "tps": 42028, "wall": 2298.4} {"step": 1474, "train_loss": 4.477836608886719, "lr": 0.00039977098580931805, "tps": 41966, "wall": 2303.4} {"step": 1475, "train_loss": 4.420412540435791, "lr": 0.0003997700186914473, "tps": 41904, "wall": 2308.4} {"step": 1476, "train_loss": 4.560955047607422, "lr": 0.0003997690495371321, "tps": 41841, "wall": 2313.4} {"step": 1477, "train_loss": 4.509968280792236, "lr": 0.0003997680783463834, "tps": 41780, "wall": 2318.4} {"step": 1478, "train_loss": 4.475714683532715, "lr": 0.00039976710511921215, "tps": 41717, "wall": 2323.4} {"step": 1479, "train_loss": 4.557614803314209, "lr": 0.00039976612985562936, "tps": 41654, "wall": 2328.5} {"step": 1480, "train_loss": 4.4366135597229, "lr": 0.0003997651525556462, "tps": 41591, "wall": 2333.6} {"step": 1481, "train_loss": 4.454329967498779, "lr": 0.0003997641732192736, "tps": 41531, "wall": 2338.6} {"step": 1482, "train_loss": 4.472235679626465, "lr": 0.0003997631918465228, "tps": 41470, "wall": 2343.6} {"step": 1483, "train_loss": 4.586488723754883, "lr": 0.0003997622084374048, "tps": 41410, "wall": 2348.6} {"step": 1484, "train_loss": 4.528948783874512, "lr": 0.0003997612229919308, "tps": 41350, "wall": 2353.6} {"step": 1485, "train_loss": 4.433725357055664, "lr": 0.00039976023551011194, "tps": 41290, "wall": 2358.6} {"step": 1486, "train_loss": 4.5311174392700195, "lr": 0.00039975924599195935, "tps": 41231, "wall": 2363.6} {"step": 1487, "train_loss": 4.526597023010254, "lr": 0.0003997582544374843, "tps": 41171, "wall": 2368.5} {"step": 1488, "train_loss": 4.555842399597168, "lr": 0.00039975726084669807, "tps": 41114, "wall": 2373.5} {"step": 1489, "train_loss": 4.588586330413818, "lr": 0.00039975626521961187, "tps": 41056, "wall": 2378.4} {"step": 1490, "train_loss": 4.460793972015381, "lr": 0.00039975526755623694, "tps": 40998, "wall": 2383.3} {"step": 1491, "train_loss": 4.507551670074463, "lr": 0.00039975426785658467, "tps": 40941, "wall": 2388.3} {"step": 1492, "train_loss": 4.554073810577393, "lr": 0.0003997532661206662, "tps": 40883, "wall": 2393.3} {"step": 1493, "train_loss": 4.476772308349609, "lr": 0.00039975226234849315, "tps": 40826, "wall": 2398.2} {"step": 1494, "train_loss": 4.559906959533691, "lr": 0.00039975125654007667, "tps": 40770, "wall": 2403.1} {"step": 1495, "train_loss": 4.451772212982178, "lr": 0.0003997502486954283, "tps": 40714, "wall": 2408.0} {"step": 1496, "train_loss": 4.487111568450928, "lr": 0.0003997492388145593, "tps": 40658, "wall": 2413.0} {"step": 1497, "train_loss": 4.540968894958496, "lr": 0.0003997482268974813, "tps": 40601, "wall": 2418.0} {"step": 1498, "train_loss": 4.44438362121582, "lr": 0.0003997472129442055, "tps": 40545, "wall": 2422.9} {"step": 1499, "train_loss": 4.465389251708984, "lr": 0.00039974619695474367, "tps": 40487, "wall": 2428.0} {"step": 1500, "train_loss": 4.483725547790527, "lr": 0.00039974517892910717, "tps": 40429, "wall": 2433.1} {"step": 1501, "train_loss": 4.553088188171387, "lr": 0.00039974415886730755, "tps": 40369, "wall": 2438.4} {"step": 1502, "train_loss": 4.454956531524658, "lr": 0.0003997431367693564, "tps": 40312, "wall": 2443.4} {"step": 1503, "train_loss": 4.401609897613525, "lr": 0.0003997421126352653, "tps": 40258, "wall": 2448.4} {"step": 1504, "train_loss": 4.454351425170898, "lr": 0.00039974108646504574, "tps": 40203, "wall": 2453.3} {"step": 1505, "train_loss": 4.5373687744140625, "lr": 0.0003997400582587095, "tps": 40148, "wall": 2458.3} {"step": 1506, "train_loss": 4.426568984985352, "lr": 0.0003997390280162681, "tps": 40095, "wall": 2463.2} {"step": 1507, "train_loss": 4.40841817855835, "lr": 0.0003997379957377333, "tps": 40041, "wall": 2468.1} {"step": 1508, "train_loss": 4.319911003112793, "lr": 0.0003997369614231168, "tps": 39987, "wall": 2473.1} {"step": 1509, "train_loss": 4.534554958343506, "lr": 0.00039973592507243025, "tps": 39934, "wall": 2478.1} {"step": 1510, "train_loss": 4.484653472900391, "lr": 0.00039973488668568533, "tps": 39880, "wall": 2483.0} {"step": 1511, "train_loss": 4.4298601150512695, "lr": 0.000399733846262894, "tps": 39826, "wall": 2488.0} {"step": 1512, "train_loss": 4.433861255645752, "lr": 0.0003997328038040679, "tps": 39773, "wall": 2493.0} {"step": 1513, "train_loss": 4.601797103881836, "lr": 0.00039973175930921887, "tps": 39720, "wall": 2498.0} {"step": 1514, "train_loss": 4.498847484588623, "lr": 0.00039973071277835874, "tps": 39667, "wall": 2503.0} {"step": 1515, "train_loss": 4.446008682250977, "lr": 0.00039972966421149937, "tps": 39612, "wall": 2508.1} {"step": 1516, "train_loss": 4.560943126678467, "lr": 0.0003997286136086527, "tps": 39557, "wall": 2513.2} {"step": 1517, "train_loss": 4.42204475402832, "lr": 0.0003997275609698305, "tps": 39503, "wall": 2518.3} {"step": 1518, "train_loss": 4.479740619659424, "lr": 0.0003997265062950447, "tps": 39451, "wall": 2523.4} {"step": 1519, "train_loss": 4.43463134765625, "lr": 0.00039972544958430747, "tps": 39399, "wall": 2528.3} {"step": 1520, "train_loss": 4.4159722328186035, "lr": 0.00039972439083763055, "tps": 39348, "wall": 2533.2} {"step": 1521, "train_loss": 4.440151691436768, "lr": 0.00039972333005502606, "tps": 39298, "wall": 2538.2} {"step": 1522, "train_loss": 4.391430854797363, "lr": 0.00039972226723650585, "tps": 39247, "wall": 2543.1} {"step": 1523, "train_loss": 4.50594425201416, "lr": 0.0003997212023820822, "tps": 39196, "wall": 2548.1} {"step": 1524, "train_loss": 4.475657939910889, "lr": 0.00039972013549176695, "tps": 39146, "wall": 2553.0} {"step": 1525, "train_loss": 4.494799613952637, "lr": 0.0003997190665655723, "tps": 39096, "wall": 2558.0} {"step": 1526, "train_loss": 4.381046295166016, "lr": 0.0003997179956035104, "tps": 39046, "wall": 2563.0} {"step": 1527, "train_loss": 4.460398197174072, "lr": 0.00039971692260559326, "tps": 38995, "wall": 2568.0} {"step": 1528, "train_loss": 4.3433918952941895, "lr": 0.00039971584757183317, "tps": 38942, "wall": 2573.1} {"step": 1529, "train_loss": 4.353096961975098, "lr": 0.00039971477050224216, "tps": 38891, "wall": 2578.2} {"step": 1530, "train_loss": 4.477878570556641, "lr": 0.0003997136913968325, "tps": 38840, "wall": 2583.3} {"step": 1531, "train_loss": 4.467311859130859, "lr": 0.00039971261025561653, "tps": 38790, "wall": 2588.3} {"step": 1532, "train_loss": 4.466419219970703, "lr": 0.0003997115270786063, "tps": 38741, "wall": 2593.3} {"step": 1533, "train_loss": 4.515496253967285, "lr": 0.00039971044186581424, "tps": 38692, "wall": 2598.3} {"step": 1534, "train_loss": 4.439355373382568, "lr": 0.0003997093546172525, "tps": 38643, "wall": 2603.2} {"step": 1535, "train_loss": 4.493413925170898, "lr": 0.0003997082653329335, "tps": 38592, "wall": 2608.3} {"step": 1536, "train_loss": 4.398372650146484, "lr": 0.0003997071740128695, "tps": 38543, "wall": 2613.4} {"step": 1537, "train_loss": 4.524842739105225, "lr": 0.0003997060806570729, "tps": 38493, "wall": 2618.4} {"step": 1538, "train_loss": 4.405954360961914, "lr": 0.0003997049852655562, "tps": 38444, "wall": 2623.5} {"step": 1539, "train_loss": 4.448719024658203, "lr": 0.0003997038878383316, "tps": 38395, "wall": 2628.6} {"step": 1540, "train_loss": 4.528096675872803, "lr": 0.0003997027883754117, "tps": 38347, "wall": 2633.6} {"step": 1541, "train_loss": 4.355472564697266, "lr": 0.00039970168687680893, "tps": 38299, "wall": 2638.6} {"step": 1542, "train_loss": 4.3926849365234375, "lr": 0.0003997005833425357, "tps": 38251, "wall": 2643.6} {"step": 1543, "train_loss": 4.5679216384887695, "lr": 0.0003996994777726045, "tps": 38205, "wall": 2648.5} {"step": 1544, "train_loss": 4.4427571296691895, "lr": 0.00039969837016702787, "tps": 38158, "wall": 2653.5} {"step": 1545, "train_loss": 4.4841837882995605, "lr": 0.00039969726052581844, "tps": 38112, "wall": 2658.4} {"step": 1546, "train_loss": 4.4844231605529785, "lr": 0.0003996961488489887, "tps": 38065, "wall": 2663.4} {"step": 1547, "train_loss": 4.4594268798828125, "lr": 0.00039969503513655126, "tps": 38019, "wall": 2668.4} {"step": 1548, "train_loss": 4.439815044403076, "lr": 0.0003996939193885187, "tps": 37972, "wall": 2673.4} {"step": 1549, "train_loss": 4.41752815246582, "lr": 0.0003996928016049038, "tps": 37926, "wall": 2678.3} {"step": 1550, "train_loss": 4.496631145477295, "lr": 0.00039969168178571906, "tps": 37881, "wall": 2683.3} {"step": 1551, "train_loss": 4.389902591705322, "lr": 0.00039969055993097725, "tps": 37834, "wall": 2688.3} {"step": 1552, "train_loss": 4.486880302429199, "lr": 0.000399689436040691, "tps": 37786, "wall": 2693.5} {"step": 1553, "train_loss": 4.404509544372559, "lr": 0.00039968831011487317, "tps": 37739, "wall": 2698.6} {"step": 1554, "train_loss": 4.428417205810547, "lr": 0.0003996871821535364, "tps": 37693, "wall": 2703.6} {"step": 1555, "train_loss": 4.44374942779541, "lr": 0.0003996860521566935, "tps": 37648, "wall": 2708.6} {"step": 1556, "train_loss": 4.502384662628174, "lr": 0.0003996849201243574, "tps": 37603, "wall": 2713.6} {"step": 1557, "train_loss": 4.316831111907959, "lr": 0.0003996837860565407, "tps": 37558, "wall": 2718.5} {"step": 1558, "train_loss": 4.315889358520508, "lr": 0.00039968264995325636, "tps": 37514, "wall": 2723.5} {"step": 1559, "train_loss": 4.466758728027344, "lr": 0.0003996815118145173, "tps": 37470, "wall": 2728.5} {"step": 1560, "train_loss": 4.366588592529297, "lr": 0.0003996803716403362, "tps": 37425, "wall": 2733.5} {"step": 1561, "train_loss": 4.459178924560547, "lr": 0.00039967922943072627, "tps": 37380, "wall": 2738.5} {"step": 1562, "train_loss": 4.3930253982543945, "lr": 0.00039967808518570023, "tps": 37336, "wall": 2743.5} {"step": 1563, "train_loss": 4.392908096313477, "lr": 0.0003996769389052712, "tps": 37291, "wall": 2748.6} {"step": 1564, "train_loss": 4.512956619262695, "lr": 0.00039967579058945203, "tps": 37246, "wall": 2753.7} {"step": 1565, "train_loss": 4.36842155456543, "lr": 0.0003996746402382558, "tps": 37202, "wall": 2758.7} {"step": 1566, "train_loss": 4.387256145477295, "lr": 0.0003996734878516955, "tps": 37159, "wall": 2763.7} {"step": 1567, "train_loss": 4.367649555206299, "lr": 0.0003996723334297842, "tps": 37116, "wall": 2768.6} {"step": 1568, "train_loss": 4.543716907501221, "lr": 0.0003996711769725351, "tps": 37072, "wall": 2773.6} {"step": 1569, "train_loss": 4.323988914489746, "lr": 0.000399670018479961, "tps": 37029, "wall": 2778.6} {"step": 1570, "train_loss": 4.456528186798096, "lr": 0.0003996688579520754, "tps": 36986, "wall": 2783.6} {"step": 1571, "train_loss": 4.300152778625488, "lr": 0.0003996676953888911, "tps": 36944, "wall": 2788.6} {"step": 1572, "train_loss": 4.355687141418457, "lr": 0.0003996665307904215, "tps": 36901, "wall": 2793.6} {"step": 1573, "train_loss": 4.304507255554199, "lr": 0.00039966536415667975, "tps": 36858, "wall": 2798.6} {"step": 1574, "train_loss": 4.5149664878845215, "lr": 0.000399664195487679, "tps": 36815, "wall": 2803.7} {"step": 1575, "train_loss": 4.408788204193115, "lr": 0.0003996630247834325, "tps": 36773, "wall": 2808.7} {"step": 1576, "train_loss": 4.424988269805908, "lr": 0.0003996618520439536, "tps": 36730, "wall": 2813.7} {"step": 1577, "train_loss": 4.483428478240967, "lr": 0.00039966067726925547, "tps": 36686, "wall": 2818.9} {"step": 1578, "train_loss": 4.324524879455566, "lr": 0.0003996595004593515, "tps": 36644, "wall": 2823.9} {"step": 1579, "train_loss": 4.412740230560303, "lr": 0.0003996583216142549, "tps": 36602, "wall": 2828.9} {"step": 1580, "train_loss": 4.44163179397583, "lr": 0.0003996571407339792, "tps": 36560, "wall": 2834.0} {"step": 1581, "train_loss": 4.436939716339111, "lr": 0.00039965595781853765, "tps": 36518, "wall": 2839.1} {"step": 1582, "train_loss": 4.520476341247559, "lr": 0.0003996547728679437, "tps": 36476, "wall": 2844.1} {"step": 1583, "train_loss": 4.437027454376221, "lr": 0.0003996535858822108, "tps": 36435, "wall": 2849.1} {"step": 1584, "train_loss": 4.488655090332031, "lr": 0.0003996523968613524, "tps": 36394, "wall": 2854.1} {"step": 1585, "train_loss": 4.400790691375732, "lr": 0.00039965120580538185, "tps": 36353, "wall": 2859.1} {"step": 1586, "train_loss": 4.375764846801758, "lr": 0.0003996500127143127, "tps": 36312, "wall": 2864.2} {"step": 1587, "train_loss": 4.453415870666504, "lr": 0.00039964881758815853, "tps": 36272, "wall": 2869.2} {"step": 1588, "train_loss": 4.305355548858643, "lr": 0.0003996476204269328, "tps": 36230, "wall": 2874.2} {"step": 1589, "train_loss": 4.374646186828613, "lr": 0.0003996464212306492, "tps": 36188, "wall": 2879.4} {"step": 1590, "train_loss": 4.4063239097595215, "lr": 0.00039964521999932113, "tps": 36145, "wall": 2884.7} {"step": 1591, "train_loss": 4.329312324523926, "lr": 0.0003996440167329623, "tps": 36103, "wall": 2889.8} {"step": 1592, "train_loss": 4.450156211853027, "lr": 0.00039964281143158633, "tps": 36060, "wall": 2895.1} {"step": 1593, "train_loss": 4.386294364929199, "lr": 0.0003996416040952069, "tps": 36017, "wall": 2900.4} {"step": 1594, "train_loss": 4.529315948486328, "lr": 0.0003996403947238377, "tps": 35974, "wall": 2905.7} {"step": 1595, "train_loss": 4.456387519836426, "lr": 0.0003996391833174923, "tps": 35931, "wall": 2910.9} {"step": 1596, "train_loss": 4.364620685577393, "lr": 0.00039963796987618457, "tps": 35889, "wall": 2916.2} {"step": 1597, "train_loss": 4.301333427429199, "lr": 0.00039963675439992814, "tps": 35846, "wall": 2921.5} {"step": 1598, "train_loss": 4.442251205444336, "lr": 0.00039963553688873694, "tps": 35803, "wall": 2926.8} {"step": 1599, "train_loss": 4.528414726257324, "lr": 0.0003996343173426246, "tps": 35760, "wall": 2932.2} {"step": 1600, "train_loss": 4.3645477294921875, "lr": 0.00039963309576160496, "tps": 35718, "wall": 2937.5} {"step": 1601, "train_loss": 4.500576972961426, "lr": 0.000399631872145692, "tps": 35677, "wall": 2942.7} {"step": 1602, "train_loss": 4.404322624206543, "lr": 0.0003996306464948994, "tps": 35634, "wall": 2948.1} {"step": 1603, "train_loss": 4.534109592437744, "lr": 0.0003996294188092411, "tps": 35592, "wall": 2953.4} {"step": 1604, "train_loss": 4.376331329345703, "lr": 0.00039962818908873107, "tps": 35551, "wall": 2958.7} {"step": 1605, "train_loss": 4.371925354003906, "lr": 0.0003996269573333831, "tps": 35510, "wall": 2964.0} {"step": 1606, "train_loss": 4.411931991577148, "lr": 0.00039962572354321137, "tps": 35469, "wall": 2969.2} {"step": 1607, "train_loss": 4.370966911315918, "lr": 0.0003996244877182297, "tps": 35428, "wall": 2974.5} {"step": 1608, "train_loss": 4.361026763916016, "lr": 0.00039962324985845206, "tps": 35390, "wall": 2979.5} {"step": 1609, "train_loss": 4.473392486572266, "lr": 0.00039962200996389253, "tps": 35352, "wall": 2984.6} {"step": 1610, "train_loss": 4.232689380645752, "lr": 0.0003996207680345652, "tps": 35314, "wall": 2989.6} {"step": 1611, "train_loss": 4.419716835021973, "lr": 0.00039961952407048404, "tps": 35276, "wall": 2994.7} {"step": 1612, "train_loss": 4.351780414581299, "lr": 0.00039961827807166327, "tps": 35239, "wall": 2999.7} {"step": 1613, "train_loss": 4.369827747344971, "lr": 0.00039961703003811686, "tps": 35202, "wall": 3004.7} {"step": 1614, "train_loss": 4.45803165435791, "lr": 0.0003996157799698591, "tps": 35165, "wall": 3009.8} {"step": 1615, "train_loss": 4.348379611968994, "lr": 0.00039961452786690396, "tps": 35128, "wall": 3014.8} {"step": 1616, "train_loss": 4.481117248535156, "lr": 0.00039961327372926576, "tps": 35092, "wall": 3019.8} {"step": 1617, "train_loss": 4.436183929443359, "lr": 0.00039961201755695874, "tps": 35056, "wall": 3024.8} {"step": 1618, "train_loss": 4.462871551513672, "lr": 0.00039961075934999695, "tps": 35019, "wall": 3029.8} {"step": 1619, "train_loss": 4.38419771194458, "lr": 0.00039960949910839485, "tps": 34983, "wall": 3034.8} {"step": 1620, "train_loss": 4.439187526702881, "lr": 0.00039960823683216664, "tps": 34947, "wall": 3039.8} {"step": 1621, "train_loss": 4.491281986236572, "lr": 0.0003996069725213266, "tps": 34909, "wall": 3045.0} {"step": 1622, "train_loss": 4.43365478515625, "lr": 0.000399605706175889, "tps": 34874, "wall": 3049.9} {"step": 1623, "train_loss": 4.343208312988281, "lr": 0.00039960443779586837, "tps": 34838, "wall": 3055.0} {"step": 1624, "train_loss": 4.423102378845215, "lr": 0.0003996031673812788, "tps": 34801, "wall": 3060.1} {"step": 1625, "train_loss": 4.442417144775391, "lr": 0.00039960189493213493, "tps": 34766, "wall": 3065.1} {"step": 1626, "train_loss": 4.377791404724121, "lr": 0.00039960062044845104, "tps": 34731, "wall": 3070.1} {"step": 1627, "train_loss": 4.358612060546875, "lr": 0.0003995993439302416, "tps": 34694, "wall": 3075.2} {"step": 1628, "train_loss": 4.4799041748046875, "lr": 0.0003995980653775211, "tps": 34659, "wall": 3080.2} {"step": 1629, "train_loss": 4.417383193969727, "lr": 0.0003995967847903039, "tps": 34624, "wall": 3085.2} {"step": 1630, "train_loss": 4.409145355224609, "lr": 0.00039959550216860475, "tps": 34589, "wall": 3090.3} {"step": 1631, "train_loss": 4.466989040374756, "lr": 0.000399594217512438, "tps": 34554, "wall": 3095.3} {"step": 1632, "train_loss": 4.386610507965088, "lr": 0.00039959293082181827, "tps": 34517, "wall": 3100.5} {"step": 1633, "train_loss": 4.399353504180908, "lr": 0.00039959164209676, "tps": 34479, "wall": 3105.7} {"step": 1634, "train_loss": 4.356419563293457, "lr": 0.00039959035133727797, "tps": 34442, "wall": 3111.0} {"step": 1635, "train_loss": 4.353126049041748, "lr": 0.00039958905854338666, "tps": 34404, "wall": 3116.3} {"step": 1636, "train_loss": 4.466837406158447, "lr": 0.00039958776371510084, "tps": 34367, "wall": 3121.6} {"step": 1637, "train_loss": 4.395802974700928, "lr": 0.0003995864668524351, "tps": 34330, "wall": 3126.9} {"step": 1638, "train_loss": 4.406604290008545, "lr": 0.0003995851679554042, "tps": 34294, "wall": 3132.1} {"step": 1639, "train_loss": 4.328527450561523, "lr": 0.0003995838670240227, "tps": 34257, "wall": 3137.4} {"step": 1640, "train_loss": 4.503905296325684, "lr": 0.0003995825640583055, "tps": 34220, "wall": 3142.7} {"step": 1641, "train_loss": 4.32539176940918, "lr": 0.0003995812590582672, "tps": 34184, "wall": 3147.9} {"step": 1642, "train_loss": 4.254655361175537, "lr": 0.00039957995202392275, "tps": 34148, "wall": 3153.2} {"step": 1643, "train_loss": 4.353536605834961, "lr": 0.000399578642955287, "tps": 34112, "wall": 3158.4} {"step": 1644, "train_loss": 4.431143283843994, "lr": 0.00039957733185237455, "tps": 34077, "wall": 3163.5} {"step": 1645, "train_loss": 4.4108052253723145, "lr": 0.0003995760187152004, "tps": 34044, "wall": 3168.5} {"step": 1646, "train_loss": 4.3851728439331055, "lr": 0.00039957470354377937, "tps": 34011, "wall": 3173.6} {"step": 1647, "train_loss": 4.319056987762451, "lr": 0.0003995733863381264, "tps": 33977, "wall": 3178.6} {"step": 1648, "train_loss": 4.453478813171387, "lr": 0.00039957206709825637, "tps": 33944, "wall": 3183.7} {"step": 1649, "train_loss": 4.44297456741333, "lr": 0.0003995707458241843, "tps": 33912, "wall": 3188.7} {"step": 1650, "train_loss": 4.301326274871826, "lr": 0.0003995694225159251, "tps": 33879, "wall": 3193.7} {"step": 1651, "train_loss": 4.434067249298096, "lr": 0.00039956809717349375, "tps": 33847, "wall": 3198.6} {"step": 1652, "train_loss": 4.396337032318115, "lr": 0.0003995667697969052, "tps": 33815, "wall": 3203.6} {"step": 1653, "train_loss": 4.444315433502197, "lr": 0.0003995654403861747, "tps": 33783, "wall": 3208.6} {"step": 1654, "train_loss": 4.479344844818115, "lr": 0.0003995641089413171, "tps": 33750, "wall": 3213.6} {"step": 1655, "train_loss": 4.438673496246338, "lr": 0.0003995627754623476, "tps": 33718, "wall": 3218.7} {"step": 1656, "train_loss": 4.428854465484619, "lr": 0.00039956143994928126, "tps": 33683, "wall": 3223.9} {"step": 1657, "train_loss": 4.420041084289551, "lr": 0.0003995601024021332, "tps": 33652, "wall": 3228.9} {"step": 1658, "train_loss": 4.366519927978516, "lr": 0.00039955876282091857, "tps": 33619, "wall": 3233.9} {"step": 1659, "train_loss": 4.368251800537109, "lr": 0.0003995574212056526, "tps": 33588, "wall": 3238.9} {"step": 1660, "train_loss": 4.325380325317383, "lr": 0.0003995560775563504, "tps": 33556, "wall": 3243.9} {"step": 1661, "train_loss": 4.318100929260254, "lr": 0.0003995547318730273, "tps": 33524, "wall": 3249.0} {"step": 1662, "train_loss": 4.361179351806641, "lr": 0.00039955338415569844, "tps": 33492, "wall": 3254.0} {"step": 1663, "train_loss": 4.338093280792236, "lr": 0.00039955203440437915, "tps": 33461, "wall": 3259.0} {"step": 1664, "train_loss": 4.418118953704834, "lr": 0.00039955068261908467, "tps": 33430, "wall": 3264.0} {"step": 1665, "train_loss": 4.3706560134887695, "lr": 0.0003995493287998303, "tps": 33399, "wall": 3269.0} {"step": 1666, "train_loss": 4.309211254119873, "lr": 0.00039954797294663156, "tps": 33368, "wall": 3274.0} {"step": 1667, "train_loss": 4.424280166625977, "lr": 0.00039954661505950357, "tps": 33338, "wall": 3278.9} {"step": 1668, "train_loss": 4.460779190063477, "lr": 0.0003995452551384619, "tps": 33305, "wall": 3284.1} {"step": 1669, "train_loss": 4.338419437408447, "lr": 0.00039954389318352175, "tps": 33275, "wall": 3289.1} {"step": 1670, "train_loss": 4.345612525939941, "lr": 0.00039954252919469877, "tps": 33243, "wall": 3294.2} {"step": 1671, "train_loss": 4.400362968444824, "lr": 0.0003995411631720082, "tps": 33213, "wall": 3299.2} {"step": 1672, "train_loss": 4.327606678009033, "lr": 0.0003995397951154657, "tps": 33182, "wall": 3304.2} {"step": 1673, "train_loss": 4.3157148361206055, "lr": 0.0003995384250250867, "tps": 33152, "wall": 3309.2} {"step": 1674, "train_loss": 4.4177021980285645, "lr": 0.0003995370529008866, "tps": 33121, "wall": 3314.2} {"step": 1675, "train_loss": 4.347601890563965, "lr": 0.00039953567874288114, "tps": 33090, "wall": 3319.4} {"step": 1676, "train_loss": 4.375204086303711, "lr": 0.00039953430255108575, "tps": 33060, "wall": 3324.3} {"step": 1677, "train_loss": 4.3099188804626465, "lr": 0.0003995329243255161, "tps": 33030, "wall": 3329.3} {"step": 1678, "train_loss": 4.3282928466796875, "lr": 0.0003995315440661878, "tps": 33000, "wall": 3334.3} {"step": 1679, "train_loss": 4.42563009262085, "lr": 0.00039953016177311643, "tps": 32971, "wall": 3339.3} {"step": 1680, "train_loss": 4.406462669372559, "lr": 0.0003995287774463177, "tps": 32940, "wall": 3344.4} {"step": 1681, "train_loss": 4.460346221923828, "lr": 0.00039952739108580724, "tps": 32905, "wall": 3349.9} {"step": 1682, "train_loss": 4.397539138793945, "lr": 0.0003995260026916007, "tps": 32871, "wall": 3355.4} {"step": 1683, "train_loss": 4.290114402770996, "lr": 0.000399524612263714, "tps": 32841, "wall": 3360.4} {"step": 1684, "train_loss": 4.281014442443848, "lr": 0.00039952321980216273, "tps": 32812, "wall": 3365.5} {"step": 1685, "train_loss": 4.345415115356445, "lr": 0.00039952182530696276, "tps": 32782, "wall": 3370.5} {"step": 1686, "train_loss": 4.3732452392578125, "lr": 0.0003995204287781298, "tps": 32751, "wall": 3375.7} {"step": 1687, "train_loss": 4.472524642944336, "lr": 0.00039951903021567977, "tps": 32720, "wall": 3380.9} {"step": 1688, "train_loss": 4.408173084259033, "lr": 0.0003995176296196284, "tps": 32691, "wall": 3385.9} {"step": 1689, "train_loss": 4.301271915435791, "lr": 0.0003995162269899916, "tps": 32658, "wall": 3391.3} {"step": 1690, "train_loss": 4.412435531616211, "lr": 0.0003995148223267853, "tps": 32629, "wall": 3396.3} {"step": 1691, "train_loss": 4.285093307495117, "lr": 0.0003995134156300254, "tps": 32601, "wall": 3401.3} {"step": 1692, "train_loss": 4.433287143707275, "lr": 0.0003995120068997278, "tps": 32570, "wall": 3406.6} {"step": 1693, "train_loss": 4.350786209106445, "lr": 0.00039951059613590843, "tps": 32540, "wall": 3411.7} {"step": 1694, "train_loss": 4.374648571014404, "lr": 0.0003995091833385833, "tps": 32507, "wall": 3417.2} {"step": 1695, "train_loss": 4.376314640045166, "lr": 0.0003995077685077685, "tps": 32476, "wall": 3422.4} {"step": 1696, "train_loss": 4.4586310386657715, "lr": 0.00039950635164347995, "tps": 32446, "wall": 3427.7} {"step": 1697, "train_loss": 4.331438064575195, "lr": 0.00039950493274573375, "tps": 32415, "wall": 3433.0} {"step": 1698, "train_loss": 4.307926177978516, "lr": 0.000399503511814546, "tps": 32384, "wall": 3438.3} {"step": 1699, "train_loss": 4.400822162628174, "lr": 0.0003995020888499327, "tps": 32353, "wall": 3443.6} {"step": 1700, "train_loss": 4.389965534210205, "lr": 0.00039950066385191003, "tps": 32322, "wall": 3448.9} {"step": 1701, "train_loss": 4.3835272789001465, "lr": 0.00039949923682049414, "tps": 32292, "wall": 3454.2} {"step": 1702, "train_loss": 4.349606990814209, "lr": 0.0003994978077557012, "tps": 32260, "wall": 3459.6} {"step": 1703, "train_loss": 4.398512840270996, "lr": 0.0003994963766575474, "tps": 32229, "wall": 3464.9} {"step": 1704, "train_loss": 4.311205863952637, "lr": 0.00039949494352604887, "tps": 32198, "wall": 3470.3} {"step": 1705, "train_loss": 4.362549781799316, "lr": 0.000399493508361222, "tps": 32167, "wall": 3475.7} {"step": 1706, "train_loss": 4.433620929718018, "lr": 0.00039949207116308285, "tps": 32137, "wall": 3481.0} {"step": 1707, "train_loss": 4.311748027801514, "lr": 0.00039949063193164786, "tps": 32107, "wall": 3486.3} {"step": 1708, "train_loss": 4.402691841125488, "lr": 0.00039948919066693325, "tps": 32077, "wall": 3491.5} {"step": 1709, "train_loss": 4.2576751708984375, "lr": 0.0003994877473689555, "tps": 32048, "wall": 3496.8} {"step": 1710, "train_loss": 4.432242393493652, "lr": 0.00039948630203773066, "tps": 32019, "wall": 3502.0} {"step": 1711, "train_loss": 4.370244979858398, "lr": 0.0003994848546732754, "tps": 31990, "wall": 3507.2} {"step": 1712, "train_loss": 4.3888258934021, "lr": 0.00039948340527560595, "tps": 31963, "wall": 3512.2} {"step": 1713, "train_loss": 4.29171895980835, "lr": 0.0003994819538447388, "tps": 31936, "wall": 3517.2} {"step": 1714, "train_loss": 4.320587635040283, "lr": 0.00039948050038069035, "tps": 31906, "wall": 3522.6} {"step": 1715, "train_loss": 4.426654815673828, "lr": 0.00039947904488347704, "tps": 31879, "wall": 3527.6} {"step": 1716, "train_loss": 4.406039714813232, "lr": 0.0003994775873531155, "tps": 31850, "wall": 3533.0} {"step": 1717, "train_loss": 4.307332992553711, "lr": 0.00039947612778962205, "tps": 31822, "wall": 3538.1} {"step": 1718, "train_loss": 4.390197277069092, "lr": 0.00039947466619301344, "tps": 31795, "wall": 3543.1} {"step": 1719, "train_loss": 4.287144660949707, "lr": 0.000399473202563306, "tps": 31769, "wall": 3548.1} {"step": 1720, "train_loss": 4.365734100341797, "lr": 0.00039947173690051634, "tps": 31740, "wall": 3553.4} {"step": 1721, "train_loss": 4.441973686218262, "lr": 0.0003994702692046613, "tps": 31711, "wall": 3558.8} {"step": 1722, "train_loss": 4.379111289978027, "lr": 0.00039946879947575723, "tps": 31683, "wall": 3564.0} {"step": 1723, "train_loss": 4.2939453125, "lr": 0.0003994673277138209, "tps": 31655, "wall": 3569.2} {"step": 1724, "train_loss": 4.372567176818848, "lr": 0.000399465853918869, "tps": 31625, "wall": 3574.6} {"step": 1725, "train_loss": 4.339035511016846, "lr": 0.0003994643780909182, "tps": 31597, "wall": 3579.8} {"step": 1726, "train_loss": 4.4185471534729, "lr": 0.00039946290022998523, "tps": 31570, "wall": 3585.0} {"step": 1727, "train_loss": 4.395648002624512, "lr": 0.0003994614203360868, "tps": 31542, "wall": 3590.2} {"step": 1728, "train_loss": 4.315542697906494, "lr": 0.00039945993840923965, "tps": 31514, "wall": 3595.5} {"step": 1729, "train_loss": 4.352089881896973, "lr": 0.0003994584544494607, "tps": 31487, "wall": 3600.7} {"step": 1730, "train_loss": 4.331515789031982, "lr": 0.0003994569684567666, "tps": 31460, "wall": 3605.9} {"step": 1731, "train_loss": 4.297792434692383, "lr": 0.0003994554804311743, "tps": 31432, "wall": 3611.2} {"step": 1732, "train_loss": 4.359083652496338, "lr": 0.0003994539903727005, "tps": 31405, "wall": 3616.4} {"step": 1733, "train_loss": 4.293667316436768, "lr": 0.0003994524982813623, "tps": 31380, "wall": 3621.4} {"step": 1734, "train_loss": 4.344047546386719, "lr": 0.00039945100415717644, "tps": 31355, "wall": 3626.3} {"step": 1735, "train_loss": 4.355501651763916, "lr": 0.00039944950800015997, "tps": 31330, "wall": 3631.3} {"step": 1736, "train_loss": 4.431325435638428, "lr": 0.00039944800981032963, "tps": 31305, "wall": 3636.3} {"step": 1737, "train_loss": 4.32811164855957, "lr": 0.0003994465095877026, "tps": 31278, "wall": 3641.6} {"step": 1738, "train_loss": 4.288454055786133, "lr": 0.00039944500733229586, "tps": 31251, "wall": 3646.8} {"step": 1739, "train_loss": 4.374111175537109, "lr": 0.0003994435030441263, "tps": 31224, "wall": 3652.1} {"step": 1740, "train_loss": 4.400799751281738, "lr": 0.0003994419967232111, "tps": 31197, "wall": 3657.3} {"step": 1741, "train_loss": 4.244153022766113, "lr": 0.0003994404883695672, "tps": 31170, "wall": 3662.5} {"step": 1742, "train_loss": 4.332793712615967, "lr": 0.00039943897798321173, "tps": 31144, "wall": 3667.7} {"step": 1743, "train_loss": 4.3617353439331055, "lr": 0.0003994374655641618, "tps": 31117, "wall": 3673.0} {"step": 1744, "train_loss": 4.346472263336182, "lr": 0.0003994359511124346, "tps": 31091, "wall": 3678.2} {"step": 1745, "train_loss": 4.440155506134033, "lr": 0.00039943443462804725, "tps": 31065, "wall": 3683.4} {"step": 1746, "train_loss": 4.249179363250732, "lr": 0.0003994329161110169, "tps": 31039, "wall": 3688.6} {"step": 1747, "train_loss": 4.361294269561768, "lr": 0.0003994313955613607, "tps": 31012, "wall": 3693.9} {"step": 1748, "train_loss": 4.465287685394287, "lr": 0.000399429872979096, "tps": 30985, "wall": 3699.2} {"step": 1749, "train_loss": 4.323521137237549, "lr": 0.0003994283483642399, "tps": 30961, "wall": 3704.2} {"step": 1750, "train_loss": 4.320242881774902, "lr": 0.0003994268217168099, "tps": 30937, "wall": 3709.2} {"step": 1751, "train_loss": 4.369041442871094, "lr": 0.0003994252930368231, "tps": 30913, "wall": 3714.2} {"step": 1752, "train_loss": 4.29787015914917, "lr": 0.0003994237623242969, "tps": 30889, "wall": 3719.2} {"step": 1753, "train_loss": 4.2804388999938965, "lr": 0.0003994222295792486, "tps": 30866, "wall": 3724.2} {"step": 1754, "train_loss": 4.272406578063965, "lr": 0.0003994206948016956, "tps": 30842, "wall": 3729.2} {"step": 1755, "train_loss": 4.2644147872924805, "lr": 0.0003994191579916552, "tps": 30818, "wall": 3734.1} {"step": 1756, "train_loss": 4.444793224334717, "lr": 0.00039941761914914493, "tps": 30795, "wall": 3739.1} {"step": 1757, "train_loss": 4.332823753356934, "lr": 0.00039941607827418215, "tps": 30771, "wall": 3744.1} {"step": 1758, "train_loss": 4.294529914855957, "lr": 0.0003994145353667843, "tps": 30746, "wall": 3749.4} {"step": 1759, "train_loss": 4.366275310516357, "lr": 0.00039941299042696893, "tps": 30721, "wall": 3754.5} {"step": 1760, "train_loss": 4.2759270668029785, "lr": 0.00039941144345475346, "tps": 30696, "wall": 3759.7} {"step": 1761, "train_loss": 4.364970684051514, "lr": 0.0003994098944501555, "tps": 30671, "wall": 3764.9} {"step": 1762, "train_loss": 4.326752185821533, "lr": 0.0003994083434131925, "tps": 30646, "wall": 3770.1} {"step": 1763, "train_loss": 4.3698601722717285, "lr": 0.0003994067903438821, "tps": 30620, "wall": 3775.4} {"step": 1764, "train_loss": 4.189781665802002, "lr": 0.0003994052352422418, "tps": 30595, "wall": 3780.6} {"step": 1765, "train_loss": 4.358157157897949, "lr": 0.0003994036781082894, "tps": 30570, "wall": 3785.9} {"step": 1766, "train_loss": 4.361883640289307, "lr": 0.0003994021189420424, "tps": 30545, "wall": 3791.1} {"step": 1767, "train_loss": 4.31028938293457, "lr": 0.0003994005577435184, "tps": 30520, "wall": 3796.4} {"step": 1768, "train_loss": 4.338536739349365, "lr": 0.0003993989945127353, "tps": 30495, "wall": 3801.7} {"step": 1769, "train_loss": 4.389545440673828, "lr": 0.00039939742924971066, "tps": 30470, "wall": 3806.9} {"step": 1770, "train_loss": 4.305353164672852, "lr": 0.00039939586195446216, "tps": 30445, "wall": 3812.2} {"step": 1771, "train_loss": 4.299271583557129, "lr": 0.0003993942926270077, "tps": 30420, "wall": 3817.4} {"step": 1772, "train_loss": 4.322881698608398, "lr": 0.000399392721267365, "tps": 30395, "wall": 3822.7} {"step": 1773, "train_loss": 4.289611339569092, "lr": 0.00039939114787555184, "tps": 30372, "wall": 3827.8} {"step": 1774, "train_loss": 4.266219615936279, "lr": 0.000399389572451586, "tps": 30349, "wall": 3832.8} {"step": 1775, "train_loss": 4.3864874839782715, "lr": 0.00039938799499548543, "tps": 30327, "wall": 3837.8} {"step": 1776, "train_loss": 4.4204535484313965, "lr": 0.00039938641550726797, "tps": 30305, "wall": 3842.8} {"step": 1777, "train_loss": 4.368368625640869, "lr": 0.0003993848339869514, "tps": 30283, "wall": 3847.7} {"step": 1778, "train_loss": 4.420487403869629, "lr": 0.0003993832504345538, "tps": 30261, "wall": 3852.7} {"step": 1779, "train_loss": 4.275766372680664, "lr": 0.00039938166485009303, "tps": 30239, "wall": 3857.7} {"step": 1780, "train_loss": 4.249674320220947, "lr": 0.000399380077233587, "tps": 30215, "wall": 3862.9} {"step": 1781, "train_loss": 4.286487102508545, "lr": 0.0003993784875850538, "tps": 30192, "wall": 3868.1} {"step": 1782, "train_loss": 4.363354682922363, "lr": 0.0003993768959045114, "tps": 30168, "wall": 3873.3} {"step": 1783, "train_loss": 4.238293647766113, "lr": 0.00039937530219197776, "tps": 30144, "wall": 3878.6} {"step": 1784, "train_loss": 4.4116411209106445, "lr": 0.00039937370644747106, "tps": 30119, "wall": 3883.9} {"step": 1785, "train_loss": 4.26014518737793, "lr": 0.0003993721086710093, "tps": 30095, "wall": 3889.2} {"step": 1786, "train_loss": 4.488839626312256, "lr": 0.00039937050886261054, "tps": 30071, "wall": 3894.5} {"step": 1787, "train_loss": 4.280060768127441, "lr": 0.000399368907022293, "tps": 30047, "wall": 3899.8} {"step": 1788, "train_loss": 4.378693103790283, "lr": 0.00039936730315007473, "tps": 30023, "wall": 3905.1} {"step": 1789, "train_loss": 4.304776668548584, "lr": 0.000399365697245974, "tps": 29998, "wall": 3910.5} {"step": 1790, "train_loss": 4.324399471282959, "lr": 0.0003993640893100089, "tps": 29974, "wall": 3915.9} {"step": 1791, "train_loss": 4.3341965675354, "lr": 0.0003993624793421977, "tps": 29950, "wall": 3921.2} {"step": 1792, "train_loss": 4.341606140136719, "lr": 0.00039936086734255864, "tps": 29926, "wall": 3926.4} {"step": 1793, "train_loss": 4.272013187408447, "lr": 0.00039935925331111005, "tps": 29902, "wall": 3931.9} {"step": 1794, "train_loss": 4.337986946105957, "lr": 0.00039935763724787006, "tps": 29877, "wall": 3937.3} {"step": 1795, "train_loss": 4.366614818572998, "lr": 0.000399356019152857, "tps": 29854, "wall": 3942.5} {"step": 1796, "train_loss": 4.2375383377075195, "lr": 0.00039935439902608934, "tps": 29831, "wall": 3947.8} {"step": 1797, "train_loss": 4.414261341094971, "lr": 0.0003993527768675853, "tps": 29807, "wall": 3953.2} {"step": 1798, "train_loss": 4.260814666748047, "lr": 0.0003993511526773633, "tps": 29785, "wall": 3958.3} {"step": 1799, "train_loss": 4.351545333862305, "lr": 0.0003993495264554418, "tps": 29763, "wall": 3963.4} {"step": 1800, "train_loss": 4.208061695098877, "lr": 0.0003993478982018391, "tps": 29741, "wall": 3968.6} {"step": 1801, "train_loss": 4.376336574554443, "lr": 0.00039934626791657366, "tps": 29718, "wall": 3973.8} {"step": 1802, "train_loss": 4.3240180015563965, "lr": 0.0003993446355996641, "tps": 29695, "wall": 3979.0} {"step": 1803, "train_loss": 4.4280009269714355, "lr": 0.00039934300125112873, "tps": 29675, "wall": 3984.0} {"step": 1804, "train_loss": 4.3537397384643555, "lr": 0.0003993413648709862, "tps": 29653, "wall": 3989.2} {"step": 1805, "train_loss": 4.332210063934326, "lr": 0.00039933972645925497, "tps": 29627, "wall": 3994.9} {"step": 1806, "train_loss": 4.374983787536621, "lr": 0.0003993380860159536, "tps": 29603, "wall": 4000.3} {"step": 1807, "train_loss": 4.262181282043457, "lr": 0.00039933644354110074, "tps": 29582, "wall": 4005.4} {"step": 1808, "train_loss": 4.296293258666992, "lr": 0.00039933479903471485, "tps": 29558, "wall": 4010.9} {"step": 1809, "train_loss": 4.321403980255127, "lr": 0.0003993331524968147, "tps": 29535, "wall": 4016.2} {"step": 1810, "train_loss": 4.345311641693115, "lr": 0.0003993315039274189, "tps": 29511, "wall": 4021.7} {"step": 1811, "train_loss": 4.2800116539001465, "lr": 0.0003993298533265461, "tps": 29487, "wall": 4027.1} {"step": 1812, "train_loss": 4.248198509216309, "lr": 0.00039932820069421505, "tps": 29464, "wall": 4032.5} {"step": 1813, "train_loss": 4.164215564727783, "lr": 0.00039932654603044447, "tps": 29442, "wall": 4037.8} {"step": 1814, "train_loss": 4.286027431488037, "lr": 0.000399324889335253, "tps": 29419, "wall": 4043.2} {"step": 1815, "train_loss": 4.342743873596191, "lr": 0.00039932323060865954, "tps": 29396, "wall": 4048.5} {"step": 1816, "train_loss": 4.2619218826293945, "lr": 0.00039932156985068276, "tps": 29373, "wall": 4053.9} {"step": 1817, "train_loss": 4.342997074127197, "lr": 0.0003993199070613416, "tps": 29351, "wall": 4059.2} {"step": 1818, "train_loss": 4.302964687347412, "lr": 0.00039931824224065485, "tps": 29329, "wall": 4064.5} {"step": 1819, "train_loss": 4.356937408447266, "lr": 0.0003993165753886413, "tps": 29308, "wall": 4069.7} {"step": 1820, "train_loss": 4.317519187927246, "lr": 0.00039931490650531987, "tps": 29286, "wall": 4075.0} {"step": 1821, "train_loss": 4.31289529800415, "lr": 0.0003993132355907095, "tps": 29264, "wall": 4080.2} {"step": 1822, "train_loss": 4.354696273803711, "lr": 0.0003993115626448291, "tps": 29243, "wall": 4085.5} {"step": 1823, "train_loss": 4.30264949798584, "lr": 0.00039930988766769763, "tps": 29223, "wall": 4090.4} {"step": 1824, "train_loss": 4.466497898101807, "lr": 0.000399308210659334, "tps": 29204, "wall": 4095.4} {"step": 1825, "train_loss": 4.335977554321289, "lr": 0.00039930653161975737, "tps": 29184, "wall": 4100.4} {"step": 1826, "train_loss": 4.262021541595459, "lr": 0.0003993048505489865, "tps": 29165, "wall": 4105.4} {"step": 1827, "train_loss": 4.268893718719482, "lr": 0.0003993031674470407, "tps": 29145, "wall": 4110.4} {"step": 1828, "train_loss": 4.345900535583496, "lr": 0.00039930148231393886, "tps": 29126, "wall": 4115.3} {"step": 1829, "train_loss": 4.440033435821533, "lr": 0.0003992997951497002, "tps": 29106, "wall": 4120.4} {"step": 1830, "train_loss": 4.3764238357543945, "lr": 0.0003992981059543437, "tps": 29087, "wall": 4125.3} {"step": 1831, "train_loss": 4.330908298492432, "lr": 0.0003992964147278885, "tps": 29068, "wall": 4130.3} {"step": 1832, "train_loss": 4.250420093536377, "lr": 0.0003992947214703539, "tps": 29047, "wall": 4135.6} {"step": 1833, "train_loss": 4.305638313293457, "lr": 0.000399293026181759, "tps": 29026, "wall": 4140.8} {"step": 1834, "train_loss": 4.395424842834473, "lr": 0.000399291328862123, "tps": 29005, "wall": 4146.0} {"step": 1835, "train_loss": 4.324113845825195, "lr": 0.0003992896295114651, "tps": 28985, "wall": 4151.2} {"step": 1836, "train_loss": 4.298093795776367, "lr": 0.0003992879281298045, "tps": 28964, "wall": 4156.5} {"step": 1837, "train_loss": 4.332225322723389, "lr": 0.00039928622471716073, "tps": 28943, "wall": 4161.7} {"step": 1838, "train_loss": 4.300453186035156, "lr": 0.0003992845192735528, "tps": 28922, "wall": 4167.0} {"step": 1839, "train_loss": 4.460129261016846, "lr": 0.00039928281179900014, "tps": 28902, "wall": 4172.2} {"step": 1840, "train_loss": 4.312843322753906, "lr": 0.00039928110229352204, "tps": 28880, "wall": 4177.6} {"step": 1841, "train_loss": 4.361216068267822, "lr": 0.00039927939075713796, "tps": 28859, "wall": 4182.9} {"step": 1842, "train_loss": 4.2386932373046875, "lr": 0.0003992776771898673, "tps": 28839, "wall": 4188.1} {"step": 1843, "train_loss": 4.225980758666992, "lr": 0.00039927596159172935, "tps": 28818, "wall": 4193.4} {"step": 1844, "train_loss": 4.269289016723633, "lr": 0.0003992742439627436, "tps": 28797, "wall": 4198.7} {"step": 1845, "train_loss": 4.2173919677734375, "lr": 0.00039927252430292957, "tps": 28777, "wall": 4204.0} {"step": 1846, "train_loss": 4.256932735443115, "lr": 0.00039927080261230666, "tps": 28756, "wall": 4209.3} {"step": 1847, "train_loss": 4.335192680358887, "lr": 0.00039926907889089436, "tps": 28736, "wall": 4214.5} {"step": 1848, "train_loss": 4.338057994842529, "lr": 0.0003992673531387123, "tps": 28715, "wall": 4219.9} {"step": 1849, "train_loss": 4.2995195388793945, "lr": 0.0003992656253557799, "tps": 28695, "wall": 4225.2} {"step": 1850, "train_loss": 4.29888916015625, "lr": 0.0003992638955421168, "tps": 28675, "wall": 4230.3} {"step": 1851, "train_loss": 4.2089433670043945, "lr": 0.0003992621636977427, "tps": 28657, "wall": 4235.3} {"step": 1852, "train_loss": 4.318658828735352, "lr": 0.00039926042982267704, "tps": 28638, "wall": 4240.3} {"step": 1853, "train_loss": 4.376907825469971, "lr": 0.0003992586939169395, "tps": 28620, "wall": 4245.4} {"step": 1854, "train_loss": 4.420835018157959, "lr": 0.0003992569559805498, "tps": 28600, "wall": 4250.6} {"step": 1855, "train_loss": 4.302666664123535, "lr": 0.00039925521601352765, "tps": 28577, "wall": 4256.3} {"step": 1856, "train_loss": 4.3225812911987305, "lr": 0.00039925347401589264, "tps": 28555, "wall": 4261.8} {"step": 1857, "train_loss": 4.380767345428467, "lr": 0.0003992517299876646, "tps": 28535, "wall": 4267.2} {"step": 1858, "train_loss": 4.304220676422119, "lr": 0.0003992499839288633, "tps": 28515, "wall": 4272.5} {"step": 1859, "train_loss": 4.329195022583008, "lr": 0.00039924823583950845, "tps": 28495, "wall": 4277.8} {"step": 1860, "train_loss": 4.3322529792785645, "lr": 0.0003992464857196199, "tps": 28474, "wall": 4283.1} {"step": 1861, "train_loss": 4.250975131988525, "lr": 0.00039924473356921746, "tps": 28454, "wall": 4288.5} {"step": 1862, "train_loss": 4.255090713500977, "lr": 0.000399242979388321, "tps": 28436, "wall": 4293.5} {"step": 1863, "train_loss": 4.275110721588135, "lr": 0.0003992412231769504, "tps": 28419, "wall": 4298.4} {"step": 1864, "train_loss": 4.28231954574585, "lr": 0.0003992394649351255, "tps": 28401, "wall": 4303.5} {"step": 1865, "train_loss": 4.276708126068115, "lr": 0.0003992377046628662, "tps": 28382, "wall": 4308.6} {"step": 1866, "train_loss": 4.402408599853516, "lr": 0.00039923594236019255, "tps": 28364, "wall": 4313.6} {"step": 1867, "train_loss": 4.223294734954834, "lr": 0.0003992341780271244, "tps": 28347, "wall": 4318.6} {"step": 1868, "train_loss": 4.3497443199157715, "lr": 0.00039923241166368184, "tps": 28329, "wall": 4323.6} {"step": 1869, "train_loss": 4.2797017097473145, "lr": 0.0003992306432698847, "tps": 28312, "wall": 4328.6} {"step": 1870, "train_loss": 4.266819953918457, "lr": 0.00039922887284575326, "tps": 28294, "wall": 4333.6} {"step": 1871, "train_loss": 4.263851642608643, "lr": 0.0003992271003913074, "tps": 28277, "wall": 4338.5} {"step": 1872, "train_loss": 4.280048370361328, "lr": 0.0003992253259065673, "tps": 28260, "wall": 4343.5} {"step": 1873, "train_loss": 4.251438617706299, "lr": 0.00039922354939155296, "tps": 28243, "wall": 4348.5} {"step": 1874, "train_loss": 4.326575756072998, "lr": 0.0003992217708462846, "tps": 28225, "wall": 4353.6} {"step": 1875, "train_loss": 4.256434440612793, "lr": 0.0003992199902707823, "tps": 28207, "wall": 4358.7} {"step": 1876, "train_loss": 4.336190700531006, "lr": 0.0003992182076650662, "tps": 28189, "wall": 4363.8} {"step": 1877, "train_loss": 4.286298751831055, "lr": 0.00039921642302915666, "tps": 28171, "wall": 4368.8} {"step": 1878, "train_loss": 4.307191371917725, "lr": 0.0003992146363630737, "tps": 28153, "wall": 4373.9} {"step": 1879, "train_loss": 4.246586322784424, "lr": 0.0003992128476668377, "tps": 28136, "wall": 4378.9} {"step": 1880, "train_loss": 4.219140529632568, "lr": 0.0003992110569404688, "tps": 28119, "wall": 4384.0} {"step": 1881, "train_loss": 4.24991512298584, "lr": 0.0003992092641839874, "tps": 28101, "wall": 4389.0} {"step": 1882, "train_loss": 4.183224678039551, "lr": 0.00039920746939741373, "tps": 28084, "wall": 4394.0} {"step": 1883, "train_loss": 4.352125644683838, "lr": 0.0003992056725807682, "tps": 28067, "wall": 4399.1} {"step": 1884, "train_loss": 4.318936347961426, "lr": 0.0003992038737340711, "tps": 28049, "wall": 4404.1} {"step": 1885, "train_loss": 4.3492231369018555, "lr": 0.00039920207285734275, "tps": 28032, "wall": 4409.2} {"step": 1886, "train_loss": 4.260662078857422, "lr": 0.0003992002699506037, "tps": 28015, "wall": 4414.3} {"step": 1887, "train_loss": 4.257899284362793, "lr": 0.0003991984650138743, "tps": 27997, "wall": 4419.3} {"step": 1888, "train_loss": 4.20151948928833, "lr": 0.00039919665804717496, "tps": 27981, "wall": 4424.3} {"step": 1889, "train_loss": 4.181796550750732, "lr": 0.00039919484905052624, "tps": 27964, "wall": 4429.3} {"step": 1890, "train_loss": 4.238351345062256, "lr": 0.0003991930380239485, "tps": 27946, "wall": 4434.4} {"step": 1891, "train_loss": 4.44590950012207, "lr": 0.0003991912249674624, "tps": 27930, "wall": 4439.4} {"step": 1892, "train_loss": 4.196640968322754, "lr": 0.00039918940988108837, "tps": 27913, "wall": 4444.4} {"step": 1893, "train_loss": 4.22296142578125, "lr": 0.000399187592764847, "tps": 27896, "wall": 4449.4} {"step": 1894, "train_loss": 4.312655925750732, "lr": 0.0003991857736187589, "tps": 27880, "wall": 4454.4} {"step": 1895, "train_loss": 4.218646049499512, "lr": 0.00039918395244284465, "tps": 27862, "wall": 4459.7} {"step": 1896, "train_loss": 4.387688636779785, "lr": 0.00039918212923712495, "tps": 27844, "wall": 4464.9} {"step": 1897, "train_loss": 4.37492561340332, "lr": 0.0003991803040016203, "tps": 27827, "wall": 4469.9} {"step": 1898, "train_loss": 4.298669338226318, "lr": 0.00039917847673635155, "tps": 27811, "wall": 4474.8} {"step": 1899, "train_loss": 4.262752532958984, "lr": 0.0003991766474413393, "tps": 27795, "wall": 4479.8} {"step": 1900, "train_loss": 4.267268180847168, "lr": 0.0003991748161166043, "tps": 27779, "wall": 4484.7} {"step": 1901, "train_loss": 4.258801460266113, "lr": 0.00039917298276216727, "tps": 27763, "wall": 4489.7} {"step": 1902, "train_loss": 4.325536251068115, "lr": 0.000399171147378049, "tps": 27747, "wall": 4494.7} {"step": 1903, "train_loss": 4.3369245529174805, "lr": 0.0003991693099642703, "tps": 27731, "wall": 4499.7} {"step": 1904, "train_loss": 4.339516639709473, "lr": 0.00039916747052085196, "tps": 27714, "wall": 4504.7} {"step": 1905, "train_loss": 4.310155868530273, "lr": 0.0003991656290478148, "tps": 27697, "wall": 4509.8} {"step": 1906, "train_loss": 4.253225326538086, "lr": 0.0003991637855451797, "tps": 27681, "wall": 4514.8} {"step": 1907, "train_loss": 4.243506908416748, "lr": 0.00039916194001296757, "tps": 27665, "wall": 4519.9} {"step": 1908, "train_loss": 4.261056423187256, "lr": 0.0003991600924511993, "tps": 27648, "wall": 4524.9} {"step": 1909, "train_loss": 4.24220085144043, "lr": 0.0003991582428598958, "tps": 27632, "wall": 4529.9} {"step": 1910, "train_loss": 4.28787899017334, "lr": 0.00039915639123907804, "tps": 27616, "wall": 4534.9} {"step": 1911, "train_loss": 4.25684118270874, "lr": 0.00039915453758876694, "tps": 27600, "wall": 4539.9} {"step": 1912, "train_loss": 4.253540992736816, "lr": 0.00039915268190898355, "tps": 27585, "wall": 4544.9} {"step": 1913, "train_loss": 4.3095316886901855, "lr": 0.000399150824199749, "tps": 27569, "wall": 4549.8} {"step": 1914, "train_loss": 4.321671009063721, "lr": 0.00039914896446108407, "tps": 27553, "wall": 4554.8} {"step": 1915, "train_loss": 4.283848762512207, "lr": 0.00039914710269301005, "tps": 27538, "wall": 4559.8} {"step": 1916, "train_loss": 4.258824348449707, "lr": 0.000399145238895548, "tps": 27522, "wall": 4564.7} {"step": 1917, "train_loss": 4.315642356872559, "lr": 0.0003991433730687189, "tps": 27507, "wall": 4569.7} {"step": 1918, "train_loss": 4.330719947814941, "lr": 0.000399141505212544, "tps": 27491, "wall": 4574.6} {"step": 1919, "train_loss": 4.212517738342285, "lr": 0.0003991396353270445, "tps": 27476, "wall": 4579.5} {"step": 1920, "train_loss": 4.260885238647461, "lr": 0.00039913776341224145, "tps": 27461, "wall": 4584.5} {"step": 1921, "train_loss": 4.205421447753906, "lr": 0.0003991358894681562, "tps": 27445, "wall": 4589.4} {"step": 1922, "train_loss": 4.254768371582031, "lr": 0.0003991340134948098, "tps": 27430, "wall": 4594.4} {"step": 1923, "train_loss": 4.209268569946289, "lr": 0.00039913213549222374, "tps": 27414, "wall": 4599.4} {"step": 1924, "train_loss": 4.2938456535339355, "lr": 0.000399130255460419, "tps": 27399, "wall": 4604.3} {"step": 1925, "train_loss": 4.3491926193237305, "lr": 0.0003991283733994172, "tps": 27384, "wall": 4609.3} {"step": 1926, "train_loss": 4.263005256652832, "lr": 0.0003991264893092394, "tps": 27368, "wall": 4614.3} {"step": 1927, "train_loss": 4.338296890258789, "lr": 0.00039912460318990704, "tps": 27353, "wall": 4619.2} {"step": 1928, "train_loss": 4.180665969848633, "lr": 0.0003991227150414415, "tps": 27338, "wall": 4624.2} {"step": 1929, "train_loss": 4.245059967041016, "lr": 0.00039912082486386416, "tps": 27323, "wall": 4629.1} {"step": 1930, "train_loss": 4.2427849769592285, "lr": 0.00039911893265719644, "tps": 27308, "wall": 4634.1} {"step": 1931, "train_loss": 4.245390892028809, "lr": 0.0003991170384214597, "tps": 27293, "wall": 4639.0} {"step": 1932, "train_loss": 4.272307395935059, "lr": 0.00039911514215667555, "tps": 27278, "wall": 4644.0} {"step": 1933, "train_loss": 4.2772321701049805, "lr": 0.0003991132438628653, "tps": 27263, "wall": 4648.9} {"step": 1934, "train_loss": 4.232913017272949, "lr": 0.00039911134354005053, "tps": 27248, "wall": 4653.8} {"step": 1935, "train_loss": 4.201873779296875, "lr": 0.00039910944118825285, "tps": 27234, "wall": 4658.8} {"step": 1936, "train_loss": 4.303892135620117, "lr": 0.00039910753680749364, "tps": 27219, "wall": 4663.7} {"step": 1937, "train_loss": 4.30410623550415, "lr": 0.0003991056303977946, "tps": 27204, "wall": 4668.7} {"step": 1938, "train_loss": 4.1613006591796875, "lr": 0.0003991037219591773, "tps": 27189, "wall": 4673.7} {"step": 1939, "train_loss": 4.407108783721924, "lr": 0.0003991018114916634, "tps": 27174, "wall": 4678.6} {"step": 1940, "train_loss": 4.285360336303711, "lr": 0.0003990998989952744, "tps": 27159, "wall": 4683.6} {"step": 1941, "train_loss": 4.171177387237549, "lr": 0.0003990979844700321, "tps": 27145, "wall": 4688.5} {"step": 1942, "train_loss": 4.244608402252197, "lr": 0.0003990960679159581, "tps": 27130, "wall": 4693.5} {"step": 1943, "train_loss": 4.245172500610352, "lr": 0.0003990941493330742, "tps": 27115, "wall": 4698.5} {"step": 1944, "train_loss": 4.260507583618164, "lr": 0.00039909222872140204, "tps": 27100, "wall": 4703.4} {"step": 1945, "train_loss": 4.29356575012207, "lr": 0.00039909030608096353, "tps": 27086, "wall": 4708.4} {"step": 1946, "train_loss": 4.312390327453613, "lr": 0.0003990883814117802, "tps": 27072, "wall": 4713.3} {"step": 1947, "train_loss": 4.222968578338623, "lr": 0.0003990864547138741, "tps": 27057, "wall": 4718.2} {"step": 1948, "train_loss": 4.413747787475586, "lr": 0.0003990845259872669, "tps": 27043, "wall": 4723.2} {"step": 1949, "train_loss": 4.280021667480469, "lr": 0.0003990825952319805, "tps": 27028, "wall": 4728.1} {"step": 1950, "train_loss": 4.231388092041016, "lr": 0.0003990806624480368, "tps": 27013, "wall": 4733.1} {"step": 1951, "train_loss": 4.268215179443359, "lr": 0.00039907872763545767, "tps": 26999, "wall": 4738.1} {"step": 1952, "train_loss": 4.1854095458984375, "lr": 0.00039907679079426503, "tps": 26985, "wall": 4743.0} {"step": 1953, "train_loss": 4.250424861907959, "lr": 0.0003990748519244808, "tps": 26970, "wall": 4748.0} {"step": 1954, "train_loss": 4.310706615447998, "lr": 0.000399072911026127, "tps": 26956, "wall": 4752.9} {"step": 1955, "train_loss": 4.236047744750977, "lr": 0.0003990709680992255, "tps": 26942, "wall": 4757.8} {"step": 1956, "train_loss": 4.121511459350586, "lr": 0.00039906902314379845, "tps": 26928, "wall": 4762.8} {"step": 1957, "train_loss": 4.181057929992676, "lr": 0.0003990670761598677, "tps": 26913, "wall": 4767.8} {"step": 1958, "train_loss": 4.316096782684326, "lr": 0.0003990651271474556, "tps": 26899, "wall": 4772.7} {"step": 1959, "train_loss": 4.149025917053223, "lr": 0.00039906317610658397, "tps": 26885, "wall": 4777.7} {"step": 1960, "train_loss": 4.200543403625488, "lr": 0.000399061223037275, "tps": 26871, "wall": 4782.6} {"step": 1961, "train_loss": 4.139656066894531, "lr": 0.0003990592679395508, "tps": 26857, "wall": 4787.6} {"step": 1962, "train_loss": 4.185357093811035, "lr": 0.0003990573108134335, "tps": 26843, "wall": 4792.6} {"step": 1963, "train_loss": 4.217287063598633, "lr": 0.00039905535165894534, "tps": 26829, "wall": 4797.5} {"step": 1964, "train_loss": 4.172221660614014, "lr": 0.00039905339047610844, "tps": 26815, "wall": 4802.5} {"step": 1965, "train_loss": 4.225429058074951, "lr": 0.00039905142726494503, "tps": 26801, "wall": 4807.4} {"step": 1966, "train_loss": 4.310910224914551, "lr": 0.00039904946202547745, "tps": 26787, "wall": 4812.3} {"step": 1967, "train_loss": 4.241264343261719, "lr": 0.0003990474947577278, "tps": 26773, "wall": 4817.3} {"step": 1968, "train_loss": 4.23159646987915, "lr": 0.00039904552546171846, "tps": 26759, "wall": 4822.2} {"step": 1969, "train_loss": 4.27298641204834, "lr": 0.0003990435541374717, "tps": 26745, "wall": 4827.1} {"step": 1970, "train_loss": 4.186271667480469, "lr": 0.00039904158078500997, "tps": 26732, "wall": 4832.1} {"step": 1971, "train_loss": 4.2890095710754395, "lr": 0.0003990396054043554, "tps": 26718, "wall": 4837.0} {"step": 1972, "train_loss": 4.147002220153809, "lr": 0.00039903762799553056, "tps": 26704, "wall": 4842.0} {"step": 1973, "train_loss": 4.251232147216797, "lr": 0.0003990356485585578, "tps": 26690, "wall": 4846.9} {"step": 1974, "train_loss": 4.214112281799316, "lr": 0.00039903366709345955, "tps": 26676, "wall": 4851.9} {"step": 1975, "train_loss": 4.223443984985352, "lr": 0.00039903168360025816, "tps": 26663, "wall": 4856.8} {"step": 1976, "train_loss": 4.221012115478516, "lr": 0.0003990296980789762, "tps": 26649, "wall": 4861.8} {"step": 1977, "train_loss": 4.296561241149902, "lr": 0.00039902771052963614, "tps": 26635, "wall": 4866.8} {"step": 1978, "train_loss": 4.162383079528809, "lr": 0.0003990257209522605, "tps": 26622, "wall": 4871.7} {"step": 1979, "train_loss": 4.258190631866455, "lr": 0.0003990237293468717, "tps": 26608, "wall": 4876.6} {"step": 1980, "train_loss": 4.210620880126953, "lr": 0.0003990217357134925, "tps": 26595, "wall": 4881.6} {"step": 1981, "train_loss": 4.2768168449401855, "lr": 0.0003990197400521454, "tps": 26581, "wall": 4886.5} {"step": 1982, "train_loss": 4.147484302520752, "lr": 0.000399017742362853, "tps": 26568, "wall": 4891.4} {"step": 1983, "train_loss": 4.238974571228027, "lr": 0.0003990157426456379, "tps": 26554, "wall": 4896.4} {"step": 1984, "train_loss": 4.236141204833984, "lr": 0.0003990137409005229, "tps": 26541, "wall": 4901.3} {"step": 1985, "train_loss": 4.249655723571777, "lr": 0.0003990117371275304, "tps": 26528, "wall": 4906.3} {"step": 1986, "train_loss": 4.137585639953613, "lr": 0.0003990097313266833, "tps": 26514, "wall": 4911.3} {"step": 1987, "train_loss": 4.136044979095459, "lr": 0.00039900772349800434, "tps": 26500, "wall": 4916.3} {"step": 1988, "train_loss": 4.222810745239258, "lr": 0.0003990057136415162, "tps": 26487, "wall": 4921.2} {"step": 1989, "train_loss": 4.299720764160156, "lr": 0.00039900370175724155, "tps": 26474, "wall": 4926.1} {"step": 1990, "train_loss": 4.227293491363525, "lr": 0.0003990016878452034, "tps": 26461, "wall": 4931.1} {"step": 1991, "train_loss": 4.234063148498535, "lr": 0.00039899967190542434, "tps": 26447, "wall": 4936.1} {"step": 1992, "train_loss": 4.284236431121826, "lr": 0.0003989976539379274, "tps": 26434, "wall": 4941.1} {"step": 1993, "train_loss": 4.248186111450195, "lr": 0.00039899563394273535, "tps": 26420, "wall": 4946.0} {"step": 1994, "train_loss": 4.223628044128418, "lr": 0.00039899361191987105, "tps": 26407, "wall": 4951.0} {"step": 1995, "train_loss": 4.206341743469238, "lr": 0.0003989915878693574, "tps": 26394, "wall": 4955.9} {"step": 1996, "train_loss": 4.217950820922852, "lr": 0.0003989895617912174, "tps": 26381, "wall": 4960.8} {"step": 1997, "train_loss": 4.2257399559021, "lr": 0.0003989875336854739, "tps": 26368, "wall": 4965.8} {"step": 1998, "train_loss": 4.118034839630127, "lr": 0.00039898550355215, "tps": 26355, "wall": 4970.7} {"step": 1999, "train_loss": 4.1337056159973145, "lr": 0.0003989834713912687, "tps": 26342, "wall": 4975.7} {"step": 2000, "train_loss": 4.193576335906982, "lr": 0.00039898143720285277, "tps": 26329, "wall": 4980.6, "val_loss_monitor": 4.262918593329563} {"step": 2001, "train_loss": 4.17180061340332, "lr": 0.00039897940098692557, "tps": 26064, "wall": 5033.7} {"step": 2002, "train_loss": 4.301549911499023, "lr": 0.00039897736274350994, "tps": 26052, "wall": 5038.6} {"step": 2003, "train_loss": 4.273933410644531, "lr": 0.0003989753224726292, "tps": 26039, "wall": 5043.6} {"step": 2004, "train_loss": 4.249141693115234, "lr": 0.00039897328017430623, "tps": 26027, "wall": 5048.5} {"step": 2005, "train_loss": 4.102210998535156, "lr": 0.0003989712358485643, "tps": 26014, "wall": 5053.5} {"step": 2006, "train_loss": 4.211825370788574, "lr": 0.00039896918949542645, "tps": 26002, "wall": 5058.4} {"step": 2007, "train_loss": 4.298422336578369, "lr": 0.00039896714111491605, "tps": 25990, "wall": 5063.3} {"step": 2008, "train_loss": 4.394797325134277, "lr": 0.00039896509070705606, "tps": 25977, "wall": 5068.3} {"step": 2009, "train_loss": 4.223546981811523, "lr": 0.00039896303827186995, "tps": 25965, "wall": 5073.2} {"step": 2010, "train_loss": 4.260069847106934, "lr": 0.0003989609838093809, "tps": 25952, "wall": 5078.2} {"step": 2011, "train_loss": 4.37169885635376, "lr": 0.00039895892731961203, "tps": 25940, "wall": 5083.1} {"step": 2012, "train_loss": 4.24716329574585, "lr": 0.0003989568688025868, "tps": 25928, "wall": 5088.1} {"step": 2013, "train_loss": 4.2209954261779785, "lr": 0.00039895480825832846, "tps": 25915, "wall": 5093.1} {"step": 2014, "train_loss": 4.229895114898682, "lr": 0.0003989527456868604, "tps": 25902, "wall": 5098.1} {"step": 2015, "train_loss": 4.333627700805664, "lr": 0.00039895068108820593, "tps": 25890, "wall": 5103.1} {"step": 2016, "train_loss": 4.251418590545654, "lr": 0.00039894861446238846, "tps": 25878, "wall": 5108.0} {"step": 2017, "train_loss": 4.271282196044922, "lr": 0.0003989465458094314, "tps": 25865, "wall": 5113.0} {"step": 2018, "train_loss": 4.212242126464844, "lr": 0.0003989444751293582, "tps": 25853, "wall": 5117.9} {"step": 2019, "train_loss": 4.215031147003174, "lr": 0.00039894240242219236, "tps": 25841, "wall": 5122.9} {"step": 2020, "train_loss": 4.256705284118652, "lr": 0.0003989403276879572, "tps": 25829, "wall": 5127.8} {"step": 2021, "train_loss": 4.323338031768799, "lr": 0.00039893825092667635, "tps": 25817, "wall": 5132.8} {"step": 2022, "train_loss": 4.367508888244629, "lr": 0.0003989361721383734, "tps": 25805, "wall": 5137.7} {"step": 2023, "train_loss": 4.206281661987305, "lr": 0.00039893409132307176, "tps": 25792, "wall": 5142.7} {"step": 2024, "train_loss": 4.373320579528809, "lr": 0.000398932008480795, "tps": 25780, "wall": 5147.6} {"step": 2025, "train_loss": 4.152259826660156, "lr": 0.00039892992361156685, "tps": 25768, "wall": 5152.6} {"step": 2026, "train_loss": 4.275361061096191, "lr": 0.0003989278367154108, "tps": 25756, "wall": 5157.6} {"step": 2027, "train_loss": 4.264655113220215, "lr": 0.0003989257477923505, "tps": 25744, "wall": 5162.5} {"step": 2028, "train_loss": 4.2172112464904785, "lr": 0.00039892365684240976, "tps": 25732, "wall": 5167.5} {"step": 2029, "train_loss": 4.283203125, "lr": 0.0003989215638656121, "tps": 25720, "wall": 5172.4} {"step": 2030, "train_loss": 4.356799602508545, "lr": 0.0003989194688619812, "tps": 25708, "wall": 5177.4} {"step": 2031, "train_loss": 4.255491733551025, "lr": 0.0003989173718315411, "tps": 25696, "wall": 5182.3} {"step": 2032, "train_loss": 4.252995491027832, "lr": 0.0003989152727743151, "tps": 25685, "wall": 5187.2} {"step": 2033, "train_loss": 4.2976155281066895, "lr": 0.0003989131716903273, "tps": 25673, "wall": 5192.2} {"step": 2034, "train_loss": 4.214825630187988, "lr": 0.0003989110685796014, "tps": 25661, "wall": 5197.1} {"step": 2035, "train_loss": 4.277390003204346, "lr": 0.00039890896344216124, "tps": 25649, "wall": 5202.0} {"step": 2036, "train_loss": 4.34000301361084, "lr": 0.0003989068562780307, "tps": 25637, "wall": 5207.0} {"step": 2037, "train_loss": 4.305586814880371, "lr": 0.00039890474708723355, "tps": 25625, "wall": 5212.1} {"step": 2038, "train_loss": 4.294500350952148, "lr": 0.0003989026358697938, "tps": 25614, "wall": 5217.0} {"step": 2039, "train_loss": 4.273901462554932, "lr": 0.00039890052262573527, "tps": 25602, "wall": 5221.9} {"step": 2040, "train_loss": 4.219332218170166, "lr": 0.000398898407355082, "tps": 25590, "wall": 5226.9} {"step": 2041, "train_loss": 4.231800079345703, "lr": 0.00039889629005785787, "tps": 25579, "wall": 5231.8} {"step": 2042, "train_loss": 4.1867876052856445, "lr": 0.0003988941707340868, "tps": 25567, "wall": 5236.7} {"step": 2043, "train_loss": 4.27499532699585, "lr": 0.000398892049383793, "tps": 25555, "wall": 5241.7} {"step": 2044, "train_loss": 4.19374418258667, "lr": 0.0003988899260070004, "tps": 25544, "wall": 5246.6} {"step": 2045, "train_loss": 4.177026271820068, "lr": 0.00039888780060373294, "tps": 25532, "wall": 5251.6} {"step": 2046, "train_loss": 4.118022441864014, "lr": 0.0003988856731740148, "tps": 25521, "wall": 5256.5} {"step": 2047, "train_loss": 4.269385814666748, "lr": 0.00039888354371787015, "tps": 25509, "wall": 5261.4} {"step": 2048, "train_loss": 4.229022979736328, "lr": 0.00039888141223532304, "tps": 25498, "wall": 5266.4} {"step": 2049, "train_loss": 4.2377142906188965, "lr": 0.00039887927872639764, "tps": 25486, "wall": 5271.4} {"step": 2050, "train_loss": 4.225353717803955, "lr": 0.000398877143191118, "tps": 25474, "wall": 5276.4} {"step": 2051, "train_loss": 4.247504711151123, "lr": 0.00039887500562950845, "tps": 25463, "wall": 5281.3} {"step": 2052, "train_loss": 4.225198268890381, "lr": 0.00039887286604159313, "tps": 25451, "wall": 5286.3} {"step": 2053, "train_loss": 4.285288333892822, "lr": 0.00039887072442739633, "tps": 25440, "wall": 5291.2} {"step": 2054, "train_loss": 4.327747821807861, "lr": 0.0003988685807869422, "tps": 25429, "wall": 5296.2} {"step": 2055, "train_loss": 4.188930988311768, "lr": 0.0003988664351202553, "tps": 25417, "wall": 5301.1} {"step": 2056, "train_loss": 4.320054054260254, "lr": 0.0003988642874273596, "tps": 25405, "wall": 5306.1} {"step": 2057, "train_loss": 4.251389503479004, "lr": 0.00039886213770827967, "tps": 25394, "wall": 5311.1} {"step": 2058, "train_loss": 4.27994966506958, "lr": 0.00039885998596303967, "tps": 25383, "wall": 5316.0} {"step": 2059, "train_loss": 4.227316856384277, "lr": 0.0003988578321916641, "tps": 25372, "wall": 5321.0} {"step": 2060, "train_loss": 4.223508834838867, "lr": 0.00039885567639417736, "tps": 25360, "wall": 5325.9} {"step": 2061, "train_loss": 4.139392852783203, "lr": 0.00039885351857060384, "tps": 25349, "wall": 5330.9} {"step": 2062, "train_loss": 4.2624735832214355, "lr": 0.000398851358720968, "tps": 25338, "wall": 5335.9} {"step": 2063, "train_loss": 4.1562089920043945, "lr": 0.00039884919684529424, "tps": 25326, "wall": 5340.8} {"step": 2064, "train_loss": 4.218754768371582, "lr": 0.0003988470329436072, "tps": 25315, "wall": 5345.8} {"step": 2065, "train_loss": 4.228000640869141, "lr": 0.0003988448670159312, "tps": 25304, "wall": 5350.7} {"step": 2066, "train_loss": 4.211795806884766, "lr": 0.00039884269906229086, "tps": 25293, "wall": 5355.6} {"step": 2067, "train_loss": 4.184022903442383, "lr": 0.0003988405290827108, "tps": 25282, "wall": 5360.6} {"step": 2068, "train_loss": 4.326233863830566, "lr": 0.00039883835707721555, "tps": 25271, "wall": 5365.5} {"step": 2069, "train_loss": 4.2513298988342285, "lr": 0.0003988361830458297, "tps": 25260, "wall": 5370.5} {"step": 2070, "train_loss": 4.211841106414795, "lr": 0.00039883400698857794, "tps": 25249, "wall": 5375.4} {"step": 2071, "train_loss": 4.218588352203369, "lr": 0.00039883182890548477, "tps": 25238, "wall": 5380.3} {"step": 2072, "train_loss": 4.198173522949219, "lr": 0.000398829648796575, "tps": 25227, "wall": 5385.3} {"step": 2073, "train_loss": 4.167183876037598, "lr": 0.0003988274666618734, "tps": 25216, "wall": 5390.2} {"step": 2074, "train_loss": 4.234774589538574, "lr": 0.0003988252825014045, "tps": 25205, "wall": 5395.2} {"step": 2075, "train_loss": 4.243930339813232, "lr": 0.00039882309631519315, "tps": 25194, "wall": 5400.2} {"step": 2076, "train_loss": 4.227947235107422, "lr": 0.00039882090810326406, "tps": 25183, "wall": 5405.1} {"step": 2077, "train_loss": 4.2744035720825195, "lr": 0.0003988187178656421, "tps": 25172, "wall": 5410.1} {"step": 2078, "train_loss": 4.215571403503418, "lr": 0.000398816525602352, "tps": 25161, "wall": 5415.0} {"step": 2079, "train_loss": 4.219164848327637, "lr": 0.00039881433131341864, "tps": 25150, "wall": 5420.0} {"step": 2080, "train_loss": 4.143466472625732, "lr": 0.0003988121349988668, "tps": 25139, "wall": 5424.9} {"step": 2081, "train_loss": 4.152566432952881, "lr": 0.0003988099366587214, "tps": 25128, "wall": 5429.9} {"step": 2082, "train_loss": 4.124814510345459, "lr": 0.00039880773629300746, "tps": 25118, "wall": 5434.8} {"step": 2083, "train_loss": 4.305178165435791, "lr": 0.0003988055339017498, "tps": 25107, "wall": 5439.7} {"step": 2084, "train_loss": 4.235455513000488, "lr": 0.00039880332948497336, "tps": 25096, "wall": 5444.7} {"step": 2085, "train_loss": 4.264429092407227, "lr": 0.00039880112304270315, "tps": 25085, "wall": 5449.6} {"step": 2086, "train_loss": 4.251245498657227, "lr": 0.00039879891457496406, "tps": 25075, "wall": 5454.6} {"step": 2087, "train_loss": 4.301164627075195, "lr": 0.00039879670408178125, "tps": 25064, "wall": 5459.5} {"step": 2088, "train_loss": 4.1994452476501465, "lr": 0.0003987944915631797, "tps": 25053, "wall": 5464.5} {"step": 2089, "train_loss": 4.255986213684082, "lr": 0.00039879227701918453, "tps": 25043, "wall": 5469.4} {"step": 2090, "train_loss": 4.358621120452881, "lr": 0.0003987900604498207, "tps": 25032, "wall": 5474.3} {"step": 2091, "train_loss": 4.1956610679626465, "lr": 0.00039878784185511345, "tps": 25021, "wall": 5479.3} {"step": 2092, "train_loss": 4.28975772857666, "lr": 0.0003987856212350878, "tps": 25011, "wall": 5484.2} {"step": 2093, "train_loss": 4.165652275085449, "lr": 0.000398783398589769, "tps": 25000, "wall": 5489.2} {"step": 2094, "train_loss": 4.241561412811279, "lr": 0.0003987811739191822, "tps": 24989, "wall": 5494.1} {"step": 2095, "train_loss": 4.250617027282715, "lr": 0.00039877894722335257, "tps": 24979, "wall": 5499.1} {"step": 2096, "train_loss": 4.211790084838867, "lr": 0.00039877671850230533, "tps": 24968, "wall": 5504.0} {"step": 2097, "train_loss": 4.208183288574219, "lr": 0.00039877448775606575, "tps": 24958, "wall": 5508.9} {"step": 2098, "train_loss": 4.313817024230957, "lr": 0.00039877225498465913, "tps": 24947, "wall": 5513.9} {"step": 2099, "train_loss": 4.193565845489502, "lr": 0.00039877002018811074, "tps": 24937, "wall": 5518.9} {"step": 2100, "train_loss": 4.282032012939453, "lr": 0.0003987677833664459, "tps": 24926, "wall": 5523.8} {"step": 2101, "train_loss": 4.1986083984375, "lr": 0.00039876554451968984, "tps": 24916, "wall": 5528.8} {"step": 2102, "train_loss": 4.055494785308838, "lr": 0.00039876330364786814, "tps": 24906, "wall": 5533.7} {"step": 2103, "train_loss": 4.1750078201293945, "lr": 0.000398761060751006, "tps": 24895, "wall": 5538.6} {"step": 2104, "train_loss": 4.233186721801758, "lr": 0.00039875881582912895, "tps": 24885, "wall": 5543.6} {"step": 2105, "train_loss": 4.222773551940918, "lr": 0.00039875656888226226, "tps": 24874, "wall": 5548.5} {"step": 2106, "train_loss": 4.123814105987549, "lr": 0.0003987543199104316, "tps": 24864, "wall": 5553.4} {"step": 2107, "train_loss": 4.190736293792725, "lr": 0.0003987520689136623, "tps": 24854, "wall": 5558.4} {"step": 2108, "train_loss": 4.116138935089111, "lr": 0.0003987498158919799, "tps": 24843, "wall": 5563.3} {"step": 2109, "train_loss": 4.122593879699707, "lr": 0.00039874756084540985, "tps": 24833, "wall": 5568.3} {"step": 2110, "train_loss": 4.168935775756836, "lr": 0.0003987453037739778, "tps": 24823, "wall": 5573.3} {"step": 2111, "train_loss": 4.239680767059326, "lr": 0.0003987430446777093, "tps": 24812, "wall": 5578.2} {"step": 2112, "train_loss": 4.157285213470459, "lr": 0.0003987407835566299, "tps": 24802, "wall": 5583.1} {"step": 2113, "train_loss": 4.172138214111328, "lr": 0.0003987385204107652, "tps": 24792, "wall": 5588.1} {"step": 2114, "train_loss": 4.182948112487793, "lr": 0.00039873625524014094, "tps": 24782, "wall": 5593.0} {"step": 2115, "train_loss": 4.229063987731934, "lr": 0.0003987339880447827, "tps": 24772, "wall": 5598.0} {"step": 2116, "train_loss": 4.288242340087891, "lr": 0.00039873171882471616, "tps": 24761, "wall": 5603.0} {"step": 2117, "train_loss": 4.2547760009765625, "lr": 0.000398729447579967, "tps": 24751, "wall": 5607.9} {"step": 2118, "train_loss": 4.225443363189697, "lr": 0.00039872717431056103, "tps": 24741, "wall": 5612.8} {"step": 2119, "train_loss": 4.154662132263184, "lr": 0.00039872489901652397, "tps": 24731, "wall": 5617.8} {"step": 2120, "train_loss": 4.170115947723389, "lr": 0.00039872262169788155, "tps": 24721, "wall": 5622.7} {"step": 2121, "train_loss": 4.286673069000244, "lr": 0.0003987203423546596, "tps": 24711, "wall": 5627.7} {"step": 2122, "train_loss": 4.238572120666504, "lr": 0.000398718060986884, "tps": 24700, "wall": 5632.7} {"step": 2123, "train_loss": 4.327249526977539, "lr": 0.0003987157775945805, "tps": 24690, "wall": 5637.6} {"step": 2124, "train_loss": 4.271082878112793, "lr": 0.000398713492177775, "tps": 24680, "wall": 5642.6} {"step": 2125, "train_loss": 4.328929424285889, "lr": 0.00039871120473649344, "tps": 24669, "wall": 5648.0} {"step": 2126, "train_loss": 4.311124801635742, "lr": 0.00039870891527076164, "tps": 24658, "wall": 5653.0} {"step": 2127, "train_loss": 4.257226943969727, "lr": 0.0003987066237806056, "tps": 24648, "wall": 5658.0} {"step": 2128, "train_loss": 4.237849235534668, "lr": 0.0003987043302660512, "tps": 24638, "wall": 5663.0} {"step": 2129, "train_loss": 4.125154495239258, "lr": 0.0003987020347271245, "tps": 24628, "wall": 5667.9} {"step": 2130, "train_loss": 4.194787979125977, "lr": 0.0003986997371638515, "tps": 24618, "wall": 5672.9} {"step": 2131, "train_loss": 4.154729843139648, "lr": 0.0003986974375762582, "tps": 24608, "wall": 5677.9} {"step": 2132, "train_loss": 4.421645164489746, "lr": 0.0003986951359643707, "tps": 24598, "wall": 5682.9} {"step": 2133, "train_loss": 4.2026777267456055, "lr": 0.000398692832328215, "tps": 24588, "wall": 5687.9} {"step": 2134, "train_loss": 4.239333629608154, "lr": 0.00039869052666781726, "tps": 24577, "wall": 5693.1} {"step": 2135, "train_loss": 4.343109607696533, "lr": 0.00039868821898320355, "tps": 24565, "wall": 5698.4} {"step": 2136, "train_loss": 4.221776485443115, "lr": 0.0003986859092744, "tps": 24555, "wall": 5703.5} {"step": 2137, "train_loss": 4.238811016082764, "lr": 0.00039868359754143283, "tps": 24544, "wall": 5708.7} {"step": 2138, "train_loss": 4.236555099487305, "lr": 0.0003986812837843282, "tps": 24533, "wall": 5713.8} {"step": 2139, "train_loss": 4.096495151519775, "lr": 0.0003986789680031123, "tps": 24523, "wall": 5719.0} {"step": 2140, "train_loss": 4.19309139251709, "lr": 0.0003986766501978114, "tps": 24510, "wall": 5724.5} {"step": 2141, "train_loss": 4.169948101043701, "lr": 0.0003986743303684517, "tps": 24500, "wall": 5729.7} {"step": 2142, "train_loss": 4.235049247741699, "lr": 0.00039867200851505957, "tps": 24489, "wall": 5734.9} {"step": 2143, "train_loss": 4.111078262329102, "lr": 0.0003986696846376612, "tps": 24478, "wall": 5740.1} {"step": 2144, "train_loss": 4.236575603485107, "lr": 0.0003986673587362831, "tps": 24467, "wall": 5745.3} {"step": 2145, "train_loss": 4.260641098022461, "lr": 0.00039866503081095137, "tps": 24457, "wall": 5750.3} {"step": 2146, "train_loss": 4.190168857574463, "lr": 0.00039866270086169256, "tps": 24447, "wall": 5755.4} {"step": 2147, "train_loss": 4.245349884033203, "lr": 0.00039866036888853306, "tps": 24436, "wall": 5760.8} {"step": 2148, "train_loss": 4.1834716796875, "lr": 0.0003986580348914991, "tps": 24425, "wall": 5766.1} {"step": 2149, "train_loss": 4.2566046714782715, "lr": 0.0003986556988706174, "tps": 24414, "wall": 5771.3} {"step": 2150, "train_loss": 4.131813049316406, "lr": 0.0003986533608259142, "tps": 24403, "wall": 5776.6} {"step": 2151, "train_loss": 4.171356201171875, "lr": 0.00039865102075741605, "tps": 24392, "wall": 5781.9} {"step": 2152, "train_loss": 4.190388202667236, "lr": 0.0003986486786651495, "tps": 24381, "wall": 5787.0} {"step": 2153, "train_loss": 4.204498767852783, "lr": 0.00039864633454914105, "tps": 24372, "wall": 5792.1} {"step": 2154, "train_loss": 4.217040538787842, "lr": 0.00039864398840941726, "tps": 24361, "wall": 5797.2} {"step": 2155, "train_loss": 4.231989860534668, "lr": 0.0003986416402460047, "tps": 24351, "wall": 5802.3} {"step": 2156, "train_loss": 4.217475891113281, "lr": 0.00039863929005892995, "tps": 24341, "wall": 5807.3} {"step": 2157, "train_loss": 4.239704132080078, "lr": 0.0003986369378482198, "tps": 24331, "wall": 5812.4} {"step": 2158, "train_loss": 4.206092357635498, "lr": 0.00039863458361390057, "tps": 24322, "wall": 5817.4} {"step": 2159, "train_loss": 4.102049350738525, "lr": 0.0003986322273559992, "tps": 24312, "wall": 5822.4} {"step": 2160, "train_loss": 4.245900630950928, "lr": 0.0003986298690745423, "tps": 24302, "wall": 5827.4} {"step": 2161, "train_loss": 4.171222686767578, "lr": 0.0003986275087695565, "tps": 24293, "wall": 5832.4} {"step": 2162, "train_loss": 4.2903947830200195, "lr": 0.0003986251464410687, "tps": 24284, "wall": 5837.4} {"step": 2163, "train_loss": 4.161416530609131, "lr": 0.00039862278208910556, "tps": 24274, "wall": 5842.3} {"step": 2164, "train_loss": 4.172352313995361, "lr": 0.00039862041571369386, "tps": 24265, "wall": 5847.2} {"step": 2165, "train_loss": 4.193544387817383, "lr": 0.0003986180473148604, "tps": 24256, "wall": 5852.2} {"step": 2166, "train_loss": 4.142586708068848, "lr": 0.0003986156768926321, "tps": 24246, "wall": 5857.2} {"step": 2167, "train_loss": 4.201904296875, "lr": 0.0003986133044470358, "tps": 24234, "wall": 5862.7} {"step": 2168, "train_loss": 4.0836944580078125, "lr": 0.00039861092997809825, "tps": 24224, "wall": 5867.9} {"step": 2169, "train_loss": 4.205025672912598, "lr": 0.00039860855348584635, "tps": 24214, "wall": 5873.1} {"step": 2170, "train_loss": 4.083793640136719, "lr": 0.0003986061749703072, "tps": 24204, "wall": 5878.2} {"step": 2171, "train_loss": 4.24100923538208, "lr": 0.0003986037944315076, "tps": 24194, "wall": 5883.2} {"step": 2172, "train_loss": 4.133788585662842, "lr": 0.00039860141186947456, "tps": 24184, "wall": 5888.4} {"step": 2173, "train_loss": 4.244924068450928, "lr": 0.00039859902728423506, "tps": 24175, "wall": 5893.4} {"step": 2174, "train_loss": 4.245997428894043, "lr": 0.00039859664067581614, "tps": 24166, "wall": 5898.3} {"step": 2175, "train_loss": 4.170986175537109, "lr": 0.0003985942520442448, "tps": 24157, "wall": 5903.2} {"step": 2176, "train_loss": 4.193185329437256, "lr": 0.0003985918613895481, "tps": 24148, "wall": 5908.2} {"step": 2177, "train_loss": 4.170263767242432, "lr": 0.00039858946871175314, "tps": 24139, "wall": 5913.1} {"step": 2178, "train_loss": 4.193732261657715, "lr": 0.00039858707401088704, "tps": 24129, "wall": 5918.1} {"step": 2179, "train_loss": 4.159667015075684, "lr": 0.00039858467728697683, "tps": 24120, "wall": 5923.0} {"step": 2180, "train_loss": 4.100841522216797, "lr": 0.00039858227854004983, "tps": 24111, "wall": 5928.0} {"step": 2181, "train_loss": 4.20305061340332, "lr": 0.00039857987777013303, "tps": 24102, "wall": 5933.0} {"step": 2182, "train_loss": 4.1272101402282715, "lr": 0.0003985774749772537, "tps": 24093, "wall": 5938.0} {"step": 2183, "train_loss": 4.189205646514893, "lr": 0.0003985750701614392, "tps": 24083, "wall": 5943.0} {"step": 2184, "train_loss": 4.113404273986816, "lr": 0.00039857266332271656, "tps": 24074, "wall": 5948.1} {"step": 2185, "train_loss": 4.129210948944092, "lr": 0.00039857025446111315, "tps": 24064, "wall": 5953.2} {"step": 2186, "train_loss": 4.275636196136475, "lr": 0.0003985678435766562, "tps": 24055, "wall": 5958.3} {"step": 2187, "train_loss": 4.184187889099121, "lr": 0.0003985654306693731, "tps": 24045, "wall": 5963.3} {"step": 2188, "train_loss": 4.033634185791016, "lr": 0.0003985630157392911, "tps": 24036, "wall": 5968.4} {"step": 2189, "train_loss": 4.322726726531982, "lr": 0.00039856059878643765, "tps": 24027, "wall": 5973.4} {"step": 2190, "train_loss": 4.259921073913574, "lr": 0.0003985581798108401, "tps": 24017, "wall": 5978.5} {"step": 2191, "train_loss": 4.135268211364746, "lr": 0.00039855575881252576, "tps": 24008, "wall": 5983.5} {"step": 2192, "train_loss": 4.13263463973999, "lr": 0.0003985533357915221, "tps": 23999, "wall": 5988.5} {"step": 2193, "train_loss": 4.129622459411621, "lr": 0.00039855091074785664, "tps": 23990, "wall": 5993.5} {"step": 2194, "train_loss": 4.203586578369141, "lr": 0.0003985484836815568, "tps": 23981, "wall": 5998.5} {"step": 2195, "train_loss": 4.187114238739014, "lr": 0.00039854605459265006, "tps": 23972, "wall": 6003.5} {"step": 2196, "train_loss": 4.269785404205322, "lr": 0.000398543623481164, "tps": 23963, "wall": 6008.5} {"step": 2197, "train_loss": 4.254212379455566, "lr": 0.0003985411903471261, "tps": 23954, "wall": 6013.5} {"step": 2198, "train_loss": 4.136228084564209, "lr": 0.0003985387551905639, "tps": 23945, "wall": 6018.4} {"step": 2199, "train_loss": 4.314896583557129, "lr": 0.00039853631801150505, "tps": 23936, "wall": 6023.4} {"step": 2200, "train_loss": 4.2374348640441895, "lr": 0.00039853387880997717, "tps": 23927, "wall": 6028.3} {"step": 2201, "train_loss": 4.29736852645874, "lr": 0.0003985314375860078, "tps": 23919, "wall": 6033.3} {"step": 2202, "train_loss": 4.137351989746094, "lr": 0.0003985289943396246, "tps": 23910, "wall": 6038.3} {"step": 2203, "train_loss": 4.214961528778076, "lr": 0.00039852654907085536, "tps": 23900, "wall": 6043.3} {"step": 2204, "train_loss": 4.228050231933594, "lr": 0.0003985241017797277, "tps": 23891, "wall": 6048.4} {"step": 2205, "train_loss": 4.25838565826416, "lr": 0.0003985216524662694, "tps": 23881, "wall": 6053.6} {"step": 2206, "train_loss": 4.185886859893799, "lr": 0.0003985192011305081, "tps": 23872, "wall": 6058.7} {"step": 2207, "train_loss": 4.191597938537598, "lr": 0.0003985167477724717, "tps": 23863, "wall": 6063.7} {"step": 2208, "train_loss": 4.259490966796875, "lr": 0.00039851429239218787, "tps": 23854, "wall": 6068.8} {"step": 2209, "train_loss": 4.161901473999023, "lr": 0.00039851183498968443, "tps": 23845, "wall": 6073.8} {"step": 2210, "train_loss": 4.132375717163086, "lr": 0.00039850937556498933, "tps": 23837, "wall": 6078.7} {"step": 2211, "train_loss": 4.171863079071045, "lr": 0.0003985069141181304, "tps": 23828, "wall": 6083.7} {"step": 2212, "train_loss": 4.132766246795654, "lr": 0.00039850445064913546, "tps": 23819, "wall": 6088.8} {"step": 2213, "train_loss": 4.170736312866211, "lr": 0.0003985019851580324, "tps": 23810, "wall": 6093.8} {"step": 2214, "train_loss": 4.218798637390137, "lr": 0.00039849951764484926, "tps": 23800, "wall": 6099.0} {"step": 2215, "train_loss": 4.167418956756592, "lr": 0.0003984970481096139, "tps": 23791, "wall": 6104.2} {"step": 2216, "train_loss": 4.160340309143066, "lr": 0.0003984945765523543, "tps": 23782, "wall": 6109.3} {"step": 2217, "train_loss": 4.214831352233887, "lr": 0.0003984921029730985, "tps": 23772, "wall": 6114.5} {"step": 2218, "train_loss": 4.27443790435791, "lr": 0.00039848962737187453, "tps": 23763, "wall": 6119.7} {"step": 2219, "train_loss": 4.135254859924316, "lr": 0.0003984871497487104, "tps": 23754, "wall": 6124.9} {"step": 2220, "train_loss": 4.17414665222168, "lr": 0.0003984846701036341, "tps": 23744, "wall": 6130.1} {"step": 2221, "train_loss": 4.183805465698242, "lr": 0.0003984821884366739, "tps": 23735, "wall": 6135.2} {"step": 2222, "train_loss": 4.152887344360352, "lr": 0.00039847970474785776, "tps": 23725, "wall": 6140.5} {"step": 2223, "train_loss": 4.259446144104004, "lr": 0.0003984772190372139, "tps": 23716, "wall": 6145.6} {"step": 2224, "train_loss": 4.194024562835693, "lr": 0.00039847473130477044, "tps": 23706, "wall": 6150.8} {"step": 2225, "train_loss": 4.216022491455078, "lr": 0.0003984722415505556, "tps": 23697, "wall": 6156.0} {"step": 2226, "train_loss": 4.217890739440918, "lr": 0.0003984697497745974, "tps": 23688, "wall": 6161.1} {"step": 2227, "train_loss": 4.173247814178467, "lr": 0.0003984672559769244, "tps": 23679, "wall": 6166.2} {"step": 2228, "train_loss": 4.41049861907959, "lr": 0.0003984647601575646, "tps": 23671, "wall": 6171.2} {"step": 2229, "train_loss": 4.146505832672119, "lr": 0.00039846226231654634, "tps": 23662, "wall": 6176.3} {"step": 2230, "train_loss": 4.192919731140137, "lr": 0.0003984597624538979, "tps": 23653, "wall": 6181.4} {"step": 2231, "train_loss": 4.139851093292236, "lr": 0.00039845726056964763, "tps": 23644, "wall": 6186.6} {"step": 2232, "train_loss": 4.16512393951416, "lr": 0.0003984547566638239, "tps": 23635, "wall": 6191.7} {"step": 2233, "train_loss": 4.0638532638549805, "lr": 0.00039845225073645497, "tps": 23626, "wall": 6196.9} {"step": 2234, "train_loss": 4.175962448120117, "lr": 0.0003984497427875693, "tps": 23616, "wall": 6202.1} {"step": 2235, "train_loss": 4.158538341522217, "lr": 0.00039844723281719533, "tps": 23607, "wall": 6207.3} {"step": 2236, "train_loss": 4.209556579589844, "lr": 0.00039844472082536145, "tps": 23598, "wall": 6212.4} {"step": 2237, "train_loss": 4.22653341293335, "lr": 0.00039844220681209603, "tps": 23589, "wall": 6217.5} {"step": 2238, "train_loss": 4.2502617835998535, "lr": 0.00039843969077742777, "tps": 23580, "wall": 6222.7} {"step": 2239, "train_loss": 4.120421409606934, "lr": 0.00039843717272138496, "tps": 23571, "wall": 6227.9} {"step": 2240, "train_loss": 4.166348934173584, "lr": 0.0003984346526439962, "tps": 23562, "wall": 6233.1} {"step": 2241, "train_loss": 4.152825832366943, "lr": 0.00039843213054529007, "tps": 23553, "wall": 6238.1} {"step": 2242, "train_loss": 4.171315670013428, "lr": 0.00039842960642529513, "tps": 23545, "wall": 6243.1} {"step": 2243, "train_loss": 4.200644493103027, "lr": 0.0003984270802840399, "tps": 23537, "wall": 6248.0} {"step": 2244, "train_loss": 4.214011192321777, "lr": 0.00039842455212155315, "tps": 23529, "wall": 6252.9} {"step": 2245, "train_loss": 4.188699245452881, "lr": 0.0003984220219378633, "tps": 23521, "wall": 6257.9} {"step": 2246, "train_loss": 4.332430362701416, "lr": 0.00039841948973299917, "tps": 23513, "wall": 6262.8} {"step": 2247, "train_loss": 4.315519332885742, "lr": 0.0003984169555069894, "tps": 23504, "wall": 6267.9} {"step": 2248, "train_loss": 4.272455215454102, "lr": 0.00039841441925986276, "tps": 23496, "wall": 6273.0} {"step": 2249, "train_loss": 4.234203338623047, "lr": 0.00039841188099164784, "tps": 23487, "wall": 6278.1} {"step": 2250, "train_loss": 4.135230541229248, "lr": 0.0003984093407023736, "tps": 23479, "wall": 6283.1} {"step": 2251, "train_loss": 4.228139400482178, "lr": 0.0003984067983920686, "tps": 23470, "wall": 6288.2} {"step": 2252, "train_loss": 4.220699310302734, "lr": 0.0003984042540607618, "tps": 23462, "wall": 6293.2} {"step": 2253, "train_loss": 4.180903434753418, "lr": 0.00039840170770848193, "tps": 23454, "wall": 6298.1} {"step": 2254, "train_loss": 4.152677536010742, "lr": 0.0003983991593352579, "tps": 23446, "wall": 6303.1} {"step": 2255, "train_loss": 4.181769371032715, "lr": 0.0003983966089411185, "tps": 23438, "wall": 6308.1} {"step": 2256, "train_loss": 4.134932518005371, "lr": 0.0003983940565260926, "tps": 23429, "wall": 6313.1} {"step": 2257, "train_loss": 4.143166542053223, "lr": 0.00039839150209020925, "tps": 23421, "wall": 6318.1} {"step": 2258, "train_loss": 4.110906600952148, "lr": 0.0003983889456334973, "tps": 23413, "wall": 6323.1} {"step": 2259, "train_loss": 4.247061729431152, "lr": 0.00039838638715598574, "tps": 23405, "wall": 6328.0} {"step": 2260, "train_loss": 4.146907806396484, "lr": 0.00039838382665770354, "tps": 23397, "wall": 6333.0} {"step": 2261, "train_loss": 4.196885585784912, "lr": 0.0003983812641386797, "tps": 23389, "wall": 6338.0} {"step": 2262, "train_loss": 4.235968589782715, "lr": 0.0003983786995989432, "tps": 23381, "wall": 6343.0} {"step": 2263, "train_loss": 4.132602214813232, "lr": 0.00039837613303852316, "tps": 23373, "wall": 6347.9} {"step": 2264, "train_loss": 4.133055210113525, "lr": 0.0003983735644574487, "tps": 23365, "wall": 6352.9} {"step": 2265, "train_loss": 4.080944538116455, "lr": 0.00039837099385574883, "tps": 23357, "wall": 6357.9} {"step": 2266, "train_loss": 4.158501625061035, "lr": 0.00039836842123345265, "tps": 23349, "wall": 6362.8} {"step": 2267, "train_loss": 4.1450371742248535, "lr": 0.0003983658465905893, "tps": 23340, "wall": 6368.1} {"step": 2268, "train_loss": 4.079074382781982, "lr": 0.00039836326992718807, "tps": 23332, "wall": 6373.2} {"step": 2269, "train_loss": 4.121734142303467, "lr": 0.00039836069124327806, "tps": 23323, "wall": 6378.3} {"step": 2270, "train_loss": 4.278011322021484, "lr": 0.0003983581105388885, "tps": 23315, "wall": 6383.4} {"step": 2271, "train_loss": 4.110222816467285, "lr": 0.0003983555278140486, "tps": 23307, "wall": 6388.5} {"step": 2272, "train_loss": 4.179203033447266, "lr": 0.0003983529430687876, "tps": 23298, "wall": 6393.6} {"step": 2273, "train_loss": 4.197866916656494, "lr": 0.00039835035630313484, "tps": 23291, "wall": 6398.5} {"step": 2274, "train_loss": 4.197138786315918, "lr": 0.00039834776751711964, "tps": 23283, "wall": 6403.5} {"step": 2275, "train_loss": 4.1735944747924805, "lr": 0.00039834517671077116, "tps": 23275, "wall": 6408.5} {"step": 2276, "train_loss": 4.199955463409424, "lr": 0.00039834258388411894, "tps": 23267, "wall": 6413.6} {"step": 2277, "train_loss": 4.215126991271973, "lr": 0.0003983399890371923, "tps": 23259, "wall": 6418.6} {"step": 2278, "train_loss": 4.233345985412598, "lr": 0.0003983373921700206, "tps": 23250, "wall": 6423.7} {"step": 2279, "train_loss": 4.148767948150635, "lr": 0.0003983347932826333, "tps": 23242, "wall": 6429.0} {"step": 2280, "train_loss": 4.242886066436768, "lr": 0.0003983321923750598, "tps": 23233, "wall": 6434.2} {"step": 2281, "train_loss": 4.080551624298096, "lr": 0.00039832958944732954, "tps": 23225, "wall": 6439.3} {"step": 2282, "train_loss": 4.125716209411621, "lr": 0.0003983269844994721, "tps": 23217, "wall": 6444.3} {"step": 2283, "train_loss": 4.1264848709106445, "lr": 0.0003983243775315169, "tps": 23208, "wall": 6449.5} {"step": 2284, "train_loss": 4.222044467926025, "lr": 0.0003983217685434935, "tps": 23200, "wall": 6454.5} {"step": 2285, "train_loss": 4.132097244262695, "lr": 0.0003983191575354315, "tps": 23192, "wall": 6459.5} {"step": 2286, "train_loss": 4.179708003997803, "lr": 0.0003983165445073604, "tps": 23184, "wall": 6464.6} {"step": 2287, "train_loss": 4.169672966003418, "lr": 0.00039831392945930983, "tps": 23176, "wall": 6469.8} {"step": 2288, "train_loss": 4.116988182067871, "lr": 0.0003983113123913094, "tps": 23167, "wall": 6475.0} {"step": 2289, "train_loss": 4.194650173187256, "lr": 0.0003983086933033888, "tps": 23159, "wall": 6480.1} {"step": 2290, "train_loss": 4.225072860717773, "lr": 0.0003983060721955777, "tps": 23151, "wall": 6485.2} {"step": 2291, "train_loss": 4.17474889755249, "lr": 0.00039830344906790577, "tps": 23143, "wall": 6490.2} {"step": 2292, "train_loss": 4.159670352935791, "lr": 0.0003983008239204027, "tps": 23135, "wall": 6495.3} {"step": 2293, "train_loss": 4.204775810241699, "lr": 0.00039829819675309824, "tps": 23127, "wall": 6500.4} {"step": 2294, "train_loss": 4.165791988372803, "lr": 0.00039829556756602213, "tps": 23119, "wall": 6505.5} {"step": 2295, "train_loss": 4.135049343109131, "lr": 0.00039829293635920427, "tps": 23111, "wall": 6510.5} {"step": 2296, "train_loss": 4.164262294769287, "lr": 0.0003982903031326743, "tps": 23104, "wall": 6515.6} {"step": 2297, "train_loss": 4.192076206207275, "lr": 0.0003982876678864622, "tps": 23095, "wall": 6520.7} {"step": 2298, "train_loss": 4.141305923461914, "lr": 0.0003982850306205977, "tps": 23087, "wall": 6526.0} {"step": 2299, "train_loss": 4.1239399909973145, "lr": 0.0003982823913351108, "tps": 23079, "wall": 6531.1} {"step": 2300, "train_loss": 4.148039817810059, "lr": 0.00039827975003003133, "tps": 23070, "wall": 6536.5} {"step": 2301, "train_loss": 4.224367141723633, "lr": 0.0003982771067053891, "tps": 23061, "wall": 6541.7} {"step": 2302, "train_loss": 4.064767837524414, "lr": 0.0003982744613612142, "tps": 23054, "wall": 6546.7} {"step": 2303, "train_loss": 4.2054877281188965, "lr": 0.00039827181399753665, "tps": 23046, "wall": 6551.9} {"step": 2304, "train_loss": 4.227352142333984, "lr": 0.00039826916461438623, "tps": 23038, "wall": 6557.0} {"step": 2305, "train_loss": 4.112133502960205, "lr": 0.0003982665132117931, "tps": 23030, "wall": 6562.0} {"step": 2306, "train_loss": 4.108081817626953, "lr": 0.00039826385978978726, "tps": 23022, "wall": 6567.1} {"step": 2307, "train_loss": 4.212860107421875, "lr": 0.00039826120434839884, "tps": 23014, "wall": 6572.3} {"step": 2308, "train_loss": 4.146687984466553, "lr": 0.00039825854688765774, "tps": 23006, "wall": 6577.4} {"step": 2309, "train_loss": 4.167816162109375, "lr": 0.0003982558874075942, "tps": 22998, "wall": 6582.4} {"step": 2310, "train_loss": 4.187829971313477, "lr": 0.00039825322590823846, "tps": 22991, "wall": 6587.5} {"step": 2311, "train_loss": 4.097725868225098, "lr": 0.0003982505623896204, "tps": 22982, "wall": 6592.7} {"step": 2312, "train_loss": 4.169797420501709, "lr": 0.0003982478968517704, "tps": 22974, "wall": 6597.9} {"step": 2313, "train_loss": 4.112185955047607, "lr": 0.0003982452292947185, "tps": 22966, "wall": 6603.0} {"step": 2314, "train_loss": 4.176955699920654, "lr": 0.000398242559718495, "tps": 22958, "wall": 6608.3} {"step": 2315, "train_loss": 4.224526882171631, "lr": 0.0003982398881231302, "tps": 22950, "wall": 6613.4} {"step": 2316, "train_loss": 4.161284446716309, "lr": 0.0003982372145086543, "tps": 22942, "wall": 6618.5} {"step": 2317, "train_loss": 4.265270233154297, "lr": 0.00039823453887509756, "tps": 22934, "wall": 6623.7} {"step": 2318, "train_loss": 4.217494964599609, "lr": 0.0003982318612224904, "tps": 22926, "wall": 6628.8} {"step": 2319, "train_loss": 4.099971771240234, "lr": 0.000398229181550863, "tps": 22919, "wall": 6633.9} {"step": 2320, "train_loss": 4.248048305511475, "lr": 0.00039822649986024576, "tps": 22911, "wall": 6639.0} {"step": 2321, "train_loss": 4.152885437011719, "lr": 0.0003982238161506692, "tps": 22903, "wall": 6644.3} {"step": 2322, "train_loss": 4.21742582321167, "lr": 0.0003982211304221635, "tps": 22893, "wall": 6649.9} {"step": 2323, "train_loss": 4.215578556060791, "lr": 0.00039821844267475925, "tps": 22885, "wall": 6655.2} {"step": 2324, "train_loss": 4.0969319343566895, "lr": 0.00039821575290848685, "tps": 22876, "wall": 6660.5} {"step": 2325, "train_loss": 4.202164649963379, "lr": 0.00039821306112337667, "tps": 22868, "wall": 6665.9} {"step": 2326, "train_loss": 4.18597936630249, "lr": 0.0003982103673194594, "tps": 22859, "wall": 6671.2} {"step": 2327, "train_loss": 4.123092174530029, "lr": 0.0003982076714967654, "tps": 22851, "wall": 6676.6} {"step": 2328, "train_loss": 4.123964786529541, "lr": 0.00039820497365532524, "tps": 22842, "wall": 6681.9} {"step": 2329, "train_loss": 4.326158046722412, "lr": 0.00039820227379516954, "tps": 22834, "wall": 6687.2} {"step": 2330, "train_loss": 4.112051963806152, "lr": 0.0003981995719163288, "tps": 22825, "wall": 6692.6} {"step": 2331, "train_loss": 4.202146053314209, "lr": 0.00039819686801883364, "tps": 22817, "wall": 6698.0} {"step": 2332, "train_loss": 4.175683498382568, "lr": 0.0003981941621027148, "tps": 22808, "wall": 6703.3} {"step": 2333, "train_loss": 4.150146961212158, "lr": 0.0003981914541680028, "tps": 22800, "wall": 6708.7} {"step": 2334, "train_loss": 4.081786155700684, "lr": 0.0003981887442147284, "tps": 22791, "wall": 6714.2} {"step": 2335, "train_loss": 4.089069843292236, "lr": 0.0003981860322429223, "tps": 22782, "wall": 6719.6} {"step": 2336, "train_loss": 4.1268086433410645, "lr": 0.0003981833182526151, "tps": 22774, "wall": 6725.0} {"step": 2337, "train_loss": 4.170955657958984, "lr": 0.0003981806022438377, "tps": 22766, "wall": 6730.3} {"step": 2338, "train_loss": 4.083677291870117, "lr": 0.00039817788421662076, "tps": 22757, "wall": 6735.7} {"step": 2339, "train_loss": 4.205501556396484, "lr": 0.00039817516417099506, "tps": 22749, "wall": 6741.1} {"step": 2340, "train_loss": 4.004969596862793, "lr": 0.0003981724421069916, "tps": 22741, "wall": 6746.3} {"step": 2341, "train_loss": 4.192336082458496, "lr": 0.00039816971802464097, "tps": 22733, "wall": 6751.4} {"step": 2342, "train_loss": 4.222536087036133, "lr": 0.00039816699192397415, "tps": 22726, "wall": 6756.4} {"step": 2343, "train_loss": 4.28530216217041, "lr": 0.000398164263805022, "tps": 22719, "wall": 6761.5} {"step": 2344, "train_loss": 4.0840229988098145, "lr": 0.00039816153366781546, "tps": 22712, "wall": 6766.5} {"step": 2345, "train_loss": 4.118182182312012, "lr": 0.00039815880151238545, "tps": 22704, "wall": 6771.5} {"step": 2346, "train_loss": 4.1641998291015625, "lr": 0.0003981560673387628, "tps": 22697, "wall": 6776.5} {"step": 2347, "train_loss": 4.220409870147705, "lr": 0.0003981533311469787, "tps": 22690, "wall": 6781.6} {"step": 2348, "train_loss": 4.111013889312744, "lr": 0.000398150592937064, "tps": 22683, "wall": 6786.6} {"step": 2349, "train_loss": 4.234275817871094, "lr": 0.0003981478527090497, "tps": 22676, "wall": 6791.6} {"step": 2350, "train_loss": 4.085146427154541, "lr": 0.0003981451104629669, "tps": 22669, "wall": 6796.6} {"step": 2351, "train_loss": 4.248698711395264, "lr": 0.0003981423661988466, "tps": 22661, "wall": 6801.8} {"step": 2352, "train_loss": 4.179862022399902, "lr": 0.00039813961991672, "tps": 22653, "wall": 6807.1} {"step": 2353, "train_loss": 4.06132173538208, "lr": 0.0003981368716166182, "tps": 22646, "wall": 6812.3} {"step": 2354, "train_loss": 4.247921943664551, "lr": 0.00039813412129857217, "tps": 22638, "wall": 6817.6} {"step": 2355, "train_loss": 4.144309043884277, "lr": 0.00039813136896261326, "tps": 22630, "wall": 6822.9} {"step": 2356, "train_loss": 4.104317665100098, "lr": 0.00039812861460877255, "tps": 22622, "wall": 6828.2} {"step": 2357, "train_loss": 4.106605529785156, "lr": 0.0003981258582370812, "tps": 22614, "wall": 6833.5} {"step": 2358, "train_loss": 4.075496673583984, "lr": 0.00039812309984757054, "tps": 22606, "wall": 6838.8} {"step": 2359, "train_loss": 4.186791896820068, "lr": 0.00039812033944027175, "tps": 22598, "wall": 6844.1} {"step": 2360, "train_loss": 4.223620891571045, "lr": 0.0003981175770152162, "tps": 22590, "wall": 6849.4} {"step": 2361, "train_loss": 4.152922630310059, "lr": 0.000398114812572435, "tps": 22582, "wall": 6854.7} {"step": 2362, "train_loss": 4.135481834411621, "lr": 0.00039811204611195963, "tps": 22574, "wall": 6860.0} {"step": 2363, "train_loss": 4.154295444488525, "lr": 0.0003981092776338213, "tps": 22566, "wall": 6865.3} {"step": 2364, "train_loss": 4.098006248474121, "lr": 0.00039810650713805146, "tps": 22558, "wall": 6870.7} {"step": 2365, "train_loss": 4.131411075592041, "lr": 0.00039810373462468153, "tps": 22550, "wall": 6876.0} {"step": 2366, "train_loss": 4.15318489074707, "lr": 0.00039810096009374276, "tps": 22542, "wall": 6881.3} {"step": 2367, "train_loss": 4.139683246612549, "lr": 0.00039809818354526676, "tps": 22534, "wall": 6886.7} {"step": 2368, "train_loss": 4.2284746170043945, "lr": 0.0003980954049792849, "tps": 22526, "wall": 6892.1} {"step": 2369, "train_loss": 4.160971164703369, "lr": 0.0003980926243958286, "tps": 22518, "wall": 6897.4} {"step": 2370, "train_loss": 4.078701019287109, "lr": 0.00039808984179492946, "tps": 22511, "wall": 6902.5} {"step": 2371, "train_loss": 4.091320514678955, "lr": 0.000398087057176619, "tps": 22504, "wall": 6907.5} {"step": 2372, "train_loss": 4.099003791809082, "lr": 0.00039808427054092863, "tps": 22497, "wall": 6912.5} {"step": 2373, "train_loss": 4.15256404876709, "lr": 0.00039808148188789005, "tps": 22491, "wall": 6917.5} {"step": 2374, "train_loss": 4.158524990081787, "lr": 0.0003980786912175348, "tps": 22484, "wall": 6922.4} {"step": 2375, "train_loss": 4.161896228790283, "lr": 0.0003980758985298945, "tps": 22478, "wall": 6927.4} {"step": 2376, "train_loss": 4.084024429321289, "lr": 0.0003980731038250008, "tps": 22471, "wall": 6932.4} {"step": 2377, "train_loss": 4.143935203552246, "lr": 0.0003980703071028854, "tps": 22463, "wall": 6937.7} {"step": 2378, "train_loss": 4.1359148025512695, "lr": 0.00039806750836357985, "tps": 22456, "wall": 6942.9} {"step": 2379, "train_loss": 4.1125946044921875, "lr": 0.00039806470760711597, "tps": 22449, "wall": 6948.0} {"step": 2380, "train_loss": 4.1659464836120605, "lr": 0.0003980619048335254, "tps": 22441, "wall": 6953.1} {"step": 2381, "train_loss": 4.17466926574707, "lr": 0.00039805910004284, "tps": 22435, "wall": 6958.2} {"step": 2382, "train_loss": 4.112886428833008, "lr": 0.0003980562932350914, "tps": 22428, "wall": 6963.1} {"step": 2383, "train_loss": 4.140937805175781, "lr": 0.00039805348441031155, "tps": 22421, "wall": 6968.2} {"step": 2384, "train_loss": 4.064267158508301, "lr": 0.00039805067356853217, "tps": 22414, "wall": 6973.4} {"step": 2385, "train_loss": 4.169035911560059, "lr": 0.00039804786070978513, "tps": 22406, "wall": 6978.6} {"step": 2386, "train_loss": 4.184805393218994, "lr": 0.00039804504583410233, "tps": 22399, "wall": 6983.8} {"step": 2387, "train_loss": 4.250523090362549, "lr": 0.0003980422289415156, "tps": 22392, "wall": 6988.9} {"step": 2388, "train_loss": 4.087191581726074, "lr": 0.00039803941003205685, "tps": 22384, "wall": 6994.3} {"step": 2389, "train_loss": 4.248891830444336, "lr": 0.00039803658910575804, "tps": 22377, "wall": 6999.4} {"step": 2390, "train_loss": 4.153651237487793, "lr": 0.00039803376616265107, "tps": 22370, "wall": 7004.6} {"step": 2391, "train_loss": 4.181820869445801, "lr": 0.000398030941202768, "tps": 22363, "wall": 7009.8} {"step": 2392, "train_loss": 4.139571189880371, "lr": 0.00039802811422614084, "tps": 22356, "wall": 7014.9} {"step": 2393, "train_loss": 4.096069812774658, "lr": 0.0003980252852328015, "tps": 22349, "wall": 7020.0} {"step": 2394, "train_loss": 4.151823043823242, "lr": 0.00039802245422278215, "tps": 22342, "wall": 7025.1} {"step": 2395, "train_loss": 4.1352715492248535, "lr": 0.0003980196211961148, "tps": 22334, "wall": 7030.4} {"step": 2396, "train_loss": 4.144407272338867, "lr": 0.00039801678615283153, "tps": 22328, "wall": 7035.4} {"step": 2397, "train_loss": 4.15283203125, "lr": 0.0003980139490929645, "tps": 22321, "wall": 7040.6} {"step": 2398, "train_loss": 4.102527618408203, "lr": 0.0003980111100165458, "tps": 22314, "wall": 7045.6} {"step": 2399, "train_loss": 4.115420341491699, "lr": 0.00039800826892360765, "tps": 22307, "wall": 7050.8} {"step": 2400, "train_loss": 4.142559051513672, "lr": 0.0003980054258141822, "tps": 22300, "wall": 7055.9} {"step": 2401, "train_loss": 4.150705814361572, "lr": 0.0003980025806883016, "tps": 22293, "wall": 7061.0} {"step": 2402, "train_loss": 4.1017560958862305, "lr": 0.0003979997335459982, "tps": 22287, "wall": 7066.0} {"step": 2403, "train_loss": 4.168484687805176, "lr": 0.0003979968843873041, "tps": 22280, "wall": 7071.1} {"step": 2404, "train_loss": 4.096842288970947, "lr": 0.0003979940332122517, "tps": 22274, "wall": 7076.1} {"step": 2405, "train_loss": 4.109105587005615, "lr": 0.0003979911800208733, "tps": 22267, "wall": 7081.2} {"step": 2406, "train_loss": 4.047446250915527, "lr": 0.0003979883248132012, "tps": 22260, "wall": 7086.4} {"step": 2407, "train_loss": 4.076653480529785, "lr": 0.0003979854675892677, "tps": 22253, "wall": 7091.6} {"step": 2408, "train_loss": 4.230548858642578, "lr": 0.0003979826083491052, "tps": 22245, "wall": 7097.0} {"step": 2409, "train_loss": 4.11431884765625, "lr": 0.0003979797470927461, "tps": 22238, "wall": 7102.2} {"step": 2410, "train_loss": 4.122410297393799, "lr": 0.0003979768838202227, "tps": 22231, "wall": 7107.2} {"step": 2411, "train_loss": 4.222010612487793, "lr": 0.00039797401853156766, "tps": 22225, "wall": 7112.3} {"step": 2412, "train_loss": 4.223146438598633, "lr": 0.0003979711512268132, "tps": 22219, "wall": 7117.2} {"step": 2413, "train_loss": 4.036041259765625, "lr": 0.000397968281905992, "tps": 22212, "wall": 7122.3} {"step": 2414, "train_loss": 4.181729316711426, "lr": 0.00039796541056913643, "tps": 22206, "wall": 7127.3} {"step": 2415, "train_loss": 4.098945140838623, "lr": 0.0003979625372162791, "tps": 22199, "wall": 7132.4} {"step": 2416, "train_loss": 4.154166221618652, "lr": 0.00039795966184745247, "tps": 22193, "wall": 7137.3} {"step": 2417, "train_loss": 4.124453067779541, "lr": 0.0003979567844626892, "tps": 22187, "wall": 7142.3} {"step": 2418, "train_loss": 4.215703010559082, "lr": 0.0003979539050620218, "tps": 22180, "wall": 7147.2} {"step": 2419, "train_loss": 4.082813739776611, "lr": 0.00039795102364548294, "tps": 22174, "wall": 7152.2} {"step": 2420, "train_loss": 4.0920023918151855, "lr": 0.00039794814021310536, "tps": 22168, "wall": 7157.2} {"step": 2421, "train_loss": 4.135451793670654, "lr": 0.0003979452547649215, "tps": 22161, "wall": 7162.2} {"step": 2422, "train_loss": 4.119929313659668, "lr": 0.00039794236730096425, "tps": 22155, "wall": 7167.2} {"step": 2423, "train_loss": 4.07441520690918, "lr": 0.00039793947782126616, "tps": 22149, "wall": 7172.2} {"step": 2424, "train_loss": 4.067679405212402, "lr": 0.00039793658632586014, "tps": 22142, "wall": 7177.3} {"step": 2425, "train_loss": 4.102788925170898, "lr": 0.00039793369281477875, "tps": 22136, "wall": 7182.2} {"step": 2426, "train_loss": 4.118897438049316, "lr": 0.0003979307972880549, "tps": 22130, "wall": 7187.2} {"step": 2427, "train_loss": 4.078593730926514, "lr": 0.00039792789974572136, "tps": 22123, "wall": 7192.3} {"step": 2428, "train_loss": 4.194128513336182, "lr": 0.0003979250001878109, "tps": 22117, "wall": 7197.3} {"step": 2429, "train_loss": 4.081964015960693, "lr": 0.00039792209861435647, "tps": 22110, "wall": 7202.4} {"step": 2430, "train_loss": 4.221147537231445, "lr": 0.00039791919502539085, "tps": 22104, "wall": 7207.5} {"step": 2431, "train_loss": 4.0988874435424805, "lr": 0.00039791628942094696, "tps": 22098, "wall": 7212.5} {"step": 2432, "train_loss": 4.1859283447265625, "lr": 0.0003979133818010577, "tps": 22092, "wall": 7217.5} {"step": 2433, "train_loss": 4.167438507080078, "lr": 0.0003979104721657561, "tps": 22086, "wall": 7222.4} {"step": 2434, "train_loss": 4.11838436126709, "lr": 0.00039790756051507497, "tps": 22079, "wall": 7227.4} {"step": 2435, "train_loss": 4.146953105926514, "lr": 0.0003979046468490474, "tps": 22073, "wall": 7232.4} {"step": 2436, "train_loss": 4.134777069091797, "lr": 0.0003979017311677064, "tps": 22067, "wall": 7237.5} {"step": 2437, "train_loss": 4.075746536254883, "lr": 0.0003978988134710849, "tps": 22060, "wall": 7242.7} {"step": 2438, "train_loss": 4.088364124298096, "lr": 0.00039789589375921605, "tps": 22054, "wall": 7247.8} {"step": 2439, "train_loss": 4.0461907386779785, "lr": 0.0003978929720321329, "tps": 22047, "wall": 7253.0} {"step": 2440, "train_loss": 4.065670013427734, "lr": 0.0003978900482898685, "tps": 22040, "wall": 7258.0} {"step": 2441, "train_loss": 3.9225378036499023, "lr": 0.00039788712253245606, "tps": 22034, "wall": 7263.1} {"step": 2442, "train_loss": 4.092479705810547, "lr": 0.00039788419475992866, "tps": 22028, "wall": 7268.1} {"step": 2443, "train_loss": 4.103142261505127, "lr": 0.00039788126497231947, "tps": 22022, "wall": 7273.1} {"step": 2444, "train_loss": 3.995633125305176, "lr": 0.0003978783331696617, "tps": 22016, "wall": 7278.1} {"step": 2445, "train_loss": 4.141013145446777, "lr": 0.00039787539935198855, "tps": 22010, "wall": 7283.0} {"step": 2446, "train_loss": 4.109850883483887, "lr": 0.00039787246351933323, "tps": 22004, "wall": 7288.0} {"step": 2447, "train_loss": 4.177218437194824, "lr": 0.000397869525671729, "tps": 21997, "wall": 7293.0} {"step": 2448, "train_loss": 4.132113456726074, "lr": 0.00039786658580920917, "tps": 21991, "wall": 7298.1} {"step": 2449, "train_loss": 3.9957175254821777, "lr": 0.0003978636439318071, "tps": 21985, "wall": 7303.3} {"step": 2450, "train_loss": 4.047698020935059, "lr": 0.000397860700039556, "tps": 21978, "wall": 7308.4} {"step": 2451, "train_loss": 4.120065689086914, "lr": 0.0003978577541324892, "tps": 21971, "wall": 7313.7} {"step": 2452, "train_loss": 4.07927942276001, "lr": 0.0003978548062106403, "tps": 21965, "wall": 7318.7} {"step": 2453, "train_loss": 4.089033603668213, "lr": 0.0003978518562740424, "tps": 21958, "wall": 7323.9} {"step": 2454, "train_loss": 3.9499547481536865, "lr": 0.0003978489043227291, "tps": 21952, "wall": 7329.1} {"step": 2455, "train_loss": 4.160537242889404, "lr": 0.00039784595035673376, "tps": 21945, "wall": 7334.2} {"step": 2456, "train_loss": 4.038674831390381, "lr": 0.0003978429943760899, "tps": 21939, "wall": 7339.4} {"step": 2457, "train_loss": 4.082968235015869, "lr": 0.000397840036380831, "tps": 21933, "wall": 7344.4} {"step": 2458, "train_loss": 4.1854777336120605, "lr": 0.0003978370763709905, "tps": 21926, "wall": 7349.5} {"step": 2459, "train_loss": 4.165750503540039, "lr": 0.000397834114346602, "tps": 21920, "wall": 7354.6} {"step": 2460, "train_loss": 4.1720662117004395, "lr": 0.0003978311503076991, "tps": 21914, "wall": 7359.7} {"step": 2461, "train_loss": 4.076130390167236, "lr": 0.0003978281842543152, "tps": 21908, "wall": 7364.8} {"step": 2462, "train_loss": 4.1923699378967285, "lr": 0.000397825216186484, "tps": 21901, "wall": 7369.9} {"step": 2463, "train_loss": 4.062188148498535, "lr": 0.00039782224610423924, "tps": 21895, "wall": 7375.1} {"step": 2464, "train_loss": 4.0833353996276855, "lr": 0.00039781927400761434, "tps": 21888, "wall": 7380.3} {"step": 2465, "train_loss": 4.1523213386535645, "lr": 0.0003978162998966431, "tps": 21882, "wall": 7385.3} {"step": 2466, "train_loss": 4.176755428314209, "lr": 0.00039781332377135934, "tps": 21876, "wall": 7390.5} {"step": 2467, "train_loss": 4.101668357849121, "lr": 0.00039781034563179647, "tps": 21870, "wall": 7395.6} {"step": 2468, "train_loss": 4.235613822937012, "lr": 0.0003978073654779885, "tps": 21864, "wall": 7400.6} {"step": 2469, "train_loss": 4.083695888519287, "lr": 0.00039780438330996897, "tps": 21858, "wall": 7405.7} {"step": 2470, "train_loss": 4.0741095542907715, "lr": 0.00039780139912777183, "tps": 21852, "wall": 7410.7} {"step": 2471, "train_loss": 4.074440956115723, "lr": 0.0003977984129314308, "tps": 21845, "wall": 7415.8} {"step": 2472, "train_loss": 4.10938835144043, "lr": 0.00039779542472097974, "tps": 21839, "wall": 7420.9} {"step": 2473, "train_loss": 4.034804821014404, "lr": 0.00039779243449645244, "tps": 21833, "wall": 7425.9} {"step": 2474, "train_loss": 4.185244560241699, "lr": 0.0003977894422578829, "tps": 21827, "wall": 7431.0} {"step": 2475, "train_loss": 4.205108642578125, "lr": 0.0003977864480053049, "tps": 21821, "wall": 7436.1} {"step": 2476, "train_loss": 4.057154178619385, "lr": 0.0003977834517387524, "tps": 21815, "wall": 7441.2} {"step": 2477, "train_loss": 4.056127071380615, "lr": 0.00039778045345825936, "tps": 21809, "wall": 7446.2} {"step": 2478, "train_loss": 4.191216945648193, "lr": 0.0003977774531638597, "tps": 21803, "wall": 7451.4} {"step": 2479, "train_loss": 4.132208824157715, "lr": 0.0003977744508555874, "tps": 21796, "wall": 7456.5} {"step": 2480, "train_loss": 4.06885290145874, "lr": 0.0003977714465334766, "tps": 21791, "wall": 7461.5} {"step": 2481, "train_loss": 4.086809158325195, "lr": 0.0003977684401975612, "tps": 21785, "wall": 7466.6} {"step": 2482, "train_loss": 4.071873664855957, "lr": 0.00039776543184787523, "tps": 21778, "wall": 7471.7} {"step": 2483, "train_loss": 4.043920516967773, "lr": 0.0003977624214844529, "tps": 21772, "wall": 7477.0} {"step": 2484, "train_loss": 4.044325351715088, "lr": 0.0003977594091073282, "tps": 21766, "wall": 7482.0} {"step": 2485, "train_loss": 4.103478908538818, "lr": 0.00039775639471653537, "tps": 21760, "wall": 7487.1} {"step": 2486, "train_loss": 4.056735992431641, "lr": 0.00039775337831210835, "tps": 21754, "wall": 7492.2} {"step": 2487, "train_loss": 4.005931854248047, "lr": 0.0003977503598940816, "tps": 21748, "wall": 7497.3} {"step": 2488, "train_loss": 4.036367893218994, "lr": 0.00039774733946248904, "tps": 21742, "wall": 7502.3} {"step": 2489, "train_loss": 4.095246315002441, "lr": 0.000397744317017365, "tps": 21736, "wall": 7507.5} {"step": 2490, "train_loss": 4.123754501342773, "lr": 0.0003977412925587438, "tps": 21730, "wall": 7512.6} {"step": 2491, "train_loss": 4.139729022979736, "lr": 0.0003977382660866596, "tps": 21724, "wall": 7517.6} {"step": 2492, "train_loss": 4.017740726470947, "lr": 0.00039773523760114674, "tps": 21718, "wall": 7522.7} {"step": 2493, "train_loss": 4.124941825866699, "lr": 0.0003977322071022394, "tps": 21712, "wall": 7527.8} {"step": 2494, "train_loss": 3.982241153717041, "lr": 0.0003977291745899721, "tps": 21706, "wall": 7532.9} {"step": 2495, "train_loss": 4.139747142791748, "lr": 0.000397726140064379, "tps": 21700, "wall": 7537.9} {"step": 2496, "train_loss": 4.017815589904785, "lr": 0.00039772310352549465, "tps": 21694, "wall": 7542.9} {"step": 2497, "train_loss": 4.077424049377441, "lr": 0.00039772006497335326, "tps": 21689, "wall": 7548.0} {"step": 2498, "train_loss": 4.129836559295654, "lr": 0.0003977170244079895, "tps": 21683, "wall": 7553.1} {"step": 2499, "train_loss": 4.122888088226318, "lr": 0.0003977139818294376, "tps": 21677, "wall": 7558.1} {"step": 2500, "train_loss": 3.946248769760132, "lr": 0.0003977109372377321, "tps": 21671, "wall": 7563.1} {"step": 2501, "train_loss": 4.072510242462158, "lr": 0.0003977078906329075, "tps": 21665, "wall": 7568.4} {"step": 2502, "train_loss": 4.083756446838379, "lr": 0.0003977048420149983, "tps": 21659, "wall": 7573.4} {"step": 2503, "train_loss": 4.129255294799805, "lr": 0.000397701791384039, "tps": 21653, "wall": 7578.4} {"step": 2504, "train_loss": 4.074782371520996, "lr": 0.0003976987387400643, "tps": 21648, "wall": 7583.5} {"step": 2505, "train_loss": 3.9735593795776367, "lr": 0.00039769568408310857, "tps": 21642, "wall": 7588.5} {"step": 2506, "train_loss": 3.9419167041778564, "lr": 0.0003976926274132065, "tps": 21636, "wall": 7593.5} {"step": 2507, "train_loss": 4.065645217895508, "lr": 0.00039768956873039287, "tps": 21630, "wall": 7598.6} {"step": 2508, "train_loss": 4.091573715209961, "lr": 0.00039768650803470205, "tps": 21625, "wall": 7603.6} {"step": 2509, "train_loss": 4.159687042236328, "lr": 0.0003976834453261689, "tps": 21619, "wall": 7608.7} {"step": 2510, "train_loss": 4.057530879974365, "lr": 0.0003976803806048281, "tps": 21613, "wall": 7613.8} {"step": 2511, "train_loss": 4.081940650939941, "lr": 0.0003976773138707143, "tps": 21607, "wall": 7618.8} {"step": 2512, "train_loss": 4.1350860595703125, "lr": 0.0003976742451238623, "tps": 21602, "wall": 7623.8} {"step": 2513, "train_loss": 4.183622360229492, "lr": 0.00039767117436430684, "tps": 21596, "wall": 7628.8} {"step": 2514, "train_loss": 4.089633941650391, "lr": 0.0003976681015920827, "tps": 21591, "wall": 7633.8} {"step": 2515, "train_loss": 4.201956272125244, "lr": 0.00039766502680722463, "tps": 21585, "wall": 7638.8} {"step": 2516, "train_loss": 4.0787272453308105, "lr": 0.00039766195000976763, "tps": 21580, "wall": 7643.7} {"step": 2517, "train_loss": 4.128678798675537, "lr": 0.0003976588711997464, "tps": 21574, "wall": 7648.7} {"step": 2518, "train_loss": 4.185877799987793, "lr": 0.00039765579037719583, "tps": 21569, "wall": 7653.6} {"step": 2519, "train_loss": 3.969668388366699, "lr": 0.0003976527075421509, "tps": 21564, "wall": 7658.6} {"step": 2520, "train_loss": 4.093975067138672, "lr": 0.0003976496226946465, "tps": 21558, "wall": 7663.6} {"step": 2521, "train_loss": 4.200504779815674, "lr": 0.00039764653583471756, "tps": 21552, "wall": 7668.7} {"step": 2522, "train_loss": 4.065242767333984, "lr": 0.00039764344696239905, "tps": 21546, "wall": 7673.9} {"step": 2523, "train_loss": 4.111008167266846, "lr": 0.00039764035607772595, "tps": 21540, "wall": 7679.2} {"step": 2524, "train_loss": 4.107122421264648, "lr": 0.00039763726318073323, "tps": 21534, "wall": 7684.3} {"step": 2525, "train_loss": 4.030006408691406, "lr": 0.0003976341682714561, "tps": 21529, "wall": 7689.3} {"step": 2526, "train_loss": 4.002840042114258, "lr": 0.00039763107134992945, "tps": 21523, "wall": 7694.2} {"step": 2527, "train_loss": 4.070673942565918, "lr": 0.0003976279724161883, "tps": 21518, "wall": 7699.4} {"step": 2528, "train_loss": 4.10346794128418, "lr": 0.0003976248714702681, "tps": 21512, "wall": 7704.4} {"step": 2529, "train_loss": 4.161854267120361, "lr": 0.0003976217685122036, "tps": 21506, "wall": 7709.4} {"step": 2530, "train_loss": 4.131313323974609, "lr": 0.0003976186635420301, "tps": 21501, "wall": 7714.6} {"step": 2531, "train_loss": 4.123477935791016, "lr": 0.00039761555655978283, "tps": 21495, "wall": 7719.6} {"step": 2532, "train_loss": 4.084355354309082, "lr": 0.0003976124475654968, "tps": 21490, "wall": 7724.6} {"step": 2533, "train_loss": 4.133862495422363, "lr": 0.00039760933655920747, "tps": 21484, "wall": 7729.6} {"step": 2534, "train_loss": 4.013723373413086, "lr": 0.0003976062235409499, "tps": 21478, "wall": 7734.7} {"step": 2535, "train_loss": 4.096464157104492, "lr": 0.00039760310851075947, "tps": 21473, "wall": 7739.7} {"step": 2536, "train_loss": 4.016295433044434, "lr": 0.00039759999146867143, "tps": 21468, "wall": 7744.7} {"step": 2537, "train_loss": 4.093896865844727, "lr": 0.00039759687241472104, "tps": 21462, "wall": 7749.9} {"step": 2538, "train_loss": 4.083765983581543, "lr": 0.0003975937513489437, "tps": 21456, "wall": 7754.9} {"step": 2539, "train_loss": 4.072469711303711, "lr": 0.0003975906282713747, "tps": 21451, "wall": 7760.1} {"step": 2540, "train_loss": 4.041876792907715, "lr": 0.0003975875031820495, "tps": 21445, "wall": 7765.1} {"step": 2541, "train_loss": 4.050976753234863, "lr": 0.00039758437608100345, "tps": 21440, "wall": 7770.1} {"step": 2542, "train_loss": 4.136040687561035, "lr": 0.00039758124696827194, "tps": 21434, "wall": 7775.1} {"step": 2543, "train_loss": 4.108788013458252, "lr": 0.00039757811584389046, "tps": 21429, "wall": 7780.1} {"step": 2544, "train_loss": 4.046133041381836, "lr": 0.00039757498270789454, "tps": 21424, "wall": 7785.1} {"step": 2545, "train_loss": 4.075910568237305, "lr": 0.00039757184756031955, "tps": 21418, "wall": 7790.1} {"step": 2546, "train_loss": 4.0671892166137695, "lr": 0.0003975687104012011, "tps": 21413, "wall": 7795.2} {"step": 2547, "train_loss": 4.143986225128174, "lr": 0.0003975655712305747, "tps": 21407, "wall": 7800.4} {"step": 2548, "train_loss": 4.076683044433594, "lr": 0.00039756243004847585, "tps": 21401, "wall": 7805.5} {"step": 2549, "train_loss": 4.1477861404418945, "lr": 0.0003975592868549402, "tps": 21396, "wall": 7810.6} {"step": 2550, "train_loss": 4.1343207359313965, "lr": 0.0003975561416500034, "tps": 21390, "wall": 7815.7} {"step": 2551, "train_loss": 4.130528450012207, "lr": 0.00039755299443370093, "tps": 21384, "wall": 7820.8} {"step": 2552, "train_loss": 4.096024513244629, "lr": 0.00039754984520606857, "tps": 21379, "wall": 7826.0} {"step": 2553, "train_loss": 4.148059368133545, "lr": 0.000397546693967142, "tps": 21373, "wall": 7831.1} {"step": 2554, "train_loss": 4.113572120666504, "lr": 0.00039754354071695687, "tps": 21368, "wall": 7836.2} {"step": 2555, "train_loss": 4.090190887451172, "lr": 0.0003975403854555489, "tps": 21362, "wall": 7841.3} {"step": 2556, "train_loss": 4.1318488121032715, "lr": 0.00039753722818295376, "tps": 21356, "wall": 7846.4} {"step": 2557, "train_loss": 4.050023078918457, "lr": 0.0003975340688992074, "tps": 21351, "wall": 7851.6} {"step": 2558, "train_loss": 4.0687055587768555, "lr": 0.00039753090760434546, "tps": 21345, "wall": 7856.7} {"step": 2559, "train_loss": 4.1838459968566895, "lr": 0.0003975277442984038, "tps": 21340, "wall": 7861.8} {"step": 2560, "train_loss": 4.023836135864258, "lr": 0.0003975245789814182, "tps": 21334, "wall": 7866.9} {"step": 2561, "train_loss": 4.036800384521484, "lr": 0.00039752141165342464, "tps": 21329, "wall": 7872.0} {"step": 2562, "train_loss": 4.063875198364258, "lr": 0.0003975182423144589, "tps": 21323, "wall": 7877.0} {"step": 2563, "train_loss": 3.99530029296875, "lr": 0.0003975150709645569, "tps": 21318, "wall": 7882.2} {"step": 2564, "train_loss": 4.133736610412598, "lr": 0.00039751189760375453, "tps": 21312, "wall": 7887.4} {"step": 2565, "train_loss": 4.145654678344727, "lr": 0.00039750872223208786, "tps": 21306, "wall": 7892.6} {"step": 2566, "train_loss": 3.992515802383423, "lr": 0.0003975055448495927, "tps": 21301, "wall": 7897.7} {"step": 2567, "train_loss": 4.108889102935791, "lr": 0.00039750236545630524, "tps": 21295, "wall": 7902.8} {"step": 2568, "train_loss": 4.120832443237305, "lr": 0.0003974991840522613, "tps": 21290, "wall": 7907.9} {"step": 2569, "train_loss": 4.1043477058410645, "lr": 0.00039749600063749706, "tps": 21284, "wall": 7913.2} {"step": 2570, "train_loss": 4.025639057159424, "lr": 0.0003974928152120484, "tps": 21279, "wall": 7918.2} {"step": 2571, "train_loss": 4.102860450744629, "lr": 0.0003974896277759516, "tps": 21273, "wall": 7923.3} {"step": 2572, "train_loss": 4.111416339874268, "lr": 0.0003974864383292427, "tps": 21268, "wall": 7928.3} {"step": 2573, "train_loss": 4.1348876953125, "lr": 0.0003974832468719578, "tps": 21263, "wall": 7933.3} {"step": 2574, "train_loss": 4.100612640380859, "lr": 0.00039748005340413314, "tps": 21258, "wall": 7938.3} {"step": 2575, "train_loss": 4.15061092376709, "lr": 0.0003974768579258048, "tps": 21253, "wall": 7943.3} {"step": 2576, "train_loss": 4.148410320281982, "lr": 0.00039747366043700903, "tps": 21247, "wall": 7948.4} {"step": 2577, "train_loss": 4.125531196594238, "lr": 0.00039747046093778195, "tps": 21242, "wall": 7953.4} {"step": 2578, "train_loss": 4.073232173919678, "lr": 0.00039746725942816, "tps": 21237, "wall": 7958.4} {"step": 2579, "train_loss": 4.05157470703125, "lr": 0.0003974640559081793, "tps": 21232, "wall": 7963.5} {"step": 2580, "train_loss": 4.094862461090088, "lr": 0.0003974608503778761, "tps": 21226, "wall": 7968.6} {"step": 2581, "train_loss": 4.089151382446289, "lr": 0.00039745764283728686, "tps": 21221, "wall": 7973.7} {"step": 2582, "train_loss": 4.063229560852051, "lr": 0.00039745443328644784, "tps": 21216, "wall": 7978.7} {"step": 2583, "train_loss": 4.113819122314453, "lr": 0.00039745122172539537, "tps": 21211, "wall": 7983.7} {"step": 2584, "train_loss": 4.091238498687744, "lr": 0.0003974480081541658, "tps": 21205, "wall": 7989.0} {"step": 2585, "train_loss": 4.1401543617248535, "lr": 0.0003974447925727957, "tps": 21199, "wall": 7994.2} {"step": 2586, "train_loss": 4.072414875030518, "lr": 0.0003974415749813214, "tps": 21194, "wall": 7999.3} {"step": 2587, "train_loss": 4.1962995529174805, "lr": 0.0003974383553797793, "tps": 21189, "wall": 8004.4} {"step": 2588, "train_loss": 4.072877407073975, "lr": 0.0003974351337682059, "tps": 21183, "wall": 8009.5} {"step": 2589, "train_loss": 4.063174247741699, "lr": 0.0003974319101466377, "tps": 21178, "wall": 8014.6} {"step": 2590, "train_loss": 4.173984527587891, "lr": 0.0003974286845151112, "tps": 21173, "wall": 8019.7} {"step": 2591, "train_loss": 4.23234748840332, "lr": 0.000397425456873663, "tps": 21167, "wall": 8024.8} {"step": 2592, "train_loss": 4.058722972869873, "lr": 0.0003974222272223297, "tps": 21162, "wall": 8030.0} {"step": 2593, "train_loss": 4.105127811431885, "lr": 0.0003974189955611477, "tps": 21156, "wall": 8035.2} {"step": 2594, "train_loss": 4.1070966720581055, "lr": 0.00039741576189015375, "tps": 21151, "wall": 8040.3} {"step": 2595, "train_loss": 4.096620082855225, "lr": 0.0003974125262093844, "tps": 21146, "wall": 8045.4} {"step": 2596, "train_loss": 4.027905464172363, "lr": 0.0003974092885188764, "tps": 21141, "wall": 8050.5} {"step": 2597, "train_loss": 4.066583633422852, "lr": 0.00039740604881866644, "tps": 21135, "wall": 8055.8} {"step": 2598, "train_loss": 4.122525691986084, "lr": 0.0003974028071087911, "tps": 21129, "wall": 8061.0} {"step": 2599, "train_loss": 4.1441779136657715, "lr": 0.0003973995633892872, "tps": 21124, "wall": 8066.1} {"step": 2600, "train_loss": 4.1486029624938965, "lr": 0.0003973963176601914, "tps": 21119, "wall": 8071.3} {"step": 2601, "train_loss": 4.076050758361816, "lr": 0.00039739306992154057, "tps": 21114, "wall": 8076.3} {"step": 2602, "train_loss": 4.131633758544922, "lr": 0.00039738982017337144, "tps": 21108, "wall": 8081.5} {"step": 2603, "train_loss": 4.033036231994629, "lr": 0.0003973865684157208, "tps": 21103, "wall": 8086.6} {"step": 2604, "train_loss": 4.242002487182617, "lr": 0.00039738331464862553, "tps": 21098, "wall": 8091.7} {"step": 2605, "train_loss": 4.0684332847595215, "lr": 0.00039738005887212253, "tps": 21093, "wall": 8096.7} {"step": 2606, "train_loss": 4.0320329666137695, "lr": 0.0003973768010862485, "tps": 21088, "wall": 8101.7} {"step": 2607, "train_loss": 4.0912933349609375, "lr": 0.00039737354129104055, "tps": 21083, "wall": 8106.7} {"step": 2608, "train_loss": 4.13183069229126, "lr": 0.00039737027948653556, "tps": 21078, "wall": 8111.6} {"step": 2609, "train_loss": 3.9924609661102295, "lr": 0.0003973670156727704, "tps": 21073, "wall": 8116.7} {"step": 2610, "train_loss": 4.156560897827148, "lr": 0.00039736374984978206, "tps": 21068, "wall": 8122.0} {"step": 2611, "train_loss": 4.0080413818359375, "lr": 0.00039736048201760766, "tps": 21062, "wall": 8127.1} {"step": 2612, "train_loss": 4.05855655670166, "lr": 0.000397357212176284, "tps": 21058, "wall": 8132.1} {"step": 2613, "train_loss": 4.142321586608887, "lr": 0.00039735394032584836, "tps": 21053, "wall": 8137.0} {"step": 2614, "train_loss": 4.038442611694336, "lr": 0.00039735066646633767, "tps": 21048, "wall": 8142.0} {"step": 2615, "train_loss": 4.014187335968018, "lr": 0.00039734739059778896, "tps": 21043, "wall": 8147.0} {"step": 2616, "train_loss": 3.971508502960205, "lr": 0.00039734411272023955, "tps": 21038, "wall": 8152.0} {"step": 2617, "train_loss": 3.996741771697998, "lr": 0.00039734083283372634, "tps": 21033, "wall": 8157.1} {"step": 2618, "train_loss": 4.113707065582275, "lr": 0.0003973375509382865, "tps": 21028, "wall": 8162.2} {"step": 2619, "train_loss": 4.073171615600586, "lr": 0.00039733426703395745, "tps": 21023, "wall": 8167.3} {"step": 2620, "train_loss": 4.189111232757568, "lr": 0.00039733098112077614, "tps": 21018, "wall": 8172.4} {"step": 2621, "train_loss": 4.042574882507324, "lr": 0.0003973276931987799, "tps": 21013, "wall": 8177.4} {"step": 2622, "train_loss": 4.037102699279785, "lr": 0.000397324403268006, "tps": 21008, "wall": 8182.4} {"step": 2623, "train_loss": 4.036942005157471, "lr": 0.0003973211113284916, "tps": 21003, "wall": 8187.5} {"step": 2624, "train_loss": 4.046918869018555, "lr": 0.0003973178173802741, "tps": 20998, "wall": 8192.6} {"step": 2625, "train_loss": 3.9828124046325684, "lr": 0.0003973145214233908, "tps": 20993, "wall": 8197.7} {"step": 2626, "train_loss": 4.066481590270996, "lr": 0.00039731122345787896, "tps": 20988, "wall": 8202.8} {"step": 2627, "train_loss": 4.170711040496826, "lr": 0.000397307923483776, "tps": 20983, "wall": 8207.9} {"step": 2628, "train_loss": 4.099956035614014, "lr": 0.00039730462150111925, "tps": 20978, "wall": 8212.9} {"step": 2629, "train_loss": 4.105802059173584, "lr": 0.0003973013175099462, "tps": 20973, "wall": 8218.0} {"step": 2630, "train_loss": 3.9996092319488525, "lr": 0.00039729801151029427, "tps": 20968, "wall": 8222.9} {"step": 2631, "train_loss": 4.098786354064941, "lr": 0.0003972947035022008, "tps": 20964, "wall": 8227.9} {"step": 2632, "train_loss": 4.1113715171813965, "lr": 0.0003972913934857034, "tps": 20959, "wall": 8232.9} {"step": 2633, "train_loss": 4.071430206298828, "lr": 0.0003972880814608394, "tps": 20954, "wall": 8237.9} {"step": 2634, "train_loss": 4.01413631439209, "lr": 0.0003972847674276466, "tps": 20949, "wall": 8242.9} {"step": 2635, "train_loss": 4.062966346740723, "lr": 0.00039728145138616226, "tps": 20945, "wall": 8247.9} {"step": 2636, "train_loss": 3.8820273876190186, "lr": 0.000397278133336424, "tps": 20940, "wall": 8252.9} {"step": 2637, "train_loss": 4.14815616607666, "lr": 0.0003972748132784695, "tps": 20935, "wall": 8258.0} {"step": 2638, "train_loss": 3.9776408672332764, "lr": 0.0003972714912123363, "tps": 20930, "wall": 8263.2} {"step": 2639, "train_loss": 4.084587097167969, "lr": 0.0003972681671380621, "tps": 20924, "wall": 8268.4} {"step": 2640, "train_loss": 4.058457851409912, "lr": 0.00039726484105568455, "tps": 20919, "wall": 8273.6} {"step": 2641, "train_loss": 4.0608954429626465, "lr": 0.00039726151296524124, "tps": 20914, "wall": 8278.6} {"step": 2642, "train_loss": 4.068848609924316, "lr": 0.00039725818286676985, "tps": 20909, "wall": 8283.8} {"step": 2643, "train_loss": 4.030008792877197, "lr": 0.00039725485076030833, "tps": 20904, "wall": 8288.9} {"step": 2644, "train_loss": 4.095519065856934, "lr": 0.00039725151664589414, "tps": 20899, "wall": 8294.1} {"step": 2645, "train_loss": 4.125998497009277, "lr": 0.0003972481805235652, "tps": 20894, "wall": 8299.3} {"step": 2646, "train_loss": 4.107272148132324, "lr": 0.0003972448423933593, "tps": 20889, "wall": 8304.5} {"step": 2647, "train_loss": 4.040040016174316, "lr": 0.00039724150225531427, "tps": 20883, "wall": 8309.7} {"step": 2648, "train_loss": 4.1106486320495605, "lr": 0.00039723816010946785, "tps": 20878, "wall": 8314.9} {"step": 2649, "train_loss": 4.098642349243164, "lr": 0.00039723481595585805, "tps": 20873, "wall": 8320.2} {"step": 2650, "train_loss": 4.167261123657227, "lr": 0.00039723146979452257, "tps": 20867, "wall": 8325.6} {"step": 2651, "train_loss": 4.181147575378418, "lr": 0.0003972281216254995, "tps": 20862, "wall": 8330.8} {"step": 2652, "train_loss": 4.078821182250977, "lr": 0.00039722477144882664, "tps": 20856, "wall": 8336.2} {"step": 2653, "train_loss": 4.142765998840332, "lr": 0.000397221419264542, "tps": 20851, "wall": 8341.5} {"step": 2654, "train_loss": 4.071717262268066, "lr": 0.00039721806507268353, "tps": 20846, "wall": 8346.8} {"step": 2655, "train_loss": 4.068688869476318, "lr": 0.0003972147088732892, "tps": 20840, "wall": 8352.1} {"step": 2656, "train_loss": 3.9982967376708984, "lr": 0.00039721135066639703, "tps": 20835, "wall": 8357.4} {"step": 2657, "train_loss": 3.9758052825927734, "lr": 0.00039720799045204515, "tps": 20829, "wall": 8362.8} {"step": 2658, "train_loss": 3.9861817359924316, "lr": 0.0003972046282302716, "tps": 20824, "wall": 8368.1} {"step": 2659, "train_loss": 4.086933612823486, "lr": 0.0003972012640011144, "tps": 20818, "wall": 8373.5} {"step": 2660, "train_loss": 3.9634158611297607, "lr": 0.0003971978977646117, "tps": 20813, "wall": 8378.9} {"step": 2661, "train_loss": 4.10870885848999, "lr": 0.0003971945295208016, "tps": 20807, "wall": 8384.3} {"step": 2662, "train_loss": 4.126817226409912, "lr": 0.00039719115926972233, "tps": 20801, "wall": 8389.7} {"step": 2663, "train_loss": 4.116102695465088, "lr": 0.00039718778701141195, "tps": 20796, "wall": 8395.1} {"step": 2664, "train_loss": 4.0578460693359375, "lr": 0.00039718441274590876, "tps": 20791, "wall": 8400.4} {"step": 2665, "train_loss": 4.142160892486572, "lr": 0.000397181036473251, "tps": 20786, "wall": 8405.5} {"step": 2666, "train_loss": 4.082467079162598, "lr": 0.00039717765819347685, "tps": 20781, "wall": 8410.6} {"step": 2667, "train_loss": 3.9887475967407227, "lr": 0.00039717427790662455, "tps": 20776, "wall": 8415.6} {"step": 2668, "train_loss": 4.101167678833008, "lr": 0.0003971708956127325, "tps": 20772, "wall": 8420.7} {"step": 2669, "train_loss": 4.079847812652588, "lr": 0.0003971675113118389, "tps": 20767, "wall": 8425.8} {"step": 2670, "train_loss": 4.077150344848633, "lr": 0.0003971641250039823, "tps": 20761, "wall": 8431.2} {"step": 2671, "train_loss": 4.053782939910889, "lr": 0.0003971607366892008, "tps": 20756, "wall": 8436.6} {"step": 2672, "train_loss": 4.03740119934082, "lr": 0.00039715734636753294, "tps": 20751, "wall": 8441.9} {"step": 2673, "train_loss": 4.034191608428955, "lr": 0.000397153954039017, "tps": 20745, "wall": 8447.2} {"step": 2674, "train_loss": 4.0264739990234375, "lr": 0.0003971505597036915, "tps": 20741, "wall": 8452.2} {"step": 2675, "train_loss": 4.059682846069336, "lr": 0.00039714716336159496, "tps": 20736, "wall": 8457.3} {"step": 2676, "train_loss": 4.103010177612305, "lr": 0.0003971437650127656, "tps": 20731, "wall": 8462.6} {"step": 2677, "train_loss": 3.945969581604004, "lr": 0.00039714036465724226, "tps": 20725, "wall": 8468.0} {"step": 2678, "train_loss": 4.114070415496826, "lr": 0.00039713696229506316, "tps": 20720, "wall": 8473.3} {"step": 2679, "train_loss": 4.010655403137207, "lr": 0.000397133557926267, "tps": 20715, "wall": 8478.7} {"step": 2680, "train_loss": 3.9767966270446777, "lr": 0.00039713015155089243, "tps": 20709, "wall": 8484.0} {"step": 2681, "train_loss": 4.064781188964844, "lr": 0.0003971267431689778, "tps": 20704, "wall": 8489.4} {"step": 2682, "train_loss": 4.054059982299805, "lr": 0.0003971233327805619, "tps": 20699, "wall": 8494.7} {"step": 2683, "train_loss": 4.062769889831543, "lr": 0.0003971199203856833, "tps": 20693, "wall": 8500.0} {"step": 2684, "train_loss": 3.950685739517212, "lr": 0.00039711650598438057, "tps": 20688, "wall": 8505.4} {"step": 2685, "train_loss": 4.123423099517822, "lr": 0.0003971130895766925, "tps": 20683, "wall": 8510.8} {"step": 2686, "train_loss": 4.108415603637695, "lr": 0.0003971096711626579, "tps": 20677, "wall": 8516.1} {"step": 2687, "train_loss": 4.109241485595703, "lr": 0.00039710625074231525, "tps": 20672, "wall": 8521.5} {"step": 2688, "train_loss": 4.039707660675049, "lr": 0.00039710282831570344, "tps": 20667, "wall": 8526.8} {"step": 2689, "train_loss": 4.073833465576172, "lr": 0.00039709940388286117, "tps": 20662, "wall": 8532.1} {"step": 2690, "train_loss": 4.097310543060303, "lr": 0.00039709597744382735, "tps": 20657, "wall": 8537.4} {"step": 2691, "train_loss": 4.066011905670166, "lr": 0.00039709254899864064, "tps": 20651, "wall": 8542.8} {"step": 2692, "train_loss": 4.123096466064453, "lr": 0.00039708911854734, "tps": 20646, "wall": 8548.2} {"step": 2693, "train_loss": 4.030142784118652, "lr": 0.00039708568608996423, "tps": 20641, "wall": 8553.5} {"step": 2694, "train_loss": 4.054027080535889, "lr": 0.00039708225162655227, "tps": 20636, "wall": 8558.7} {"step": 2695, "train_loss": 4.100077152252197, "lr": 0.00039707881515714294, "tps": 20631, "wall": 8564.0} {"step": 2696, "train_loss": 4.027022361755371, "lr": 0.00039707537668177517, "tps": 20626, "wall": 8569.1} {"step": 2697, "train_loss": 4.093452453613281, "lr": 0.00039707193620048804, "tps": 20621, "wall": 8574.3} {"step": 2698, "train_loss": 4.109945774078369, "lr": 0.0003970684937133204, "tps": 20617, "wall": 8579.2} {"step": 2699, "train_loss": 4.067776679992676, "lr": 0.00039706504922031125, "tps": 20612, "wall": 8584.3} {"step": 2700, "train_loss": 4.061275005340576, "lr": 0.0003970616027214997, "tps": 20608, "wall": 8589.4} {"step": 2701, "train_loss": 4.014925003051758, "lr": 0.0003970581542169247, "tps": 20603, "wall": 8594.5} {"step": 2702, "train_loss": 4.128720283508301, "lr": 0.00039705470370662534, "tps": 20599, "wall": 8599.5} {"step": 2703, "train_loss": 4.073971271514893, "lr": 0.0003970512511906408, "tps": 20594, "wall": 8604.6} {"step": 2704, "train_loss": 4.191133975982666, "lr": 0.00039704779666901004, "tps": 20589, "wall": 8610.0} {"step": 2705, "train_loss": 4.073030471801758, "lr": 0.00039704434014177227, "tps": 20583, "wall": 8615.7} {"step": 2706, "train_loss": 4.070072174072266, "lr": 0.00039704088160896664, "tps": 20578, "wall": 8620.9} {"step": 2707, "train_loss": 3.9824376106262207, "lr": 0.00039703742107063234, "tps": 20573, "wall": 8626.1} {"step": 2708, "train_loss": 4.135499477386475, "lr": 0.00039703395852680847, "tps": 20568, "wall": 8631.4} {"step": 2709, "train_loss": 3.9929304122924805, "lr": 0.0003970304939775344, "tps": 20563, "wall": 8636.8} {"step": 2710, "train_loss": 4.15130615234375, "lr": 0.0003970270274228494, "tps": 20557, "wall": 8642.5} {"step": 2711, "train_loss": 4.107576370239258, "lr": 0.00039702355886279256, "tps": 20552, "wall": 8647.6} {"step": 2712, "train_loss": 4.121581077575684, "lr": 0.0003970200882974033, "tps": 20548, "wall": 8652.7} {"step": 2713, "train_loss": 4.066164493560791, "lr": 0.00039701661572672084, "tps": 20543, "wall": 8657.9} {"step": 2714, "train_loss": 4.068453788757324, "lr": 0.0003970131411507847, "tps": 20538, "wall": 8663.2} {"step": 2715, "train_loss": 3.99413800239563, "lr": 0.00039700966456963406, "tps": 20534, "wall": 8668.3} {"step": 2716, "train_loss": 4.01097297668457, "lr": 0.00039700618598330833, "tps": 20529, "wall": 8673.5} {"step": 2717, "train_loss": 3.9874868392944336, "lr": 0.00039700270539184696, "tps": 20525, "wall": 8678.5} {"step": 2718, "train_loss": 4.094785213470459, "lr": 0.0003969992227952894, "tps": 20520, "wall": 8683.5} {"step": 2719, "train_loss": 4.017531394958496, "lr": 0.0003969957381936751, "tps": 20516, "wall": 8688.5} {"step": 2720, "train_loss": 3.918562889099121, "lr": 0.0003969922515870434, "tps": 20512, "wall": 8693.6} {"step": 2721, "train_loss": 3.996701717376709, "lr": 0.000396988762975434, "tps": 20507, "wall": 8698.6} {"step": 2722, "train_loss": 4.07423210144043, "lr": 0.0003969852723588863, "tps": 20503, "wall": 8703.6} {"step": 2723, "train_loss": 3.9308323860168457, "lr": 0.00039698177973743984, "tps": 20498, "wall": 8709.0} {"step": 2724, "train_loss": 4.165657043457031, "lr": 0.00039697828511113417, "tps": 20493, "wall": 8714.3} {"step": 2725, "train_loss": 3.914515495300293, "lr": 0.0003969747884800089, "tps": 20488, "wall": 8719.7} {"step": 2726, "train_loss": 4.149572849273682, "lr": 0.00039697128984410367, "tps": 20483, "wall": 8724.8} {"step": 2727, "train_loss": 4.06733512878418, "lr": 0.00039696778920345814, "tps": 20479, "wall": 8730.0} {"step": 2728, "train_loss": 4.109750747680664, "lr": 0.0003969642865581119, "tps": 20474, "wall": 8735.3} {"step": 2729, "train_loss": 4.019064903259277, "lr": 0.00039696078190810464, "tps": 20469, "wall": 8740.5} {"step": 2730, "train_loss": 4.020113945007324, "lr": 0.0003969572752534761, "tps": 20464, "wall": 8745.7} {"step": 2731, "train_loss": 4.11685848236084, "lr": 0.00039695376659426595, "tps": 20460, "wall": 8750.9} {"step": 2732, "train_loss": 4.025729179382324, "lr": 0.0003969502559305139, "tps": 20455, "wall": 8756.1} {"step": 2733, "train_loss": 4.149321556091309, "lr": 0.0003969467432622599, "tps": 20451, "wall": 8761.2} {"step": 2734, "train_loss": 4.067617893218994, "lr": 0.0003969432285895435, "tps": 20446, "wall": 8766.2} {"step": 2735, "train_loss": 4.076785087585449, "lr": 0.00039693971191240475, "tps": 20442, "wall": 8771.3} {"step": 2736, "train_loss": 4.040739059448242, "lr": 0.0003969361932308833, "tps": 20438, "wall": 8776.4} {"step": 2737, "train_loss": 4.062636375427246, "lr": 0.00039693267254501904, "tps": 20433, "wall": 8781.4} {"step": 2738, "train_loss": 4.037981033325195, "lr": 0.00039692914985485196, "tps": 20429, "wall": 8786.5} {"step": 2739, "train_loss": 4.037241458892822, "lr": 0.00039692562516042187, "tps": 20425, "wall": 8791.5} {"step": 2740, "train_loss": 4.076350212097168, "lr": 0.00039692209846176876, "tps": 20420, "wall": 8796.6} {"step": 2741, "train_loss": 4.041306972503662, "lr": 0.00039691856975893254, "tps": 20416, "wall": 8801.6} {"step": 2742, "train_loss": 4.03443717956543, "lr": 0.00039691503905195315, "tps": 20412, "wall": 8806.6} {"step": 2743, "train_loss": 4.055820465087891, "lr": 0.00039691150634087066, "tps": 20408, "wall": 8811.7} {"step": 2744, "train_loss": 4.052046298980713, "lr": 0.000396907971625725, "tps": 20403, "wall": 8816.8} {"step": 2745, "train_loss": 4.0942511558532715, "lr": 0.00039690443490655636, "tps": 20399, "wall": 8821.7} {"step": 2746, "train_loss": 3.9347710609436035, "lr": 0.00039690089618340467, "tps": 20395, "wall": 8826.7} {"step": 2747, "train_loss": 4.08039665222168, "lr": 0.00039689735545631006, "tps": 20391, "wall": 8831.7} {"step": 2748, "train_loss": 3.9550280570983887, "lr": 0.0003968938127253126, "tps": 20387, "wall": 8836.7} {"step": 2749, "train_loss": 4.0425615310668945, "lr": 0.00039689026799045253, "tps": 20383, "wall": 8841.6} {"step": 2750, "train_loss": 4.026216983795166, "lr": 0.0003968867212517699, "tps": 20379, "wall": 8846.6} {"step": 2751, "train_loss": 4.013617515563965, "lr": 0.0003968831725093049, "tps": 20375, "wall": 8851.6} {"step": 2752, "train_loss": 4.03089714050293, "lr": 0.00039687962176309776, "tps": 20371, "wall": 8856.5} {"step": 2753, "train_loss": 4.089290618896484, "lr": 0.0003968760690131887, "tps": 20367, "wall": 8861.5} {"step": 2754, "train_loss": 4.188794136047363, "lr": 0.000396872514259618, "tps": 20363, "wall": 8866.4} {"step": 2755, "train_loss": 4.091802597045898, "lr": 0.00039686895750242585, "tps": 20359, "wall": 8871.4} {"step": 2756, "train_loss": 4.033349514007568, "lr": 0.0003968653987416526, "tps": 20355, "wall": 8876.4} {"step": 2757, "train_loss": 4.048573017120361, "lr": 0.00039686183797733854, "tps": 20351, "wall": 8881.4} {"step": 2758, "train_loss": 4.0248870849609375, "lr": 0.000396858275209524, "tps": 20347, "wall": 8886.3} {"step": 2759, "train_loss": 4.112856388092041, "lr": 0.0003968547104382494, "tps": 20343, "wall": 8891.3} {"step": 2760, "train_loss": 4.023221015930176, "lr": 0.000396851143663555, "tps": 20339, "wall": 8896.3} {"step": 2761, "train_loss": 4.130871295928955, "lr": 0.00039684757488548126, "tps": 20335, "wall": 8901.3} {"step": 2762, "train_loss": 3.979839324951172, "lr": 0.00039684400410406874, "tps": 20331, "wall": 8906.3} {"step": 2763, "train_loss": 4.046543598175049, "lr": 0.0003968404313193577, "tps": 20327, "wall": 8911.3} {"step": 2764, "train_loss": 4.06415319442749, "lr": 0.00039683685653138864, "tps": 20323, "wall": 8916.3} {"step": 2765, "train_loss": 4.0005083084106445, "lr": 0.00039683327974020217, "tps": 20319, "wall": 8921.3} {"step": 2766, "train_loss": 4.085564613342285, "lr": 0.0003968297009458387, "tps": 20314, "wall": 8926.3} {"step": 2767, "train_loss": 4.0598368644714355, "lr": 0.0003968261201483389, "tps": 20310, "wall": 8931.4} {"step": 2768, "train_loss": 4.029268264770508, "lr": 0.0003968225373477432, "tps": 20306, "wall": 8936.4} {"step": 2769, "train_loss": 4.1094231605529785, "lr": 0.0003968189525440921, "tps": 20302, "wall": 8941.4} {"step": 2770, "train_loss": 4.060445785522461, "lr": 0.0003968153657374265, "tps": 20298, "wall": 8946.5} {"step": 2771, "train_loss": 3.9189364910125732, "lr": 0.0003968117769277868, "tps": 20294, "wall": 8951.5} {"step": 2772, "train_loss": 3.973763942718506, "lr": 0.00039680818611521375, "tps": 20290, "wall": 8956.5} {"step": 2773, "train_loss": 4.114893913269043, "lr": 0.00039680459329974804, "tps": 20286, "wall": 8961.7} {"step": 2774, "train_loss": 3.987306594848633, "lr": 0.0003968009984814303, "tps": 20281, "wall": 8966.8} {"step": 2775, "train_loss": 4.069343090057373, "lr": 0.0003967974016603012, "tps": 20277, "wall": 8972.0} {"step": 2776, "train_loss": 3.966001033782959, "lr": 0.00039679380283640174, "tps": 20273, "wall": 8977.1} {"step": 2777, "train_loss": 4.027435779571533, "lr": 0.0003967902020097724, "tps": 20269, "wall": 8982.1} {"step": 2778, "train_loss": 4.026635646820068, "lr": 0.0003967865991804541, "tps": 20264, "wall": 8987.2} {"step": 2779, "train_loss": 3.9860472679138184, "lr": 0.00039678299434848765, "tps": 20260, "wall": 8992.3} {"step": 2780, "train_loss": 3.9193289279937744, "lr": 0.00039677938751391385, "tps": 20256, "wall": 8997.4} {"step": 2781, "train_loss": 4.106559753417969, "lr": 0.00039677577867677365, "tps": 20252, "wall": 9002.4} {"step": 2782, "train_loss": 4.0439019203186035, "lr": 0.0003967721678371078, "tps": 20248, "wall": 9007.4} {"step": 2783, "train_loss": 4.145766258239746, "lr": 0.0003967685549949573, "tps": 20244, "wall": 9012.5} {"step": 2784, "train_loss": 4.085299968719482, "lr": 0.0003967649401503631, "tps": 20240, "wall": 9017.5} {"step": 2785, "train_loss": 4.065550327301025, "lr": 0.000396761323303366, "tps": 20236, "wall": 9022.7} {"step": 2786, "train_loss": 3.8896102905273438, "lr": 0.00039675770445400714, "tps": 20231, "wall": 9027.8} {"step": 2787, "train_loss": 4.117079734802246, "lr": 0.0003967540836023274, "tps": 20227, "wall": 9032.9} {"step": 2788, "train_loss": 4.06960391998291, "lr": 0.00039675046074836787, "tps": 20223, "wall": 9037.9} {"step": 2789, "train_loss": 4.130481719970703, "lr": 0.00039674683589216957, "tps": 20219, "wall": 9043.1} {"step": 2790, "train_loss": 4.006527423858643, "lr": 0.00039674320903377344, "tps": 20215, "wall": 9048.1} {"step": 2791, "train_loss": 4.115267753601074, "lr": 0.00039673958017322073, "tps": 20211, "wall": 9053.2} {"step": 2792, "train_loss": 4.0442795753479, "lr": 0.00039673594931055253, "tps": 20207, "wall": 9058.3} {"step": 2793, "train_loss": 3.988090991973877, "lr": 0.00039673231644580994, "tps": 20203, "wall": 9063.3} {"step": 2794, "train_loss": 4.042503356933594, "lr": 0.0003967286815790341, "tps": 20199, "wall": 9068.4} {"step": 2795, "train_loss": 4.143531799316406, "lr": 0.0003967250447102662, "tps": 20195, "wall": 9073.4} {"step": 2796, "train_loss": 3.9969472885131836, "lr": 0.00039672140583954735, "tps": 20191, "wall": 9078.5} {"step": 2797, "train_loss": 4.019280910491943, "lr": 0.0003967177649669189, "tps": 20187, "wall": 9083.5} {"step": 2798, "train_loss": 3.932133197784424, "lr": 0.0003967141220924221, "tps": 20182, "wall": 9088.6} {"step": 2799, "train_loss": 3.958923101425171, "lr": 0.00039671047721609817, "tps": 20178, "wall": 9093.7} {"step": 2800, "train_loss": 3.9715473651885986, "lr": 0.00039670683033798834, "tps": 20175, "wall": 9098.7} {"step": 2801, "train_loss": 4.003340721130371, "lr": 0.00039670318145813404, "tps": 20171, "wall": 9103.7} {"step": 2802, "train_loss": 4.056759357452393, "lr": 0.00039669953057657647, "tps": 20167, "wall": 9108.8} {"step": 2803, "train_loss": 3.968018054962158, "lr": 0.00039669587769335704, "tps": 20162, "wall": 9114.1} {"step": 2804, "train_loss": 4.116983413696289, "lr": 0.00039669222280851727, "tps": 20158, "wall": 9119.2} {"step": 2805, "train_loss": 3.9848904609680176, "lr": 0.0003966885659220983, "tps": 20154, "wall": 9124.3} {"step": 2806, "train_loss": 4.111847877502441, "lr": 0.0003966849070341418, "tps": 20150, "wall": 9129.4} {"step": 2807, "train_loss": 4.11598014831543, "lr": 0.00039668124614468907, "tps": 20146, "wall": 9134.5} {"step": 2808, "train_loss": 3.976900577545166, "lr": 0.00039667758325378165, "tps": 20141, "wall": 9139.7} {"step": 2809, "train_loss": 4.005825042724609, "lr": 0.00039667391836146094, "tps": 20137, "wall": 9144.8} {"step": 2810, "train_loss": 3.997913360595703, "lr": 0.00039667025146776855, "tps": 20133, "wall": 9150.0} {"step": 2811, "train_loss": 4.186008930206299, "lr": 0.000396666582572746, "tps": 20129, "wall": 9155.1} {"step": 2812, "train_loss": 4.058632850646973, "lr": 0.00039666291167643497, "tps": 20125, "wall": 9160.1} {"step": 2813, "train_loss": 3.966657876968384, "lr": 0.00039665923877887677, "tps": 20121, "wall": 9165.2} {"step": 2814, "train_loss": 3.9695091247558594, "lr": 0.0003966555638801132, "tps": 20117, "wall": 9170.2} {"step": 2815, "train_loss": 4.042957305908203, "lr": 0.00039665188698018584, "tps": 20113, "wall": 9175.3} {"step": 2816, "train_loss": 4.096163749694824, "lr": 0.0003966482080791364, "tps": 20109, "wall": 9180.4} {"step": 2817, "train_loss": 4.096490859985352, "lr": 0.0003966445271770064, "tps": 20105, "wall": 9185.4} {"step": 2818, "train_loss": 4.105997562408447, "lr": 0.0003966408442738377, "tps": 20101, "wall": 9190.6} {"step": 2819, "train_loss": 3.9967293739318848, "lr": 0.000396637159369672, "tps": 20097, "wall": 9195.6} {"step": 2820, "train_loss": 4.122483253479004, "lr": 0.00039663347246455096, "tps": 20093, "wall": 9200.7} {"step": 2821, "train_loss": 4.082848072052002, "lr": 0.00039662978355851637, "tps": 20089, "wall": 9205.7} {"step": 2822, "train_loss": 4.032491683959961, "lr": 0.00039662609265161004, "tps": 20085, "wall": 9210.9} {"step": 2823, "train_loss": 4.008533477783203, "lr": 0.0003966223997438738, "tps": 20081, "wall": 9216.1} {"step": 2824, "train_loss": 3.99185848236084, "lr": 0.00039661870483534943, "tps": 20077, "wall": 9221.2} {"step": 2825, "train_loss": 4.01675271987915, "lr": 0.0003966150079260788, "tps": 20073, "wall": 9226.2} {"step": 2826, "train_loss": 4.074446201324463, "lr": 0.0003966113090161039, "tps": 20069, "wall": 9231.3} {"step": 2827, "train_loss": 3.9860572814941406, "lr": 0.0003966076081054665, "tps": 20065, "wall": 9236.5} {"step": 2828, "train_loss": 3.9312593936920166, "lr": 0.00039660390519420847, "tps": 20061, "wall": 9241.6} {"step": 2829, "train_loss": 4.029815196990967, "lr": 0.00039660020028237195, "tps": 20057, "wall": 9246.9} {"step": 2830, "train_loss": 4.047301769256592, "lr": 0.00039659649336999875, "tps": 20052, "wall": 9252.1} {"step": 2831, "train_loss": 3.9538755416870117, "lr": 0.00039659278445713095, "tps": 20049, "wall": 9257.1} {"step": 2832, "train_loss": 4.037803649902344, "lr": 0.0003965890735438105, "tps": 20045, "wall": 9262.1} {"step": 2833, "train_loss": 4.115605354309082, "lr": 0.00039658536063007954, "tps": 20041, "wall": 9267.2} {"step": 2834, "train_loss": 4.108041763305664, "lr": 0.00039658164571598, "tps": 20037, "wall": 9272.1} {"step": 2835, "train_loss": 4.081705093383789, "lr": 0.00039657792880155407, "tps": 20034, "wall": 9277.1} {"step": 2836, "train_loss": 4.072104454040527, "lr": 0.00039657420988684376, "tps": 20030, "wall": 9282.1} {"step": 2837, "train_loss": 4.02387809753418, "lr": 0.0003965704889718913, "tps": 20026, "wall": 9287.1} {"step": 2838, "train_loss": 4.074963569641113, "lr": 0.00039656676605673877, "tps": 20023, "wall": 9292.1} {"step": 2839, "train_loss": 3.9943838119506836, "lr": 0.0003965630411414283, "tps": 20019, "wall": 9297.1} {"step": 2840, "train_loss": 3.9517693519592285, "lr": 0.00039655931422600226, "tps": 20015, "wall": 9302.1} {"step": 2841, "train_loss": 4.083695411682129, "lr": 0.0003965555853105027, "tps": 20012, "wall": 9307.1} {"step": 2842, "train_loss": 4.102719783782959, "lr": 0.0003965518543949719, "tps": 20008, "wall": 9312.0} {"step": 2843, "train_loss": 4.062747478485107, "lr": 0.0003965481214794521, "tps": 20004, "wall": 9317.0} {"step": 2844, "train_loss": 3.9507408142089844, "lr": 0.0003965443865639857, "tps": 20001, "wall": 9322.0} {"step": 2845, "train_loss": 4.115976810455322, "lr": 0.00039654064964861493, "tps": 19997, "wall": 9327.0} {"step": 2846, "train_loss": 4.100612640380859, "lr": 0.00039653691073338217, "tps": 19993, "wall": 9332.0} {"step": 2847, "train_loss": 4.020260810852051, "lr": 0.00039653316981832967, "tps": 19990, "wall": 9337.0} {"step": 2848, "train_loss": 4.025568962097168, "lr": 0.0003965294269034999, "tps": 19986, "wall": 9342.0} {"step": 2849, "train_loss": 3.9817452430725098, "lr": 0.00039652568198893516, "tps": 19982, "wall": 9347.0} {"step": 2850, "train_loss": 4.018677234649658, "lr": 0.0003965219350746781, "tps": 19978, "wall": 9352.1} {"step": 2851, "train_loss": 4.078397274017334, "lr": 0.0003965181861607709, "tps": 19975, "wall": 9357.1} {"step": 2852, "train_loss": 3.9808595180511475, "lr": 0.00039651443524725614, "tps": 19971, "wall": 9362.1} {"step": 2853, "train_loss": 4.046599388122559, "lr": 0.00039651068233417634, "tps": 19967, "wall": 9367.1} {"step": 2854, "train_loss": 3.9459328651428223, "lr": 0.000396506927421574, "tps": 19964, "wall": 9372.1} {"step": 2855, "train_loss": 4.084236145019531, "lr": 0.0003965031705094916, "tps": 19960, "wall": 9377.1} {"step": 2856, "train_loss": 4.088543891906738, "lr": 0.00039649941159797177, "tps": 19956, "wall": 9382.1} {"step": 2857, "train_loss": 3.9072189331054688, "lr": 0.000396495650687057, "tps": 19953, "wall": 9387.1} {"step": 2858, "train_loss": 3.9585208892822266, "lr": 0.0003964918877767899, "tps": 19949, "wall": 9392.1} {"step": 2859, "train_loss": 4.09077787399292, "lr": 0.0003964881228672132, "tps": 19945, "wall": 9397.1} {"step": 2860, "train_loss": 3.931493043899536, "lr": 0.00039648435595836956, "tps": 19942, "wall": 9402.1} {"step": 2861, "train_loss": 4.093856334686279, "lr": 0.00039648058705030154, "tps": 19938, "wall": 9407.1} {"step": 2862, "train_loss": 4.019756317138672, "lr": 0.00039647681614305195, "tps": 19934, "wall": 9412.2} {"step": 2863, "train_loss": 4.0178680419921875, "lr": 0.0003964730432366634, "tps": 19931, "wall": 9417.2} {"step": 2864, "train_loss": 4.0241827964782715, "lr": 0.0003964692683311786, "tps": 19926, "wall": 9422.5} {"step": 2865, "train_loss": 4.016561508178711, "lr": 0.00039646549142664046, "tps": 19922, "wall": 9427.8} {"step": 2866, "train_loss": 3.930361747741699, "lr": 0.00039646171252309166, "tps": 19918, "wall": 9433.1} {"step": 2867, "train_loss": 3.954681873321533, "lr": 0.00039645793162057497, "tps": 19914, "wall": 9438.3} {"step": 2868, "train_loss": 4.0725932121276855, "lr": 0.0003964541487191334, "tps": 19910, "wall": 9443.6} {"step": 2869, "train_loss": 3.949490547180176, "lr": 0.0003964503638188096, "tps": 19905, "wall": 9448.9} {"step": 2870, "train_loss": 4.070936679840088, "lr": 0.0003964465769196466, "tps": 19901, "wall": 9454.2} {"step": 2871, "train_loss": 4.022280693054199, "lr": 0.0003964427880216872, "tps": 19897, "wall": 9459.5} {"step": 2872, "train_loss": 3.952150821685791, "lr": 0.0003964389971249743, "tps": 19893, "wall": 9464.7} {"step": 2873, "train_loss": 3.9573731422424316, "lr": 0.00039643520422955096, "tps": 19889, "wall": 9470.0} {"step": 2874, "train_loss": 3.9195399284362793, "lr": 0.00039643140933546004, "tps": 19884, "wall": 9475.3} {"step": 2875, "train_loss": 4.097381114959717, "lr": 0.0003964276124427446, "tps": 19880, "wall": 9480.5} {"step": 2876, "train_loss": 3.9083871841430664, "lr": 0.00039642381355144764, "tps": 19877, "wall": 9485.5} {"step": 2877, "train_loss": 4.078124046325684, "lr": 0.0003964200126616122, "tps": 19873, "wall": 9490.5} {"step": 2878, "train_loss": 4.099825859069824, "lr": 0.0003964162097732813, "tps": 19870, "wall": 9495.5} {"step": 2879, "train_loss": 4.045320987701416, "lr": 0.00039641240488649793, "tps": 19866, "wall": 9500.5} {"step": 2880, "train_loss": 4.0463643074035645, "lr": 0.0003964085980013054, "tps": 19863, "wall": 9505.5} {"step": 2881, "train_loss": 4.114964485168457, "lr": 0.0003964047891177467, "tps": 19859, "wall": 9510.5} {"step": 2882, "train_loss": 3.991241931915283, "lr": 0.00039640097823586497, "tps": 19856, "wall": 9515.4} {"step": 2883, "train_loss": 4.0406646728515625, "lr": 0.00039639716535570346, "tps": 19852, "wall": 9520.4} {"step": 2884, "train_loss": 4.02249813079834, "lr": 0.00039639335047730526, "tps": 19849, "wall": 9525.4} {"step": 2885, "train_loss": 4.176736831665039, "lr": 0.0003963895336007137, "tps": 19845, "wall": 9530.3} {"step": 2886, "train_loss": 4.041242599487305, "lr": 0.00039638571472597195, "tps": 19842, "wall": 9535.3} {"step": 2887, "train_loss": 4.042850494384766, "lr": 0.00039638189385312326, "tps": 19838, "wall": 9540.3} {"step": 2888, "train_loss": 4.084381580352783, "lr": 0.00039637807098221096, "tps": 19835, "wall": 9545.3} {"step": 2889, "train_loss": 4.027762413024902, "lr": 0.0003963742461132783, "tps": 19831, "wall": 9550.2} {"step": 2890, "train_loss": 4.013782024383545, "lr": 0.0003963704192463687, "tps": 19828, "wall": 9555.2} {"step": 2891, "train_loss": 3.9610507488250732, "lr": 0.0003963665903815254, "tps": 19825, "wall": 9560.2} {"step": 2892, "train_loss": 4.041385650634766, "lr": 0.0003963627595187918, "tps": 19821, "wall": 9565.1} {"step": 2893, "train_loss": 4.035074710845947, "lr": 0.00039635892665821135, "tps": 19818, "wall": 9570.1} {"step": 2894, "train_loss": 4.060301303863525, "lr": 0.0003963550917998275, "tps": 19814, "wall": 9575.0} {"step": 2895, "train_loss": 4.037818431854248, "lr": 0.0003963512549436835, "tps": 19811, "wall": 9580.0} {"step": 2896, "train_loss": 4.135414123535156, "lr": 0.00039634741608982304, "tps": 19807, "wall": 9585.0} {"step": 2897, "train_loss": 4.005922317504883, "lr": 0.00039634357523828947, "tps": 19804, "wall": 9590.0} {"step": 2898, "train_loss": 3.9558496475219727, "lr": 0.00039633973238912634, "tps": 19800, "wall": 9595.0} {"step": 2899, "train_loss": 4.126834392547607, "lr": 0.0003963358875423772, "tps": 19797, "wall": 9599.9} {"step": 2900, "train_loss": 4.050032615661621, "lr": 0.0003963320406980856, "tps": 19794, "wall": 9604.9} {"step": 2901, "train_loss": 3.912724018096924, "lr": 0.000396328191856295, "tps": 19790, "wall": 9609.8} {"step": 2902, "train_loss": 4.00093936920166, "lr": 0.0003963243410170492, "tps": 19787, "wall": 9614.8} {"step": 2903, "train_loss": 4.096070766448975, "lr": 0.00039632048818039175, "tps": 19783, "wall": 9619.8} {"step": 2904, "train_loss": 3.9926276206970215, "lr": 0.0003963166333463662, "tps": 19780, "wall": 9624.7} {"step": 2905, "train_loss": 4.035971641540527, "lr": 0.00039631277651501636, "tps": 19777, "wall": 9629.7} {"step": 2906, "train_loss": 3.9711315631866455, "lr": 0.0003963089176863858, "tps": 19773, "wall": 9634.6} {"step": 2907, "train_loss": 4.014208793640137, "lr": 0.00039630505686051825, "tps": 19770, "wall": 9639.6} {"step": 2908, "train_loss": 4.010710716247559, "lr": 0.00039630119403745754, "tps": 19766, "wall": 9644.6} {"step": 2909, "train_loss": 4.097019672393799, "lr": 0.00039629732921724737, "tps": 19763, "wall": 9649.5} {"step": 2910, "train_loss": 4.013275623321533, "lr": 0.0003962934623999315, "tps": 19760, "wall": 9654.5} {"step": 2911, "train_loss": 3.897878408432007, "lr": 0.0003962895935855538, "tps": 19756, "wall": 9659.5} {"step": 2912, "train_loss": 3.9910459518432617, "lr": 0.000396285722774158, "tps": 19753, "wall": 9664.5} {"step": 2913, "train_loss": 4.073771953582764, "lr": 0.0003962818499657879, "tps": 19749, "wall": 9669.5} {"step": 2914, "train_loss": 3.99346923828125, "lr": 0.00039627797516048757, "tps": 19746, "wall": 9674.5} {"step": 2915, "train_loss": 4.041207313537598, "lr": 0.0003962740983583008, "tps": 19743, "wall": 9679.4} {"step": 2916, "train_loss": 3.9302124977111816, "lr": 0.0003962702195592714, "tps": 19739, "wall": 9684.4} {"step": 2917, "train_loss": 3.99703049659729, "lr": 0.00039626633876344356, "tps": 19736, "wall": 9689.4} {"step": 2918, "train_loss": 3.977095365524292, "lr": 0.0003962624559708611, "tps": 19733, "wall": 9694.3} {"step": 2919, "train_loss": 3.8906068801879883, "lr": 0.00039625857118156794, "tps": 19729, "wall": 9699.3} {"step": 2920, "train_loss": 3.9948320388793945, "lr": 0.00039625468439560813, "tps": 19726, "wall": 9704.2} {"step": 2921, "train_loss": 4.007579803466797, "lr": 0.0003962507956130258, "tps": 19723, "wall": 9709.2} {"step": 2922, "train_loss": 4.043657302856445, "lr": 0.00039624690483386484, "tps": 19719, "wall": 9714.3} {"step": 2923, "train_loss": 4.0213303565979, "lr": 0.00039624301205816947, "tps": 19716, "wall": 9719.2} {"step": 2924, "train_loss": 3.9442996978759766, "lr": 0.00039623911728598366, "tps": 19713, "wall": 9724.2} {"step": 2925, "train_loss": 3.8652946949005127, "lr": 0.0003962352205173516, "tps": 19709, "wall": 9729.1} {"step": 2926, "train_loss": 3.9243061542510986, "lr": 0.0003962313217523175, "tps": 19706, "wall": 9734.1} {"step": 2927, "train_loss": 4.020493984222412, "lr": 0.0003962274209909254, "tps": 19703, "wall": 9739.1} {"step": 2928, "train_loss": 4.016326904296875, "lr": 0.00039622351823321954, "tps": 19699, "wall": 9744.0} {"step": 2929, "train_loss": 4.030320167541504, "lr": 0.00039621961347924414, "tps": 19696, "wall": 9749.0} {"step": 2930, "train_loss": 4.050085544586182, "lr": 0.00039621570672904345, "tps": 19693, "wall": 9753.9} {"step": 2931, "train_loss": 3.9910473823547363, "lr": 0.0003962117979826617, "tps": 19689, "wall": 9758.9} {"step": 2932, "train_loss": 3.9436287879943848, "lr": 0.00039620788724014315, "tps": 19686, "wall": 9763.8} {"step": 2933, "train_loss": 4.025299549102783, "lr": 0.0003962039745015321, "tps": 19683, "wall": 9768.8} {"step": 2934, "train_loss": 4.110861301422119, "lr": 0.0003962000597668729, "tps": 19679, "wall": 9773.8} {"step": 2935, "train_loss": 4.061698913574219, "lr": 0.0003961961430362099, "tps": 19676, "wall": 9778.8} {"step": 2936, "train_loss": 4.018675804138184, "lr": 0.00039619222430958747, "tps": 19673, "wall": 9783.7} {"step": 2937, "train_loss": 4.055974960327148, "lr": 0.00039618830358704993, "tps": 19670, "wall": 9788.7} {"step": 2938, "train_loss": 4.044171333312988, "lr": 0.00039618438086864186, "tps": 19666, "wall": 9793.6} {"step": 2939, "train_loss": 4.053878307342529, "lr": 0.00039618045615440753, "tps": 19663, "wall": 9798.6} {"step": 2940, "train_loss": 4.061960220336914, "lr": 0.0003961765294443915, "tps": 19660, "wall": 9803.5} {"step": 2941, "train_loss": 3.9307849407196045, "lr": 0.0003961726007386382, "tps": 19657, "wall": 9808.5} {"step": 2942, "train_loss": 3.9807238578796387, "lr": 0.00039616867003719214, "tps": 19653, "wall": 9813.4} {"step": 2943, "train_loss": 3.9917151927948, "lr": 0.00039616473734009784, "tps": 19650, "wall": 9818.4} {"step": 2944, "train_loss": 3.94413685798645, "lr": 0.0003961608026473999, "tps": 19647, "wall": 9823.4} {"step": 2945, "train_loss": 3.950863838195801, "lr": 0.0003961568659591428, "tps": 19644, "wall": 9828.3} {"step": 2946, "train_loss": 3.990994453430176, "lr": 0.0003961529272753712, "tps": 19640, "wall": 9833.3} {"step": 2947, "train_loss": 3.9582090377807617, "lr": 0.0003961489865961298, "tps": 19637, "wall": 9838.3} {"step": 2948, "train_loss": 4.032408714294434, "lr": 0.000396145043921463, "tps": 19634, "wall": 9843.2} {"step": 2949, "train_loss": 4.014595031738281, "lr": 0.00039614109925141576, "tps": 19631, "wall": 9848.2} {"step": 2950, "train_loss": 4.0647125244140625, "lr": 0.0003961371525860326, "tps": 19627, "wall": 9853.1} {"step": 2951, "train_loss": 3.975280284881592, "lr": 0.0003961332039253582, "tps": 19624, "wall": 9858.1} {"step": 2952, "train_loss": 4.046900749206543, "lr": 0.0003961292532694373, "tps": 19621, "wall": 9863.0} {"step": 2953, "train_loss": 3.897045135498047, "lr": 0.00039612530061831474, "tps": 19618, "wall": 9868.0} {"step": 2954, "train_loss": 3.9577903747558594, "lr": 0.00039612134597203524, "tps": 19615, "wall": 9873.0} {"step": 2955, "train_loss": 3.915191650390625, "lr": 0.00039611738933064365, "tps": 19611, "wall": 9877.9} {"step": 2956, "train_loss": 3.952733039855957, "lr": 0.00039611343069418466, "tps": 19608, "wall": 9882.9} {"step": 2957, "train_loss": 3.960296869277954, "lr": 0.0003961094700627033, "tps": 19605, "wall": 9887.8} {"step": 2958, "train_loss": 4.019873142242432, "lr": 0.00039610550743624423, "tps": 19602, "wall": 9892.9} {"step": 2959, "train_loss": 3.9714674949645996, "lr": 0.0003961015428148525, "tps": 19598, "wall": 9897.8} {"step": 2960, "train_loss": 3.9833145141601562, "lr": 0.000396097576198573, "tps": 19595, "wall": 9902.7} {"step": 2961, "train_loss": 3.9897308349609375, "lr": 0.00039609360758745054, "tps": 19592, "wall": 9907.8} {"step": 2962, "train_loss": 4.091950416564941, "lr": 0.0003960896369815302, "tps": 19589, "wall": 9912.8} {"step": 2963, "train_loss": 3.9559473991394043, "lr": 0.00039608566438085693, "tps": 19586, "wall": 9917.7} {"step": 2964, "train_loss": 3.9658589363098145, "lr": 0.00039608168978547576, "tps": 19582, "wall": 9922.7} {"step": 2965, "train_loss": 3.9761931896209717, "lr": 0.00039607771319543164, "tps": 19579, "wall": 9927.6} {"step": 2966, "train_loss": 4.00921630859375, "lr": 0.00039607373461076966, "tps": 19576, "wall": 9932.6} {"step": 2967, "train_loss": 3.9951701164245605, "lr": 0.00039606975403153494, "tps": 19573, "wall": 9937.5} {"step": 2968, "train_loss": 3.8799707889556885, "lr": 0.00039606577145777247, "tps": 19570, "wall": 9942.5} {"step": 2969, "train_loss": 3.950227975845337, "lr": 0.00039606178688952746, "tps": 19567, "wall": 9947.4} {"step": 2970, "train_loss": 3.899026870727539, "lr": 0.00039605780032684495, "tps": 19563, "wall": 9952.4} {"step": 2971, "train_loss": 4.07706880569458, "lr": 0.00039605381176977016, "tps": 19560, "wall": 9957.4} {"step": 2972, "train_loss": 3.929563283920288, "lr": 0.0003960498212183483, "tps": 19557, "wall": 9962.3} {"step": 2973, "train_loss": 4.099765300750732, "lr": 0.0003960458286726246, "tps": 19554, "wall": 9967.3} {"step": 2974, "train_loss": 3.9743285179138184, "lr": 0.0003960418341326441, "tps": 19551, "wall": 9972.2} {"step": 2975, "train_loss": 3.995162010192871, "lr": 0.00039603783759845226, "tps": 19548, "wall": 9977.2} {"step": 2976, "train_loss": 3.9996871948242188, "lr": 0.0003960338390700943, "tps": 19544, "wall": 9982.1} {"step": 2977, "train_loss": 3.9057116508483887, "lr": 0.0003960298385476154, "tps": 19541, "wall": 9987.1} {"step": 2978, "train_loss": 4.073807716369629, "lr": 0.00039602583603106094, "tps": 19538, "wall": 9992.0} {"step": 2979, "train_loss": 3.9407927989959717, "lr": 0.0003960218315204764, "tps": 19535, "wall": 9997.0} {"step": 2980, "train_loss": 4.012510776519775, "lr": 0.00039601782501590696, "tps": 19532, "wall": 10001.9} {"step": 2981, "train_loss": 3.9245080947875977, "lr": 0.00039601381651739815, "tps": 19529, "wall": 10006.9} {"step": 2982, "train_loss": 4.039052963256836, "lr": 0.00039600980602499524, "tps": 19526, "wall": 10011.9} {"step": 2983, "train_loss": 3.9676833152770996, "lr": 0.0003960057935387437, "tps": 19523, "wall": 10016.8} {"step": 2984, "train_loss": 3.9569807052612305, "lr": 0.000396001779058689, "tps": 19520, "wall": 10021.8} {"step": 2985, "train_loss": 3.9655632972717285, "lr": 0.0003959977625848767, "tps": 19516, "wall": 10026.7} {"step": 2986, "train_loss": 4.062266826629639, "lr": 0.0003959937441173522, "tps": 19513, "wall": 10031.7} {"step": 2987, "train_loss": 4.075193405151367, "lr": 0.000395989723656161, "tps": 19510, "wall": 10036.7} {"step": 2988, "train_loss": 4.082204341888428, "lr": 0.0003959857012013488, "tps": 19507, "wall": 10041.6} {"step": 2989, "train_loss": 4.049567699432373, "lr": 0.00039598167675296096, "tps": 19504, "wall": 10046.6} {"step": 2990, "train_loss": 3.924766778945923, "lr": 0.00039597765031104324, "tps": 19501, "wall": 10051.5} {"step": 2991, "train_loss": 4.01870059967041, "lr": 0.0003959736218756411, "tps": 19498, "wall": 10056.5} {"step": 2992, "train_loss": 3.9633517265319824, "lr": 0.00039596959144680026, "tps": 19495, "wall": 10061.4} {"step": 2993, "train_loss": 4.039804935455322, "lr": 0.0003959655590245664, "tps": 19492, "wall": 10066.4} {"step": 2994, "train_loss": 3.97190523147583, "lr": 0.00039596152460898517, "tps": 19489, "wall": 10071.3} {"step": 2995, "train_loss": 3.9377617835998535, "lr": 0.00039595748820010226, "tps": 19485, "wall": 10076.4} {"step": 2996, "train_loss": 4.054714679718018, "lr": 0.00039595344979796336, "tps": 19482, "wall": 10081.3} {"step": 2997, "train_loss": 3.9137015342712402, "lr": 0.0003959494094026143, "tps": 19479, "wall": 10086.3} {"step": 2998, "train_loss": 4.12202262878418, "lr": 0.0003959453670141008, "tps": 19476, "wall": 10091.3} {"step": 2999, "train_loss": 4.030705451965332, "lr": 0.0003959413226324687, "tps": 19473, "wall": 10096.2} {"step": 3000, "train_loss": 4.044322490692139, "lr": 0.0003959372762577638, "tps": 19470, "wall": 10101.3, "val_loss_monitor": 3.9998098617932447} {"step": 3001, "train_loss": 3.9022278785705566, "lr": 0.0003959332278900318, "tps": 19374, "wall": 10154.4} {"step": 3002, "train_loss": 3.9491772651672363, "lr": 0.00039592917752931877, "tps": 19371, "wall": 10159.4} {"step": 3003, "train_loss": 3.912604808807373, "lr": 0.0003959251251756705, "tps": 19368, "wall": 10164.4} {"step": 3004, "train_loss": 4.022930145263672, "lr": 0.00039592107082913285, "tps": 19365, "wall": 10169.3} {"step": 3005, "train_loss": 3.926271915435791, "lr": 0.00039591701448975187, "tps": 19362, "wall": 10174.3} {"step": 3006, "train_loss": 4.074603080749512, "lr": 0.0003959129561575733, "tps": 19359, "wall": 10179.3} {"step": 3007, "train_loss": 4.064314842224121, "lr": 0.00039590889583264335, "tps": 19356, "wall": 10184.2} {"step": 3008, "train_loss": 4.01746129989624, "lr": 0.0003959048335150079, "tps": 19353, "wall": 10189.2} {"step": 3009, "train_loss": 3.9681572914123535, "lr": 0.000395900769204713, "tps": 19350, "wall": 10194.3} {"step": 3010, "train_loss": 3.924126148223877, "lr": 0.0003958967029018046, "tps": 19347, "wall": 10199.3} {"step": 3011, "train_loss": 4.020236015319824, "lr": 0.0003958926346063288, "tps": 19344, "wall": 10204.3} {"step": 3012, "train_loss": 3.8239967823028564, "lr": 0.0003958885643183318, "tps": 19341, "wall": 10209.2} {"step": 3013, "train_loss": 4.034412384033203, "lr": 0.00039588449203785967, "tps": 19338, "wall": 10214.2} {"step": 3014, "train_loss": 3.979462146759033, "lr": 0.0003958804177649584, "tps": 19335, "wall": 10219.2} {"step": 3015, "train_loss": 3.90427565574646, "lr": 0.0003958763414996743, "tps": 19332, "wall": 10224.2} {"step": 3016, "train_loss": 3.8812665939331055, "lr": 0.0003958722632420535, "tps": 19329, "wall": 10229.3} {"step": 3017, "train_loss": 3.9341769218444824, "lr": 0.0003958681829921421, "tps": 19326, "wall": 10234.2} {"step": 3018, "train_loss": 3.9037349224090576, "lr": 0.00039586410074998654, "tps": 19323, "wall": 10239.2} {"step": 3019, "train_loss": 3.980360507965088, "lr": 0.0003958600165156328, "tps": 19320, "wall": 10244.2} {"step": 3020, "train_loss": 4.020113468170166, "lr": 0.00039585593028912744, "tps": 19317, "wall": 10249.1} {"step": 3021, "train_loss": 4.107637882232666, "lr": 0.00039585184207051647, "tps": 19314, "wall": 10254.1} {"step": 3022, "train_loss": 3.990920066833496, "lr": 0.0003958477518598463, "tps": 19311, "wall": 10259.1} {"step": 3023, "train_loss": 4.097112655639648, "lr": 0.00039584365965716336, "tps": 19308, "wall": 10264.1} {"step": 3024, "train_loss": 3.9563121795654297, "lr": 0.00039583956546251393, "tps": 19305, "wall": 10269.1} {"step": 3025, "train_loss": 3.9944651126861572, "lr": 0.0003958354692759443, "tps": 19302, "wall": 10274.0} {"step": 3026, "train_loss": 4.026609897613525, "lr": 0.00039583137109750106, "tps": 19299, "wall": 10279.0} {"step": 3027, "train_loss": 3.961238384246826, "lr": 0.0003958272709272305, "tps": 19296, "wall": 10284.0} {"step": 3028, "train_loss": 3.952116012573242, "lr": 0.0003958231687651791, "tps": 19293, "wall": 10288.9} {"step": 3029, "train_loss": 3.9731838703155518, "lr": 0.00039581906461139333, "tps": 19290, "wall": 10293.9} {"step": 3030, "train_loss": 3.9725067615509033, "lr": 0.00039581495846591967, "tps": 19287, "wall": 10298.9} {"step": 3031, "train_loss": 3.978015899658203, "lr": 0.0003958108503288046, "tps": 19284, "wall": 10303.8} {"step": 3032, "train_loss": 4.095431804656982, "lr": 0.0003958067402000948, "tps": 19281, "wall": 10308.8} {"step": 3033, "train_loss": 3.989809513092041, "lr": 0.00039580262807983673, "tps": 19278, "wall": 10313.8} {"step": 3034, "train_loss": 3.9612369537353516, "lr": 0.00039579851396807697, "tps": 19275, "wall": 10318.8} {"step": 3035, "train_loss": 3.992584228515625, "lr": 0.0003957943978648621, "tps": 19272, "wall": 10323.8} {"step": 3036, "train_loss": 4.023238182067871, "lr": 0.00039579027977023874, "tps": 19269, "wall": 10328.7} {"step": 3037, "train_loss": 3.9126088619232178, "lr": 0.0003957861596842537, "tps": 19266, "wall": 10333.7} {"step": 3038, "train_loss": 3.99440336227417, "lr": 0.0003957820376069534, "tps": 19264, "wall": 10338.6} {"step": 3039, "train_loss": 4.003018379211426, "lr": 0.0003957779135383848, "tps": 19261, "wall": 10343.6} {"step": 3040, "train_loss": 3.990432024002075, "lr": 0.0003957737874785944, "tps": 19258, "wall": 10348.6} {"step": 3041, "train_loss": 4.023116111755371, "lr": 0.0003957696594276291, "tps": 19255, "wall": 10353.5} {"step": 3042, "train_loss": 3.9159276485443115, "lr": 0.0003957655293855355, "tps": 19252, "wall": 10358.5} {"step": 3043, "train_loss": 3.9789299964904785, "lr": 0.00039576139735236055, "tps": 19249, "wall": 10363.4} {"step": 3044, "train_loss": 3.878085136413574, "lr": 0.0003957572633281509, "tps": 19246, "wall": 10368.4} {"step": 3045, "train_loss": 4.027951717376709, "lr": 0.00039575312731295357, "tps": 19243, "wall": 10373.4} {"step": 3046, "train_loss": 3.983912944793701, "lr": 0.0003957489893068152, "tps": 19240, "wall": 10378.4} {"step": 3047, "train_loss": 3.942775249481201, "lr": 0.00039574484930978283, "tps": 19237, "wall": 10383.4} {"step": 3048, "train_loss": 3.9353551864624023, "lr": 0.0003957407073219033, "tps": 19235, "wall": 10388.3} {"step": 3049, "train_loss": 4.01697301864624, "lr": 0.0003957365633432235, "tps": 19232, "wall": 10393.3} {"step": 3050, "train_loss": 3.9841670989990234, "lr": 0.00039573241737379046, "tps": 19229, "wall": 10398.3} {"step": 3051, "train_loss": 4.108656406402588, "lr": 0.000395728269413651, "tps": 19226, "wall": 10403.2} {"step": 3052, "train_loss": 3.97402286529541, "lr": 0.00039572411946285223, "tps": 19223, "wall": 10408.2} {"step": 3053, "train_loss": 3.9663174152374268, "lr": 0.00039571996752144116, "tps": 19220, "wall": 10413.1} {"step": 3054, "train_loss": 4.022403717041016, "lr": 0.0003957158135894647, "tps": 19217, "wall": 10418.1} {"step": 3055, "train_loss": 3.978501796722412, "lr": 0.0003957116576669702, "tps": 19214, "wall": 10423.0} {"step": 3056, "train_loss": 4.016330718994141, "lr": 0.00039570749975400437, "tps": 19212, "wall": 10428.0} {"step": 3057, "train_loss": 3.8597917556762695, "lr": 0.0003957033398506145, "tps": 19209, "wall": 10433.0} {"step": 3058, "train_loss": 3.9355902671813965, "lr": 0.0003956991779568477, "tps": 19206, "wall": 10437.9} {"step": 3059, "train_loss": 4.078261852264404, "lr": 0.00039569501407275116, "tps": 19203, "wall": 10442.9} {"step": 3060, "train_loss": 3.934722423553467, "lr": 0.0003956908481983719, "tps": 19200, "wall": 10447.8} {"step": 3061, "train_loss": 4.046703815460205, "lr": 0.0003956866803337573, "tps": 19197, "wall": 10452.8} {"step": 3062, "train_loss": 3.8641159534454346, "lr": 0.0003956825104789544, "tps": 19194, "wall": 10457.8} {"step": 3063, "train_loss": 3.985430955886841, "lr": 0.0003956783386340106, "tps": 19192, "wall": 10462.7} {"step": 3064, "train_loss": 4.020411491394043, "lr": 0.000395674164798973, "tps": 19189, "wall": 10467.7} {"step": 3065, "train_loss": 3.9033029079437256, "lr": 0.00039566998897388897, "tps": 19186, "wall": 10472.7} {"step": 3066, "train_loss": 4.025549411773682, "lr": 0.00039566581115880583, "tps": 19183, "wall": 10477.6} {"step": 3067, "train_loss": 4.016595363616943, "lr": 0.0003956616313537709, "tps": 19180, "wall": 10482.6} {"step": 3068, "train_loss": 4.064723014831543, "lr": 0.0003956574495588315, "tps": 19177, "wall": 10487.6} {"step": 3069, "train_loss": 3.943565845489502, "lr": 0.00039565326577403493, "tps": 19175, "wall": 10492.6} {"step": 3070, "train_loss": 4.032164573669434, "lr": 0.00039564907999942877, "tps": 19172, "wall": 10497.5} {"step": 3071, "train_loss": 4.061458110809326, "lr": 0.00039564489223506026, "tps": 19169, "wall": 10502.5} {"step": 3072, "train_loss": 3.9533448219299316, "lr": 0.0003956407024809769, "tps": 19166, "wall": 10507.4} {"step": 3073, "train_loss": 4.005331039428711, "lr": 0.00039563651073722616, "tps": 19163, "wall": 10512.4} {"step": 3074, "train_loss": 4.055492877960205, "lr": 0.00039563231700385555, "tps": 19161, "wall": 10517.3} {"step": 3075, "train_loss": 3.965416431427002, "lr": 0.0003956281212809126, "tps": 19158, "wall": 10522.2} {"step": 3076, "train_loss": 3.971097469329834, "lr": 0.0003956239235684447, "tps": 19155, "wall": 10527.2} {"step": 3077, "train_loss": 3.9210762977600098, "lr": 0.00039561972386649956, "tps": 19152, "wall": 10532.2} {"step": 3078, "train_loss": 4.115189552307129, "lr": 0.00039561552217512463, "tps": 19149, "wall": 10537.1} {"step": 3079, "train_loss": 3.978853702545166, "lr": 0.0003956113184943676, "tps": 19147, "wall": 10542.1} {"step": 3080, "train_loss": 3.96323299407959, "lr": 0.0003956071128242761, "tps": 19144, "wall": 10547.0} {"step": 3081, "train_loss": 4.029781818389893, "lr": 0.0003956029051648976, "tps": 19141, "wall": 10552.1} {"step": 3082, "train_loss": 3.940669059753418, "lr": 0.00039559869551628, "tps": 19138, "wall": 10557.1} {"step": 3083, "train_loss": 3.95369553565979, "lr": 0.0003955944838784708, "tps": 19135, "wall": 10562.0} {"step": 3084, "train_loss": 4.028532028198242, "lr": 0.00039559027025151786, "tps": 19133, "wall": 10566.9} {"step": 3085, "train_loss": 3.9706063270568848, "lr": 0.00039558605463546885, "tps": 19130, "wall": 10571.9} {"step": 3086, "train_loss": 3.9632012844085693, "lr": 0.00039558183703037144, "tps": 19127, "wall": 10576.8} {"step": 3087, "train_loss": 3.865417003631592, "lr": 0.00039557761743627353, "tps": 19124, "wall": 10581.8} {"step": 3088, "train_loss": 4.051373481750488, "lr": 0.00039557339585322284, "tps": 19122, "wall": 10586.7} {"step": 3089, "train_loss": 4.046409606933594, "lr": 0.0003955691722812672, "tps": 19119, "wall": 10591.7} {"step": 3090, "train_loss": 3.972705125808716, "lr": 0.0003955649467204546, "tps": 19116, "wall": 10596.6} {"step": 3091, "train_loss": 3.9593617916107178, "lr": 0.00039556071917083263, "tps": 19113, "wall": 10601.6} {"step": 3092, "train_loss": 4.0850629806518555, "lr": 0.0003955564896324494, "tps": 19111, "wall": 10606.5} {"step": 3093, "train_loss": 3.9546077251434326, "lr": 0.0003955522581053528, "tps": 19108, "wall": 10611.5} {"step": 3094, "train_loss": 4.002862453460693, "lr": 0.0003955480245895907, "tps": 19105, "wall": 10616.4} {"step": 3095, "train_loss": 4.050102710723877, "lr": 0.00039554378908521106, "tps": 19102, "wall": 10621.4} {"step": 3096, "train_loss": 3.9695026874542236, "lr": 0.00039553955159226187, "tps": 19100, "wall": 10626.3} {"step": 3097, "train_loss": 3.9650588035583496, "lr": 0.0003955353121107912, "tps": 19097, "wall": 10631.3} {"step": 3098, "train_loss": 4.059099197387695, "lr": 0.0003955310706408469, "tps": 19094, "wall": 10636.2} {"step": 3099, "train_loss": 3.8974459171295166, "lr": 0.0003955268271824773, "tps": 19092, "wall": 10641.2} {"step": 3100, "train_loss": 3.960806131362915, "lr": 0.00039552258173573016, "tps": 19089, "wall": 10646.1} {"step": 3101, "train_loss": 3.967899799346924, "lr": 0.0003955183343006538, "tps": 19086, "wall": 10651.0} {"step": 3102, "train_loss": 3.9931108951568604, "lr": 0.00039551408487729624, "tps": 19083, "wall": 10656.0} {"step": 3103, "train_loss": 3.9812521934509277, "lr": 0.00039550983346570563, "tps": 19081, "wall": 10660.9} {"step": 3104, "train_loss": 3.9467904567718506, "lr": 0.0003955055800659301, "tps": 19078, "wall": 10665.9} {"step": 3105, "train_loss": 4.001926898956299, "lr": 0.0003955013246780179, "tps": 19075, "wall": 10670.8} {"step": 3106, "train_loss": 3.9583539962768555, "lr": 0.0003954970673020172, "tps": 19073, "wall": 10675.8} {"step": 3107, "train_loss": 3.874453067779541, "lr": 0.00039549280793797623, "tps": 19070, "wall": 10680.8} {"step": 3108, "train_loss": 3.8878698348999023, "lr": 0.0003954885465859432, "tps": 19067, "wall": 10685.7} {"step": 3109, "train_loss": 4.023602485656738, "lr": 0.0003954842832459665, "tps": 19064, "wall": 10690.7} {"step": 3110, "train_loss": 4.00429105758667, "lr": 0.0003954800179180943, "tps": 19062, "wall": 10695.6} {"step": 3111, "train_loss": 3.908149480819702, "lr": 0.0003954757506023749, "tps": 19059, "wall": 10700.6} {"step": 3112, "train_loss": 3.9819693565368652, "lr": 0.0003954714812988568, "tps": 19056, "wall": 10705.5} {"step": 3113, "train_loss": 4.00736665725708, "lr": 0.0003954672100075882, "tps": 19054, "wall": 10710.5} {"step": 3114, "train_loss": 3.9321184158325195, "lr": 0.00039546293672861754, "tps": 19051, "wall": 10715.4} {"step": 3115, "train_loss": 4.028239727020264, "lr": 0.0003954586614619933, "tps": 19048, "wall": 10720.4} {"step": 3116, "train_loss": 3.9059009552001953, "lr": 0.00039545438420776386, "tps": 19046, "wall": 10725.3} {"step": 3117, "train_loss": 3.971470594406128, "lr": 0.00039545010496597763, "tps": 19043, "wall": 10730.3} {"step": 3118, "train_loss": 4.114142417907715, "lr": 0.0003954458237366831, "tps": 19040, "wall": 10735.3} {"step": 3119, "train_loss": 3.9249510765075684, "lr": 0.0003954415405199288, "tps": 19037, "wall": 10740.2} {"step": 3120, "train_loss": 3.999994993209839, "lr": 0.00039543725531576327, "tps": 19035, "wall": 10745.2} {"step": 3121, "train_loss": 3.9813990592956543, "lr": 0.000395432968124235, "tps": 19032, "wall": 10750.1} {"step": 3122, "train_loss": 3.8615286350250244, "lr": 0.00039542867894539255, "tps": 19029, "wall": 10755.1} {"step": 3123, "train_loss": 3.95510196685791, "lr": 0.0003954243877792846, "tps": 19027, "wall": 10760.0} {"step": 3124, "train_loss": 3.9600167274475098, "lr": 0.00039542009462595963, "tps": 19024, "wall": 10765.0} {"step": 3125, "train_loss": 3.979935884475708, "lr": 0.00039541579948546636, "tps": 19021, "wall": 10770.0} {"step": 3126, "train_loss": 3.9673190116882324, "lr": 0.0003954115023578534, "tps": 19019, "wall": 10774.9} {"step": 3127, "train_loss": 3.963939666748047, "lr": 0.0003954072032431696, "tps": 19016, "wall": 10779.9} {"step": 3128, "train_loss": 3.986672878265381, "lr": 0.0003954029021414633, "tps": 19013, "wall": 10784.8} {"step": 3129, "train_loss": 3.940232753753662, "lr": 0.00039539859905278355, "tps": 19011, "wall": 10789.8} {"step": 3130, "train_loss": 4.021617889404297, "lr": 0.000395394293977179, "tps": 19008, "wall": 10794.8} {"step": 3131, "train_loss": 4.019092559814453, "lr": 0.00039538998691469835, "tps": 19005, "wall": 10799.7} {"step": 3132, "train_loss": 3.973452568054199, "lr": 0.0003953856778653904, "tps": 19003, "wall": 10804.7} {"step": 3133, "train_loss": 3.867791175842285, "lr": 0.00039538136682930406, "tps": 19000, "wall": 10809.6} {"step": 3134, "train_loss": 3.9554505348205566, "lr": 0.0003953770538064881, "tps": 18998, "wall": 10814.6} {"step": 3135, "train_loss": 3.983187198638916, "lr": 0.00039537273879699137, "tps": 18995, "wall": 10819.5} {"step": 3136, "train_loss": 3.967040538787842, "lr": 0.0003953684218008628, "tps": 18992, "wall": 10824.4} {"step": 3137, "train_loss": 4.083669662475586, "lr": 0.00039536410281815123, "tps": 18990, "wall": 10829.4} {"step": 3138, "train_loss": 4.060785293579102, "lr": 0.0003953597818489056, "tps": 18987, "wall": 10834.3} {"step": 3139, "train_loss": 4.015509605407715, "lr": 0.00039535545889317494, "tps": 18984, "wall": 10839.3} {"step": 3140, "train_loss": 3.9196524620056152, "lr": 0.0003953511339510081, "tps": 18982, "wall": 10844.2} {"step": 3141, "train_loss": 3.8795056343078613, "lr": 0.00039534680702245416, "tps": 18979, "wall": 10849.2} {"step": 3142, "train_loss": 3.9494857788085938, "lr": 0.0003953424781075621, "tps": 18976, "wall": 10854.2} {"step": 3143, "train_loss": 3.9159183502197266, "lr": 0.00039533814720638094, "tps": 18974, "wall": 10859.1} {"step": 3144, "train_loss": 4.032013416290283, "lr": 0.00039533381431895975, "tps": 18971, "wall": 10864.1} {"step": 3145, "train_loss": 3.954308032989502, "lr": 0.0003953294794453477, "tps": 18969, "wall": 10869.1} {"step": 3146, "train_loss": 3.9983129501342773, "lr": 0.0003953251425855937, "tps": 18966, "wall": 10874.1} {"step": 3147, "train_loss": 4.116816997528076, "lr": 0.0003953208037397471, "tps": 18963, "wall": 10879.0} {"step": 3148, "train_loss": 4.010399341583252, "lr": 0.00039531646290785695, "tps": 18961, "wall": 10883.9} {"step": 3149, "train_loss": 3.952241897583008, "lr": 0.0003953121200899724, "tps": 18958, "wall": 10888.9} {"step": 3150, "train_loss": 3.963326930999756, "lr": 0.0003953077752861427, "tps": 18956, "wall": 10893.8} {"step": 3151, "train_loss": 3.883603811264038, "lr": 0.00039530342849641696, "tps": 18953, "wall": 10898.8} {"step": 3152, "train_loss": 3.994476318359375, "lr": 0.00039529907972084456, "tps": 18950, "wall": 10903.7} {"step": 3153, "train_loss": 3.9721055030822754, "lr": 0.0003952947289594747, "tps": 18948, "wall": 10908.7} {"step": 3154, "train_loss": 4.044678688049316, "lr": 0.00039529037621235664, "tps": 18945, "wall": 10913.7} {"step": 3155, "train_loss": 3.9540185928344727, "lr": 0.00039528602147953973, "tps": 18942, "wall": 10918.6} {"step": 3156, "train_loss": 3.992236375808716, "lr": 0.00039528166476107327, "tps": 18940, "wall": 10923.6} {"step": 3157, "train_loss": 3.989716053009033, "lr": 0.0003952773060570066, "tps": 18937, "wall": 10928.6} {"step": 3158, "train_loss": 3.8953349590301514, "lr": 0.0003952729453673892, "tps": 18935, "wall": 10933.6} {"step": 3159, "train_loss": 3.9612245559692383, "lr": 0.0003952685826922704, "tps": 18932, "wall": 10938.5} {"step": 3160, "train_loss": 3.9533512592315674, "lr": 0.0003952642180316995, "tps": 18930, "wall": 10943.4} {"step": 3161, "train_loss": 4.031001567840576, "lr": 0.00039525985138572615, "tps": 18927, "wall": 10948.4} {"step": 3162, "train_loss": 3.9385948181152344, "lr": 0.0003952554827543997, "tps": 18924, "wall": 10953.3} {"step": 3163, "train_loss": 3.972513198852539, "lr": 0.00039525111213776967, "tps": 18922, "wall": 10958.3} {"step": 3164, "train_loss": 3.9525375366210938, "lr": 0.0003952467395358856, "tps": 18919, "wall": 10963.2} {"step": 3165, "train_loss": 3.962371349334717, "lr": 0.0003952423649487969, "tps": 18917, "wall": 10968.2} {"step": 3166, "train_loss": 3.9965081214904785, "lr": 0.00039523798837655323, "tps": 18914, "wall": 10973.2} {"step": 3167, "train_loss": 3.883251190185547, "lr": 0.0003952336098192042, "tps": 18911, "wall": 10978.2} {"step": 3168, "train_loss": 3.930410146713257, "lr": 0.00039522922927679924, "tps": 18909, "wall": 10983.1} {"step": 3169, "train_loss": 3.910971164703369, "lr": 0.0003952248467493882, "tps": 18906, "wall": 10988.1} {"step": 3170, "train_loss": 3.920980453491211, "lr": 0.00039522046223702063, "tps": 18904, "wall": 10993.1} {"step": 3171, "train_loss": 4.024012088775635, "lr": 0.0003952160757397461, "tps": 18901, "wall": 10998.0} {"step": 3172, "train_loss": 3.976016044616699, "lr": 0.00039521168725761445, "tps": 18898, "wall": 11003.0} {"step": 3173, "train_loss": 3.9281527996063232, "lr": 0.0003952072967906753, "tps": 18896, "wall": 11008.0} {"step": 3174, "train_loss": 4.046811103820801, "lr": 0.0003952029043389784, "tps": 18893, "wall": 11013.0} {"step": 3175, "train_loss": 3.910943031311035, "lr": 0.0003951985099025736, "tps": 18891, "wall": 11017.9} {"step": 3176, "train_loss": 3.993204355239868, "lr": 0.00039519411348151045, "tps": 18888, "wall": 11022.9} {"step": 3177, "train_loss": 4.006094455718994, "lr": 0.00039518971507583904, "tps": 18886, "wall": 11027.8} {"step": 3178, "train_loss": 3.926161289215088, "lr": 0.000395185314685609, "tps": 18883, "wall": 11032.8} {"step": 3179, "train_loss": 3.9836063385009766, "lr": 0.00039518091231087026, "tps": 18881, "wall": 11037.8} {"step": 3180, "train_loss": 3.967928886413574, "lr": 0.0003951765079516727, "tps": 18878, "wall": 11042.8} {"step": 3181, "train_loss": 3.9345850944519043, "lr": 0.0003951721016080661, "tps": 18875, "wall": 11047.7} {"step": 3182, "train_loss": 3.9645018577575684, "lr": 0.00039516769328010057, "tps": 18873, "wall": 11052.7} {"step": 3183, "train_loss": 3.9111409187316895, "lr": 0.0003951632829678258, "tps": 18870, "wall": 11057.6} {"step": 3184, "train_loss": 3.9852771759033203, "lr": 0.00039515887067129195, "tps": 18868, "wall": 11062.6} {"step": 3185, "train_loss": 3.987661600112915, "lr": 0.000395154456390549, "tps": 18865, "wall": 11067.5} {"step": 3186, "train_loss": 3.9775755405426025, "lr": 0.0003951500401256468, "tps": 18863, "wall": 11072.5} {"step": 3187, "train_loss": 3.8749842643737793, "lr": 0.0003951456218766355, "tps": 18860, "wall": 11077.4} {"step": 3188, "train_loss": 3.940080165863037, "lr": 0.00039514120164356513, "tps": 18858, "wall": 11082.4} {"step": 3189, "train_loss": 4.02153205871582, "lr": 0.0003951367794264857, "tps": 18855, "wall": 11087.3} {"step": 3190, "train_loss": 3.9587578773498535, "lr": 0.0003951323552254474, "tps": 18853, "wall": 11092.4} {"step": 3191, "train_loss": 3.9559154510498047, "lr": 0.00039512792904050035, "tps": 18850, "wall": 11097.3} {"step": 3192, "train_loss": 3.9888224601745605, "lr": 0.0003951235008716946, "tps": 18848, "wall": 11102.3} {"step": 3193, "train_loss": 3.993164539337158, "lr": 0.00039511907071908037, "tps": 18845, "wall": 11107.2} {"step": 3194, "train_loss": 3.9929513931274414, "lr": 0.0003951146385827078, "tps": 18843, "wall": 11112.2} {"step": 3195, "train_loss": 3.9157397747039795, "lr": 0.0003951102044626271, "tps": 18840, "wall": 11117.2} {"step": 3196, "train_loss": 3.9393908977508545, "lr": 0.0003951057683588886, "tps": 18838, "wall": 11122.1} {"step": 3197, "train_loss": 4.021627426147461, "lr": 0.0003951013302715425, "tps": 18835, "wall": 11127.1} {"step": 3198, "train_loss": 3.912374496459961, "lr": 0.000395096890200639, "tps": 18833, "wall": 11132.0} {"step": 3199, "train_loss": 4.019939422607422, "lr": 0.00039509244814622845, "tps": 18830, "wall": 11137.0} {"step": 3200, "train_loss": 3.900785446166992, "lr": 0.00039508800410836126, "tps": 18828, "wall": 11141.9} {"step": 3201, "train_loss": 3.986265182495117, "lr": 0.0003950835580870876, "tps": 18825, "wall": 11146.9} {"step": 3202, "train_loss": 4.020657539367676, "lr": 0.0003950791100824579, "tps": 18822, "wall": 11151.9} {"step": 3203, "train_loss": 3.989126443862915, "lr": 0.0003950746600945227, "tps": 18820, "wall": 11156.9} {"step": 3204, "train_loss": 3.9668595790863037, "lr": 0.0003950702081233322, "tps": 18817, "wall": 11161.8} {"step": 3205, "train_loss": 3.9730138778686523, "lr": 0.0003950657541689369, "tps": 18815, "wall": 11166.8} {"step": 3206, "train_loss": 3.963794231414795, "lr": 0.0003950612982313873, "tps": 18813, "wall": 11171.7} {"step": 3207, "train_loss": 3.9548795223236084, "lr": 0.0003950568403107338, "tps": 18810, "wall": 11176.7} {"step": 3208, "train_loss": 3.9153504371643066, "lr": 0.00039505238040702696, "tps": 18808, "wall": 11181.6} {"step": 3209, "train_loss": 3.9398179054260254, "lr": 0.00039504791852031725, "tps": 18805, "wall": 11186.6} {"step": 3210, "train_loss": 3.9472198486328125, "lr": 0.0003950434546506553, "tps": 18803, "wall": 11191.6} {"step": 3211, "train_loss": 3.8953857421875, "lr": 0.0003950389887980916, "tps": 18800, "wall": 11196.5} {"step": 3212, "train_loss": 3.974411964416504, "lr": 0.0003950345209626768, "tps": 18798, "wall": 11201.5} {"step": 3213, "train_loss": 4.0169172286987305, "lr": 0.0003950300511444615, "tps": 18795, "wall": 11206.5} {"step": 3214, "train_loss": 3.9013049602508545, "lr": 0.00039502557934349627, "tps": 18793, "wall": 11211.4} {"step": 3215, "train_loss": 3.956231117248535, "lr": 0.0003950211055598318, "tps": 18790, "wall": 11216.4} {"step": 3216, "train_loss": 3.999147415161133, "lr": 0.00039501662979351876, "tps": 18788, "wall": 11221.4} {"step": 3217, "train_loss": 3.9316368103027344, "lr": 0.0003950121520446079, "tps": 18785, "wall": 11226.3} {"step": 3218, "train_loss": 3.977355480194092, "lr": 0.0003950076723131499, "tps": 18783, "wall": 11231.3} {"step": 3219, "train_loss": 3.884315252304077, "lr": 0.0003950031905991955, "tps": 18780, "wall": 11236.2} {"step": 3220, "train_loss": 3.923893451690674, "lr": 0.0003949987069027955, "tps": 18778, "wall": 11241.2} {"step": 3221, "train_loss": 4.0179243087768555, "lr": 0.0003949942212240007, "tps": 18775, "wall": 11246.2} {"step": 3222, "train_loss": 3.894434928894043, "lr": 0.0003949897335628619, "tps": 18773, "wall": 11251.1} {"step": 3223, "train_loss": 3.781468629837036, "lr": 0.00039498524391943, "tps": 18771, "wall": 11256.0} {"step": 3224, "train_loss": 3.8840463161468506, "lr": 0.0003949807522937557, "tps": 18768, "wall": 11261.0} {"step": 3225, "train_loss": 3.915872097015381, "lr": 0.00039497625868589, "tps": 18766, "wall": 11265.9} {"step": 3226, "train_loss": 3.9901556968688965, "lr": 0.0003949717630958837, "tps": 18763, "wall": 11270.9} {"step": 3227, "train_loss": 3.890289068222046, "lr": 0.0003949672655237879, "tps": 18761, "wall": 11275.9} {"step": 3228, "train_loss": 4.116067886352539, "lr": 0.0003949627659696534, "tps": 18758, "wall": 11280.8} {"step": 3229, "train_loss": 3.909426212310791, "lr": 0.0003949582644335312, "tps": 18756, "wall": 11285.8} {"step": 3230, "train_loss": 3.9242160320281982, "lr": 0.0003949537609154724, "tps": 18754, "wall": 11290.7} {"step": 3231, "train_loss": 3.9024975299835205, "lr": 0.00039494925541552783, "tps": 18751, "wall": 11295.6} {"step": 3232, "train_loss": 3.8641438484191895, "lr": 0.0003949447479337487, "tps": 18749, "wall": 11300.6} {"step": 3233, "train_loss": 3.784482955932617, "lr": 0.000394940238470186, "tps": 18746, "wall": 11305.5} {"step": 3234, "train_loss": 3.994861125946045, "lr": 0.0003949357270248908, "tps": 18744, "wall": 11310.5} {"step": 3235, "train_loss": 3.974400281906128, "lr": 0.0003949312135979142, "tps": 18742, "wall": 11315.4} {"step": 3236, "train_loss": 3.9194798469543457, "lr": 0.0003949266981893074, "tps": 18739, "wall": 11320.4} {"step": 3237, "train_loss": 4.041353225708008, "lr": 0.0003949221807991214, "tps": 18737, "wall": 11325.4} {"step": 3238, "train_loss": 4.010782241821289, "lr": 0.00039491766142740764, "tps": 18734, "wall": 11330.3} {"step": 3239, "train_loss": 3.998141288757324, "lr": 0.00039491314007421703, "tps": 18732, "wall": 11335.3} {"step": 3240, "train_loss": 4.0198845863342285, "lr": 0.0003949086167396009, "tps": 18729, "wall": 11340.3} {"step": 3241, "train_loss": 3.9352500438690186, "lr": 0.00039490409142361056, "tps": 18727, "wall": 11345.2} {"step": 3242, "train_loss": 3.9630627632141113, "lr": 0.00039489956412629715, "tps": 18725, "wall": 11350.2} {"step": 3243, "train_loss": 4.042231559753418, "lr": 0.00039489503484771204, "tps": 18722, "wall": 11355.1} {"step": 3244, "train_loss": 3.994770050048828, "lr": 0.0003948905035879065, "tps": 18720, "wall": 11360.1} {"step": 3245, "train_loss": 3.9010729789733887, "lr": 0.00039488597034693186, "tps": 18717, "wall": 11365.0} {"step": 3246, "train_loss": 3.938406467437744, "lr": 0.00039488143512483956, "tps": 18715, "wall": 11370.0} {"step": 3247, "train_loss": 4.0002055168151855, "lr": 0.0003948768979216808, "tps": 18713, "wall": 11374.9} {"step": 3248, "train_loss": 3.9308319091796875, "lr": 0.00039487235873750714, "tps": 18710, "wall": 11379.9} {"step": 3249, "train_loss": 3.958110809326172, "lr": 0.00039486781757236997, "tps": 18708, "wall": 11384.8} {"step": 3250, "train_loss": 3.885176420211792, "lr": 0.0003948632744263206, "tps": 18706, "wall": 11389.8} {"step": 3251, "train_loss": 3.9920897483825684, "lr": 0.00039485872929941073, "tps": 18703, "wall": 11394.8} {"step": 3252, "train_loss": 3.7901902198791504, "lr": 0.0003948541821916917, "tps": 18701, "wall": 11399.8} {"step": 3253, "train_loss": 3.893737316131592, "lr": 0.00039484963310321494, "tps": 18698, "wall": 11404.7} {"step": 3254, "train_loss": 4.027071952819824, "lr": 0.0003948450820340321, "tps": 18696, "wall": 11409.7} {"step": 3255, "train_loss": 4.026960372924805, "lr": 0.0003948405289841947, "tps": 18694, "wall": 11414.6} {"step": 3256, "train_loss": 3.987332820892334, "lr": 0.00039483597395375435, "tps": 18691, "wall": 11419.5} {"step": 3257, "train_loss": 3.854670524597168, "lr": 0.00039483141694276265, "tps": 18689, "wall": 11424.5} {"step": 3258, "train_loss": 4.0110650062561035, "lr": 0.00039482685795127126, "tps": 18687, "wall": 11429.4} {"step": 3259, "train_loss": 3.940732002258301, "lr": 0.00039482229697933167, "tps": 18684, "wall": 11434.4} {"step": 3260, "train_loss": 3.820099115371704, "lr": 0.00039481773402699565, "tps": 18682, "wall": 11439.3} {"step": 3261, "train_loss": 3.913649320602417, "lr": 0.00039481316909431493, "tps": 18679, "wall": 11444.3} {"step": 3262, "train_loss": 3.9472320079803467, "lr": 0.0003948086021813411, "tps": 18677, "wall": 11449.2} {"step": 3263, "train_loss": 3.954867362976074, "lr": 0.000394804033288126, "tps": 18675, "wall": 11454.2} {"step": 3264, "train_loss": 4.03193998336792, "lr": 0.0003947994624147214, "tps": 18672, "wall": 11459.1} {"step": 3265, "train_loss": 3.948737859725952, "lr": 0.000394794889561179, "tps": 18670, "wall": 11464.1} {"step": 3266, "train_loss": 3.920217514038086, "lr": 0.0003947903147275506, "tps": 18668, "wall": 11469.0} {"step": 3267, "train_loss": 3.9364559650421143, "lr": 0.0003947857379138881, "tps": 18665, "wall": 11474.0} {"step": 3268, "train_loss": 3.991342067718506, "lr": 0.0003947811591202434, "tps": 18663, "wall": 11478.9} {"step": 3269, "train_loss": 3.9309844970703125, "lr": 0.0003947765783466681, "tps": 18661, "wall": 11483.9} {"step": 3270, "train_loss": 4.030022621154785, "lr": 0.0003947719955932143, "tps": 18658, "wall": 11488.8} {"step": 3271, "train_loss": 4.005052089691162, "lr": 0.00039476741085993393, "tps": 18656, "wall": 11493.8} {"step": 3272, "train_loss": 3.9153356552124023, "lr": 0.0003947628241468789, "tps": 18654, "wall": 11498.7} {"step": 3273, "train_loss": 3.9657788276672363, "lr": 0.0003947582354541011, "tps": 18651, "wall": 11503.7} {"step": 3274, "train_loss": 3.9729037284851074, "lr": 0.0003947536447816525, "tps": 18649, "wall": 11508.7} {"step": 3275, "train_loss": 3.8673596382141113, "lr": 0.0003947490521295852, "tps": 18646, "wall": 11513.7} {"step": 3276, "train_loss": 3.8577117919921875, "lr": 0.00039474445749795124, "tps": 18644, "wall": 11518.6} {"step": 3277, "train_loss": 3.9767110347747803, "lr": 0.00039473986088680256, "tps": 18642, "wall": 11523.6} {"step": 3278, "train_loss": 3.8571314811706543, "lr": 0.0003947352622961913, "tps": 18640, "wall": 11528.6} {"step": 3279, "train_loss": 3.986604928970337, "lr": 0.00039473066172616956, "tps": 18637, "wall": 11533.6} {"step": 3280, "train_loss": 3.9311585426330566, "lr": 0.0003947260591767894, "tps": 18635, "wall": 11538.5} {"step": 3281, "train_loss": 3.883021354675293, "lr": 0.00039472145464810297, "tps": 18632, "wall": 11543.5} {"step": 3282, "train_loss": 3.9730913639068604, "lr": 0.00039471684814016246, "tps": 18630, "wall": 11548.4} {"step": 3283, "train_loss": 3.9299890995025635, "lr": 0.00039471223965302006, "tps": 18628, "wall": 11553.4} {"step": 3284, "train_loss": 3.909862995147705, "lr": 0.00039470762918672795, "tps": 18626, "wall": 11558.3} {"step": 3285, "train_loss": 4.006918907165527, "lr": 0.00039470301674133834, "tps": 18623, "wall": 11563.3} {"step": 3286, "train_loss": 3.9347095489501953, "lr": 0.00039469840231690355, "tps": 18621, "wall": 11568.3} {"step": 3287, "train_loss": 3.907759189605713, "lr": 0.00039469378591347573, "tps": 18618, "wall": 11573.3} {"step": 3288, "train_loss": 3.9825258255004883, "lr": 0.0003946891675311074, "tps": 18616, "wall": 11578.2} {"step": 3289, "train_loss": 3.8899788856506348, "lr": 0.00039468454716985057, "tps": 18614, "wall": 11583.2} {"step": 3290, "train_loss": 3.8318586349487305, "lr": 0.0003946799248297578, "tps": 18612, "wall": 11588.1} {"step": 3291, "train_loss": 3.8732666969299316, "lr": 0.00039467530051088146, "tps": 18609, "wall": 11593.1} {"step": 3292, "train_loss": 3.9807848930358887, "lr": 0.0003946706742132738, "tps": 18607, "wall": 11598.0} {"step": 3293, "train_loss": 3.913428544998169, "lr": 0.00039466604593698724, "tps": 18605, "wall": 11603.0} {"step": 3294, "train_loss": 3.9402520656585693, "lr": 0.00039466141568207435, "tps": 18602, "wall": 11607.9} {"step": 3295, "train_loss": 3.968733787536621, "lr": 0.0003946567834485875, "tps": 18600, "wall": 11612.9} {"step": 3296, "train_loss": 3.9071993827819824, "lr": 0.0003946521492365791, "tps": 18598, "wall": 11617.9} {"step": 3297, "train_loss": 3.944566011428833, "lr": 0.00039464751304610173, "tps": 18595, "wall": 11622.8} {"step": 3298, "train_loss": 3.957629919052124, "lr": 0.0003946428748772079, "tps": 18593, "wall": 11627.8} {"step": 3299, "train_loss": 3.9498679637908936, "lr": 0.0003946382347299501, "tps": 18591, "wall": 11632.8} {"step": 3300, "train_loss": 3.976688861846924, "lr": 0.00039463359260438096, "tps": 18588, "wall": 11637.8} {"step": 3301, "train_loss": 3.90008282661438, "lr": 0.000394628948500553, "tps": 18586, "wall": 11642.7} {"step": 3302, "train_loss": 3.8776726722717285, "lr": 0.00039462430241851893, "tps": 18584, "wall": 11647.7} {"step": 3303, "train_loss": 3.9680709838867188, "lr": 0.0003946196543583312, "tps": 18582, "wall": 11652.6} {"step": 3304, "train_loss": 3.891880750656128, "lr": 0.0003946150043200427, "tps": 18579, "wall": 11657.6} {"step": 3305, "train_loss": 3.994314432144165, "lr": 0.0003946103523037059, "tps": 18577, "wall": 11662.5} {"step": 3306, "train_loss": 3.971836566925049, "lr": 0.0003946056983093736, "tps": 18575, "wall": 11667.5} {"step": 3307, "train_loss": 3.9530534744262695, "lr": 0.0003946010423370986, "tps": 18573, "wall": 11672.5} {"step": 3308, "train_loss": 3.891927480697632, "lr": 0.00039459638438693346, "tps": 18570, "wall": 11677.4} {"step": 3309, "train_loss": 4.039183139801025, "lr": 0.000394591724458931, "tps": 18568, "wall": 11682.4} {"step": 3310, "train_loss": 3.921482563018799, "lr": 0.0003945870625531441, "tps": 18566, "wall": 11687.4} {"step": 3311, "train_loss": 3.9178786277770996, "lr": 0.0003945823986696255, "tps": 18563, "wall": 11692.4} {"step": 3312, "train_loss": 3.887180805206299, "lr": 0.000394577732808428, "tps": 18561, "wall": 11697.3} {"step": 3313, "train_loss": 3.916654109954834, "lr": 0.0003945730649696045, "tps": 18559, "wall": 11702.3} {"step": 3314, "train_loss": 3.9501476287841797, "lr": 0.00039456839515320793, "tps": 18557, "wall": 11707.2} {"step": 3315, "train_loss": 3.9905970096588135, "lr": 0.00039456372335929115, "tps": 18554, "wall": 11712.2} {"step": 3316, "train_loss": 3.99886155128479, "lr": 0.000394559049587907, "tps": 18552, "wall": 11717.2} {"step": 3317, "train_loss": 3.891507387161255, "lr": 0.00039455437383910857, "tps": 18550, "wall": 11722.1} {"step": 3318, "train_loss": 3.9888525009155273, "lr": 0.00039454969611294865, "tps": 18548, "wall": 11727.1} {"step": 3319, "train_loss": 3.9811925888061523, "lr": 0.00039454501640948043, "tps": 18545, "wall": 11732.0} {"step": 3320, "train_loss": 3.84867525100708, "lr": 0.00039454033472875673, "tps": 18543, "wall": 11737.0} {"step": 3321, "train_loss": 3.9126458168029785, "lr": 0.00039453565107083077, "tps": 18541, "wall": 11742.0} {"step": 3322, "train_loss": 3.9876108169555664, "lr": 0.0003945309654357554, "tps": 18538, "wall": 11746.9} {"step": 3323, "train_loss": 3.925839424133301, "lr": 0.00039452627782358393, "tps": 18536, "wall": 11751.9} {"step": 3324, "train_loss": 3.99440598487854, "lr": 0.00039452158823436925, "tps": 18534, "wall": 11756.9} {"step": 3325, "train_loss": 3.9147729873657227, "lr": 0.00039451689666816466, "tps": 18532, "wall": 11761.9} {"step": 3326, "train_loss": 3.994046688079834, "lr": 0.00039451220312502317, "tps": 18529, "wall": 11766.9} {"step": 3327, "train_loss": 3.874114990234375, "lr": 0.000394507507604998, "tps": 18527, "wall": 11771.8} {"step": 3328, "train_loss": 3.9527978897094727, "lr": 0.0003945028101081424, "tps": 18525, "wall": 11776.8} {"step": 3329, "train_loss": 3.9914824962615967, "lr": 0.00039449811063450944, "tps": 18523, "wall": 11781.7} {"step": 3330, "train_loss": 3.8894505500793457, "lr": 0.0003944934091841525, "tps": 18520, "wall": 11786.7} {"step": 3331, "train_loss": 3.927173137664795, "lr": 0.00039448870575712475, "tps": 18518, "wall": 11791.7} {"step": 3332, "train_loss": 3.9281396865844727, "lr": 0.0003944840003534795, "tps": 18516, "wall": 11796.6} {"step": 3333, "train_loss": 3.918119192123413, "lr": 0.00039447929297327004, "tps": 18514, "wall": 11801.6} {"step": 3334, "train_loss": 3.8892273902893066, "lr": 0.00039447458361654975, "tps": 18511, "wall": 11806.5} {"step": 3335, "train_loss": 3.8346457481384277, "lr": 0.00039446987228337194, "tps": 18509, "wall": 11811.5} {"step": 3336, "train_loss": 3.90399169921875, "lr": 0.00039446515897379, "tps": 18507, "wall": 11816.5} {"step": 3337, "train_loss": 3.936154842376709, "lr": 0.00039446044368785725, "tps": 18505, "wall": 11821.5} {"step": 3338, "train_loss": 3.91586971282959, "lr": 0.00039445572642562716, "tps": 18502, "wall": 11826.5} {"step": 3339, "train_loss": 3.982104778289795, "lr": 0.00039445100718715314, "tps": 18500, "wall": 11831.5} {"step": 3340, "train_loss": 3.9631192684173584, "lr": 0.0003944462859724887, "tps": 18498, "wall": 11836.5} {"step": 3341, "train_loss": 3.834460735321045, "lr": 0.00039444156278168734, "tps": 18496, "wall": 11841.4} {"step": 3342, "train_loss": 3.9013936519622803, "lr": 0.00039443683761480246, "tps": 18493, "wall": 11846.4} {"step": 3343, "train_loss": 3.9173145294189453, "lr": 0.0003944321104718877, "tps": 18491, "wall": 11851.4} {"step": 3344, "train_loss": 4.005398750305176, "lr": 0.0003944273813529965, "tps": 18489, "wall": 11856.3} {"step": 3345, "train_loss": 3.9857285022735596, "lr": 0.00039442265025818254, "tps": 18487, "wall": 11861.3} {"step": 3346, "train_loss": 3.971616268157959, "lr": 0.0003944179171874994, "tps": 18485, "wall": 11866.3} {"step": 3347, "train_loss": 3.852404832839966, "lr": 0.00039441318214100056, "tps": 18482, "wall": 11871.3} {"step": 3348, "train_loss": 3.954866647720337, "lr": 0.0003944084451187398, "tps": 18480, "wall": 11876.3} {"step": 3349, "train_loss": 3.941495418548584, "lr": 0.00039440370612077067, "tps": 18478, "wall": 11881.3} {"step": 3350, "train_loss": 3.962068796157837, "lr": 0.000394398965147147, "tps": 18475, "wall": 11886.3} {"step": 3351, "train_loss": 3.891205310821533, "lr": 0.0003943942221979224, "tps": 18473, "wall": 11891.3} {"step": 3352, "train_loss": 3.9517316818237305, "lr": 0.0003943894772731506, "tps": 18471, "wall": 11896.3} {"step": 3353, "train_loss": 3.8470470905303955, "lr": 0.0003943847303728854, "tps": 18469, "wall": 11901.3} {"step": 3354, "train_loss": 3.9442222118377686, "lr": 0.0003943799814971805, "tps": 18467, "wall": 11906.2} {"step": 3355, "train_loss": 3.948988914489746, "lr": 0.00039437523064608977, "tps": 18464, "wall": 11911.2} {"step": 3356, "train_loss": 3.920452117919922, "lr": 0.00039437047781966703, "tps": 18462, "wall": 11916.2} {"step": 3357, "train_loss": 3.852357864379883, "lr": 0.000394365723017966, "tps": 18460, "wall": 11921.1} {"step": 3358, "train_loss": 3.954138994216919, "lr": 0.00039436096624104064, "tps": 18458, "wall": 11926.1} {"step": 3359, "train_loss": 3.8641648292541504, "lr": 0.00039435620748894487, "tps": 18456, "wall": 11931.1} {"step": 3360, "train_loss": 4.072003364562988, "lr": 0.0003943514467617325, "tps": 18453, "wall": 11936.1} {"step": 3361, "train_loss": 3.825976848602295, "lr": 0.0003943466840594575, "tps": 18451, "wall": 11941.0} {"step": 3362, "train_loss": 3.879998207092285, "lr": 0.0003943419193821739, "tps": 18449, "wall": 11946.0} {"step": 3363, "train_loss": 3.842845916748047, "lr": 0.0003943371527299356, "tps": 18447, "wall": 11951.0} {"step": 3364, "train_loss": 3.946526288986206, "lr": 0.00039433238410279656, "tps": 18445, "wall": 11956.0} {"step": 3365, "train_loss": 3.9351916313171387, "lr": 0.0003943276135008108, "tps": 18442, "wall": 11961.0} {"step": 3366, "train_loss": 3.900035858154297, "lr": 0.0003943228409240325, "tps": 18440, "wall": 11965.9} {"step": 3367, "train_loss": 4.031930446624756, "lr": 0.0003943180663725156, "tps": 18438, "wall": 11970.9} {"step": 3368, "train_loss": 3.9453110694885254, "lr": 0.0003943132898463142, "tps": 18436, "wall": 11975.9} {"step": 3369, "train_loss": 3.852410078048706, "lr": 0.00039430851134548246, "tps": 18434, "wall": 11980.8} {"step": 3370, "train_loss": 3.8669261932373047, "lr": 0.00039430373087007435, "tps": 18431, "wall": 11985.8} {"step": 3371, "train_loss": 4.004523754119873, "lr": 0.00039429894842014424, "tps": 18429, "wall": 11990.8} {"step": 3372, "train_loss": 3.9814841747283936, "lr": 0.00039429416399574624, "tps": 18427, "wall": 11995.8} {"step": 3373, "train_loss": 4.039546012878418, "lr": 0.0003942893775969345, "tps": 18425, "wall": 12000.7} {"step": 3374, "train_loss": 3.8668227195739746, "lr": 0.0003942845892237632, "tps": 18423, "wall": 12005.7} {"step": 3375, "train_loss": 3.9843618869781494, "lr": 0.00039427979887628667, "tps": 18421, "wall": 12010.6} {"step": 3376, "train_loss": 3.8394105434417725, "lr": 0.0003942750065545592, "tps": 18418, "wall": 12015.6} {"step": 3377, "train_loss": 3.972459077835083, "lr": 0.000394270212258635, "tps": 18416, "wall": 12020.6} {"step": 3378, "train_loss": 3.9464802742004395, "lr": 0.0003942654159885684, "tps": 18414, "wall": 12025.6} {"step": 3379, "train_loss": 3.882577896118164, "lr": 0.0003942606177444138, "tps": 18412, "wall": 12030.5} {"step": 3380, "train_loss": 3.9550108909606934, "lr": 0.00039425581752622536, "tps": 18410, "wall": 12035.5} {"step": 3381, "train_loss": 4.000140190124512, "lr": 0.00039425101533405773, "tps": 18408, "wall": 12040.4} {"step": 3382, "train_loss": 4.014590740203857, "lr": 0.0003942462111679651, "tps": 18406, "wall": 12045.4} {"step": 3383, "train_loss": 3.9297263622283936, "lr": 0.00039424140502800195, "tps": 18403, "wall": 12050.4} {"step": 3384, "train_loss": 3.9735333919525146, "lr": 0.00039423659691422276, "tps": 18401, "wall": 12055.4} {"step": 3385, "train_loss": 4.004814147949219, "lr": 0.00039423178682668203, "tps": 18399, "wall": 12060.4} {"step": 3386, "train_loss": 3.972513437271118, "lr": 0.00039422697476543413, "tps": 18397, "wall": 12065.3} {"step": 3387, "train_loss": 3.894303321838379, "lr": 0.0003942221607305336, "tps": 18395, "wall": 12070.3} {"step": 3388, "train_loss": 3.910829544067383, "lr": 0.00039421734472203513, "tps": 18392, "wall": 12075.4} {"step": 3389, "train_loss": 3.857534885406494, "lr": 0.00039421252673999305, "tps": 18390, "wall": 12080.3} {"step": 3390, "train_loss": 3.938863515853882, "lr": 0.000394207706784462, "tps": 18388, "wall": 12085.3} {"step": 3391, "train_loss": 3.971585273742676, "lr": 0.0003942028848554967, "tps": 18386, "wall": 12090.3} {"step": 3392, "train_loss": 4.085994243621826, "lr": 0.0003941980609531517, "tps": 18384, "wall": 12095.2} {"step": 3393, "train_loss": 3.9255523681640625, "lr": 0.00039419323507748166, "tps": 18382, "wall": 12100.2} {"step": 3394, "train_loss": 3.8154749870300293, "lr": 0.0003941884072285412, "tps": 18380, "wall": 12105.1} {"step": 3395, "train_loss": 4.019410133361816, "lr": 0.00039418357740638506, "tps": 18378, "wall": 12110.1} {"step": 3396, "train_loss": 3.8822364807128906, "lr": 0.0003941787456110679, "tps": 18375, "wall": 12115.1} {"step": 3397, "train_loss": 3.9248743057250977, "lr": 0.0003941739118426445, "tps": 18373, "wall": 12120.1} {"step": 3398, "train_loss": 3.88403058052063, "lr": 0.0003941690761011696, "tps": 18371, "wall": 12125.1} {"step": 3399, "train_loss": 3.815786838531494, "lr": 0.000394164238386698, "tps": 18369, "wall": 12130.1} {"step": 3400, "train_loss": 3.8658664226531982, "lr": 0.00039415939869928446, "tps": 18367, "wall": 12135.1} {"step": 3401, "train_loss": 4.030089378356934, "lr": 0.0003941545570389838, "tps": 18365, "wall": 12140.0} {"step": 3402, "train_loss": 3.9496755599975586, "lr": 0.00039414971340585105, "tps": 18363, "wall": 12145.0} {"step": 3403, "train_loss": 3.9526772499084473, "lr": 0.0003941448677999407, "tps": 18360, "wall": 12150.0} {"step": 3404, "train_loss": 3.9203433990478516, "lr": 0.000394140020221308, "tps": 18358, "wall": 12155.0} {"step": 3405, "train_loss": 4.030834674835205, "lr": 0.00039413517067000774, "tps": 18356, "wall": 12159.9} {"step": 3406, "train_loss": 3.851555824279785, "lr": 0.00039413031914609483, "tps": 18354, "wall": 12164.9} {"step": 3407, "train_loss": 3.944523572921753, "lr": 0.00039412546564962416, "tps": 18352, "wall": 12169.9} {"step": 3408, "train_loss": 3.9876623153686523, "lr": 0.0003941206101806509, "tps": 18350, "wall": 12174.9} {"step": 3409, "train_loss": 3.9545609951019287, "lr": 0.00039411575273922995, "tps": 18348, "wall": 12179.9} {"step": 3410, "train_loss": 3.900137424468994, "lr": 0.0003941108933254163, "tps": 18345, "wall": 12184.9} {"step": 3411, "train_loss": 3.936997890472412, "lr": 0.000394106031939265, "tps": 18343, "wall": 12189.8} {"step": 3412, "train_loss": 3.8264999389648438, "lr": 0.0003941011685808312, "tps": 18341, "wall": 12194.8} {"step": 3413, "train_loss": 3.7939202785491943, "lr": 0.0003940963032501699, "tps": 18339, "wall": 12199.8} {"step": 3414, "train_loss": 3.888894557952881, "lr": 0.0003940914359473363, "tps": 18337, "wall": 12204.8} {"step": 3415, "train_loss": 4.0494232177734375, "lr": 0.0003940865666723855, "tps": 18335, "wall": 12209.7} {"step": 3416, "train_loss": 3.976874351501465, "lr": 0.00039408169542537257, "tps": 18333, "wall": 12214.7} {"step": 3417, "train_loss": 3.9286117553710938, "lr": 0.0003940768222063529, "tps": 18331, "wall": 12219.7} {"step": 3418, "train_loss": 3.9547178745269775, "lr": 0.0003940719470153815, "tps": 18329, "wall": 12224.7} {"step": 3419, "train_loss": 3.8383803367614746, "lr": 0.00039406706985251365, "tps": 18327, "wall": 12229.6} {"step": 3420, "train_loss": 3.8727939128875732, "lr": 0.00039406219071780465, "tps": 18324, "wall": 12234.6} {"step": 3421, "train_loss": 3.8769848346710205, "lr": 0.00039405730961130975, "tps": 18322, "wall": 12239.6} {"step": 3422, "train_loss": 3.9901223182678223, "lr": 0.0003940524265330842, "tps": 18320, "wall": 12244.6} {"step": 3423, "train_loss": 4.071376323699951, "lr": 0.0003940475414831834, "tps": 18318, "wall": 12249.5} {"step": 3424, "train_loss": 3.9815664291381836, "lr": 0.00039404265446166254, "tps": 18316, "wall": 12254.5} {"step": 3425, "train_loss": 3.8831026554107666, "lr": 0.0003940377654685771, "tps": 18314, "wall": 12259.5} {"step": 3426, "train_loss": 3.8783023357391357, "lr": 0.00039403287450398246, "tps": 18312, "wall": 12264.4} {"step": 3427, "train_loss": 4.015000343322754, "lr": 0.000394027981567934, "tps": 18310, "wall": 12269.4} {"step": 3428, "train_loss": 3.958016872406006, "lr": 0.0003940230866604872, "tps": 18308, "wall": 12274.3} {"step": 3429, "train_loss": 3.8959078788757324, "lr": 0.0003940181897816974, "tps": 18306, "wall": 12279.3} {"step": 3430, "train_loss": 3.8589138984680176, "lr": 0.00039401329093162013, "tps": 18304, "wall": 12284.2} {"step": 3431, "train_loss": 3.933926582336426, "lr": 0.0003940083901103109, "tps": 18302, "wall": 12289.2} {"step": 3432, "train_loss": 3.884456157684326, "lr": 0.00039400348731782523, "tps": 18300, "wall": 12294.2} {"step": 3433, "train_loss": 3.9475622177124023, "lr": 0.00039399858255421863, "tps": 18298, "wall": 12299.2} {"step": 3434, "train_loss": 3.893756866455078, "lr": 0.0003939936758195466, "tps": 18295, "wall": 12304.1} {"step": 3435, "train_loss": 3.949824333190918, "lr": 0.00039398876711386495, "tps": 18293, "wall": 12309.1} {"step": 3436, "train_loss": 3.8317384719848633, "lr": 0.00039398385643722906, "tps": 18291, "wall": 12314.1} {"step": 3437, "train_loss": 3.952864170074463, "lr": 0.00039397894378969463, "tps": 18289, "wall": 12319.0} {"step": 3438, "train_loss": 3.977766513824463, "lr": 0.0003939740291713173, "tps": 18287, "wall": 12324.0} {"step": 3439, "train_loss": 3.953728675842285, "lr": 0.0003939691125821527, "tps": 18285, "wall": 12328.9} {"step": 3440, "train_loss": 3.862856864929199, "lr": 0.0003939641940222567, "tps": 18283, "wall": 12333.9} {"step": 3441, "train_loss": 3.950526714324951, "lr": 0.0003939592734916848, "tps": 18281, "wall": 12338.9} {"step": 3442, "train_loss": 3.9088950157165527, "lr": 0.00039395435099049287, "tps": 18279, "wall": 12343.8} {"step": 3443, "train_loss": 3.9470343589782715, "lr": 0.00039394942651873666, "tps": 18277, "wall": 12348.8} {"step": 3444, "train_loss": 4.008951663970947, "lr": 0.00039394450007647195, "tps": 18275, "wall": 12353.8} {"step": 3445, "train_loss": 3.8644607067108154, "lr": 0.0003939395716637545, "tps": 18273, "wall": 12358.8} {"step": 3446, "train_loss": 3.9436416625976562, "lr": 0.0003939346412806402, "tps": 18271, "wall": 12363.8} {"step": 3447, "train_loss": 3.9478402137756348, "lr": 0.00039392970892718486, "tps": 18269, "wall": 12368.7} {"step": 3448, "train_loss": 3.9403181076049805, "lr": 0.00039392477460344435, "tps": 18267, "wall": 12373.7} {"step": 3449, "train_loss": 4.00478458404541, "lr": 0.00039391983830947463, "tps": 18265, "wall": 12378.6} {"step": 3450, "train_loss": 3.8335323333740234, "lr": 0.00039391490004533154, "tps": 18263, "wall": 12383.6} {"step": 3451, "train_loss": 3.9534201622009277, "lr": 0.000393909959811071, "tps": 18261, "wall": 12388.6} {"step": 3452, "train_loss": 3.8810007572174072, "lr": 0.0003939050176067491, "tps": 18259, "wall": 12393.5} {"step": 3453, "train_loss": 3.8981258869171143, "lr": 0.00039390007343242174, "tps": 18257, "wall": 12398.5} {"step": 3454, "train_loss": 3.950517177581787, "lr": 0.000393895127288145, "tps": 18255, "wall": 12403.4} {"step": 3455, "train_loss": 3.8715243339538574, "lr": 0.00039389017917397474, "tps": 18253, "wall": 12408.4} {"step": 3456, "train_loss": 3.918522357940674, "lr": 0.00039388522908996717, "tps": 18251, "wall": 12413.4} {"step": 3457, "train_loss": 3.8870999813079834, "lr": 0.00039388027703617833, "tps": 18249, "wall": 12418.4} {"step": 3458, "train_loss": 3.9879748821258545, "lr": 0.0003938753230126643, "tps": 18247, "wall": 12423.3} {"step": 3459, "train_loss": 4.004575252532959, "lr": 0.0003938703670194812, "tps": 18245, "wall": 12428.3} {"step": 3460, "train_loss": 3.8586487770080566, "lr": 0.00039386540905668514, "tps": 18242, "wall": 12433.3} {"step": 3461, "train_loss": 3.91215443611145, "lr": 0.0003938604491243324, "tps": 18240, "wall": 12438.3} {"step": 3462, "train_loss": 3.898672103881836, "lr": 0.000393855487222479, "tps": 18238, "wall": 12443.2} {"step": 3463, "train_loss": 3.8257150650024414, "lr": 0.0003938505233511813, "tps": 18236, "wall": 12448.2} {"step": 3464, "train_loss": 3.9820265769958496, "lr": 0.00039384555751049543, "tps": 18234, "wall": 12453.2} {"step": 3465, "train_loss": 3.9750313758850098, "lr": 0.0003938405897004777, "tps": 18232, "wall": 12458.1} {"step": 3466, "train_loss": 3.891533374786377, "lr": 0.00039383561992118436, "tps": 18230, "wall": 12463.1} {"step": 3467, "train_loss": 3.894580841064453, "lr": 0.0003938306481726717, "tps": 18228, "wall": 12468.0} {"step": 3468, "train_loss": 3.9340929985046387, "lr": 0.0003938256744549961, "tps": 18226, "wall": 12473.1} {"step": 3469, "train_loss": 3.988996982574463, "lr": 0.0003938206987682138, "tps": 18224, "wall": 12478.1} {"step": 3470, "train_loss": 4.021566390991211, "lr": 0.0003938157211123812, "tps": 18222, "wall": 12483.0} {"step": 3471, "train_loss": 3.9880542755126953, "lr": 0.0003938107414875548, "tps": 18220, "wall": 12488.0} {"step": 3472, "train_loss": 4.044501304626465, "lr": 0.0003938057598937908, "tps": 18218, "wall": 12493.0} {"step": 3473, "train_loss": 3.895899534225464, "lr": 0.00039380077633114583, "tps": 18216, "wall": 12498.0} {"step": 3474, "train_loss": 3.9474830627441406, "lr": 0.0003937957907996763, "tps": 18214, "wall": 12503.0} {"step": 3475, "train_loss": 3.9369583129882812, "lr": 0.00039379080329943856, "tps": 18212, "wall": 12507.9} {"step": 3476, "train_loss": 3.919475555419922, "lr": 0.00039378581383048923, "tps": 18210, "wall": 12513.0} {"step": 3477, "train_loss": 3.961392879486084, "lr": 0.0003937808223928848, "tps": 18208, "wall": 12517.9} {"step": 3478, "train_loss": 3.9775846004486084, "lr": 0.00039377582898668183, "tps": 18206, "wall": 12522.9} {"step": 3479, "train_loss": 3.9340896606445312, "lr": 0.00039377083361193685, "tps": 18204, "wall": 12527.9} {"step": 3480, "train_loss": 3.863128662109375, "lr": 0.00039376583626870643, "tps": 18202, "wall": 12532.9} {"step": 3481, "train_loss": 3.969942569732666, "lr": 0.00039376083695704734, "tps": 18200, "wall": 12537.9} {"step": 3482, "train_loss": 3.9389920234680176, "lr": 0.000393755835677016, "tps": 18198, "wall": 12542.8} {"step": 3483, "train_loss": 3.88004732131958, "lr": 0.00039375083242866913, "tps": 18196, "wall": 12547.8} {"step": 3484, "train_loss": 3.789172410964966, "lr": 0.0003937458272120635, "tps": 18194, "wall": 12552.8} {"step": 3485, "train_loss": 3.9497976303100586, "lr": 0.00039374082002725563, "tps": 18192, "wall": 12557.8} {"step": 3486, "train_loss": 3.963064432144165, "lr": 0.0003937358108743024, "tps": 18190, "wall": 12562.7} {"step": 3487, "train_loss": 3.897739887237549, "lr": 0.0003937307997532606, "tps": 18188, "wall": 12567.7} {"step": 3488, "train_loss": 4.000636100769043, "lr": 0.00039372578666418685, "tps": 18186, "wall": 12572.7} {"step": 3489, "train_loss": 3.8383734226226807, "lr": 0.0003937207716071379, "tps": 18184, "wall": 12577.7} {"step": 3490, "train_loss": 3.790865182876587, "lr": 0.0003937157545821708, "tps": 18182, "wall": 12582.6} {"step": 3491, "train_loss": 3.9026472568511963, "lr": 0.00039371073558934207, "tps": 18180, "wall": 12587.6} {"step": 3492, "train_loss": 3.8684234619140625, "lr": 0.00039370571462870886, "tps": 18178, "wall": 12592.6} {"step": 3493, "train_loss": 3.906688690185547, "lr": 0.0003937006917003279, "tps": 18176, "wall": 12597.5} {"step": 3494, "train_loss": 3.9323489665985107, "lr": 0.000393695666804256, "tps": 18174, "wall": 12602.5} {"step": 3495, "train_loss": 3.873373508453369, "lr": 0.0003936906399405503, "tps": 18172, "wall": 12607.5} {"step": 3496, "train_loss": 3.854400157928467, "lr": 0.0003936856111092676, "tps": 18170, "wall": 12612.4} {"step": 3497, "train_loss": 3.868227958679199, "lr": 0.00039368058031046487, "tps": 18168, "wall": 12617.4} {"step": 3498, "train_loss": 3.9472405910491943, "lr": 0.0003936755475441992, "tps": 18166, "wall": 12622.4} {"step": 3499, "train_loss": 3.8927314281463623, "lr": 0.00039367051281052754, "tps": 18165, "wall": 12627.3} {"step": 3500, "train_loss": 3.919501304626465, "lr": 0.0003936654761095069, "tps": 18163, "wall": 12632.3} {"step": 3501, "train_loss": 3.8540830612182617, "lr": 0.0003936604374411943, "tps": 18160, "wall": 12637.4} {"step": 3502, "train_loss": 3.9512171745300293, "lr": 0.00039365539680564685, "tps": 18158, "wall": 12642.4} {"step": 3503, "train_loss": 3.931540012359619, "lr": 0.0003936503542029217, "tps": 18157, "wall": 12647.3} {"step": 3504, "train_loss": 3.9309396743774414, "lr": 0.000393645309633076, "tps": 18155, "wall": 12652.4} {"step": 3505, "train_loss": 3.945216655731201, "lr": 0.00039364026309616677, "tps": 18153, "wall": 12657.3} {"step": 3506, "train_loss": 3.957934856414795, "lr": 0.00039363521459225123, "tps": 18151, "wall": 12662.3} {"step": 3507, "train_loss": 3.9335343837738037, "lr": 0.00039363016412138663, "tps": 18149, "wall": 12667.3} {"step": 3508, "train_loss": 3.816037654876709, "lr": 0.00039362511168363016, "tps": 18147, "wall": 12672.2} {"step": 3509, "train_loss": 4.018100261688232, "lr": 0.00039362005727903906, "tps": 18145, "wall": 12677.2} {"step": 3510, "train_loss": 3.9278483390808105, "lr": 0.00039361500090767047, "tps": 18143, "wall": 12682.2} {"step": 3511, "train_loss": 3.89727783203125, "lr": 0.0003936099425695818, "tps": 18141, "wall": 12687.1} {"step": 3512, "train_loss": 3.9838762283325195, "lr": 0.00039360488226483024, "tps": 18139, "wall": 12692.1} {"step": 3513, "train_loss": 3.891185998916626, "lr": 0.00039359981999347325, "tps": 18137, "wall": 12697.1} {"step": 3514, "train_loss": 3.813157320022583, "lr": 0.00039359475575556814, "tps": 18135, "wall": 12702.0} {"step": 3515, "train_loss": 3.9219601154327393, "lr": 0.0003935896895511722, "tps": 18133, "wall": 12707.0} {"step": 3516, "train_loss": 3.922632932662964, "lr": 0.00039358462138034284, "tps": 18131, "wall": 12712.0} {"step": 3517, "train_loss": 3.8812785148620605, "lr": 0.00039357955124313753, "tps": 18129, "wall": 12717.0} {"step": 3518, "train_loss": 3.8807930946350098, "lr": 0.00039357447913961367, "tps": 18127, "wall": 12721.9} {"step": 3519, "train_loss": 3.9833884239196777, "lr": 0.0003935694050698287, "tps": 18125, "wall": 12726.9} {"step": 3520, "train_loss": 3.862877368927002, "lr": 0.00039356432903384016, "tps": 18124, "wall": 12731.9} {"step": 3521, "train_loss": 3.8973541259765625, "lr": 0.00039355925103170555, "tps": 18122, "wall": 12736.8} {"step": 3522, "train_loss": 3.922394275665283, "lr": 0.00039355417106348223, "tps": 18120, "wall": 12741.8} {"step": 3523, "train_loss": 3.9537057876586914, "lr": 0.00039354908912922796, "tps": 18118, "wall": 12746.8} {"step": 3524, "train_loss": 3.953510284423828, "lr": 0.0003935440052290002, "tps": 18116, "wall": 12751.7} {"step": 3525, "train_loss": 3.9321706295013428, "lr": 0.00039353891936285654, "tps": 18114, "wall": 12756.7} {"step": 3526, "train_loss": 3.9111475944519043, "lr": 0.0003935338315308547, "tps": 18112, "wall": 12761.7} {"step": 3527, "train_loss": 3.943307399749756, "lr": 0.0003935287417330521, "tps": 18110, "wall": 12766.6} {"step": 3528, "train_loss": 3.9833309650421143, "lr": 0.0003935236499695066, "tps": 18108, "wall": 12771.6} {"step": 3529, "train_loss": 3.8395652770996094, "lr": 0.0003935185562402758, "tps": 18106, "wall": 12776.6} {"step": 3530, "train_loss": 3.9431679248809814, "lr": 0.00039351346054541735, "tps": 18104, "wall": 12781.6} {"step": 3531, "train_loss": 3.943880081176758, "lr": 0.00039350836288498913, "tps": 18102, "wall": 12786.5} {"step": 3532, "train_loss": 3.9074649810791016, "lr": 0.00039350326325904875, "tps": 18100, "wall": 12791.5} {"step": 3533, "train_loss": 3.8083338737487793, "lr": 0.00039349816166765403, "tps": 18098, "wall": 12796.5} {"step": 3534, "train_loss": 3.90946888923645, "lr": 0.00039349305811086266, "tps": 18097, "wall": 12801.5} {"step": 3535, "train_loss": 3.887702703475952, "lr": 0.00039348795258873265, "tps": 18095, "wall": 12806.5} {"step": 3536, "train_loss": 3.931753158569336, "lr": 0.0003934828451013216, "tps": 18093, "wall": 12811.5} {"step": 3537, "train_loss": 3.971306324005127, "lr": 0.0003934777356486877, "tps": 18091, "wall": 12816.4} {"step": 3538, "train_loss": 3.951880931854248, "lr": 0.0003934726242308884, "tps": 18089, "wall": 12821.4} {"step": 3539, "train_loss": 3.865356922149658, "lr": 0.00039346751084798196, "tps": 18087, "wall": 12826.4} {"step": 3540, "train_loss": 3.910834312438965, "lr": 0.0003934623955000262, "tps": 18085, "wall": 12831.3} {"step": 3541, "train_loss": 3.7915143966674805, "lr": 0.000393457278187079, "tps": 18083, "wall": 12836.4} {"step": 3542, "train_loss": 3.8967456817626953, "lr": 0.0003934521589091983, "tps": 18081, "wall": 12841.3} {"step": 3543, "train_loss": 4.001552581787109, "lr": 0.00039344703766644223, "tps": 18079, "wall": 12846.3} {"step": 3544, "train_loss": 3.9922475814819336, "lr": 0.0003934419144588687, "tps": 18077, "wall": 12851.3} {"step": 3545, "train_loss": 4.024895668029785, "lr": 0.0003934367892865358, "tps": 18075, "wall": 12856.4} {"step": 3546, "train_loss": 3.8370144367218018, "lr": 0.0003934316621495016, "tps": 18074, "wall": 12861.3} {"step": 3547, "train_loss": 3.977684259414673, "lr": 0.00039342653304782414, "tps": 18072, "wall": 12866.3} {"step": 3548, "train_loss": 3.837697982788086, "lr": 0.0003934214019815615, "tps": 18070, "wall": 12871.2} {"step": 3549, "train_loss": 3.9794466495513916, "lr": 0.0003934162689507718, "tps": 18068, "wall": 12876.2} {"step": 3550, "train_loss": 3.9187731742858887, "lr": 0.00039341113395551327, "tps": 18066, "wall": 12881.1} {"step": 3551, "train_loss": 3.8152763843536377, "lr": 0.00039340599699584406, "tps": 18064, "wall": 12886.1} {"step": 3552, "train_loss": 3.9702248573303223, "lr": 0.0003934008580718223, "tps": 18062, "wall": 12891.1} {"step": 3553, "train_loss": 3.883991003036499, "lr": 0.00039339571718350626, "tps": 18060, "wall": 12896.1} {"step": 3554, "train_loss": 3.9702939987182617, "lr": 0.0003933905743309541, "tps": 18059, "wall": 12901.1} {"step": 3555, "train_loss": 3.9526543617248535, "lr": 0.0003933854295142242, "tps": 18057, "wall": 12906.0} {"step": 3556, "train_loss": 3.866842269897461, "lr": 0.0003933802827333748, "tps": 18055, "wall": 12911.0} {"step": 3557, "train_loss": 3.887979507446289, "lr": 0.00039337513398846405, "tps": 18053, "wall": 12915.9} {"step": 3558, "train_loss": 3.871729850769043, "lr": 0.0003933699832795505, "tps": 18051, "wall": 12920.9} {"step": 3559, "train_loss": 3.8276724815368652, "lr": 0.00039336483060669236, "tps": 18049, "wall": 12925.9} {"step": 3560, "train_loss": 3.8608810901641846, "lr": 0.0003933596759699481, "tps": 18047, "wall": 12930.8} {"step": 3561, "train_loss": 3.902402400970459, "lr": 0.000393354519369376, "tps": 18045, "wall": 12935.8} {"step": 3562, "train_loss": 3.9797439575195312, "lr": 0.0003933493608050345, "tps": 18044, "wall": 12940.8} {"step": 3563, "train_loss": 3.887563705444336, "lr": 0.00039334420027698207, "tps": 18042, "wall": 12945.8} {"step": 3564, "train_loss": 3.907241106033325, "lr": 0.0003933390377852773, "tps": 18040, "wall": 12950.7} {"step": 3565, "train_loss": 3.92022705078125, "lr": 0.00039333387332997837, "tps": 18038, "wall": 12955.7} {"step": 3566, "train_loss": 3.9422082901000977, "lr": 0.00039332870691114396, "tps": 18036, "wall": 12960.7} {"step": 3567, "train_loss": 3.9235358238220215, "lr": 0.00039332353852883264, "tps": 18034, "wall": 12965.7} {"step": 3568, "train_loss": 3.975511312484741, "lr": 0.0003933183681831029, "tps": 18032, "wall": 12970.6} {"step": 3569, "train_loss": 3.925790786743164, "lr": 0.00039331319587401325, "tps": 18030, "wall": 12975.7} {"step": 3570, "train_loss": 3.881310224533081, "lr": 0.00039330802160162244, "tps": 18029, "wall": 12980.7} {"step": 3571, "train_loss": 3.9284520149230957, "lr": 0.0003933028453659889, "tps": 18027, "wall": 12985.6} {"step": 3572, "train_loss": 3.873654365539551, "lr": 0.00039329766716717136, "tps": 18025, "wall": 12990.6} {"step": 3573, "train_loss": 4.015933990478516, "lr": 0.0003932924870052285, "tps": 18023, "wall": 12995.6} {"step": 3574, "train_loss": 3.9128570556640625, "lr": 0.0003932873048802189, "tps": 18021, "wall": 13000.5} {"step": 3575, "train_loss": 3.9091286659240723, "lr": 0.00039328212079220144, "tps": 18019, "wall": 13005.5} {"step": 3576, "train_loss": 3.852356195449829, "lr": 0.00039327693474123474, "tps": 18017, "wall": 13010.5} {"step": 3577, "train_loss": 3.876189708709717, "lr": 0.0003932717467273775, "tps": 18016, "wall": 13015.5} {"step": 3578, "train_loss": 3.8631367683410645, "lr": 0.00039326655675068855, "tps": 18014, "wall": 13020.4} {"step": 3579, "train_loss": 3.8807904720306396, "lr": 0.00039326136481122664, "tps": 18012, "wall": 13025.4} {"step": 3580, "train_loss": 3.8573999404907227, "lr": 0.0003932561709090506, "tps": 18010, "wall": 13030.4} {"step": 3581, "train_loss": 3.914947032928467, "lr": 0.00039325097504421935, "tps": 18008, "wall": 13035.3} {"step": 3582, "train_loss": 3.9604320526123047, "lr": 0.00039324577721679165, "tps": 18006, "wall": 13040.3} {"step": 3583, "train_loss": 3.950608253479004, "lr": 0.00039324057742682646, "tps": 18005, "wall": 13045.3} {"step": 3584, "train_loss": 3.91163969039917, "lr": 0.00039323537567438263, "tps": 18003, "wall": 13050.2} {"step": 3585, "train_loss": 3.876283884048462, "lr": 0.00039323017195951905, "tps": 18001, "wall": 13055.2} {"step": 3586, "train_loss": 3.9236085414886475, "lr": 0.0003932249662822947, "tps": 17999, "wall": 13060.2} {"step": 3587, "train_loss": 3.828700542449951, "lr": 0.00039321975864276855, "tps": 17997, "wall": 13065.2} {"step": 3588, "train_loss": 3.891329288482666, "lr": 0.00039321454904099964, "tps": 17995, "wall": 13070.1} {"step": 3589, "train_loss": 3.8767452239990234, "lr": 0.00039320933747704695, "tps": 17993, "wall": 13075.2} {"step": 3590, "train_loss": 4.001420497894287, "lr": 0.0003932041239509695, "tps": 17992, "wall": 13080.1} {"step": 3591, "train_loss": 3.92649507522583, "lr": 0.0003931989084628264, "tps": 17990, "wall": 13085.1} {"step": 3592, "train_loss": 3.83231258392334, "lr": 0.00039319369101267667, "tps": 17988, "wall": 13090.0} {"step": 3593, "train_loss": 3.962207317352295, "lr": 0.00039318847160057943, "tps": 17986, "wall": 13095.0} {"step": 3594, "train_loss": 3.8837623596191406, "lr": 0.0003931832502265938, "tps": 17984, "wall": 13099.9} {"step": 3595, "train_loss": 3.778027057647705, "lr": 0.000393178026890779, "tps": 17983, "wall": 13104.9} {"step": 3596, "train_loss": 3.902512788772583, "lr": 0.0003931728015931941, "tps": 17981, "wall": 13109.9} {"step": 3597, "train_loss": 3.997633457183838, "lr": 0.0003931675743338983, "tps": 17979, "wall": 13114.8} {"step": 3598, "train_loss": 4.001363277435303, "lr": 0.0003931623451129509, "tps": 17977, "wall": 13119.8} {"step": 3599, "train_loss": 3.9191622734069824, "lr": 0.00039315711393041105, "tps": 17975, "wall": 13124.7} {"step": 3600, "train_loss": 3.960968017578125, "lr": 0.0003931518807863381, "tps": 17974, "wall": 13129.7} {"step": 3601, "train_loss": 3.9172821044921875, "lr": 0.0003931466456807913, "tps": 17972, "wall": 13134.7} {"step": 3602, "train_loss": 3.8922858238220215, "lr": 0.00039314140861382985, "tps": 17970, "wall": 13139.7} {"step": 3603, "train_loss": 3.8443591594696045, "lr": 0.0003931361695855132, "tps": 17968, "wall": 13144.7} {"step": 3604, "train_loss": 3.9652912616729736, "lr": 0.0003931309285959006, "tps": 17966, "wall": 13149.6} {"step": 3605, "train_loss": 3.9444377422332764, "lr": 0.0003931256856450515, "tps": 17965, "wall": 13154.6} {"step": 3606, "train_loss": 3.9564666748046875, "lr": 0.0003931204407330253, "tps": 17963, "wall": 13159.6} {"step": 3607, "train_loss": 3.932126998901367, "lr": 0.00039311519385988136, "tps": 17961, "wall": 13164.5} {"step": 3608, "train_loss": 3.99151349067688, "lr": 0.0003931099450256791, "tps": 17959, "wall": 13169.5} {"step": 3609, "train_loss": 3.835228681564331, "lr": 0.0003931046942304781, "tps": 17957, "wall": 13174.4} {"step": 3610, "train_loss": 3.824492931365967, "lr": 0.0003930994414743377, "tps": 17956, "wall": 13179.4} {"step": 3611, "train_loss": 3.889345645904541, "lr": 0.0003930941867573175, "tps": 17954, "wall": 13184.4} {"step": 3612, "train_loss": 3.8445138931274414, "lr": 0.00039308893007947696, "tps": 17952, "wall": 13189.3} {"step": 3613, "train_loss": 3.9463934898376465, "lr": 0.0003930836714408757, "tps": 17950, "wall": 13194.4} {"step": 3614, "train_loss": 3.962522029876709, "lr": 0.00039307841084157316, "tps": 17948, "wall": 13199.3} {"step": 3615, "train_loss": 3.8762454986572266, "lr": 0.0003930731482816291, "tps": 17947, "wall": 13204.3} {"step": 3616, "train_loss": 3.8397457599639893, "lr": 0.000393067883761103, "tps": 17945, "wall": 13209.2} {"step": 3617, "train_loss": 3.826876163482666, "lr": 0.00039306261728005456, "tps": 17943, "wall": 13214.2} {"step": 3618, "train_loss": 3.900045871734619, "lr": 0.00039305734883854354, "tps": 17941, "wall": 13219.2} {"step": 3619, "train_loss": 3.9714741706848145, "lr": 0.00039305207843662933, "tps": 17939, "wall": 13224.1} {"step": 3620, "train_loss": 4.024166584014893, "lr": 0.0003930468060743719, "tps": 17938, "wall": 13229.1} {"step": 3621, "train_loss": 3.8830130100250244, "lr": 0.00039304153175183094, "tps": 17936, "wall": 13234.0} {"step": 3622, "train_loss": 3.8627607822418213, "lr": 0.000393036255469066, "tps": 17934, "wall": 13239.0} {"step": 3623, "train_loss": 3.8720269203186035, "lr": 0.00039303097722613714, "tps": 17932, "wall": 13244.0} {"step": 3624, "train_loss": 3.8017518520355225, "lr": 0.000393025697023104, "tps": 17931, "wall": 13248.9} {"step": 3625, "train_loss": 3.9046435356140137, "lr": 0.0003930204148600264, "tps": 17929, "wall": 13253.9} {"step": 3626, "train_loss": 3.7958474159240723, "lr": 0.00039301513073696404, "tps": 17927, "wall": 13258.9} {"step": 3627, "train_loss": 3.8754844665527344, "lr": 0.00039300984465397707, "tps": 17925, "wall": 13263.9} {"step": 3628, "train_loss": 3.912109613418579, "lr": 0.00039300455661112516, "tps": 17923, "wall": 13268.8} {"step": 3629, "train_loss": 3.9366044998168945, "lr": 0.0003929992666084683, "tps": 17922, "wall": 13273.8} {"step": 3630, "train_loss": 3.8420276641845703, "lr": 0.00039299397464606634, "tps": 17920, "wall": 13278.7} {"step": 3631, "train_loss": 3.898805618286133, "lr": 0.00039298868072397934, "tps": 17918, "wall": 13283.7} {"step": 3632, "train_loss": 3.8954927921295166, "lr": 0.00039298338484226717, "tps": 17916, "wall": 13288.7} {"step": 3633, "train_loss": 3.8141932487487793, "lr": 0.0003929780870009898, "tps": 17915, "wall": 13293.6} {"step": 3634, "train_loss": 3.8172945976257324, "lr": 0.0003929727872002074, "tps": 17913, "wall": 13298.6} {"step": 3635, "train_loss": 3.9509048461914062, "lr": 0.0003929674854399799, "tps": 17911, "wall": 13303.6} {"step": 3636, "train_loss": 3.7712132930755615, "lr": 0.00039296218172036733, "tps": 17909, "wall": 13308.5} {"step": 3637, "train_loss": 3.9239883422851562, "lr": 0.0003929568760414298, "tps": 17908, "wall": 13313.5} {"step": 3638, "train_loss": 3.8553056716918945, "lr": 0.0003929515684032275, "tps": 17906, "wall": 13318.5} {"step": 3639, "train_loss": 3.9894587993621826, "lr": 0.0003929462588058204, "tps": 17904, "wall": 13323.4} {"step": 3640, "train_loss": 3.8353404998779297, "lr": 0.00039294094724926876, "tps": 17902, "wall": 13328.4} {"step": 3641, "train_loss": 3.9440717697143555, "lr": 0.00039293563373363265, "tps": 17901, "wall": 13333.4} {"step": 3642, "train_loss": 3.775904417037964, "lr": 0.0003929303182589724, "tps": 17899, "wall": 13338.3} {"step": 3643, "train_loss": 3.816129684448242, "lr": 0.0003929250008253481, "tps": 17897, "wall": 13343.3} {"step": 3644, "train_loss": 3.9240074157714844, "lr": 0.0003929196814328201, "tps": 17895, "wall": 13348.3} {"step": 3645, "train_loss": 3.8831865787506104, "lr": 0.0003929143600814485, "tps": 17894, "wall": 13353.2} {"step": 3646, "train_loss": 3.809521198272705, "lr": 0.00039290903677129373, "tps": 17892, "wall": 13358.2} {"step": 3647, "train_loss": 3.8878421783447266, "lr": 0.00039290371150241607, "tps": 17890, "wall": 13363.2} {"step": 3648, "train_loss": 3.79361629486084, "lr": 0.0003928983842748758, "tps": 17888, "wall": 13368.1} {"step": 3649, "train_loss": 3.898106575012207, "lr": 0.0003928930550887332, "tps": 17887, "wall": 13373.2} {"step": 3650, "train_loss": 3.9117989540100098, "lr": 0.0003928877239440488, "tps": 17885, "wall": 13378.1} {"step": 3651, "train_loss": 4.002474784851074, "lr": 0.0003928823908408828, "tps": 17883, "wall": 13383.1} {"step": 3652, "train_loss": 3.8685684204101562, "lr": 0.00039287705577929587, "tps": 17881, "wall": 13388.0} {"step": 3653, "train_loss": 3.8221333026885986, "lr": 0.00039287171875934825, "tps": 17880, "wall": 13393.0} {"step": 3654, "train_loss": 3.928098201751709, "lr": 0.0003928663797811004, "tps": 17878, "wall": 13398.0} {"step": 3655, "train_loss": 3.846346855163574, "lr": 0.0003928610388446129, "tps": 17876, "wall": 13402.9} {"step": 3656, "train_loss": 3.8438706398010254, "lr": 0.0003928556959499462, "tps": 17874, "wall": 13407.9} {"step": 3657, "train_loss": 3.861388921737671, "lr": 0.0003928503510971608, "tps": 17873, "wall": 13412.8} {"step": 3658, "train_loss": 3.9894089698791504, "lr": 0.0003928450042863173, "tps": 17871, "wall": 13417.8} {"step": 3659, "train_loss": 3.861660957336426, "lr": 0.0003928396555174762, "tps": 17869, "wall": 13422.8} {"step": 3660, "train_loss": 3.8357748985290527, "lr": 0.00039283430479069816, "tps": 17867, "wall": 13427.8} {"step": 3661, "train_loss": 3.8804731369018555, "lr": 0.0003928289521060437, "tps": 17866, "wall": 13432.8} {"step": 3662, "train_loss": 3.905164957046509, "lr": 0.00039282359746357367, "tps": 17864, "wall": 13437.8} {"step": 3663, "train_loss": 3.851778268814087, "lr": 0.00039281824086334844, "tps": 17862, "wall": 13442.7} {"step": 3664, "train_loss": 3.8038170337677, "lr": 0.0003928128823054289, "tps": 17861, "wall": 13447.7} {"step": 3665, "train_loss": 3.8769826889038086, "lr": 0.0003928075217898756, "tps": 17859, "wall": 13452.6} {"step": 3666, "train_loss": 3.9334473609924316, "lr": 0.0003928021593167494, "tps": 17857, "wall": 13457.6} {"step": 3667, "train_loss": 3.9528393745422363, "lr": 0.00039279679488611103, "tps": 17855, "wall": 13462.6} {"step": 3668, "train_loss": 3.9304990768432617, "lr": 0.0003927914284980212, "tps": 17854, "wall": 13467.5} {"step": 3669, "train_loss": 3.7939085960388184, "lr": 0.00039278606015254067, "tps": 17852, "wall": 13472.5} {"step": 3670, "train_loss": 3.860610008239746, "lr": 0.0003927806898497303, "tps": 17850, "wall": 13477.4} {"step": 3671, "train_loss": 3.9587903022766113, "lr": 0.000392775317589651, "tps": 17849, "wall": 13482.4} {"step": 3672, "train_loss": 3.9624385833740234, "lr": 0.0003927699433723635, "tps": 17847, "wall": 13487.4} {"step": 3673, "train_loss": 3.9559481143951416, "lr": 0.00039276456719792874, "tps": 17845, "wall": 13492.4} {"step": 3674, "train_loss": 4.030264854431152, "lr": 0.00039275918906640767, "tps": 17843, "wall": 13497.3} {"step": 3675, "train_loss": 3.9129629135131836, "lr": 0.00039275380897786107, "tps": 17842, "wall": 13502.3} {"step": 3676, "train_loss": 3.8682942390441895, "lr": 0.00039274842693235004, "tps": 17840, "wall": 13507.2} {"step": 3677, "train_loss": 3.8985719680786133, "lr": 0.00039274304292993546, "tps": 17838, "wall": 13512.2} {"step": 3678, "train_loss": 3.806602716445923, "lr": 0.00039273765697067837, "tps": 17837, "wall": 13517.2} {"step": 3679, "train_loss": 3.902900457382202, "lr": 0.00039273226905463975, "tps": 17835, "wall": 13522.1} {"step": 3680, "train_loss": 3.8755173683166504, "lr": 0.0003927268791818806, "tps": 17833, "wall": 13527.1} {"step": 3681, "train_loss": 3.9543938636779785, "lr": 0.00039272148735246205, "tps": 17832, "wall": 13532.0} {"step": 3682, "train_loss": 3.941621780395508, "lr": 0.00039271609356644516, "tps": 17830, "wall": 13537.0} {"step": 3683, "train_loss": 3.8930654525756836, "lr": 0.00039271069782389096, "tps": 17828, "wall": 13541.9} {"step": 3684, "train_loss": 3.9667317867279053, "lr": 0.0003927053001248607, "tps": 17826, "wall": 13546.9} {"step": 3685, "train_loss": 3.884272575378418, "lr": 0.0003926999004694154, "tps": 17825, "wall": 13551.9} {"step": 3686, "train_loss": 3.883617401123047, "lr": 0.00039269449885761637, "tps": 17823, "wall": 13556.9} {"step": 3687, "train_loss": 3.7862064838409424, "lr": 0.0003926890952895247, "tps": 17821, "wall": 13561.8} {"step": 3688, "train_loss": 3.972459316253662, "lr": 0.00039268368976520156, "tps": 17820, "wall": 13566.8} {"step": 3689, "train_loss": 3.8936004638671875, "lr": 0.00039267828228470823, "tps": 17818, "wall": 13571.7} {"step": 3690, "train_loss": 4.015218257904053, "lr": 0.00039267287284810596, "tps": 17816, "wall": 13576.7} {"step": 3691, "train_loss": 3.945098400115967, "lr": 0.0003926674614554561, "tps": 17815, "wall": 13581.7} {"step": 3692, "train_loss": 4.01741886138916, "lr": 0.0003926620481068199, "tps": 17813, "wall": 13586.6} {"step": 3693, "train_loss": 3.929537296295166, "lr": 0.0003926566328022587, "tps": 17811, "wall": 13591.6} {"step": 3694, "train_loss": 3.8857483863830566, "lr": 0.0003926512155418338, "tps": 17810, "wall": 13596.5} {"step": 3695, "train_loss": 3.950629472732544, "lr": 0.00039264579632560654, "tps": 17808, "wall": 13601.5} {"step": 3696, "train_loss": 3.968716621398926, "lr": 0.0003926403751536384, "tps": 17806, "wall": 13606.5} {"step": 3697, "train_loss": 3.7847437858581543, "lr": 0.00039263495202599075, "tps": 17804, "wall": 13611.5} {"step": 3698, "train_loss": 3.870750904083252, "lr": 0.000392629526942725, "tps": 17803, "wall": 13616.5} {"step": 3699, "train_loss": 3.8978018760681152, "lr": 0.00039262409990390264, "tps": 17801, "wall": 13621.5} {"step": 3700, "train_loss": 3.9073758125305176, "lr": 0.00039261867090958517, "tps": 17799, "wall": 13626.4} {"step": 3701, "train_loss": 3.8514130115509033, "lr": 0.00039261323995983406, "tps": 17798, "wall": 13631.4} {"step": 3702, "train_loss": 3.899709939956665, "lr": 0.00039260780705471077, "tps": 17796, "wall": 13636.4} {"step": 3703, "train_loss": 3.84708833694458, "lr": 0.00039260237219427695, "tps": 17794, "wall": 13641.3} {"step": 3704, "train_loss": 3.9190456867218018, "lr": 0.0003925969353785941, "tps": 17793, "wall": 13646.3} {"step": 3705, "train_loss": 3.900812864303589, "lr": 0.0003925914966077238, "tps": 17791, "wall": 13651.2} {"step": 3706, "train_loss": 3.77408766746521, "lr": 0.0003925860558817278, "tps": 17789, "wall": 13656.2} {"step": 3707, "train_loss": 3.9838624000549316, "lr": 0.0003925806132006675, "tps": 17788, "wall": 13661.2} {"step": 3708, "train_loss": 3.8499348163604736, "lr": 0.0003925751685646047, "tps": 17786, "wall": 13666.2} {"step": 3709, "train_loss": 3.8624157905578613, "lr": 0.00039256972197360113, "tps": 17784, "wall": 13671.1} {"step": 3710, "train_loss": 3.8633570671081543, "lr": 0.0003925642734277184, "tps": 17783, "wall": 13676.2} {"step": 3711, "train_loss": 3.935556173324585, "lr": 0.00039255882292701813, "tps": 17781, "wall": 13681.1} {"step": 3712, "train_loss": 3.917236089706421, "lr": 0.0003925533704715623, "tps": 17779, "wall": 13686.1} {"step": 3713, "train_loss": 3.9200973510742188, "lr": 0.0003925479160614125, "tps": 17778, "wall": 13691.1} {"step": 3714, "train_loss": 3.8968844413757324, "lr": 0.0003925424596966306, "tps": 17776, "wall": 13696.0} {"step": 3715, "train_loss": 3.7920572757720947, "lr": 0.0003925370013772784, "tps": 17774, "wall": 13701.0} {"step": 3716, "train_loss": 3.903286933898926, "lr": 0.00039253154110341766, "tps": 17773, "wall": 13706.0} {"step": 3717, "train_loss": 3.9864747524261475, "lr": 0.0003925260788751103, "tps": 17771, "wall": 13710.9} {"step": 3718, "train_loss": 3.9226276874542236, "lr": 0.00039252061469241816, "tps": 17769, "wall": 13715.9} {"step": 3719, "train_loss": 3.8096096515655518, "lr": 0.00039251514855540324, "tps": 17768, "wall": 13720.9} {"step": 3720, "train_loss": 3.9133548736572266, "lr": 0.00039250968046412735, "tps": 17766, "wall": 13725.8} {"step": 3721, "train_loss": 3.8065285682678223, "lr": 0.0003925042104186524, "tps": 17764, "wall": 13730.8} {"step": 3722, "train_loss": 3.833378553390503, "lr": 0.0003924987384190405, "tps": 17763, "wall": 13735.8} {"step": 3723, "train_loss": 3.933864116668701, "lr": 0.00039249326446535353, "tps": 17761, "wall": 13740.8} {"step": 3724, "train_loss": 3.8873744010925293, "lr": 0.00039248778855765354, "tps": 17759, "wall": 13745.7} {"step": 3725, "train_loss": 3.9157843589782715, "lr": 0.0003924823106960026, "tps": 17758, "wall": 13750.7} {"step": 3726, "train_loss": 3.8413593769073486, "lr": 0.00039247683088046263, "tps": 17756, "wall": 13755.7} {"step": 3727, "train_loss": 3.8914613723754883, "lr": 0.0003924713491110958, "tps": 17754, "wall": 13760.6} {"step": 3728, "train_loss": 3.872584342956543, "lr": 0.00039246586538796424, "tps": 17753, "wall": 13765.6} {"step": 3729, "train_loss": 3.8450050354003906, "lr": 0.00039246037971113, "tps": 17751, "wall": 13770.5} {"step": 3730, "train_loss": 3.860218048095703, "lr": 0.00039245489208065526, "tps": 17749, "wall": 13775.5} {"step": 3731, "train_loss": 3.9532127380371094, "lr": 0.00039244940249660214, "tps": 17748, "wall": 13780.5} {"step": 3732, "train_loss": 3.9269206523895264, "lr": 0.0003924439109590329, "tps": 17746, "wall": 13785.5} {"step": 3733, "train_loss": 3.9128847122192383, "lr": 0.0003924384174680097, "tps": 17745, "wall": 13790.4} {"step": 3734, "train_loss": 3.867358922958374, "lr": 0.00039243292202359475, "tps": 17743, "wall": 13795.4} {"step": 3735, "train_loss": 3.9029459953308105, "lr": 0.00039242742462585037, "tps": 17741, "wall": 13800.4} {"step": 3736, "train_loss": 3.8868443965911865, "lr": 0.00039242192527483874, "tps": 17740, "wall": 13805.4} {"step": 3737, "train_loss": 3.8758392333984375, "lr": 0.00039241642397062226, "tps": 17738, "wall": 13810.3} {"step": 3738, "train_loss": 3.799976348876953, "lr": 0.00039241092071326327, "tps": 17736, "wall": 13815.4} {"step": 3739, "train_loss": 3.8033814430236816, "lr": 0.0003924054155028239, "tps": 17735, "wall": 13820.4} {"step": 3740, "train_loss": 3.901475191116333, "lr": 0.0003923999083393667, "tps": 17733, "wall": 13825.3} {"step": 3741, "train_loss": 3.979853868484497, "lr": 0.000392394399222954, "tps": 17731, "wall": 13830.3} {"step": 3742, "train_loss": 3.9089508056640625, "lr": 0.00039238888815364836, "tps": 17730, "wall": 13835.2} {"step": 3743, "train_loss": 3.851008415222168, "lr": 0.00039238337513151195, "tps": 17728, "wall": 13840.2} {"step": 3744, "train_loss": 3.913114547729492, "lr": 0.00039237786015660736, "tps": 17726, "wall": 13845.2} {"step": 3745, "train_loss": 3.854548454284668, "lr": 0.000392372343228997, "tps": 17725, "wall": 13850.1} {"step": 3746, "train_loss": 3.9428577423095703, "lr": 0.0003923668243487434, "tps": 17723, "wall": 13855.2} {"step": 3747, "train_loss": 3.8646085262298584, "lr": 0.00039236130351590916, "tps": 17722, "wall": 13860.1} {"step": 3748, "train_loss": 3.887113094329834, "lr": 0.0003923557807305567, "tps": 17720, "wall": 13865.1} {"step": 3749, "train_loss": 3.8196561336517334, "lr": 0.00039235025599274867, "tps": 17718, "wall": 13870.0} {"step": 3750, "train_loss": 3.79364275932312, "lr": 0.0003923447293025476, "tps": 17717, "wall": 13875.0} {"step": 3751, "train_loss": 3.8550467491149902, "lr": 0.0003923392006600162, "tps": 17715, "wall": 13880.0} {"step": 3752, "train_loss": 3.8624374866485596, "lr": 0.0003923336700652168, "tps": 17713, "wall": 13884.9} {"step": 3753, "train_loss": 3.8481616973876953, "lr": 0.0003923281375182124, "tps": 17712, "wall": 13889.9} {"step": 3754, "train_loss": 3.794480800628662, "lr": 0.0003923226030190656, "tps": 17710, "wall": 13894.9} {"step": 3755, "train_loss": 3.9017536640167236, "lr": 0.00039231706656783896, "tps": 17709, "wall": 13899.8} {"step": 3756, "train_loss": 3.941189765930176, "lr": 0.0003923115281645953, "tps": 17707, "wall": 13904.8} {"step": 3757, "train_loss": 3.7827725410461426, "lr": 0.00039230598780939723, "tps": 17705, "wall": 13909.8} {"step": 3758, "train_loss": 3.9321374893188477, "lr": 0.0003923004455023076, "tps": 17704, "wall": 13914.8} {"step": 3759, "train_loss": 3.870551824569702, "lr": 0.00039229490124338933, "tps": 17702, "wall": 13919.8} {"step": 3760, "train_loss": 3.837006092071533, "lr": 0.000392289355032705, "tps": 17700, "wall": 13924.7} {"step": 3761, "train_loss": 3.9230008125305176, "lr": 0.00039228380687031763, "tps": 17699, "wall": 13929.7} {"step": 3762, "train_loss": 3.916874408721924, "lr": 0.00039227825675628987, "tps": 17697, "wall": 13934.6} {"step": 3763, "train_loss": 3.7962822914123535, "lr": 0.00039227270469068475, "tps": 17696, "wall": 13939.6} {"step": 3764, "train_loss": 3.876532554626465, "lr": 0.0003922671506735651, "tps": 17694, "wall": 13944.6} {"step": 3765, "train_loss": 3.8720147609710693, "lr": 0.0003922615947049939, "tps": 17692, "wall": 13949.5} {"step": 3766, "train_loss": 3.8772830963134766, "lr": 0.000392256036785034, "tps": 17691, "wall": 13954.5} {"step": 3767, "train_loss": 3.9117355346679688, "lr": 0.00039225047691374837, "tps": 17689, "wall": 13959.5} {"step": 3768, "train_loss": 3.8712027072906494, "lr": 0.00039224491509120006, "tps": 17688, "wall": 13964.5} {"step": 3769, "train_loss": 3.869211435317993, "lr": 0.000392239351317452, "tps": 17686, "wall": 13969.4} {"step": 3770, "train_loss": 3.81581974029541, "lr": 0.00039223378559256726, "tps": 17684, "wall": 13974.5} {"step": 3771, "train_loss": 4.004430294036865, "lr": 0.00039222821791660886, "tps": 17683, "wall": 13979.4} {"step": 3772, "train_loss": 3.8172121047973633, "lr": 0.0003922226482896399, "tps": 17681, "wall": 13984.4} {"step": 3773, "train_loss": 3.774496555328369, "lr": 0.0003922170767117235, "tps": 17680, "wall": 13989.3} {"step": 3774, "train_loss": 3.8284268379211426, "lr": 0.0003922115031829227, "tps": 17678, "wall": 13994.3} {"step": 3775, "train_loss": 3.815664768218994, "lr": 0.0003922059277033007, "tps": 17676, "wall": 13999.3} {"step": 3776, "train_loss": 3.8265676498413086, "lr": 0.0003922003502729206, "tps": 17675, "wall": 14004.2} {"step": 3777, "train_loss": 3.901569366455078, "lr": 0.0003921947708918457, "tps": 17673, "wall": 14009.2} {"step": 3778, "train_loss": 3.9599037170410156, "lr": 0.000392189189560139, "tps": 17672, "wall": 14014.2} {"step": 3779, "train_loss": 3.8980274200439453, "lr": 0.0003921836062778639, "tps": 17670, "wall": 14019.1} {"step": 3780, "train_loss": 3.7997350692749023, "lr": 0.0003921780210450836, "tps": 17668, "wall": 14024.1} {"step": 3781, "train_loss": 3.9249794483184814, "lr": 0.00039217243386186135, "tps": 17667, "wall": 14029.1} {"step": 3782, "train_loss": 3.9253382682800293, "lr": 0.0003921668447282605, "tps": 17665, "wall": 14034.1} {"step": 3783, "train_loss": 3.7501320838928223, "lr": 0.0003921612536443442, "tps": 17664, "wall": 14039.0} {"step": 3784, "train_loss": 3.960920810699463, "lr": 0.00039215566061017603, "tps": 17662, "wall": 14044.0} {"step": 3785, "train_loss": 3.9133291244506836, "lr": 0.00039215006562581914, "tps": 17661, "wall": 14049.0} {"step": 3786, "train_loss": 4.0058274269104, "lr": 0.0003921444686913371, "tps": 17659, "wall": 14053.9} {"step": 3787, "train_loss": 3.8170158863067627, "lr": 0.00039213886980679315, "tps": 17657, "wall": 14058.9} {"step": 3788, "train_loss": 3.9862804412841797, "lr": 0.00039213326897225074, "tps": 17656, "wall": 14063.9} {"step": 3789, "train_loss": 3.9510135650634766, "lr": 0.00039212766618777333, "tps": 17654, "wall": 14068.8} {"step": 3790, "train_loss": 3.7716517448425293, "lr": 0.0003921220614534245, "tps": 17653, "wall": 14073.8} {"step": 3791, "train_loss": 3.7628421783447266, "lr": 0.00039211645476926757, "tps": 17651, "wall": 14078.7} {"step": 3792, "train_loss": 3.9046335220336914, "lr": 0.00039211084613536613, "tps": 17650, "wall": 14083.7} {"step": 3793, "train_loss": 3.9105489253997803, "lr": 0.00039210523555178377, "tps": 17648, "wall": 14088.7} {"step": 3794, "train_loss": 3.87518572807312, "lr": 0.0003920996230185839, "tps": 17646, "wall": 14093.7} {"step": 3795, "train_loss": 3.8354859352111816, "lr": 0.00039209400853583025, "tps": 17645, "wall": 14098.6} {"step": 3796, "train_loss": 3.9144163131713867, "lr": 0.0003920883921035864, "tps": 17643, "wall": 14103.6} {"step": 3797, "train_loss": 3.8145432472229004, "lr": 0.00039208277372191583, "tps": 17642, "wall": 14108.6} {"step": 3798, "train_loss": 3.8235931396484375, "lr": 0.00039207715339088236, "tps": 17640, "wall": 14113.5} {"step": 3799, "train_loss": 3.8662943840026855, "lr": 0.00039207153111054955, "tps": 17639, "wall": 14118.5} {"step": 3800, "train_loss": 3.8827648162841797, "lr": 0.0003920659068809812, "tps": 17637, "wall": 14123.5} {"step": 3801, "train_loss": 3.8302364349365234, "lr": 0.00039206028070224087, "tps": 17635, "wall": 14128.4} {"step": 3802, "train_loss": 3.8227059841156006, "lr": 0.00039205465257439244, "tps": 17634, "wall": 14133.4} {"step": 3803, "train_loss": 3.8051280975341797, "lr": 0.0003920490224974995, "tps": 17632, "wall": 14138.3} {"step": 3804, "train_loss": 3.8402204513549805, "lr": 0.000392043390471626, "tps": 17631, "wall": 14143.3} {"step": 3805, "train_loss": 3.9847381114959717, "lr": 0.0003920377564968357, "tps": 17629, "wall": 14148.2} {"step": 3806, "train_loss": 3.77006196975708, "lr": 0.00039203212057319233, "tps": 17628, "wall": 14153.3} {"step": 3807, "train_loss": 3.929340362548828, "lr": 0.00039202648270075975, "tps": 17626, "wall": 14158.2} {"step": 3808, "train_loss": 3.746293067932129, "lr": 0.000392020842879602, "tps": 17625, "wall": 14163.2} {"step": 3809, "train_loss": 3.912416934967041, "lr": 0.0003920152011097827, "tps": 17623, "wall": 14168.1} {"step": 3810, "train_loss": 3.9168596267700195, "lr": 0.000392009557391366, "tps": 17621, "wall": 14173.1} {"step": 3811, "train_loss": 3.8405466079711914, "lr": 0.0003920039117244156, "tps": 17620, "wall": 14178.2} {"step": 3812, "train_loss": 3.8642420768737793, "lr": 0.00039199826410899564, "tps": 17618, "wall": 14183.1} {"step": 3813, "train_loss": 3.9321556091308594, "lr": 0.0003919926145451701, "tps": 17617, "wall": 14188.1} {"step": 3814, "train_loss": 3.9939098358154297, "lr": 0.0003919869630330029, "tps": 17615, "wall": 14193.0} {"step": 3815, "train_loss": 3.784533977508545, "lr": 0.00039198130957255803, "tps": 17614, "wall": 14198.0} {"step": 3816, "train_loss": 3.9027557373046875, "lr": 0.0003919756541638996, "tps": 17612, "wall": 14203.0} {"step": 3817, "train_loss": 3.829789876937866, "lr": 0.00039196999680709166, "tps": 17611, "wall": 14207.9} {"step": 3818, "train_loss": 3.8669676780700684, "lr": 0.0003919643375021983, "tps": 17609, "wall": 14213.0} {"step": 3819, "train_loss": 3.905076026916504, "lr": 0.00039195867624928365, "tps": 17607, "wall": 14217.9} {"step": 3820, "train_loss": 3.8118715286254883, "lr": 0.0003919530130484118, "tps": 17606, "wall": 14222.8} {"step": 3821, "train_loss": 4.021792888641357, "lr": 0.0003919473478996469, "tps": 17604, "wall": 14227.8} {"step": 3822, "train_loss": 3.8909425735473633, "lr": 0.0003919416808030531, "tps": 17603, "wall": 14232.7} {"step": 3823, "train_loss": 3.924471139907837, "lr": 0.00039193601175869467, "tps": 17601, "wall": 14237.7} {"step": 3824, "train_loss": 3.8652358055114746, "lr": 0.0003919303407666358, "tps": 17599, "wall": 14243.1} {"step": 3825, "train_loss": 3.760000705718994, "lr": 0.0003919246678269407, "tps": 17598, "wall": 14248.1} {"step": 3826, "train_loss": 3.922833204269409, "lr": 0.0003919189929396737, "tps": 17596, "wall": 14253.2} {"step": 3827, "train_loss": 3.86663818359375, "lr": 0.000391913316104899, "tps": 17595, "wall": 14258.1} {"step": 3828, "train_loss": 3.860391855239868, "lr": 0.000391907637322681, "tps": 17593, "wall": 14263.1} {"step": 3829, "train_loss": 3.919877052307129, "lr": 0.00039190195659308404, "tps": 17591, "wall": 14268.1} {"step": 3830, "train_loss": 3.8658602237701416, "lr": 0.0003918962739161723, "tps": 17590, "wall": 14273.1} {"step": 3831, "train_loss": 3.9187393188476562, "lr": 0.00039189058929201036, "tps": 17588, "wall": 14278.1} {"step": 3832, "train_loss": 3.884340286254883, "lr": 0.00039188490272066244, "tps": 17587, "wall": 14283.0} {"step": 3833, "train_loss": 3.7978029251098633, "lr": 0.0003918792142021932, "tps": 17585, "wall": 14288.0} {"step": 3834, "train_loss": 3.878748893737793, "lr": 0.00039187352373666677, "tps": 17584, "wall": 14293.0} {"step": 3835, "train_loss": 3.953338623046875, "lr": 0.0003918678313241478, "tps": 17582, "wall": 14298.0} {"step": 3836, "train_loss": 3.946770191192627, "lr": 0.00039186213696470074, "tps": 17581, "wall": 14303.0} {"step": 3837, "train_loss": 3.865224838256836, "lr": 0.0003918564406583901, "tps": 17579, "wall": 14307.9} {"step": 3838, "train_loss": 3.8715155124664307, "lr": 0.00039185074240528044, "tps": 17578, "wall": 14312.9} {"step": 3839, "train_loss": 3.897486686706543, "lr": 0.00039184504220543624, "tps": 17576, "wall": 14317.8} {"step": 3840, "train_loss": 3.8722083568573, "lr": 0.0003918393400589221, "tps": 17575, "wall": 14322.8} {"step": 3841, "train_loss": 3.856583595275879, "lr": 0.0003918336359658026, "tps": 17573, "wall": 14327.7} {"step": 3842, "train_loss": 3.9959638118743896, "lr": 0.0003918279299261424, "tps": 17571, "wall": 14332.8} {"step": 3843, "train_loss": 3.8258423805236816, "lr": 0.00039182222194000614, "tps": 17570, "wall": 14337.7} {"step": 3844, "train_loss": 3.8414149284362793, "lr": 0.00039181651200745837, "tps": 17568, "wall": 14342.7} {"step": 3845, "train_loss": 3.8671321868896484, "lr": 0.00039181080012856397, "tps": 17567, "wall": 14347.6} {"step": 3846, "train_loss": 3.8853416442871094, "lr": 0.00039180508630338746, "tps": 17565, "wall": 14352.6} {"step": 3847, "train_loss": 3.8769278526306152, "lr": 0.00039179937053199367, "tps": 17564, "wall": 14357.6} {"step": 3848, "train_loss": 3.87545108795166, "lr": 0.0003917936528144473, "tps": 17562, "wall": 14362.6} {"step": 3849, "train_loss": 3.9196066856384277, "lr": 0.0003917879331508131, "tps": 17561, "wall": 14367.5} {"step": 3850, "train_loss": 3.8190200328826904, "lr": 0.00039178221154115593, "tps": 17559, "wall": 14372.5} {"step": 3851, "train_loss": 3.8661344051361084, "lr": 0.00039177648798554063, "tps": 17558, "wall": 14377.4} {"step": 3852, "train_loss": 3.863677740097046, "lr": 0.00039177076248403186, "tps": 17556, "wall": 14382.4} {"step": 3853, "train_loss": 3.8384435176849365, "lr": 0.00039176503503669466, "tps": 17555, "wall": 14387.4} {"step": 3854, "train_loss": 3.835988759994507, "lr": 0.0003917593056435939, "tps": 17553, "wall": 14392.5} {"step": 3855, "train_loss": 3.8606436252593994, "lr": 0.00039175357430479437, "tps": 17552, "wall": 14397.4} {"step": 3856, "train_loss": 3.836796522140503, "lr": 0.0003917478410203611, "tps": 17550, "wall": 14402.4} {"step": 3857, "train_loss": 3.810133934020996, "lr": 0.000391742105790359, "tps": 17549, "wall": 14407.3} {"step": 3858, "train_loss": 3.8378419876098633, "lr": 0.00039173636861485306, "tps": 17547, "wall": 14412.3} {"step": 3859, "train_loss": 3.8380086421966553, "lr": 0.0003917306294939082, "tps": 17546, "wall": 14417.3} {"step": 3860, "train_loss": 3.8284544944763184, "lr": 0.00039172488842758945, "tps": 17544, "wall": 14422.3} {"step": 3861, "train_loss": 3.9009475708007812, "lr": 0.00039171914541596194, "tps": 17543, "wall": 14427.2} {"step": 3862, "train_loss": 3.898437023162842, "lr": 0.0003917134004590906, "tps": 17541, "wall": 14432.2} {"step": 3863, "train_loss": 3.7942497730255127, "lr": 0.0003917076535570406, "tps": 17540, "wall": 14437.2} {"step": 3864, "train_loss": 3.8652029037475586, "lr": 0.000391701904709877, "tps": 17538, "wall": 14442.1} {"step": 3865, "train_loss": 3.8310153484344482, "lr": 0.0003916961539176649, "tps": 17537, "wall": 14447.1} {"step": 3866, "train_loss": 3.8486263751983643, "lr": 0.0003916904011804696, "tps": 17535, "wall": 14452.1} {"step": 3867, "train_loss": 3.911396026611328, "lr": 0.00039168464649835604, "tps": 17534, "wall": 14457.1} {"step": 3868, "train_loss": 3.9196598529815674, "lr": 0.00039167888987138953, "tps": 17532, "wall": 14462.1} {"step": 3869, "train_loss": 3.7959351539611816, "lr": 0.0003916731312996353, "tps": 17531, "wall": 14467.0} {"step": 3870, "train_loss": 3.8317313194274902, "lr": 0.0003916673707831585, "tps": 17529, "wall": 14472.0} {"step": 3871, "train_loss": 3.828625202178955, "lr": 0.0003916616083220245, "tps": 17528, "wall": 14477.0} {"step": 3872, "train_loss": 3.9345290660858154, "lr": 0.0003916558439162985, "tps": 17526, "wall": 14481.9} {"step": 3873, "train_loss": 3.8455424308776855, "lr": 0.00039165007756604577, "tps": 17525, "wall": 14486.9} {"step": 3874, "train_loss": 3.921865463256836, "lr": 0.0003916443092713317, "tps": 17523, "wall": 14491.9} {"step": 3875, "train_loss": 3.838578224182129, "lr": 0.0003916385390322216, "tps": 17522, "wall": 14496.8} {"step": 3876, "train_loss": 3.7934303283691406, "lr": 0.00039163276684878087, "tps": 17520, "wall": 14501.8} {"step": 3877, "train_loss": 3.839404582977295, "lr": 0.00039162699272107484, "tps": 17519, "wall": 14506.8} {"step": 3878, "train_loss": 3.864558219909668, "lr": 0.00039162121664916897, "tps": 17517, "wall": 14511.7} {"step": 3879, "train_loss": 3.945312261581421, "lr": 0.0003916154386331287, "tps": 17516, "wall": 14516.7} {"step": 3880, "train_loss": 3.8147566318511963, "lr": 0.0003916096586730194, "tps": 17514, "wall": 14521.7} {"step": 3881, "train_loss": 3.8723983764648438, "lr": 0.00039160387676890663, "tps": 17513, "wall": 14526.7} {"step": 3882, "train_loss": 4.007495880126953, "lr": 0.00039159809292085585, "tps": 17511, "wall": 14531.6} {"step": 3883, "train_loss": 3.89986515045166, "lr": 0.0003915923071289326, "tps": 17510, "wall": 14536.6} {"step": 3884, "train_loss": 3.8983657360076904, "lr": 0.00039158651939320247, "tps": 17508, "wall": 14541.6} {"step": 3885, "train_loss": 3.860797166824341, "lr": 0.0003915807297137309, "tps": 17507, "wall": 14546.5} {"step": 3886, "train_loss": 3.8174524307250977, "lr": 0.00039157493809058357, "tps": 17505, "wall": 14551.5} {"step": 3887, "train_loss": 3.8476810455322266, "lr": 0.000391569144523826, "tps": 17504, "wall": 14556.5} {"step": 3888, "train_loss": 3.8766303062438965, "lr": 0.0003915633490135239, "tps": 17503, "wall": 14561.4} {"step": 3889, "train_loss": 3.903590679168701, "lr": 0.0003915575515597429, "tps": 17501, "wall": 14566.4} {"step": 3890, "train_loss": 3.828692674636841, "lr": 0.00039155175216254874, "tps": 17500, "wall": 14571.3} {"step": 3891, "train_loss": 3.8210253715515137, "lr": 0.000391545950822007, "tps": 17498, "wall": 14576.3} {"step": 3892, "train_loss": 3.9085805416107178, "lr": 0.0003915401475381835, "tps": 17497, "wall": 14581.3} {"step": 3893, "train_loss": 3.9013278484344482, "lr": 0.00039153434231114386, "tps": 17495, "wall": 14586.3} {"step": 3894, "train_loss": 3.8794572353363037, "lr": 0.00039152853514095394, "tps": 17494, "wall": 14591.2} {"step": 3895, "train_loss": 3.8303730487823486, "lr": 0.0003915227260276795, "tps": 17492, "wall": 14596.2} {"step": 3896, "train_loss": 3.8288891315460205, "lr": 0.0003915169149713863, "tps": 17491, "wall": 14601.2} {"step": 3897, "train_loss": 3.874819755554199, "lr": 0.00039151110197214024, "tps": 17489, "wall": 14606.2} {"step": 3898, "train_loss": 3.899305582046509, "lr": 0.00039150528703000713, "tps": 17488, "wall": 14611.1} {"step": 3899, "train_loss": 3.84182071685791, "lr": 0.00039149947014505284, "tps": 17486, "wall": 14616.1} {"step": 3900, "train_loss": 3.9123647212982178, "lr": 0.00039149365131734335, "tps": 17485, "wall": 14621.1} {"step": 3901, "train_loss": 3.882784128189087, "lr": 0.0003914878305469444, "tps": 17484, "wall": 14626.0} {"step": 3902, "train_loss": 3.8789308071136475, "lr": 0.00039148200783392206, "tps": 17482, "wall": 14631.0} {"step": 3903, "train_loss": 3.847041130065918, "lr": 0.0003914761831783423, "tps": 17481, "wall": 14636.0} {"step": 3904, "train_loss": 3.9022274017333984, "lr": 0.000391470356580271, "tps": 17479, "wall": 14641.0} {"step": 3905, "train_loss": 3.8568267822265625, "lr": 0.0003914645280397743, "tps": 17478, "wall": 14645.9} {"step": 3906, "train_loss": 3.7936549186706543, "lr": 0.00039145869755691806, "tps": 17476, "wall": 14650.9} {"step": 3907, "train_loss": 3.897209405899048, "lr": 0.00039145286513176845, "tps": 17475, "wall": 14655.9} {"step": 3908, "train_loss": 3.852125644683838, "lr": 0.00039144703076439153, "tps": 17473, "wall": 14660.8} {"step": 3909, "train_loss": 3.7370851039886475, "lr": 0.0003914411944548534, "tps": 17472, "wall": 14665.8} {"step": 3910, "train_loss": 3.9232373237609863, "lr": 0.00039143535620322006, "tps": 17470, "wall": 14670.7} {"step": 3911, "train_loss": 3.793276786804199, "lr": 0.0003914295160095578, "tps": 17469, "wall": 14675.7} {"step": 3912, "train_loss": 3.823499917984009, "lr": 0.0003914236738739327, "tps": 17468, "wall": 14680.7} {"step": 3913, "train_loss": 4.018215179443359, "lr": 0.00039141782979641086, "tps": 17466, "wall": 14685.6} {"step": 3914, "train_loss": 3.8420839309692383, "lr": 0.00039141198377705866, "tps": 17465, "wall": 14690.6} {"step": 3915, "train_loss": 3.8263673782348633, "lr": 0.0003914061358159423, "tps": 17463, "wall": 14695.6} {"step": 3916, "train_loss": 3.824695348739624, "lr": 0.0003914002859131278, "tps": 17462, "wall": 14700.5} {"step": 3917, "train_loss": 3.8858566284179688, "lr": 0.00039139443406868165, "tps": 17460, "wall": 14705.5} {"step": 3918, "train_loss": 3.877920150756836, "lr": 0.0003913885802826701, "tps": 17459, "wall": 14710.5} {"step": 3919, "train_loss": 3.780742645263672, "lr": 0.0003913827245551595, "tps": 17457, "wall": 14715.4} {"step": 3920, "train_loss": 3.848989486694336, "lr": 0.000391376866886216, "tps": 17456, "wall": 14720.4} {"step": 3921, "train_loss": 3.7531981468200684, "lr": 0.00039137100727590617, "tps": 17455, "wall": 14725.3} {"step": 3922, "train_loss": 3.9455785751342773, "lr": 0.00039136514572429625, "tps": 17453, "wall": 14730.3} {"step": 3923, "train_loss": 3.848703384399414, "lr": 0.0003913592822314527, "tps": 17452, "wall": 14735.2} {"step": 3924, "train_loss": 3.8941433429718018, "lr": 0.000391353416797442, "tps": 17450, "wall": 14740.2} {"step": 3925, "train_loss": 3.770514488220215, "lr": 0.0003913475494223304, "tps": 17449, "wall": 14745.1} {"step": 3926, "train_loss": 3.881453275680542, "lr": 0.00039134168010618455, "tps": 17448, "wall": 14750.1} {"step": 3927, "train_loss": 3.861959457397461, "lr": 0.00039133580884907087, "tps": 17446, "wall": 14755.1} {"step": 3928, "train_loss": 3.9091875553131104, "lr": 0.00039132993565105587, "tps": 17445, "wall": 14760.1} {"step": 3929, "train_loss": 3.94996976852417, "lr": 0.00039132406051220616, "tps": 17443, "wall": 14765.0} {"step": 3930, "train_loss": 3.8783297538757324, "lr": 0.0003913181834325881, "tps": 17442, "wall": 14770.0} {"step": 3931, "train_loss": 3.867154359817505, "lr": 0.00039131230441226856, "tps": 17440, "wall": 14775.0} {"step": 3932, "train_loss": 3.8421382904052734, "lr": 0.00039130642345131385, "tps": 17439, "wall": 14780.0} {"step": 3933, "train_loss": 3.9000234603881836, "lr": 0.0003913005405497907, "tps": 17437, "wall": 14784.9} {"step": 3934, "train_loss": 3.869157314300537, "lr": 0.0003912946557077658, "tps": 17436, "wall": 14789.9} {"step": 3935, "train_loss": 3.808948516845703, "lr": 0.00039128876892530575, "tps": 17435, "wall": 14794.8} {"step": 3936, "train_loss": 3.8140687942504883, "lr": 0.00039128288020247727, "tps": 17433, "wall": 14799.8} {"step": 3937, "train_loss": 3.8423571586608887, "lr": 0.0003912769895393471, "tps": 17432, "wall": 14804.8} {"step": 3938, "train_loss": 3.8615357875823975, "lr": 0.00039127109693598187, "tps": 17430, "wall": 14809.7} {"step": 3939, "train_loss": 3.8532984256744385, "lr": 0.00039126520239244836, "tps": 17429, "wall": 14814.7} {"step": 3940, "train_loss": 3.8908498287200928, "lr": 0.00039125930590881345, "tps": 17427, "wall": 14819.7} {"step": 3941, "train_loss": 3.8399550914764404, "lr": 0.0003912534074851438, "tps": 17426, "wall": 14824.6} {"step": 3942, "train_loss": 3.8623757362365723, "lr": 0.0003912475071215063, "tps": 17425, "wall": 14829.6} {"step": 3943, "train_loss": 3.7803542613983154, "lr": 0.00039124160481796775, "tps": 17423, "wall": 14834.6} {"step": 3944, "train_loss": 3.9123353958129883, "lr": 0.0003912357005745951, "tps": 17422, "wall": 14839.6} {"step": 3945, "train_loss": 3.8381247520446777, "lr": 0.0003912297943914551, "tps": 17420, "wall": 14844.5} {"step": 3946, "train_loss": 3.9323184490203857, "lr": 0.0003912238862686148, "tps": 17419, "wall": 14849.5} {"step": 3947, "train_loss": 3.842496871948242, "lr": 0.00039121797620614095, "tps": 17418, "wall": 14854.5} {"step": 3948, "train_loss": 3.75321626663208, "lr": 0.00039121206420410074, "tps": 17416, "wall": 14859.4} {"step": 3949, "train_loss": 3.8487038612365723, "lr": 0.0003912061502625609, "tps": 17415, "wall": 14864.4} {"step": 3950, "train_loss": 3.8560266494750977, "lr": 0.00039120023438158865, "tps": 17413, "wall": 14869.3} {"step": 3951, "train_loss": 3.8537204265594482, "lr": 0.0003911943165612507, "tps": 17412, "wall": 14874.3} {"step": 3952, "train_loss": 3.858599901199341, "lr": 0.0003911883968016144, "tps": 17411, "wall": 14879.3} {"step": 3953, "train_loss": 3.8797664642333984, "lr": 0.00039118247510274665, "tps": 17409, "wall": 14884.3} {"step": 3954, "train_loss": 3.9065089225769043, "lr": 0.0003911765514647145, "tps": 17408, "wall": 14889.2} {"step": 3955, "train_loss": 3.808973550796509, "lr": 0.0003911706258875853, "tps": 17406, "wall": 14894.2} {"step": 3956, "train_loss": 3.8220856189727783, "lr": 0.0003911646983714258, "tps": 17405, "wall": 14899.2} {"step": 3957, "train_loss": 3.7909388542175293, "lr": 0.00039115876891630336, "tps": 17403, "wall": 14904.1} {"step": 3958, "train_loss": 3.808717727661133, "lr": 0.0003911528375222852, "tps": 17402, "wall": 14909.1} {"step": 3959, "train_loss": 3.908679246902466, "lr": 0.0003911469041894384, "tps": 17401, "wall": 14914.1} {"step": 3960, "train_loss": 3.872387647628784, "lr": 0.0003911409689178302, "tps": 17399, "wall": 14919.0} {"step": 3961, "train_loss": 3.971160650253296, "lr": 0.00039113503170752785, "tps": 17398, "wall": 14924.0} {"step": 3962, "train_loss": 3.853813409805298, "lr": 0.00039112909255859863, "tps": 17397, "wall": 14928.9} {"step": 3963, "train_loss": 3.8319242000579834, "lr": 0.0003911231514711098, "tps": 17395, "wall": 14934.0} {"step": 3964, "train_loss": 3.884793758392334, "lr": 0.00039111720844512863, "tps": 17394, "wall": 14938.9} {"step": 3965, "train_loss": 3.8458499908447266, "lr": 0.0003911112634807224, "tps": 17392, "wall": 14943.9} {"step": 3966, "train_loss": 3.840998649597168, "lr": 0.00039110531657795855, "tps": 17391, "wall": 14948.9} {"step": 3967, "train_loss": 3.805136203765869, "lr": 0.0003910993677369045, "tps": 17390, "wall": 14953.8} {"step": 3968, "train_loss": 3.868515968322754, "lr": 0.00039109341695762746, "tps": 17388, "wall": 14958.8} {"step": 3969, "train_loss": 3.7514452934265137, "lr": 0.00039108746424019504, "tps": 17387, "wall": 14963.7} {"step": 3970, "train_loss": 3.869821548461914, "lr": 0.00039108150958467447, "tps": 17385, "wall": 14968.7} {"step": 3971, "train_loss": 3.8670926094055176, "lr": 0.00039107555299113336, "tps": 17384, "wall": 14973.7} {"step": 3972, "train_loss": 3.9790868759155273, "lr": 0.00039106959445963914, "tps": 17383, "wall": 14978.6} {"step": 3973, "train_loss": 3.747364044189453, "lr": 0.00039106363399025925, "tps": 17381, "wall": 14983.6} {"step": 3974, "train_loss": 3.814882278442383, "lr": 0.00039105767158306124, "tps": 17380, "wall": 14988.5} {"step": 3975, "train_loss": 3.991234064102173, "lr": 0.0003910517072381128, "tps": 17378, "wall": 14993.6} {"step": 3976, "train_loss": 3.799124240875244, "lr": 0.00039104574095548124, "tps": 17377, "wall": 14998.5} {"step": 3977, "train_loss": 3.8997960090637207, "lr": 0.00039103977273523434, "tps": 17376, "wall": 15003.5} {"step": 3978, "train_loss": 3.8181376457214355, "lr": 0.00039103380257743956, "tps": 17374, "wall": 15008.5} {"step": 3979, "train_loss": 3.762460708618164, "lr": 0.0003910278304821647, "tps": 17373, "wall": 15013.4} {"step": 3980, "train_loss": 3.874453544616699, "lr": 0.0003910218564494773, "tps": 17371, "wall": 15018.4} {"step": 3981, "train_loss": 3.941500425338745, "lr": 0.00039101588047944503, "tps": 17370, "wall": 15023.3} {"step": 3982, "train_loss": 3.9318015575408936, "lr": 0.0003910099025721357, "tps": 17369, "wall": 15028.3} {"step": 3983, "train_loss": 3.8239755630493164, "lr": 0.0003910039227276168, "tps": 17367, "wall": 15033.3} {"step": 3984, "train_loss": 3.8386802673339844, "lr": 0.0003909979409459563, "tps": 17366, "wall": 15038.3} {"step": 3985, "train_loss": 3.8155243396759033, "lr": 0.00039099195722722184, "tps": 17365, "wall": 15043.2} {"step": 3986, "train_loss": 3.9454054832458496, "lr": 0.0003909859715714813, "tps": 17363, "wall": 15048.3} {"step": 3987, "train_loss": 3.8596391677856445, "lr": 0.00039097998397880237, "tps": 17362, "wall": 15053.3} {"step": 3988, "train_loss": 3.883268117904663, "lr": 0.000390973994449253, "tps": 17360, "wall": 15058.3} {"step": 3989, "train_loss": 3.87144136428833, "lr": 0.00039096800298290093, "tps": 17359, "wall": 15063.3} {"step": 3990, "train_loss": 3.8272862434387207, "lr": 0.000390962009579814, "tps": 17357, "wall": 15068.3} {"step": 3991, "train_loss": 3.8938143253326416, "lr": 0.0003909560142400603, "tps": 17356, "wall": 15073.3} {"step": 3992, "train_loss": 3.9095828533172607, "lr": 0.0003909500169637075, "tps": 17355, "wall": 15078.3} {"step": 3993, "train_loss": 3.917904853820801, "lr": 0.0003909440177508237, "tps": 17353, "wall": 15083.3} {"step": 3994, "train_loss": 3.8110151290893555, "lr": 0.0003909380166014769, "tps": 17352, "wall": 15088.3} {"step": 3995, "train_loss": 3.839503288269043, "lr": 0.0003909320135157349, "tps": 17350, "wall": 15093.3} {"step": 3996, "train_loss": 3.77984619140625, "lr": 0.00039092600849366583, "tps": 17349, "wall": 15098.3} {"step": 3997, "train_loss": 3.7827036380767822, "lr": 0.0003909200015353377, "tps": 17348, "wall": 15103.3} {"step": 3998, "train_loss": 3.7740283012390137, "lr": 0.00039091399264081856, "tps": 17346, "wall": 15108.3} {"step": 3999, "train_loss": 3.835236072540283, "lr": 0.00039090798181017647, "tps": 17345, "wall": 15113.4} {"step": 4000, "train_loss": 3.8698058128356934, "lr": 0.0003909019690434795, "tps": 17343, "wall": 15118.4, "val_loss_monitor": 3.857974221298858} {"step": 4001, "train_loss": 3.8251380920410156, "lr": 0.0003908959543407957, "tps": 17286, "wall": 15171.9} {"step": 4002, "train_loss": 3.8347420692443848, "lr": 0.0003908899377021934, "tps": 17285, "wall": 15177.0} {"step": 4003, "train_loss": 3.7805309295654297, "lr": 0.0003908839191277406, "tps": 17284, "wall": 15182.0} {"step": 4004, "train_loss": 3.727365493774414, "lr": 0.0003908778986175056, "tps": 17282, "wall": 15187.0} {"step": 4005, "train_loss": 3.8243417739868164, "lr": 0.0003908718761715564, "tps": 17281, "wall": 15192.1} {"step": 4006, "train_loss": 3.8437371253967285, "lr": 0.0003908658517899614, "tps": 17279, "wall": 15197.1} {"step": 4007, "train_loss": 3.8822741508483887, "lr": 0.0003908598254727888, "tps": 17278, "wall": 15202.1} {"step": 4008, "train_loss": 3.7490010261535645, "lr": 0.0003908537972201068, "tps": 17277, "wall": 15207.1} {"step": 4009, "train_loss": 3.9038705825805664, "lr": 0.0003908477670319837, "tps": 17275, "wall": 15212.1} {"step": 4010, "train_loss": 3.83620023727417, "lr": 0.00039084173490848797, "tps": 17274, "wall": 15217.1} {"step": 4011, "train_loss": 3.774930238723755, "lr": 0.0003908357008496877, "tps": 17272, "wall": 15222.1} {"step": 4012, "train_loss": 3.804685592651367, "lr": 0.00039082966485565147, "tps": 17271, "wall": 15227.1} {"step": 4013, "train_loss": 3.8419713973999023, "lr": 0.0003908236269264476, "tps": 17270, "wall": 15232.1} {"step": 4014, "train_loss": 3.829214572906494, "lr": 0.0003908175870621443, "tps": 17268, "wall": 15237.2} {"step": 4015, "train_loss": 3.8242545127868652, "lr": 0.00039081154526281024, "tps": 17267, "wall": 15242.3} {"step": 4016, "train_loss": 3.7916228771209717, "lr": 0.00039080550152851374, "tps": 17265, "wall": 15247.3} {"step": 4017, "train_loss": 3.854997158050537, "lr": 0.0003907994558593232, "tps": 17264, "wall": 15252.3} {"step": 4018, "train_loss": 3.9009900093078613, "lr": 0.0003907934082553073, "tps": 17263, "wall": 15257.3} {"step": 4019, "train_loss": 3.8210103511810303, "lr": 0.0003907873587165343, "tps": 17261, "wall": 15262.3} {"step": 4020, "train_loss": 3.8037619590759277, "lr": 0.000390781307243073, "tps": 17260, "wall": 15267.3} {"step": 4021, "train_loss": 3.9632010459899902, "lr": 0.0003907752538349917, "tps": 17259, "wall": 15272.3} {"step": 4022, "train_loss": 3.9174704551696777, "lr": 0.00039076919849235917, "tps": 17257, "wall": 15277.3} {"step": 4023, "train_loss": 3.799210548400879, "lr": 0.00039076314121524384, "tps": 17256, "wall": 15282.3} {"step": 4024, "train_loss": 3.8869543075561523, "lr": 0.00039075708200371446, "tps": 17255, "wall": 15287.3} {"step": 4025, "train_loss": 3.809570074081421, "lr": 0.00039075102085783965, "tps": 17253, "wall": 15292.3} {"step": 4026, "train_loss": 3.849011182785034, "lr": 0.00039074495777768794, "tps": 17252, "wall": 15297.3} {"step": 4027, "train_loss": 3.8755617141723633, "lr": 0.00039073889276332823, "tps": 17250, "wall": 15302.3} {"step": 4028, "train_loss": 3.828819751739502, "lr": 0.000390732825814829, "tps": 17249, "wall": 15307.3} {"step": 4029, "train_loss": 3.713529586791992, "lr": 0.0003907267569322591, "tps": 17248, "wall": 15312.3} {"step": 4030, "train_loss": 3.8044614791870117, "lr": 0.0003907206861156873, "tps": 17246, "wall": 15317.3} {"step": 4031, "train_loss": 3.8463826179504395, "lr": 0.00039071461336518233, "tps": 17245, "wall": 15322.3} {"step": 4032, "train_loss": 3.792870283126831, "lr": 0.000390708538680813, "tps": 17244, "wall": 15327.3} {"step": 4033, "train_loss": 3.80972957611084, "lr": 0.0003907024620626481, "tps": 17242, "wall": 15332.4} {"step": 4034, "train_loss": 3.9619131088256836, "lr": 0.0003906963835107564, "tps": 17241, "wall": 15337.4} {"step": 4035, "train_loss": 3.861994743347168, "lr": 0.0003906903030252069, "tps": 17240, "wall": 15342.4} {"step": 4036, "train_loss": 3.8282060623168945, "lr": 0.0003906842206060684, "tps": 17238, "wall": 15347.3} {"step": 4037, "train_loss": 3.8385720252990723, "lr": 0.0003906781362534098, "tps": 17237, "wall": 15352.4} {"step": 4038, "train_loss": 3.811025619506836, "lr": 0.0003906720499673001, "tps": 17236, "wall": 15357.3} {"step": 4039, "train_loss": 3.778836488723755, "lr": 0.00039066596174780813, "tps": 17234, "wall": 15362.3} {"step": 4040, "train_loss": 3.9272563457489014, "lr": 0.0003906598715950029, "tps": 17233, "wall": 15367.2} {"step": 4041, "train_loss": 3.911998748779297, "lr": 0.00039065377950895345, "tps": 17232, "wall": 15372.2} {"step": 4042, "train_loss": 3.9003190994262695, "lr": 0.0003906476854897287, "tps": 17230, "wall": 15377.1} {"step": 4043, "train_loss": 3.8151676654815674, "lr": 0.0003906415895373978, "tps": 17229, "wall": 15382.1} {"step": 4044, "train_loss": 3.8864829540252686, "lr": 0.0003906354916520297, "tps": 17228, "wall": 15387.0} {"step": 4045, "train_loss": 3.8613154888153076, "lr": 0.00039062939183369356, "tps": 17227, "wall": 15392.0} {"step": 4046, "train_loss": 3.739851474761963, "lr": 0.0003906232900824584, "tps": 17225, "wall": 15396.9} {"step": 4047, "train_loss": 3.7789368629455566, "lr": 0.0003906171863983934, "tps": 17224, "wall": 15401.9} {"step": 4048, "train_loss": 3.872833728790283, "lr": 0.00039061108078156765, "tps": 17223, "wall": 15406.9} {"step": 4049, "train_loss": 3.778437614440918, "lr": 0.0003906049732320504, "tps": 17221, "wall": 15411.8} {"step": 4050, "train_loss": 3.8596997261047363, "lr": 0.00039059886374991076, "tps": 17220, "wall": 15416.9} {"step": 4051, "train_loss": 3.888364791870117, "lr": 0.000390592752335218, "tps": 17219, "wall": 15421.8} {"step": 4052, "train_loss": 3.79667329788208, "lr": 0.00039058663898804125, "tps": 17217, "wall": 15426.8} {"step": 4053, "train_loss": 3.867478370666504, "lr": 0.00039058052370844983, "tps": 17216, "wall": 15431.7} {"step": 4054, "train_loss": 3.9197311401367188, "lr": 0.0003905744064965131, "tps": 17215, "wall": 15436.7} {"step": 4055, "train_loss": 3.8072636127471924, "lr": 0.00039056828735230015, "tps": 17214, "wall": 15441.7} {"step": 4056, "train_loss": 3.8553497791290283, "lr": 0.00039056216627588044, "tps": 17212, "wall": 15446.6} {"step": 4057, "train_loss": 3.827470064163208, "lr": 0.0003905560432673233, "tps": 17211, "wall": 15451.6} {"step": 4058, "train_loss": 3.817157745361328, "lr": 0.0003905499183266981, "tps": 17210, "wall": 15456.5} {"step": 4059, "train_loss": 3.968372106552124, "lr": 0.00039054379145407413, "tps": 17208, "wall": 15461.5} {"step": 4060, "train_loss": 3.7989089488983154, "lr": 0.0003905376626495209, "tps": 17207, "wall": 15466.4} {"step": 4061, "train_loss": 3.8074464797973633, "lr": 0.0003905315319131078, "tps": 17206, "wall": 15471.4} {"step": 4062, "train_loss": 3.8649377822875977, "lr": 0.0003905253992449043, "tps": 17205, "wall": 15476.4} {"step": 4063, "train_loss": 3.893101453781128, "lr": 0.0003905192646449799, "tps": 17203, "wall": 15481.3} {"step": 4064, "train_loss": 3.7882933616638184, "lr": 0.00039051312811340394, "tps": 17202, "wall": 15486.3} {"step": 4065, "train_loss": 3.8364405632019043, "lr": 0.0003905069896502461, "tps": 17201, "wall": 15491.3} {"step": 4066, "train_loss": 3.789435386657715, "lr": 0.0003905008492555758, "tps": 17200, "wall": 15496.2} {"step": 4067, "train_loss": 3.852736473083496, "lr": 0.00039049470692946274, "tps": 17198, "wall": 15501.2} {"step": 4068, "train_loss": 3.924276828765869, "lr": 0.0003904885626719764, "tps": 17197, "wall": 15506.2} {"step": 4069, "train_loss": 3.8108973503112793, "lr": 0.00039048241648318636, "tps": 17196, "wall": 15511.1} {"step": 4070, "train_loss": 3.7707204818725586, "lr": 0.00039047626836316227, "tps": 17194, "wall": 15516.1} {"step": 4071, "train_loss": 3.8595776557922363, "lr": 0.00039047011831197385, "tps": 17193, "wall": 15521.1} {"step": 4072, "train_loss": 3.933236598968506, "lr": 0.00039046396632969066, "tps": 17192, "wall": 15526.1} {"step": 4073, "train_loss": 3.8443143367767334, "lr": 0.00039045781241638246, "tps": 17190, "wall": 15531.1} {"step": 4074, "train_loss": 3.7551889419555664, "lr": 0.00039045165657211893, "tps": 17189, "wall": 15536.1} {"step": 4075, "train_loss": 3.7691915035247803, "lr": 0.0003904454987969698, "tps": 17188, "wall": 15541.1} {"step": 4076, "train_loss": 3.894014596939087, "lr": 0.0003904393390910048, "tps": 17187, "wall": 15546.0} {"step": 4077, "train_loss": 3.8600664138793945, "lr": 0.00039043317745429386, "tps": 17185, "wall": 15551.0} {"step": 4078, "train_loss": 3.8485758304595947, "lr": 0.0003904270138869066, "tps": 17184, "wall": 15555.9} {"step": 4079, "train_loss": 3.871936559677124, "lr": 0.00039042084838891293, "tps": 17183, "wall": 15560.9} {"step": 4080, "train_loss": 3.7996749877929688, "lr": 0.00039041468096038265, "tps": 17182, "wall": 15565.8} {"step": 4081, "train_loss": 3.8061323165893555, "lr": 0.0003904085116013856, "tps": 17180, "wall": 15570.8} {"step": 4082, "train_loss": 3.8906922340393066, "lr": 0.0003904023403119918, "tps": 17179, "wall": 15575.8} {"step": 4083, "train_loss": 3.821533203125, "lr": 0.000390396167092271, "tps": 17178, "wall": 15580.7} {"step": 4084, "train_loss": 3.780128240585327, "lr": 0.0003903899919422932, "tps": 17176, "wall": 15585.7} {"step": 4085, "train_loss": 3.986670732498169, "lr": 0.0003903838148621284, "tps": 17175, "wall": 15590.7} {"step": 4086, "train_loss": 3.74596905708313, "lr": 0.00039037763585184656, "tps": 17174, "wall": 15595.7} {"step": 4087, "train_loss": 3.8564836978912354, "lr": 0.00039037145491151756, "tps": 17173, "wall": 15600.7} {"step": 4088, "train_loss": 3.8810601234436035, "lr": 0.0003903652720412115, "tps": 17171, "wall": 15605.6} {"step": 4089, "train_loss": 3.849081516265869, "lr": 0.0003903590872409985, "tps": 17170, "wall": 15610.6} {"step": 4090, "train_loss": 3.7883005142211914, "lr": 0.0003903529005109485, "tps": 17169, "wall": 15615.5} {"step": 4091, "train_loss": 3.929797410964966, "lr": 0.00039034671185113166, "tps": 17168, "wall": 15620.5} {"step": 4092, "train_loss": 3.816962480545044, "lr": 0.000390340521261618, "tps": 17166, "wall": 15625.5} {"step": 4093, "train_loss": 3.906115770339966, "lr": 0.00039033432874247773, "tps": 17165, "wall": 15630.5} {"step": 4094, "train_loss": 3.812805652618408, "lr": 0.0003903281342937809, "tps": 17164, "wall": 15635.4} {"step": 4095, "train_loss": 3.8636603355407715, "lr": 0.00039032193791559784, "tps": 17162, "wall": 15640.4} {"step": 4096, "train_loss": 4.0148844718933105, "lr": 0.00039031573960799867, "tps": 17161, "wall": 15645.4} {"step": 4097, "train_loss": 3.9247729778289795, "lr": 0.0003903095393710535, "tps": 17160, "wall": 15650.3} {"step": 4098, "train_loss": 3.8025054931640625, "lr": 0.0003903033372048327, "tps": 17159, "wall": 15655.3} {"step": 4099, "train_loss": 3.780427932739258, "lr": 0.0003902971331094065, "tps": 17157, "wall": 15660.3} {"step": 4100, "train_loss": 3.8448486328125, "lr": 0.0003902909270848451, "tps": 17156, "wall": 15665.2} {"step": 4101, "train_loss": 3.845426559448242, "lr": 0.00039028471913121895, "tps": 17155, "wall": 15670.2} {"step": 4102, "train_loss": 3.8104519844055176, "lr": 0.0003902785092485982, "tps": 17154, "wall": 15675.2} {"step": 4103, "train_loss": 3.8367786407470703, "lr": 0.00039027229743705333, "tps": 17152, "wall": 15680.2} {"step": 4104, "train_loss": 3.7727389335632324, "lr": 0.0003902660836966547, "tps": 17151, "wall": 15685.1} {"step": 4105, "train_loss": 3.7976608276367188, "lr": 0.0003902598680274726, "tps": 17150, "wall": 15690.1} {"step": 4106, "train_loss": 3.812023639678955, "lr": 0.0003902536504295775, "tps": 17149, "wall": 15695.0} {"step": 4107, "train_loss": 3.8046250343322754, "lr": 0.0003902474309030399, "tps": 17147, "wall": 15700.0} {"step": 4108, "train_loss": 3.7652015686035156, "lr": 0.00039024120944793013, "tps": 17146, "wall": 15705.0} {"step": 4109, "train_loss": 3.8408846855163574, "lr": 0.0003902349860643188, "tps": 17145, "wall": 15709.9} {"step": 4110, "train_loss": 3.908626079559326, "lr": 0.00039022876075227634, "tps": 17144, "wall": 15714.9} {"step": 4111, "train_loss": 3.87935209274292, "lr": 0.00039022253351187315, "tps": 17142, "wall": 15719.9} {"step": 4112, "train_loss": 3.803664207458496, "lr": 0.00039021630434318, "tps": 17141, "wall": 15724.9} {"step": 4113, "train_loss": 3.748432159423828, "lr": 0.00039021007324626733, "tps": 17140, "wall": 15729.9} {"step": 4114, "train_loss": 3.758547782897949, "lr": 0.00039020384022120575, "tps": 17139, "wall": 15734.8} {"step": 4115, "train_loss": 3.842684030532837, "lr": 0.0003901976052680658, "tps": 17137, "wall": 15739.8} {"step": 4116, "train_loss": 3.8606066703796387, "lr": 0.0003901913683869182, "tps": 17136, "wall": 15744.8} {"step": 4117, "train_loss": 3.802081346511841, "lr": 0.0003901851295778336, "tps": 17135, "wall": 15749.7} {"step": 4118, "train_loss": 3.8879897594451904, "lr": 0.0003901788888408826, "tps": 17134, "wall": 15754.7} {"step": 4119, "train_loss": 3.731196880340576, "lr": 0.00039017264617613597, "tps": 17132, "wall": 15759.7} {"step": 4120, "train_loss": 3.7266857624053955, "lr": 0.00039016640158366444, "tps": 17131, "wall": 15764.6} {"step": 4121, "train_loss": 3.7750444412231445, "lr": 0.00039016015506353863, "tps": 17130, "wall": 15769.6} {"step": 4122, "train_loss": 3.9251608848571777, "lr": 0.00039015390661582936, "tps": 17129, "wall": 15774.6} {"step": 4123, "train_loss": 3.823054790496826, "lr": 0.0003901476562406075, "tps": 17127, "wall": 15779.6} {"step": 4124, "train_loss": 3.8853161334991455, "lr": 0.00039014140393794374, "tps": 17126, "wall": 15784.6} {"step": 4125, "train_loss": 3.774466037750244, "lr": 0.000390135149707909, "tps": 17125, "wall": 15789.5} {"step": 4126, "train_loss": 3.914961099624634, "lr": 0.0003901288935505741, "tps": 17124, "wall": 15794.5} {"step": 4127, "train_loss": 3.8485915660858154, "lr": 0.0003901226354660098, "tps": 17122, "wall": 15799.5} {"step": 4128, "train_loss": 3.9516983032226562, "lr": 0.0003901163754542871, "tps": 17121, "wall": 15804.4} {"step": 4129, "train_loss": 3.8864965438842773, "lr": 0.00039011011351547696, "tps": 17120, "wall": 15809.4} {"step": 4130, "train_loss": 3.904873847961426, "lr": 0.00039010384964965027, "tps": 17119, "wall": 15814.4} {"step": 4131, "train_loss": 3.9311461448669434, "lr": 0.00039009758385687783, "tps": 17117, "wall": 15819.3} {"step": 4132, "train_loss": 3.7998228073120117, "lr": 0.0003900913161372309, "tps": 17116, "wall": 15824.3} {"step": 4133, "train_loss": 3.8430371284484863, "lr": 0.0003900850464907802, "tps": 17115, "wall": 15829.3} {"step": 4134, "train_loss": 3.791123628616333, "lr": 0.000390078774917597, "tps": 17114, "wall": 15834.3} {"step": 4135, "train_loss": 3.8455870151519775, "lr": 0.00039007250141775225, "tps": 17112, "wall": 15839.2} {"step": 4136, "train_loss": 3.924428939819336, "lr": 0.00039006622599131697, "tps": 17111, "wall": 15844.2} {"step": 4137, "train_loss": 3.900189161300659, "lr": 0.0003900599486383622, "tps": 17110, "wall": 15849.2} {"step": 4138, "train_loss": 3.83066463470459, "lr": 0.0003900536693589592, "tps": 17109, "wall": 15854.1} {"step": 4139, "train_loss": 3.874277114868164, "lr": 0.00039004738815317906, "tps": 17108, "wall": 15859.1} {"step": 4140, "train_loss": 3.8852434158325195, "lr": 0.0003900411050210929, "tps": 17106, "wall": 15864.1} {"step": 4141, "train_loss": 3.756434440612793, "lr": 0.0003900348199627719, "tps": 17105, "wall": 15869.0} {"step": 4142, "train_loss": 3.8124725818634033, "lr": 0.00039002853297828726, "tps": 17104, "wall": 15874.0} {"step": 4143, "train_loss": 3.9062747955322266, "lr": 0.0003900222440677102, "tps": 17103, "wall": 15879.0} {"step": 4144, "train_loss": 3.7749133110046387, "lr": 0.00039001595323111195, "tps": 17101, "wall": 15883.9} {"step": 4145, "train_loss": 3.8637990951538086, "lr": 0.00039000966046856376, "tps": 17100, "wall": 15888.9} {"step": 4146, "train_loss": 3.8372392654418945, "lr": 0.00039000336578013696, "tps": 17099, "wall": 15893.9} {"step": 4147, "train_loss": 3.8494439125061035, "lr": 0.0003899970691659029, "tps": 17098, "wall": 15898.9} {"step": 4148, "train_loss": 3.9418163299560547, "lr": 0.00038999077062593275, "tps": 17097, "wall": 15903.8} {"step": 4149, "train_loss": 3.803828716278076, "lr": 0.000389984470160298, "tps": 17095, "wall": 15908.8} {"step": 4150, "train_loss": 3.8130979537963867, "lr": 0.00038997816776906993, "tps": 17094, "wall": 15913.8} {"step": 4151, "train_loss": 3.7247684001922607, "lr": 0.00038997186345232003, "tps": 17093, "wall": 15918.7} {"step": 4152, "train_loss": 3.733477830886841, "lr": 0.00038996555721011966, "tps": 17092, "wall": 15923.7} {"step": 4153, "train_loss": 3.8474888801574707, "lr": 0.0003899592490425402, "tps": 17090, "wall": 15928.7} {"step": 4154, "train_loss": 3.8193159103393555, "lr": 0.00038995293894965327, "tps": 17089, "wall": 15933.7} {"step": 4155, "train_loss": 3.835101366043091, "lr": 0.0003899466269315302, "tps": 17088, "wall": 15938.6} {"step": 4156, "train_loss": 3.8697590827941895, "lr": 0.00038994031298824255, "tps": 17087, "wall": 15943.6} {"step": 4157, "train_loss": 3.7524890899658203, "lr": 0.00038993399711986185, "tps": 17086, "wall": 15948.5} {"step": 4158, "train_loss": 3.9324941635131836, "lr": 0.00038992767932645965, "tps": 17084, "wall": 15953.6} {"step": 4159, "train_loss": 3.9061107635498047, "lr": 0.00038992135960810745, "tps": 17083, "wall": 15958.6} {"step": 4160, "train_loss": 3.9459891319274902, "lr": 0.00038991503796487697, "tps": 17082, "wall": 15963.5} {"step": 4161, "train_loss": 3.730691909790039, "lr": 0.0003899087143968397, "tps": 17081, "wall": 15968.5} {"step": 4162, "train_loss": 3.941312789916992, "lr": 0.00038990238890406734, "tps": 17080, "wall": 15973.4} {"step": 4163, "train_loss": 3.9970059394836426, "lr": 0.00038989606148663147, "tps": 17078, "wall": 15978.4} {"step": 4164, "train_loss": 3.873724937438965, "lr": 0.00038988973214460393, "tps": 17077, "wall": 15983.4} {"step": 4165, "train_loss": 3.882624864578247, "lr": 0.0003898834008780562, "tps": 17076, "wall": 15988.3} {"step": 4166, "train_loss": 3.820744276046753, "lr": 0.0003898770676870602, "tps": 17075, "wall": 15993.3} {"step": 4167, "train_loss": 3.8134262561798096, "lr": 0.00038987073257168756, "tps": 17073, "wall": 15998.3} {"step": 4168, "train_loss": 3.8391056060791016, "lr": 0.0003898643955320101, "tps": 17072, "wall": 16003.2} {"step": 4169, "train_loss": 3.8585410118103027, "lr": 0.0003898580565680995, "tps": 17071, "wall": 16008.2} {"step": 4170, "train_loss": 3.8830814361572266, "lr": 0.0003898517156800277, "tps": 17070, "wall": 16013.3} {"step": 4171, "train_loss": 3.761220932006836, "lr": 0.0003898453728678665, "tps": 17069, "wall": 16018.2} {"step": 4172, "train_loss": 3.8073267936706543, "lr": 0.0003898390281316877, "tps": 17067, "wall": 16023.2} {"step": 4173, "train_loss": 3.882718086242676, "lr": 0.00038983268147156316, "tps": 17066, "wall": 16028.1} {"step": 4174, "train_loss": 3.792367696762085, "lr": 0.00038982633288756486, "tps": 17065, "wall": 16033.1} {"step": 4175, "train_loss": 3.9074716567993164, "lr": 0.0003898199823797647, "tps": 17064, "wall": 16038.1} {"step": 4176, "train_loss": 3.831265449523926, "lr": 0.00038981362994823456, "tps": 17063, "wall": 16043.1} {"step": 4177, "train_loss": 3.836775302886963, "lr": 0.0003898072755930464, "tps": 17061, "wall": 16048.0} {"step": 4178, "train_loss": 3.8667216300964355, "lr": 0.0003898009193142723, "tps": 17060, "wall": 16053.0} {"step": 4179, "train_loss": 3.841948986053467, "lr": 0.00038979456111198414, "tps": 17059, "wall": 16058.0} {"step": 4180, "train_loss": 3.8786725997924805, "lr": 0.0003897882009862541, "tps": 17058, "wall": 16062.9} {"step": 4181, "train_loss": 3.8472540378570557, "lr": 0.000389781838937154, "tps": 17057, "wall": 16067.9} {"step": 4182, "train_loss": 3.7190229892730713, "lr": 0.00038977547496475614, "tps": 17055, "wall": 16073.0} {"step": 4183, "train_loss": 3.802943229675293, "lr": 0.0003897691090691325, "tps": 17054, "wall": 16077.9} {"step": 4184, "train_loss": 3.854005813598633, "lr": 0.0003897627412503552, "tps": 17053, "wall": 16082.9} {"step": 4185, "train_loss": 3.875272035598755, "lr": 0.00038975637150849633, "tps": 17052, "wall": 16087.8} {"step": 4186, "train_loss": 3.872954845428467, "lr": 0.0003897499998436282, "tps": 17051, "wall": 16092.8} {"step": 4187, "train_loss": 3.86421799659729, "lr": 0.0003897436262558229, "tps": 17049, "wall": 16097.8} {"step": 4188, "train_loss": 3.7412662506103516, "lr": 0.0003897372507451525, "tps": 17048, "wall": 16102.8} {"step": 4189, "train_loss": 3.8437325954437256, "lr": 0.0003897308733116894, "tps": 17047, "wall": 16107.7} {"step": 4190, "train_loss": 3.793851375579834, "lr": 0.00038972449395550577, "tps": 17046, "wall": 16112.7} {"step": 4191, "train_loss": 3.8875744342803955, "lr": 0.00038971811267667387, "tps": 17045, "wall": 16117.7} {"step": 4192, "train_loss": 3.811100482940674, "lr": 0.00038971172947526605, "tps": 17043, "wall": 16122.7} {"step": 4193, "train_loss": 3.8041369915008545, "lr": 0.00038970534435135457, "tps": 17042, "wall": 16127.7} {"step": 4194, "train_loss": 3.7453577518463135, "lr": 0.0003896989573050118, "tps": 17041, "wall": 16132.7} {"step": 4195, "train_loss": 3.77140212059021, "lr": 0.00038969256833631, "tps": 17040, "wall": 16137.7} {"step": 4196, "train_loss": 3.8870792388916016, "lr": 0.00038968617744532166, "tps": 17038, "wall": 16142.7} {"step": 4197, "train_loss": 3.9273529052734375, "lr": 0.000389679784632119, "tps": 17037, "wall": 16147.6} {"step": 4198, "train_loss": 3.8754420280456543, "lr": 0.00038967338989677475, "tps": 17036, "wall": 16152.6} {"step": 4199, "train_loss": 3.7657828330993652, "lr": 0.00038966699323936103, "tps": 17035, "wall": 16157.5} {"step": 4200, "train_loss": 3.801265239715576, "lr": 0.00038966059465995047, "tps": 17034, "wall": 16162.5} {"step": 4201, "train_loss": 3.7655811309814453, "lr": 0.00038965419415861553, "tps": 17033, "wall": 16167.5} {"step": 4202, "train_loss": 3.859898090362549, "lr": 0.0003896477917354287, "tps": 17031, "wall": 16172.4} {"step": 4203, "train_loss": 3.7489523887634277, "lr": 0.0003896413873904624, "tps": 17030, "wall": 16177.4} {"step": 4204, "train_loss": 3.7972257137298584, "lr": 0.00038963498112378945, "tps": 17029, "wall": 16182.3} {"step": 4205, "train_loss": 3.8804640769958496, "lr": 0.0003896285729354822, "tps": 17028, "wall": 16187.3} {"step": 4206, "train_loss": 3.8819236755371094, "lr": 0.0003896221628256133, "tps": 17027, "wall": 16192.3} {"step": 4207, "train_loss": 3.85140323638916, "lr": 0.0003896157507942553, "tps": 17025, "wall": 16197.3} {"step": 4208, "train_loss": 3.8484091758728027, "lr": 0.0003896093368414809, "tps": 17024, "wall": 16202.3} {"step": 4209, "train_loss": 3.8113455772399902, "lr": 0.0003896029209673628, "tps": 17023, "wall": 16207.3} {"step": 4210, "train_loss": 3.7609262466430664, "lr": 0.0003895965031719737, "tps": 17022, "wall": 16212.3} {"step": 4211, "train_loss": 3.881810426712036, "lr": 0.00038959008345538614, "tps": 17021, "wall": 16217.2} {"step": 4212, "train_loss": 3.850735664367676, "lr": 0.00038958366181767297, "tps": 17020, "wall": 16222.2} {"step": 4213, "train_loss": 3.714876651763916, "lr": 0.0003895772382589069, "tps": 17018, "wall": 16227.2} {"step": 4214, "train_loss": 3.8954176902770996, "lr": 0.0003895708127791607, "tps": 17017, "wall": 16232.1} {"step": 4215, "train_loss": 3.781404972076416, "lr": 0.0003895643853785072, "tps": 17016, "wall": 16237.1} {"step": 4216, "train_loss": 3.7972493171691895, "lr": 0.0003895579560570192, "tps": 17015, "wall": 16242.1} {"step": 4217, "train_loss": 3.9416561126708984, "lr": 0.00038955152481476936, "tps": 17014, "wall": 16247.0} {"step": 4218, "train_loss": 3.7447121143341064, "lr": 0.0003895450916518308, "tps": 17013, "wall": 16252.0} {"step": 4219, "train_loss": 3.830775737762451, "lr": 0.0003895386565682762, "tps": 17011, "wall": 16257.0} {"step": 4220, "train_loss": 3.830296277999878, "lr": 0.0003895322195641785, "tps": 17010, "wall": 16262.0} {"step": 4221, "train_loss": 3.8803763389587402, "lr": 0.0003895257806396108, "tps": 17009, "wall": 16266.9} {"step": 4222, "train_loss": 3.907576084136963, "lr": 0.0003895193397946457, "tps": 17008, "wall": 16271.9} {"step": 4223, "train_loss": 3.8416364192962646, "lr": 0.00038951289702935646, "tps": 17007, "wall": 16276.9} {"step": 4224, "train_loss": 3.876452922821045, "lr": 0.0003895064523438159, "tps": 17006, "wall": 16281.9} {"step": 4225, "train_loss": 3.770669937133789, "lr": 0.0003895000057380971, "tps": 17004, "wall": 16286.8} {"step": 4226, "train_loss": 3.8079981803894043, "lr": 0.00038949355721227305, "tps": 17003, "wall": 16291.8} {"step": 4227, "train_loss": 3.8011927604675293, "lr": 0.0003894871067664169, "tps": 17002, "wall": 16296.7} {"step": 4228, "train_loss": 3.8037161827087402, "lr": 0.0003894806544006015, "tps": 17001, "wall": 16301.7} {"step": 4229, "train_loss": 3.9492592811584473, "lr": 0.00038947420011490013, "tps": 17000, "wall": 16306.7} {"step": 4230, "train_loss": 3.849827289581299, "lr": 0.0003894677439093859, "tps": 16999, "wall": 16311.7} {"step": 4231, "train_loss": 3.7501330375671387, "lr": 0.00038946128578413184, "tps": 16997, "wall": 16316.7} {"step": 4232, "train_loss": 3.819056987762451, "lr": 0.00038945482573921124, "tps": 16996, "wall": 16321.6} {"step": 4233, "train_loss": 3.8460075855255127, "lr": 0.00038944836377469714, "tps": 16995, "wall": 16326.6} {"step": 4234, "train_loss": 3.8626770973205566, "lr": 0.00038944189989066283, "tps": 16994, "wall": 16331.5} {"step": 4235, "train_loss": 3.8687777519226074, "lr": 0.00038943543408718155, "tps": 16993, "wall": 16336.5} {"step": 4236, "train_loss": 3.810710906982422, "lr": 0.0003894289663643264, "tps": 16992, "wall": 16341.5} {"step": 4237, "train_loss": 3.8513340950012207, "lr": 0.00038942249672217083, "tps": 16990, "wall": 16346.5} {"step": 4238, "train_loss": 3.963927745819092, "lr": 0.00038941602516078796, "tps": 16989, "wall": 16351.4} {"step": 4239, "train_loss": 3.8109116554260254, "lr": 0.00038940955168025135, "tps": 16988, "wall": 16356.4} {"step": 4240, "train_loss": 3.877290725708008, "lr": 0.00038940307628063407, "tps": 16987, "wall": 16361.4} {"step": 4241, "train_loss": 3.735065460205078, "lr": 0.00038939659896200957, "tps": 16986, "wall": 16366.3} {"step": 4242, "train_loss": 3.7668299674987793, "lr": 0.0003893901197244513, "tps": 16985, "wall": 16371.3} {"step": 4243, "train_loss": 3.819976806640625, "lr": 0.0003893836385680325, "tps": 16983, "wall": 16376.4} {"step": 4244, "train_loss": 3.826578140258789, "lr": 0.0003893771554928268, "tps": 16982, "wall": 16381.3} {"step": 4245, "train_loss": 3.785454273223877, "lr": 0.0003893706704989074, "tps": 16981, "wall": 16386.3} {"step": 4246, "train_loss": 3.6973490715026855, "lr": 0.00038936418358634795, "tps": 16980, "wall": 16391.3} {"step": 4247, "train_loss": 3.7478580474853516, "lr": 0.00038935769475522184, "tps": 16979, "wall": 16396.2} {"step": 4248, "train_loss": 3.7715678215026855, "lr": 0.00038935120400560263, "tps": 16978, "wall": 16401.2} {"step": 4249, "train_loss": 3.7919368743896484, "lr": 0.0003893447113375638, "tps": 16977, "wall": 16406.2} {"step": 4250, "train_loss": 3.822065830230713, "lr": 0.0003893382167511789, "tps": 16975, "wall": 16411.2} {"step": 4251, "train_loss": 3.799475908279419, "lr": 0.0003893317202465215, "tps": 16974, "wall": 16416.2} {"step": 4252, "train_loss": 3.759758710861206, "lr": 0.0003893252218236653, "tps": 16973, "wall": 16421.1} {"step": 4253, "train_loss": 3.797269105911255, "lr": 0.00038931872148268375, "tps": 16972, "wall": 16426.1} {"step": 4254, "train_loss": 3.978788137435913, "lr": 0.0003893122192236506, "tps": 16971, "wall": 16431.1} {"step": 4255, "train_loss": 3.87796950340271, "lr": 0.00038930571504663947, "tps": 16970, "wall": 16436.1} {"step": 4256, "train_loss": 3.770681381225586, "lr": 0.000389299208951724, "tps": 16968, "wall": 16441.1} {"step": 4257, "train_loss": 3.81699800491333, "lr": 0.00038929270093897804, "tps": 16967, "wall": 16446.0} {"step": 4258, "train_loss": 3.8493080139160156, "lr": 0.00038928619100847507, "tps": 16966, "wall": 16451.0} {"step": 4259, "train_loss": 3.8223953247070312, "lr": 0.00038927967916028907, "tps": 16965, "wall": 16456.0} {"step": 4260, "train_loss": 3.858844518661499, "lr": 0.0003892731653944936, "tps": 16964, "wall": 16461.0} {"step": 4261, "train_loss": 3.759286403656006, "lr": 0.0003892666497111627, "tps": 16963, "wall": 16465.9} {"step": 4262, "train_loss": 3.936018466949463, "lr": 0.00038926013211036995, "tps": 16962, "wall": 16470.9} {"step": 4263, "train_loss": 3.8635194301605225, "lr": 0.00038925361259218926, "tps": 16960, "wall": 16475.9} {"step": 4264, "train_loss": 3.790529727935791, "lr": 0.0003892470911566945, "tps": 16959, "wall": 16480.8} {"step": 4265, "train_loss": 3.898914337158203, "lr": 0.0003892405678039595, "tps": 16958, "wall": 16485.8} {"step": 4266, "train_loss": 3.8889706134796143, "lr": 0.0003892340425340583, "tps": 16957, "wall": 16490.8} {"step": 4267, "train_loss": 3.8224902153015137, "lr": 0.0003892275153470646, "tps": 16956, "wall": 16495.8} {"step": 4268, "train_loss": 3.80016827583313, "lr": 0.00038922098624305247, "tps": 16955, "wall": 16500.7} {"step": 4269, "train_loss": 3.91235089302063, "lr": 0.0003892144552220959, "tps": 16954, "wall": 16505.7} {"step": 4270, "train_loss": 3.849034547805786, "lr": 0.0003892079222842688, "tps": 16952, "wall": 16510.6} {"step": 4271, "train_loss": 3.8485798835754395, "lr": 0.00038920138742964516, "tps": 16951, "wall": 16515.6} {"step": 4272, "train_loss": 3.758504629135132, "lr": 0.00038919485065829916, "tps": 16950, "wall": 16520.5} {"step": 4273, "train_loss": 3.8226139545440674, "lr": 0.0003891883119703046, "tps": 16949, "wall": 16525.5} {"step": 4274, "train_loss": 3.8221588134765625, "lr": 0.00038918177136573577, "tps": 16948, "wall": 16530.5} {"step": 4275, "train_loss": 3.8272852897644043, "lr": 0.0003891752288446667, "tps": 16947, "wall": 16535.4} {"step": 4276, "train_loss": 3.8463940620422363, "lr": 0.00038916868440717146, "tps": 16946, "wall": 16540.4} {"step": 4277, "train_loss": 3.797274112701416, "lr": 0.0003891621380533242, "tps": 16945, "wall": 16545.4} {"step": 4278, "train_loss": 3.798673391342163, "lr": 0.0003891555897831991, "tps": 16943, "wall": 16550.4} {"step": 4279, "train_loss": 3.8142614364624023, "lr": 0.00038914903959687036, "tps": 16942, "wall": 16555.4} {"step": 4280, "train_loss": 3.843475341796875, "lr": 0.00038914248749441206, "tps": 16941, "wall": 16560.4} {"step": 4281, "train_loss": 3.8553683757781982, "lr": 0.0003891359334758986, "tps": 16940, "wall": 16565.4} {"step": 4282, "train_loss": 3.709500789642334, "lr": 0.00038912937754140406, "tps": 16939, "wall": 16570.3} {"step": 4283, "train_loss": 3.8402652740478516, "lr": 0.00038912281969100284, "tps": 16938, "wall": 16575.3} {"step": 4284, "train_loss": 3.8093178272247314, "lr": 0.00038911625992476916, "tps": 16937, "wall": 16580.3} {"step": 4285, "train_loss": 3.9179365634918213, "lr": 0.0003891096982427773, "tps": 16935, "wall": 16585.2} {"step": 4286, "train_loss": 3.833908796310425, "lr": 0.0003891031346451017, "tps": 16934, "wall": 16590.2} {"step": 4287, "train_loss": 3.884098529815674, "lr": 0.0003890965691318166, "tps": 16933, "wall": 16595.2} {"step": 4288, "train_loss": 3.7906296253204346, "lr": 0.0003890900017029964, "tps": 16932, "wall": 16600.1} {"step": 4289, "train_loss": 3.8038904666900635, "lr": 0.00038908343235871554, "tps": 16931, "wall": 16605.1} {"step": 4290, "train_loss": 3.9111669063568115, "lr": 0.0003890768610990484, "tps": 16930, "wall": 16610.0} {"step": 4291, "train_loss": 3.780488967895508, "lr": 0.00038907028792406945, "tps": 16929, "wall": 16615.1} {"step": 4292, "train_loss": 3.9623241424560547, "lr": 0.00038906371283385313, "tps": 16928, "wall": 16620.0} {"step": 4293, "train_loss": 3.7750563621520996, "lr": 0.00038905713582847385, "tps": 16927, "wall": 16625.0} {"step": 4294, "train_loss": 3.8001060485839844, "lr": 0.0003890505569080063, "tps": 16925, "wall": 16629.9} {"step": 4295, "train_loss": 3.7645931243896484, "lr": 0.00038904397607252483, "tps": 16924, "wall": 16634.9} {"step": 4296, "train_loss": 3.7325096130371094, "lr": 0.00038903739332210406, "tps": 16923, "wall": 16639.9} {"step": 4297, "train_loss": 3.8253204822540283, "lr": 0.0003890308086568186, "tps": 16922, "wall": 16644.9} {"step": 4298, "train_loss": 3.835998773574829, "lr": 0.0003890242220767429, "tps": 16921, "wall": 16649.8} {"step": 4299, "train_loss": 3.827988862991333, "lr": 0.00038901763358195173, "tps": 16920, "wall": 16654.8} {"step": 4300, "train_loss": 3.7114925384521484, "lr": 0.0003890110431725197, "tps": 16919, "wall": 16659.7} {"step": 4301, "train_loss": 3.734126091003418, "lr": 0.0003890044508485214, "tps": 16918, "wall": 16664.7} {"step": 4302, "train_loss": 3.816019058227539, "lr": 0.00038899785661003147, "tps": 16917, "wall": 16669.6} {"step": 4303, "train_loss": 3.7767205238342285, "lr": 0.0003889912604571247, "tps": 16915, "wall": 16674.6} {"step": 4304, "train_loss": 3.8043508529663086, "lr": 0.0003889846623898759, "tps": 16914, "wall": 16679.6} {"step": 4305, "train_loss": 3.8305087089538574, "lr": 0.0003889780624083596, "tps": 16913, "wall": 16684.6} {"step": 4306, "train_loss": 3.7795426845550537, "lr": 0.0003889714605126507, "tps": 16912, "wall": 16689.5} {"step": 4307, "train_loss": 3.720139980316162, "lr": 0.00038896485670282397, "tps": 16911, "wall": 16694.5} {"step": 4308, "train_loss": 3.8790030479431152, "lr": 0.00038895825097895416, "tps": 16910, "wall": 16699.5} {"step": 4309, "train_loss": 3.8239784240722656, "lr": 0.0003889516433411162, "tps": 16909, "wall": 16704.5} {"step": 4310, "train_loss": 3.831204652786255, "lr": 0.00038894503378938483, "tps": 16908, "wall": 16709.5} {"step": 4311, "train_loss": 3.987759590148926, "lr": 0.000388938422323835, "tps": 16906, "wall": 16714.5} {"step": 4312, "train_loss": 3.7568063735961914, "lr": 0.00038893180894454153, "tps": 16905, "wall": 16719.5} {"step": 4313, "train_loss": 3.8102238178253174, "lr": 0.00038892519365157945, "tps": 16904, "wall": 16724.5} {"step": 4314, "train_loss": 3.8655872344970703, "lr": 0.00038891857644502364, "tps": 16903, "wall": 16729.5} {"step": 4315, "train_loss": 3.8076353073120117, "lr": 0.00038891195732494905, "tps": 16902, "wall": 16734.6} {"step": 4316, "train_loss": 3.822725296020508, "lr": 0.0003889053362914306, "tps": 16901, "wall": 16739.6} {"step": 4317, "train_loss": 3.769195079803467, "lr": 0.00038889871334454347, "tps": 16900, "wall": 16744.6} {"step": 4318, "train_loss": 3.812936782836914, "lr": 0.0003888920884843625, "tps": 16898, "wall": 16749.7} {"step": 4319, "train_loss": 3.773350954055786, "lr": 0.00038888546171096287, "tps": 16897, "wall": 16754.6} {"step": 4320, "train_loss": 3.970203399658203, "lr": 0.00038887883302441957, "tps": 16896, "wall": 16759.6} {"step": 4321, "train_loss": 3.896306037902832, "lr": 0.0003888722024248078, "tps": 16895, "wall": 16764.8} {"step": 4322, "train_loss": 3.82440185546875, "lr": 0.00038886556991220246, "tps": 16894, "wall": 16769.8} {"step": 4323, "train_loss": 3.742871046066284, "lr": 0.0003888589354866788, "tps": 16893, "wall": 16774.8} {"step": 4324, "train_loss": 3.860964775085449, "lr": 0.00038885229914831205, "tps": 16891, "wall": 16779.8} {"step": 4325, "train_loss": 3.890613555908203, "lr": 0.0003888456608971773, "tps": 16890, "wall": 16784.8} {"step": 4326, "train_loss": 3.8217198848724365, "lr": 0.00038883902073334975, "tps": 16889, "wall": 16789.9} {"step": 4327, "train_loss": 3.762258291244507, "lr": 0.0003888323786569047, "tps": 16888, "wall": 16795.0} {"step": 4328, "train_loss": 3.9000186920166016, "lr": 0.00038882573466791725, "tps": 16887, "wall": 16799.9} {"step": 4329, "train_loss": 3.806241035461426, "lr": 0.0003888190887664628, "tps": 16886, "wall": 16804.9} {"step": 4330, "train_loss": 3.8493027687072754, "lr": 0.00038881244095261653, "tps": 16885, "wall": 16809.9} {"step": 4331, "train_loss": 3.80814790725708, "lr": 0.00038880579122645386, "tps": 16883, "wall": 16814.9} {"step": 4332, "train_loss": 3.8261985778808594, "lr": 0.00038879913958805, "tps": 16882, "wall": 16819.9} {"step": 4333, "train_loss": 3.761464834213257, "lr": 0.0003887924860374804, "tps": 16881, "wall": 16825.0} {"step": 4334, "train_loss": 3.8223299980163574, "lr": 0.0003887858305748204, "tps": 16880, "wall": 16830.0} {"step": 4335, "train_loss": 3.879412889480591, "lr": 0.0003887791732001453, "tps": 16879, "wall": 16835.0} {"step": 4336, "train_loss": 3.8317432403564453, "lr": 0.00038877251391353067, "tps": 16878, "wall": 16840.0} {"step": 4337, "train_loss": 3.7728676795959473, "lr": 0.0003887658527150518, "tps": 16877, "wall": 16845.0} {"step": 4338, "train_loss": 3.9087207317352295, "lr": 0.00038875918960478426, "tps": 16875, "wall": 16850.0} {"step": 4339, "train_loss": 3.814531087875366, "lr": 0.00038875252458280354, "tps": 16874, "wall": 16855.1} {"step": 4340, "train_loss": 3.7699942588806152, "lr": 0.00038874585764918503, "tps": 16873, "wall": 16860.1} {"step": 4341, "train_loss": 3.8342084884643555, "lr": 0.00038873918880400437, "tps": 16872, "wall": 16865.2} {"step": 4342, "train_loss": 3.8478243350982666, "lr": 0.000388732518047337, "tps": 16871, "wall": 16870.2} {"step": 4343, "train_loss": 3.7760913372039795, "lr": 0.0003887258453792585, "tps": 16870, "wall": 16875.2} {"step": 4344, "train_loss": 3.918205976486206, "lr": 0.0003887191707998445, "tps": 16869, "wall": 16880.2} {"step": 4345, "train_loss": 3.863792896270752, "lr": 0.00038871249430917073, "tps": 16868, "wall": 16885.2} {"step": 4346, "train_loss": 3.7390897274017334, "lr": 0.00038870581590731267, "tps": 16866, "wall": 16890.2} {"step": 4347, "train_loss": 3.8450093269348145, "lr": 0.0003886991355943459, "tps": 16865, "wall": 16895.2} {"step": 4348, "train_loss": 3.792372703552246, "lr": 0.00038869245337034625, "tps": 16864, "wall": 16900.2} {"step": 4349, "train_loss": 3.8009591102600098, "lr": 0.00038868576923538936, "tps": 16863, "wall": 16905.2} {"step": 4350, "train_loss": 3.854952573776245, "lr": 0.00038867908318955096, "tps": 16862, "wall": 16910.3} {"step": 4351, "train_loss": 3.9585628509521484, "lr": 0.00038867239523290674, "tps": 16861, "wall": 16915.3} {"step": 4352, "train_loss": 3.832578659057617, "lr": 0.00038866570536553254, "tps": 16860, "wall": 16920.3} {"step": 4353, "train_loss": 3.803058624267578, "lr": 0.0003886590135875041, "tps": 16859, "wall": 16925.3} {"step": 4354, "train_loss": 3.853633403778076, "lr": 0.0003886523198988972, "tps": 16857, "wall": 16930.3} {"step": 4355, "train_loss": 3.842780590057373, "lr": 0.00038864562429978777, "tps": 16856, "wall": 16935.3} {"step": 4356, "train_loss": 3.7869608402252197, "lr": 0.0003886389267902515, "tps": 16855, "wall": 16940.3} {"step": 4357, "train_loss": 3.7112655639648438, "lr": 0.0003886322273703644, "tps": 16854, "wall": 16945.3} {"step": 4358, "train_loss": 3.9488227367401123, "lr": 0.00038862552604020226, "tps": 16853, "wall": 16950.3} {"step": 4359, "train_loss": 3.7413368225097656, "lr": 0.00038861882279984104, "tps": 16852, "wall": 16955.3} {"step": 4360, "train_loss": 3.819056510925293, "lr": 0.0003886121176493567, "tps": 16851, "wall": 16960.4} {"step": 4361, "train_loss": 3.824270725250244, "lr": 0.00038860541058882524, "tps": 16850, "wall": 16965.4} {"step": 4362, "train_loss": 3.8174848556518555, "lr": 0.0003885987016183225, "tps": 16848, "wall": 16970.4} {"step": 4363, "train_loss": 3.831059455871582, "lr": 0.00038859199073792446, "tps": 16847, "wall": 16975.5} {"step": 4364, "train_loss": 3.8190793991088867, "lr": 0.0003885852779477073, "tps": 16846, "wall": 16980.5} {"step": 4365, "train_loss": 3.7017579078674316, "lr": 0.000388578563247747, "tps": 16845, "wall": 16985.5} {"step": 4366, "train_loss": 3.7763524055480957, "lr": 0.0003885718466381197, "tps": 16844, "wall": 16990.5} {"step": 4367, "train_loss": 3.762234687805176, "lr": 0.00038856512811890123, "tps": 16843, "wall": 16995.5} {"step": 4368, "train_loss": 3.7861170768737793, "lr": 0.000388558407690168, "tps": 16842, "wall": 17000.5} {"step": 4369, "train_loss": 3.7793145179748535, "lr": 0.0003885516853519959, "tps": 16841, "wall": 17005.5} {"step": 4370, "train_loss": 3.8699288368225098, "lr": 0.0003885449611044613, "tps": 16840, "wall": 17010.5} {"step": 4371, "train_loss": 3.822110414505005, "lr": 0.0003885382349476402, "tps": 16838, "wall": 17015.5} {"step": 4372, "train_loss": 3.8018651008605957, "lr": 0.0003885315068816089, "tps": 16837, "wall": 17020.6} {"step": 4373, "train_loss": 3.8316521644592285, "lr": 0.00038852477690644354, "tps": 16836, "wall": 17025.6} {"step": 4374, "train_loss": 3.848912239074707, "lr": 0.0003885180450222204, "tps": 16835, "wall": 17030.6} {"step": 4375, "train_loss": 3.7918543815612793, "lr": 0.0003885113112290157, "tps": 16834, "wall": 17035.7} {"step": 4376, "train_loss": 3.802680253982544, "lr": 0.0003885045755269058, "tps": 16833, "wall": 17040.7} {"step": 4377, "train_loss": 3.8486809730529785, "lr": 0.0003884978379159669, "tps": 16832, "wall": 17045.7} {"step": 4378, "train_loss": 3.8408641815185547, "lr": 0.0003884910983962755, "tps": 16831, "wall": 17050.7} {"step": 4379, "train_loss": 3.7401084899902344, "lr": 0.0003884843569679077, "tps": 16829, "wall": 17055.7} {"step": 4380, "train_loss": 3.7170872688293457, "lr": 0.0003884776136309399, "tps": 16828, "wall": 17060.7} {"step": 4381, "train_loss": 3.7604944705963135, "lr": 0.00038847086838544875, "tps": 16827, "wall": 17065.7} {"step": 4382, "train_loss": 3.80100417137146, "lr": 0.00038846412123151044, "tps": 16826, "wall": 17070.7} {"step": 4383, "train_loss": 3.793151378631592, "lr": 0.0003884573721692015, "tps": 16825, "wall": 17075.7} {"step": 4384, "train_loss": 3.915822982788086, "lr": 0.00038845062119859824, "tps": 16824, "wall": 17080.8} {"step": 4385, "train_loss": 3.803232192993164, "lr": 0.0003884438683197773, "tps": 16823, "wall": 17085.8} {"step": 4386, "train_loss": 3.753757953643799, "lr": 0.00038843711353281503, "tps": 16822, "wall": 17090.8} {"step": 4387, "train_loss": 3.739743709564209, "lr": 0.00038843035683778804, "tps": 16821, "wall": 17095.9} {"step": 4388, "train_loss": 3.9173433780670166, "lr": 0.00038842359823477296, "tps": 16820, "wall": 17100.9} {"step": 4389, "train_loss": 3.7565958499908447, "lr": 0.0003884168377238461, "tps": 16818, "wall": 17105.9} {"step": 4390, "train_loss": 3.9065816402435303, "lr": 0.00038841007530508433, "tps": 16817, "wall": 17110.9} {"step": 4391, "train_loss": 3.8231122493743896, "lr": 0.000388403310978564, "tps": 16816, "wall": 17115.9} {"step": 4392, "train_loss": 3.784575939178467, "lr": 0.000388396544744362, "tps": 16815, "wall": 17120.9} {"step": 4393, "train_loss": 3.84904146194458, "lr": 0.00038838977660255467, "tps": 16814, "wall": 17125.9} {"step": 4394, "train_loss": 3.710577964782715, "lr": 0.0003883830065532189, "tps": 16813, "wall": 17130.9} {"step": 4395, "train_loss": 3.7910099029541016, "lr": 0.0003883762345964314, "tps": 16812, "wall": 17135.9} {"step": 4396, "train_loss": 3.8621110916137695, "lr": 0.0003883694607322687, "tps": 16811, "wall": 17140.9} {"step": 4397, "train_loss": 3.827579975128174, "lr": 0.0003883626849608076, "tps": 16810, "wall": 17145.9} {"step": 4398, "train_loss": 3.7970030307769775, "lr": 0.00038835590728212503, "tps": 16809, "wall": 17150.9} {"step": 4399, "train_loss": 3.7831225395202637, "lr": 0.00038834912769629756, "tps": 16808, "wall": 17156.0} {"step": 4400, "train_loss": 3.8126821517944336, "lr": 0.0003883423462034021, "tps": 16806, "wall": 17161.0} {"step": 4401, "train_loss": 3.843384265899658, "lr": 0.0003883355628035154, "tps": 16805, "wall": 17166.0} {"step": 4402, "train_loss": 3.865894317626953, "lr": 0.0003883287774967143, "tps": 16804, "wall": 17171.0} {"step": 4403, "train_loss": 3.8294460773468018, "lr": 0.0003883219902830758, "tps": 16803, "wall": 17175.9} {"step": 4404, "train_loss": 3.7867603302001953, "lr": 0.00038831520116267666, "tps": 16802, "wall": 17181.0} {"step": 4405, "train_loss": 3.832144021987915, "lr": 0.0003883084101355938, "tps": 16801, "wall": 17186.0} {"step": 4406, "train_loss": 3.8557920455932617, "lr": 0.0003883016172019042, "tps": 16800, "wall": 17191.0} {"step": 4407, "train_loss": 3.8558220863342285, "lr": 0.0003882948223616847, "tps": 16799, "wall": 17196.0} {"step": 4408, "train_loss": 3.7305779457092285, "lr": 0.00038828802561501237, "tps": 16798, "wall": 17201.1} {"step": 4409, "train_loss": 3.8054862022399902, "lr": 0.00038828122696196423, "tps": 16797, "wall": 17206.1} {"step": 4410, "train_loss": 3.783912181854248, "lr": 0.00038827442640261724, "tps": 16796, "wall": 17211.1} {"step": 4411, "train_loss": 3.777057409286499, "lr": 0.00038826762393704843, "tps": 16794, "wall": 17216.2} {"step": 4412, "train_loss": 3.893568515777588, "lr": 0.00038826081956533484, "tps": 16793, "wall": 17221.2} {"step": 4413, "train_loss": 3.8590188026428223, "lr": 0.00038825401328755355, "tps": 16792, "wall": 17226.2} {"step": 4414, "train_loss": 3.8635354042053223, "lr": 0.0003882472051037818, "tps": 16791, "wall": 17231.1} {"step": 4415, "train_loss": 3.7594401836395264, "lr": 0.0003882403950140965, "tps": 16790, "wall": 17236.2} {"step": 4416, "train_loss": 3.7397475242614746, "lr": 0.000388233583018575, "tps": 16789, "wall": 17241.2} {"step": 4417, "train_loss": 3.8076136112213135, "lr": 0.00038822676911729435, "tps": 16788, "wall": 17246.2} {"step": 4418, "train_loss": 3.888122797012329, "lr": 0.0003882199533103317, "tps": 16787, "wall": 17251.2} {"step": 4419, "train_loss": 3.7283740043640137, "lr": 0.0003882131355977644, "tps": 16786, "wall": 17256.2} {"step": 4420, "train_loss": 3.8076729774475098, "lr": 0.0003882063159796695, "tps": 16785, "wall": 17261.1} {"step": 4421, "train_loss": 3.8277463912963867, "lr": 0.00038819949445612447, "tps": 16784, "wall": 17266.1} {"step": 4422, "train_loss": 3.734257459640503, "lr": 0.0003881926710272064, "tps": 16782, "wall": 17271.7} {"step": 4423, "train_loss": 3.8346774578094482, "lr": 0.00038818584569299267, "tps": 16781, "wall": 17277.1} {"step": 4424, "train_loss": 3.9797441959381104, "lr": 0.00038817901845356056, "tps": 16779, "wall": 17282.4} {"step": 4425, "train_loss": 3.713149070739746, "lr": 0.00038817218930898743, "tps": 16778, "wall": 17287.7} {"step": 4426, "train_loss": 3.685117244720459, "lr": 0.0003881653582593507, "tps": 16777, "wall": 17293.0} {"step": 4427, "train_loss": 3.838498830795288, "lr": 0.0003881585253047276, "tps": 16775, "wall": 17298.4} {"step": 4428, "train_loss": 3.780609607696533, "lr": 0.0003881516904451957, "tps": 16774, "wall": 17303.7} {"step": 4429, "train_loss": 3.7812955379486084, "lr": 0.00038814485368083234, "tps": 16773, "wall": 17308.9} {"step": 4430, "train_loss": 3.8277173042297363, "lr": 0.000388138015011715, "tps": 16771, "wall": 17314.1} {"step": 4431, "train_loss": 3.7322707176208496, "lr": 0.0003881311744379211, "tps": 16770, "wall": 17319.4} {"step": 4432, "train_loss": 3.772768497467041, "lr": 0.00038812433195952817, "tps": 16769, "wall": 17324.7} {"step": 4433, "train_loss": 3.821671485900879, "lr": 0.0003881174875766137, "tps": 16767, "wall": 17329.9} {"step": 4434, "train_loss": 3.7893314361572266, "lr": 0.0003881106412892552, "tps": 16766, "wall": 17335.2} {"step": 4435, "train_loss": 3.778569221496582, "lr": 0.0003881037930975303, "tps": 16765, "wall": 17340.5} {"step": 4436, "train_loss": 3.8965976238250732, "lr": 0.0003880969430015166, "tps": 16763, "wall": 17345.8} {"step": 4437, "train_loss": 3.800525665283203, "lr": 0.0003880900910012915, "tps": 16762, "wall": 17351.0} {"step": 4438, "train_loss": 3.766977310180664, "lr": 0.00038808323709693286, "tps": 16761, "wall": 17356.3} {"step": 4439, "train_loss": 3.8558788299560547, "lr": 0.0003880763812885182, "tps": 16759, "wall": 17361.7} {"step": 4440, "train_loss": 3.670203685760498, "lr": 0.0003880695235761252, "tps": 16758, "wall": 17366.7} {"step": 4441, "train_loss": 3.8372318744659424, "lr": 0.0003880626639598315, "tps": 16757, "wall": 17371.7} {"step": 4442, "train_loss": 3.7829060554504395, "lr": 0.00038805580243971493, "tps": 16756, "wall": 17376.7} {"step": 4443, "train_loss": 3.7421412467956543, "lr": 0.000388048939015853, "tps": 16755, "wall": 17381.7} {"step": 4444, "train_loss": 3.7557497024536133, "lr": 0.0003880420736883238, "tps": 16754, "wall": 17386.7} {"step": 4445, "train_loss": 3.8133139610290527, "lr": 0.00038803520645720475, "tps": 16753, "wall": 17391.7} {"step": 4446, "train_loss": 3.789670944213867, "lr": 0.00038802833732257385, "tps": 16752, "wall": 17396.8} {"step": 4447, "train_loss": 3.8114216327667236, "lr": 0.0003880214662845088, "tps": 16751, "wall": 17401.8} {"step": 4448, "train_loss": 3.8543541431427, "lr": 0.0003880145933430875, "tps": 16750, "wall": 17406.8} {"step": 4449, "train_loss": 3.789191246032715, "lr": 0.00038800771849838785, "tps": 16749, "wall": 17411.8} {"step": 4450, "train_loss": 3.791929244995117, "lr": 0.0003880008417504876, "tps": 16748, "wall": 17416.8} {"step": 4451, "train_loss": 3.8092284202575684, "lr": 0.00038799396309946487, "tps": 16747, "wall": 17421.9} {"step": 4452, "train_loss": 3.7698731422424316, "lr": 0.0003879870825453973, "tps": 16745, "wall": 17427.0} {"step": 4453, "train_loss": 3.773813247680664, "lr": 0.000387980200088363, "tps": 16744, "wall": 17432.0} {"step": 4454, "train_loss": 3.821810483932495, "lr": 0.00038797331572843993, "tps": 16743, "wall": 17437.0} {"step": 4455, "train_loss": 3.7665696144104004, "lr": 0.000387966429465706, "tps": 16742, "wall": 17442.0} {"step": 4456, "train_loss": 3.8801841735839844, "lr": 0.00038795954130023934, "tps": 16741, "wall": 17447.3} {"step": 4457, "train_loss": 3.807774066925049, "lr": 0.0003879526512321179, "tps": 16740, "wall": 17452.3} {"step": 4458, "train_loss": 3.726134777069092, "lr": 0.0003879457592614197, "tps": 16739, "wall": 17457.3} {"step": 4459, "train_loss": 3.8470115661621094, "lr": 0.0003879388653882229, "tps": 16738, "wall": 17462.3} {"step": 4460, "train_loss": 3.7406482696533203, "lr": 0.0003879319696126055, "tps": 16737, "wall": 17467.3} {"step": 4461, "train_loss": 3.853044033050537, "lr": 0.00038792507193464564, "tps": 16736, "wall": 17472.3} {"step": 4462, "train_loss": 3.8184289932250977, "lr": 0.0003879181723544216, "tps": 16735, "wall": 17477.3} {"step": 4463, "train_loss": 3.7510721683502197, "lr": 0.00038791127087201135, "tps": 16734, "wall": 17482.3} {"step": 4464, "train_loss": 3.8106746673583984, "lr": 0.0003879043674874931, "tps": 16732, "wall": 17487.5} {"step": 4465, "train_loss": 3.767000675201416, "lr": 0.00038789746220094516, "tps": 16731, "wall": 17492.5} {"step": 4466, "train_loss": 3.7807419300079346, "lr": 0.0003878905550124456, "tps": 16730, "wall": 17497.5} {"step": 4467, "train_loss": 3.869962215423584, "lr": 0.0003878836459220728, "tps": 16729, "wall": 17502.5} {"step": 4468, "train_loss": 3.828887939453125, "lr": 0.00038787673492990496, "tps": 16728, "wall": 17507.7} {"step": 4469, "train_loss": 3.8175976276397705, "lr": 0.00038786982203602047, "tps": 16727, "wall": 17512.8} {"step": 4470, "train_loss": 3.9053287506103516, "lr": 0.00038786290724049746, "tps": 16726, "wall": 17517.8} {"step": 4471, "train_loss": 3.788407802581787, "lr": 0.0003878559905434144, "tps": 16725, "wall": 17522.8} {"step": 4472, "train_loss": 3.900578498840332, "lr": 0.00038784907194484955, "tps": 16724, "wall": 17527.8} {"step": 4473, "train_loss": 3.82513427734375, "lr": 0.0003878421514448813, "tps": 16723, "wall": 17532.8} {"step": 4474, "train_loss": 3.893721103668213, "lr": 0.0003878352290435882, "tps": 16722, "wall": 17537.8} {"step": 4475, "train_loss": 3.7575178146362305, "lr": 0.0003878283047410485, "tps": 16721, "wall": 17542.8} {"step": 4476, "train_loss": 3.8715105056762695, "lr": 0.0003878213785373407, "tps": 16720, "wall": 17547.8} {"step": 4477, "train_loss": 3.7660508155822754, "lr": 0.00038781445043254315, "tps": 16718, "wall": 17553.1} {"step": 4478, "train_loss": 3.867875576019287, "lr": 0.00038780752042673447, "tps": 16717, "wall": 17558.4} {"step": 4479, "train_loss": 3.804014205932617, "lr": 0.00038780058851999315, "tps": 16716, "wall": 17563.6} {"step": 4480, "train_loss": 3.8815689086914062, "lr": 0.0003877936547123977, "tps": 16715, "wall": 17568.9} {"step": 4481, "train_loss": 3.830796480178833, "lr": 0.00038778671900402666, "tps": 16713, "wall": 17574.2} {"step": 4482, "train_loss": 3.886026382446289, "lr": 0.00038777978139495855, "tps": 16712, "wall": 17579.4} {"step": 4483, "train_loss": 3.8680365085601807, "lr": 0.000387772841885272, "tps": 16711, "wall": 17584.7} {"step": 4484, "train_loss": 3.7707624435424805, "lr": 0.00038776590047504564, "tps": 16710, "wall": 17590.0} {"step": 4485, "train_loss": 3.7618260383605957, "lr": 0.0003877589571643581, "tps": 16708, "wall": 17595.2} {"step": 4486, "train_loss": 3.7896203994750977, "lr": 0.00038775201195328797, "tps": 16707, "wall": 17600.5} {"step": 4487, "train_loss": 3.8178718090057373, "lr": 0.000387745064841914, "tps": 16706, "wall": 17605.8} {"step": 4488, "train_loss": 3.756582021713257, "lr": 0.0003877381158303149, "tps": 16704, "wall": 17611.1} {"step": 4489, "train_loss": 3.796109199523926, "lr": 0.00038773116491856924, "tps": 16703, "wall": 17616.4} {"step": 4490, "train_loss": 3.6839957237243652, "lr": 0.000387724212106756, "tps": 16702, "wall": 17621.7} {"step": 4491, "train_loss": 3.8032450675964355, "lr": 0.0003877172573949537, "tps": 16700, "wall": 17627.0} {"step": 4492, "train_loss": 3.857729196548462, "lr": 0.0003877103007832413, "tps": 16699, "wall": 17632.3} {"step": 4493, "train_loss": 3.978102207183838, "lr": 0.0003877033422716975, "tps": 16698, "wall": 17637.7} {"step": 4494, "train_loss": 3.8553996086120605, "lr": 0.00038769638186040125, "tps": 16696, "wall": 17643.0} {"step": 4495, "train_loss": 3.8011741638183594, "lr": 0.0003876894195494312, "tps": 16695, "wall": 17648.3} {"step": 4496, "train_loss": 3.7949700355529785, "lr": 0.0003876824553388664, "tps": 16694, "wall": 17653.6} {"step": 4497, "train_loss": 3.6482760906219482, "lr": 0.00038767548922878566, "tps": 16693, "wall": 17658.8} {"step": 4498, "train_loss": 3.8562917709350586, "lr": 0.00038766852121926786, "tps": 16691, "wall": 17664.1} {"step": 4499, "train_loss": 3.7024810314178467, "lr": 0.00038766155131039206, "tps": 16690, "wall": 17669.1} {"step": 4500, "train_loss": 3.8505640029907227, "lr": 0.0003876545795022371, "tps": 16689, "wall": 17674.1} {"step": 4501, "train_loss": 3.83905029296875, "lr": 0.000387647605794882, "tps": 16688, "wall": 17679.3} {"step": 4502, "train_loss": 3.793726921081543, "lr": 0.00038764063018840577, "tps": 16687, "wall": 17684.3} {"step": 4503, "train_loss": 3.8314013481140137, "lr": 0.00038763365268288736, "tps": 16686, "wall": 17689.3} {"step": 4504, "train_loss": 3.7907817363739014, "lr": 0.0003876266732784059, "tps": 16685, "wall": 17694.3} {"step": 4505, "train_loss": 3.696500778198242, "lr": 0.00038761969197504044, "tps": 16684, "wall": 17699.3} {"step": 4506, "train_loss": 3.7900822162628174, "lr": 0.00038761270877287, "tps": 16683, "wall": 17704.2} {"step": 4507, "train_loss": 3.917954921722412, "lr": 0.0003876057236719737, "tps": 16682, "wall": 17709.2} {"step": 4508, "train_loss": 3.71311092376709, "lr": 0.00038759873667243075, "tps": 16681, "wall": 17714.2} {"step": 4509, "train_loss": 3.753892183303833, "lr": 0.00038759174777432023, "tps": 16680, "wall": 17719.1} {"step": 4510, "train_loss": 3.717726230621338, "lr": 0.00038758475697772134, "tps": 16679, "wall": 17724.1} {"step": 4511, "train_loss": 3.7025370597839355, "lr": 0.00038757776428271324, "tps": 16678, "wall": 17729.1} {"step": 4512, "train_loss": 3.736711025238037, "lr": 0.0003875707696893752, "tps": 16677, "wall": 17734.0} {"step": 4513, "train_loss": 3.8065185546875, "lr": 0.00038756377319778634, "tps": 16676, "wall": 17739.0} {"step": 4514, "train_loss": 3.836209297180176, "lr": 0.000387556774808026, "tps": 16675, "wall": 17744.0} {"step": 4515, "train_loss": 3.7784829139709473, "lr": 0.0003875497745201735, "tps": 16674, "wall": 17748.9} {"step": 4516, "train_loss": 3.806894063949585, "lr": 0.0003875427723343081, "tps": 16673, "wall": 17753.9} {"step": 4517, "train_loss": 3.736043930053711, "lr": 0.00038753576825050905, "tps": 16672, "wall": 17758.9} {"step": 4518, "train_loss": 3.832602024078369, "lr": 0.0003875287622688558, "tps": 16671, "wall": 17763.8} {"step": 4519, "train_loss": 3.8371386528015137, "lr": 0.00038752175438942765, "tps": 16670, "wall": 17768.8} {"step": 4520, "train_loss": 3.772226572036743, "lr": 0.000387514744612304, "tps": 16669, "wall": 17773.8} {"step": 4521, "train_loss": 3.801377773284912, "lr": 0.00038750773293756425, "tps": 16669, "wall": 17778.7} {"step": 4522, "train_loss": 3.803645372390747, "lr": 0.00038750071936528786, "tps": 16668, "wall": 17783.6} {"step": 4523, "train_loss": 3.8442440032958984, "lr": 0.00038749370389555424, "tps": 16667, "wall": 17788.6} {"step": 4524, "train_loss": 3.870967388153076, "lr": 0.00038748668652844296, "tps": 16666, "wall": 17793.6} {"step": 4525, "train_loss": 3.800821304321289, "lr": 0.00038747966726403334, "tps": 16665, "wall": 17798.5} {"step": 4526, "train_loss": 3.8213651180267334, "lr": 0.000387472646102405, "tps": 16664, "wall": 17803.5} {"step": 4527, "train_loss": 3.7570226192474365, "lr": 0.0003874656230436375, "tps": 16663, "wall": 17808.4} {"step": 4528, "train_loss": 3.955148935317993, "lr": 0.00038745859808781037, "tps": 16662, "wall": 17813.5} {"step": 4529, "train_loss": 3.8257102966308594, "lr": 0.0003874515712350031, "tps": 16661, "wall": 17818.4} {"step": 4530, "train_loss": 3.7756669521331787, "lr": 0.0003874445424852954, "tps": 16660, "wall": 17823.3} {"step": 4531, "train_loss": 3.687504768371582, "lr": 0.0003874375118387669, "tps": 16659, "wall": 17828.3} {"step": 4532, "train_loss": 3.8350276947021484, "lr": 0.00038743047929549725, "tps": 16658, "wall": 17833.3} {"step": 4533, "train_loss": 3.6850950717926025, "lr": 0.00038742344485556603, "tps": 16657, "wall": 17838.2} {"step": 4534, "train_loss": 3.74520206451416, "lr": 0.00038741640851905297, "tps": 16656, "wall": 17843.2} {"step": 4535, "train_loss": 3.6908717155456543, "lr": 0.0003874093702860378, "tps": 16655, "wall": 17848.1} {"step": 4536, "train_loss": 3.7653515338897705, "lr": 0.00038740233015660015, "tps": 16654, "wall": 17853.1} {"step": 4537, "train_loss": 3.825230121612549, "lr": 0.0003873952881308199, "tps": 16653, "wall": 17858.0} {"step": 4538, "train_loss": 3.8635478019714355, "lr": 0.00038738824420877675, "tps": 16652, "wall": 17863.0} {"step": 4539, "train_loss": 3.839477062225342, "lr": 0.0003873811983905506, "tps": 16651, "wall": 17867.9} {"step": 4540, "train_loss": 3.9219279289245605, "lr": 0.0003873741506762211, "tps": 16650, "wall": 17873.0} {"step": 4541, "train_loss": 3.8956313133239746, "lr": 0.00038736710106586814, "tps": 16649, "wall": 17877.9} {"step": 4542, "train_loss": 3.8047738075256348, "lr": 0.0003873600495595716, "tps": 16648, "wall": 17882.9} {"step": 4543, "train_loss": 3.8228273391723633, "lr": 0.00038735299615741143, "tps": 16647, "wall": 17887.8} {"step": 4544, "train_loss": 3.7802584171295166, "lr": 0.00038734594085946747, "tps": 16646, "wall": 17892.8} {"step": 4545, "train_loss": 3.728060483932495, "lr": 0.0003873388836658196, "tps": 16645, "wall": 17897.8} {"step": 4546, "train_loss": 3.7560126781463623, "lr": 0.00038733182457654776, "tps": 16645, "wall": 17902.8} {"step": 4547, "train_loss": 3.7890994548797607, "lr": 0.00038732476359173203, "tps": 16644, "wall": 17907.7} {"step": 4548, "train_loss": 3.604712724685669, "lr": 0.00038731770071145233, "tps": 16643, "wall": 17912.7} {"step": 4549, "train_loss": 3.791266918182373, "lr": 0.0003873106359357886, "tps": 16642, "wall": 17917.7} {"step": 4550, "train_loss": 3.6549112796783447, "lr": 0.000387303569264821, "tps": 16641, "wall": 17922.6} {"step": 4551, "train_loss": 3.8856656551361084, "lr": 0.0003872965006986295, "tps": 16640, "wall": 17927.6} {"step": 4552, "train_loss": 3.788613796234131, "lr": 0.00038728943023729417, "tps": 16639, "wall": 17932.6} {"step": 4553, "train_loss": 3.7620558738708496, "lr": 0.00038728235788089514, "tps": 16638, "wall": 17937.5} {"step": 4554, "train_loss": 3.802178382873535, "lr": 0.00038727528362951253, "tps": 16637, "wall": 17942.5} {"step": 4555, "train_loss": 3.821713924407959, "lr": 0.0003872682074832264, "tps": 16636, "wall": 17947.5} {"step": 4556, "train_loss": 3.750821590423584, "lr": 0.00038726112944211704, "tps": 16635, "wall": 17952.4} {"step": 4557, "train_loss": 3.7634410858154297, "lr": 0.0003872540495062645, "tps": 16634, "wall": 17957.4} {"step": 4558, "train_loss": 3.760385751724243, "lr": 0.00038724696767574905, "tps": 16633, "wall": 17962.4} {"step": 4559, "train_loss": 3.8300931453704834, "lr": 0.0003872398839506509, "tps": 16632, "wall": 17967.3} {"step": 4560, "train_loss": 3.7832586765289307, "lr": 0.0003872327983310503, "tps": 16631, "wall": 17972.3} {"step": 4561, "train_loss": 3.864480972290039, "lr": 0.0003872257108170275, "tps": 16630, "wall": 17977.3} {"step": 4562, "train_loss": 3.8072190284729004, "lr": 0.00038721862140866285, "tps": 16629, "wall": 17982.2} {"step": 4563, "train_loss": 3.8136441707611084, "lr": 0.00038721153010603664, "tps": 16628, "wall": 17987.2} {"step": 4564, "train_loss": 3.8272297382354736, "lr": 0.0003872044369092291, "tps": 16627, "wall": 17992.2} {"step": 4565, "train_loss": 3.7273237705230713, "lr": 0.0003871973418183206, "tps": 16626, "wall": 17997.2} {"step": 4566, "train_loss": 3.813965320587158, "lr": 0.00038719024483339166, "tps": 16625, "wall": 18002.2} {"step": 4567, "train_loss": 3.7388839721679688, "lr": 0.00038718314595452254, "tps": 16624, "wall": 18007.2} {"step": 4568, "train_loss": 3.7350993156433105, "lr": 0.00038717604518179367, "tps": 16624, "wall": 18012.1} {"step": 4569, "train_loss": 3.893394947052002, "lr": 0.0003871689425152856, "tps": 16623, "wall": 18017.1} {"step": 4570, "train_loss": 3.7256429195404053, "lr": 0.00038716183795507866, "tps": 16622, "wall": 18022.1} {"step": 4571, "train_loss": 3.769130229949951, "lr": 0.00038715473150125336, "tps": 16621, "wall": 18027.0} {"step": 4572, "train_loss": 3.8028769493103027, "lr": 0.00038714762315389026, "tps": 16620, "wall": 18032.0} {"step": 4573, "train_loss": 3.765460968017578, "lr": 0.00038714051291306983, "tps": 16619, "wall": 18037.0} {"step": 4574, "train_loss": 3.7086143493652344, "lr": 0.0003871334007788726, "tps": 16618, "wall": 18041.9} {"step": 4575, "train_loss": 3.8764820098876953, "lr": 0.0003871262867513792, "tps": 16617, "wall": 18046.9} {"step": 4576, "train_loss": 3.754629373550415, "lr": 0.00038711917083067014, "tps": 16616, "wall": 18051.9} {"step": 4577, "train_loss": 3.7233047485351562, "lr": 0.0003871120530168261, "tps": 16615, "wall": 18056.9} {"step": 4578, "train_loss": 3.747030258178711, "lr": 0.0003871049333099277, "tps": 16614, "wall": 18061.9} {"step": 4579, "train_loss": 3.8678126335144043, "lr": 0.00038709781171005555, "tps": 16613, "wall": 18066.8} {"step": 4580, "train_loss": 3.738797187805176, "lr": 0.0003870906882172903, "tps": 16612, "wall": 18071.8} {"step": 4581, "train_loss": 3.7606687545776367, "lr": 0.0003870835628317128, "tps": 16611, "wall": 18076.7} {"step": 4582, "train_loss": 3.781752586364746, "lr": 0.0003870764355534036, "tps": 16610, "wall": 18081.7} {"step": 4583, "train_loss": 3.6708202362060547, "lr": 0.0003870693063824435, "tps": 16609, "wall": 18086.7} {"step": 4584, "train_loss": 3.797757148742676, "lr": 0.0003870621753189132, "tps": 16608, "wall": 18091.7} {"step": 4585, "train_loss": 3.756760597229004, "lr": 0.0003870550423628937, "tps": 16607, "wall": 18096.6} {"step": 4586, "train_loss": 3.735455274581909, "lr": 0.00038704790751446555, "tps": 16607, "wall": 18101.6} {"step": 4587, "train_loss": 3.7951016426086426, "lr": 0.0003870407707737097, "tps": 16606, "wall": 18106.5} {"step": 4588, "train_loss": 3.7308740615844727, "lr": 0.00038703363214070686, "tps": 16605, "wall": 18111.5} {"step": 4589, "train_loss": 3.847062587738037, "lr": 0.0003870264916155381, "tps": 16604, "wall": 18116.5} {"step": 4590, "train_loss": 3.7137861251831055, "lr": 0.00038701934919828417, "tps": 16603, "wall": 18121.5} {"step": 4591, "train_loss": 3.77400803565979, "lr": 0.000387012204889026, "tps": 16602, "wall": 18126.5} {"step": 4592, "train_loss": 3.857440948486328, "lr": 0.0003870050586878445, "tps": 16601, "wall": 18131.5} {"step": 4593, "train_loss": 3.7708818912506104, "lr": 0.00038699791059482083, "tps": 16600, "wall": 18136.4} {"step": 4594, "train_loss": 3.8585567474365234, "lr": 0.0003869907606100356, "tps": 16599, "wall": 18141.3} {"step": 4595, "train_loss": 3.8025903701782227, "lr": 0.0003869836087335701, "tps": 16598, "wall": 18146.3} {"step": 4596, "train_loss": 3.7962422370910645, "lr": 0.0003869764549655053, "tps": 16597, "wall": 18151.3} {"step": 4597, "train_loss": 3.8119635581970215, "lr": 0.00038696929930592203, "tps": 16596, "wall": 18156.2} {"step": 4598, "train_loss": 3.7745044231414795, "lr": 0.0003869621417549016, "tps": 16595, "wall": 18161.2} {"step": 4599, "train_loss": 3.7770323753356934, "lr": 0.000386954982312525, "tps": 16594, "wall": 18166.2} {"step": 4600, "train_loss": 3.7068214416503906, "lr": 0.0003869478209788733, "tps": 16593, "wall": 18171.1} {"step": 4601, "train_loss": 3.839944362640381, "lr": 0.0003869406577540277, "tps": 16592, "wall": 18176.2} {"step": 4602, "train_loss": 3.8022947311401367, "lr": 0.0003869334926380693, "tps": 16592, "wall": 18181.2} {"step": 4603, "train_loss": 3.7387866973876953, "lr": 0.0003869263256310792, "tps": 16591, "wall": 18186.1} {"step": 4604, "train_loss": 3.820324420928955, "lr": 0.0003869191567331386, "tps": 16590, "wall": 18191.1} {"step": 4605, "train_loss": 3.7213902473449707, "lr": 0.0003869119859443289, "tps": 16589, "wall": 18196.0} {"step": 4606, "train_loss": 3.7782888412475586, "lr": 0.0003869048132647311, "tps": 16588, "wall": 18201.0} {"step": 4607, "train_loss": 3.678110361099243, "lr": 0.0003868976386944266, "tps": 16587, "wall": 18206.0} {"step": 4608, "train_loss": 3.879908561706543, "lr": 0.00038689046223349657, "tps": 16586, "wall": 18211.0} {"step": 4609, "train_loss": 3.751906633377075, "lr": 0.0003868832838820224, "tps": 16585, "wall": 18216.0} {"step": 4610, "train_loss": 3.881220817565918, "lr": 0.00038687610364008537, "tps": 16584, "wall": 18220.9} {"step": 4611, "train_loss": 3.782443046569824, "lr": 0.00038686892150776675, "tps": 16583, "wall": 18225.9} {"step": 4612, "train_loss": 3.8279590606689453, "lr": 0.00038686173748514805, "tps": 16582, "wall": 18230.9} {"step": 4613, "train_loss": 3.8236300945281982, "lr": 0.0003868545515723105, "tps": 16581, "wall": 18235.9} {"step": 4614, "train_loss": 3.7660183906555176, "lr": 0.00038684736376933557, "tps": 16580, "wall": 18240.9} {"step": 4615, "train_loss": 3.7898378372192383, "lr": 0.00038684017407630464, "tps": 16579, "wall": 18245.9} {"step": 4616, "train_loss": 3.8372859954833984, "lr": 0.00038683298249329927, "tps": 16578, "wall": 18250.8} {"step": 4617, "train_loss": 3.752547025680542, "lr": 0.0003868257890204008, "tps": 16578, "wall": 18255.8} {"step": 4618, "train_loss": 3.745100498199463, "lr": 0.00038681859365769075, "tps": 16577, "wall": 18260.7} {"step": 4619, "train_loss": 3.8134870529174805, "lr": 0.0003868113964052507, "tps": 16576, "wall": 18265.7} {"step": 4620, "train_loss": 3.854851722717285, "lr": 0.0003868041972631621, "tps": 16575, "wall": 18270.7} {"step": 4621, "train_loss": 3.636359691619873, "lr": 0.00038679699623150654, "tps": 16574, "wall": 18275.6} {"step": 4622, "train_loss": 3.773440361022949, "lr": 0.00038678979331036555, "tps": 16573, "wall": 18280.6} {"step": 4623, "train_loss": 3.717451572418213, "lr": 0.0003867825884998208, "tps": 16572, "wall": 18285.6} {"step": 4624, "train_loss": 3.863636016845703, "lr": 0.00038677538179995386, "tps": 16571, "wall": 18290.5} {"step": 4625, "train_loss": 3.7713167667388916, "lr": 0.00038676817321084634, "tps": 16570, "wall": 18295.5} {"step": 4626, "train_loss": 3.782771587371826, "lr": 0.00038676096273257995, "tps": 16569, "wall": 18300.5} {"step": 4627, "train_loss": 3.8039169311523438, "lr": 0.00038675375036523635, "tps": 16568, "wall": 18305.5} {"step": 4628, "train_loss": 3.8306941986083984, "lr": 0.0003867465361088973, "tps": 16567, "wall": 18310.4} {"step": 4629, "train_loss": 3.780092716217041, "lr": 0.0003867393199636444, "tps": 16567, "wall": 18315.4} {"step": 4630, "train_loss": 3.7042698860168457, "lr": 0.0003867321019295594, "tps": 16566, "wall": 18320.4} {"step": 4631, "train_loss": 3.8150405883789062, "lr": 0.00038672488200672424, "tps": 16565, "wall": 18325.4} {"step": 4632, "train_loss": 3.762744426727295, "lr": 0.00038671766019522056, "tps": 16564, "wall": 18330.3} {"step": 4633, "train_loss": 3.6796603202819824, "lr": 0.0003867104364951302, "tps": 16563, "wall": 18335.3} {"step": 4634, "train_loss": 3.717271089553833, "lr": 0.00038670321090653503, "tps": 16562, "wall": 18340.3} {"step": 4635, "train_loss": 3.800229072570801, "lr": 0.00038669598342951685, "tps": 16561, "wall": 18345.2} {"step": 4636, "train_loss": 3.71065092086792, "lr": 0.0003866887540641575, "tps": 16560, "wall": 18350.2} {"step": 4637, "train_loss": 3.721130132675171, "lr": 0.000386681522810539, "tps": 16559, "wall": 18355.2} {"step": 4638, "train_loss": 3.7202155590057373, "lr": 0.0003866742896687432, "tps": 16558, "wall": 18360.2} {"step": 4639, "train_loss": 3.794445514678955, "lr": 0.00038666705463885197, "tps": 16557, "wall": 18365.2} {"step": 4640, "train_loss": 3.807389259338379, "lr": 0.00038665981772094735, "tps": 16556, "wall": 18370.2} {"step": 4641, "train_loss": 3.762476682662964, "lr": 0.00038665257891511135, "tps": 16555, "wall": 18375.1} {"step": 4642, "train_loss": 3.802288293838501, "lr": 0.0003866453382214259, "tps": 16555, "wall": 18380.2} {"step": 4643, "train_loss": 3.8415348529815674, "lr": 0.0003866380956399729, "tps": 16554, "wall": 18385.1} {"step": 4644, "train_loss": 3.747610569000244, "lr": 0.00038663085117083477, "tps": 16553, "wall": 18390.1} {"step": 4645, "train_loss": 3.804534912109375, "lr": 0.00038662360481409323, "tps": 16552, "wall": 18395.1} {"step": 4646, "train_loss": 3.88900089263916, "lr": 0.0003866163565698304, "tps": 16551, "wall": 18400.1} {"step": 4647, "train_loss": 3.806521415710449, "lr": 0.0003866091064381286, "tps": 16550, "wall": 18405.1} {"step": 4648, "train_loss": 3.837449550628662, "lr": 0.00038660185441906976, "tps": 16549, "wall": 18410.0} {"step": 4649, "train_loss": 3.796802282333374, "lr": 0.0003865946005127361, "tps": 16548, "wall": 18415.1} {"step": 4650, "train_loss": 3.9176077842712402, "lr": 0.0003865873447192098, "tps": 16547, "wall": 18420.1} {"step": 4651, "train_loss": 3.8052258491516113, "lr": 0.00038658008703857305, "tps": 16546, "wall": 18425.1} {"step": 4652, "train_loss": 3.8521690368652344, "lr": 0.0003865728274709081, "tps": 16545, "wall": 18430.0} {"step": 4653, "train_loss": 3.837677240371704, "lr": 0.00038656556601629716, "tps": 16544, "wall": 18435.0} {"step": 4654, "train_loss": 3.7395811080932617, "lr": 0.0003865583026748224, "tps": 16543, "wall": 18440.0} {"step": 4655, "train_loss": 3.8975706100463867, "lr": 0.0003865510374465662, "tps": 16542, "wall": 18445.0} {"step": 4656, "train_loss": 3.811967611312866, "lr": 0.0003865437703316109, "tps": 16542, "wall": 18450.0} {"step": 4657, "train_loss": 3.76985764503479, "lr": 0.0003865365013300386, "tps": 16541, "wall": 18455.0} {"step": 4658, "train_loss": 3.7749550342559814, "lr": 0.00038652923044193196, "tps": 16540, "wall": 18459.9} {"step": 4659, "train_loss": 3.791266918182373, "lr": 0.00038652195766737316, "tps": 16539, "wall": 18464.9} {"step": 4660, "train_loss": 3.7509427070617676, "lr": 0.00038651468300644455, "tps": 16538, "wall": 18469.9} {"step": 4661, "train_loss": 3.7523233890533447, "lr": 0.00038650740645922865, "tps": 16537, "wall": 18474.9} {"step": 4662, "train_loss": 3.7242963314056396, "lr": 0.00038650012802580785, "tps": 16536, "wall": 18479.8} {"step": 4663, "train_loss": 3.7057719230651855, "lr": 0.00038649284770626456, "tps": 16535, "wall": 18484.8} {"step": 4664, "train_loss": 3.772691011428833, "lr": 0.0003864855655006813, "tps": 16534, "wall": 18489.8} {"step": 4665, "train_loss": 3.807950496673584, "lr": 0.00038647828140914056, "tps": 16533, "wall": 18494.7} {"step": 4666, "train_loss": 3.926199197769165, "lr": 0.0003864709954317249, "tps": 16533, "wall": 18499.7} {"step": 4667, "train_loss": 3.673421859741211, "lr": 0.00038646370756851667, "tps": 16532, "wall": 18504.7} {"step": 4668, "train_loss": 3.704674243927002, "lr": 0.0003864564178195986, "tps": 16531, "wall": 18509.7} {"step": 4669, "train_loss": 3.795919895172119, "lr": 0.00038644912618505326, "tps": 16530, "wall": 18514.7} {"step": 4670, "train_loss": 3.8849945068359375, "lr": 0.0003864418326649632, "tps": 16529, "wall": 18519.6} {"step": 4671, "train_loss": 3.812140703201294, "lr": 0.00038643453725941107, "tps": 16528, "wall": 18524.6} {"step": 4672, "train_loss": 3.7257285118103027, "lr": 0.0003864272399684795, "tps": 16527, "wall": 18529.6} {"step": 4673, "train_loss": 3.783088445663452, "lr": 0.00038641994079225106, "tps": 16526, "wall": 18534.6} {"step": 4674, "train_loss": 3.774995803833008, "lr": 0.0003864126397308086, "tps": 16525, "wall": 18539.5} {"step": 4675, "train_loss": 3.7459123134613037, "lr": 0.00038640533678423476, "tps": 16524, "wall": 18544.5} {"step": 4676, "train_loss": 3.803436756134033, "lr": 0.0003863980319526123, "tps": 16524, "wall": 18549.5} {"step": 4677, "train_loss": 3.9279932975769043, "lr": 0.00038639072523602387, "tps": 16523, "wall": 18554.4} {"step": 4678, "train_loss": 3.788783073425293, "lr": 0.0003863834166345523, "tps": 16522, "wall": 18559.4} {"step": 4679, "train_loss": 3.8078174591064453, "lr": 0.0003863761061482804, "tps": 16521, "wall": 18564.3} {"step": 4680, "train_loss": 3.7451910972595215, "lr": 0.000386368793777291, "tps": 16520, "wall": 18569.3} {"step": 4681, "train_loss": 3.728708505630493, "lr": 0.0003863614795216669, "tps": 16519, "wall": 18574.3} {"step": 4682, "train_loss": 3.8269054889678955, "lr": 0.0003863541633814909, "tps": 16518, "wall": 18579.2} {"step": 4683, "train_loss": 3.7245068550109863, "lr": 0.000386346845356846, "tps": 16517, "wall": 18584.2} {"step": 4684, "train_loss": 3.737459659576416, "lr": 0.000386339525447815, "tps": 16516, "wall": 18589.2} {"step": 4685, "train_loss": 3.7008185386657715, "lr": 0.0003863322036544809, "tps": 16516, "wall": 18594.2} {"step": 4686, "train_loss": 3.740111827850342, "lr": 0.00038632487997692657, "tps": 16515, "wall": 18599.1} {"step": 4687, "train_loss": 3.7238376140594482, "lr": 0.00038631755441523503, "tps": 16514, "wall": 18604.1} {"step": 4688, "train_loss": 3.701108455657959, "lr": 0.00038631022696948916, "tps": 16513, "wall": 18609.1} {"step": 4689, "train_loss": 3.7033157348632812, "lr": 0.00038630289763977207, "tps": 16512, "wall": 18614.0} {"step": 4690, "train_loss": 3.866755485534668, "lr": 0.00038629556642616675, "tps": 16511, "wall": 18619.0} {"step": 4691, "train_loss": 3.774606227874756, "lr": 0.0003862882333287563, "tps": 16510, "wall": 18623.9} {"step": 4692, "train_loss": 3.806232452392578, "lr": 0.00038628089834762374, "tps": 16509, "wall": 18628.9} {"step": 4693, "train_loss": 3.761806011199951, "lr": 0.00038627356148285215, "tps": 16508, "wall": 18633.9} {"step": 4694, "train_loss": 3.801636219024658, "lr": 0.00038626622273452464, "tps": 16508, "wall": 18638.8} {"step": 4695, "train_loss": 3.691721200942993, "lr": 0.0003862588821027244, "tps": 16507, "wall": 18643.8} {"step": 4696, "train_loss": 3.715169906616211, "lr": 0.0003862515395875346, "tps": 16506, "wall": 18648.7} {"step": 4697, "train_loss": 3.7206034660339355, "lr": 0.00038624419518903827, "tps": 16505, "wall": 18653.8} {"step": 4698, "train_loss": 3.802753448486328, "lr": 0.00038623684890731877, "tps": 16504, "wall": 18658.8} {"step": 4699, "train_loss": 3.8672289848327637, "lr": 0.0003862295007424592, "tps": 16503, "wall": 18663.7} {"step": 4700, "train_loss": 3.774174451828003, "lr": 0.00038622215069454287, "tps": 16502, "wall": 18668.7} {"step": 4701, "train_loss": 3.821449041366577, "lr": 0.00038621479876365305, "tps": 16501, "wall": 18673.7} {"step": 4702, "train_loss": 3.680420160293579, "lr": 0.0003862074449498729, "tps": 16500, "wall": 18678.6} {"step": 4703, "train_loss": 3.860351085662842, "lr": 0.0003862000892532859, "tps": 16500, "wall": 18683.6} {"step": 4704, "train_loss": 3.766702175140381, "lr": 0.00038619273167397536, "tps": 16499, "wall": 18688.5} {"step": 4705, "train_loss": 3.6325807571411133, "lr": 0.0003861853722120245, "tps": 16498, "wall": 18693.5} {"step": 4706, "train_loss": 3.7294464111328125, "lr": 0.0003861780108675167, "tps": 16497, "wall": 18698.5} {"step": 4707, "train_loss": 3.750256061553955, "lr": 0.0003861706476405355, "tps": 16496, "wall": 18703.5} {"step": 4708, "train_loss": 3.7725138664245605, "lr": 0.0003861632825311642, "tps": 16495, "wall": 18708.4} {"step": 4709, "train_loss": 3.681262254714966, "lr": 0.0003861559155394862, "tps": 16494, "wall": 18713.5} {"step": 4710, "train_loss": 3.857698440551758, "lr": 0.000386148546665585, "tps": 16493, "wall": 18718.4} {"step": 4711, "train_loss": 3.652493715286255, "lr": 0.0003861411759095441, "tps": 16493, "wall": 18723.4} {"step": 4712, "train_loss": 3.703319549560547, "lr": 0.00038613380327144696, "tps": 16492, "wall": 18728.4} {"step": 4713, "train_loss": 3.721494197845459, "lr": 0.0003861264287513771, "tps": 16491, "wall": 18733.3} {"step": 4714, "train_loss": 3.7102813720703125, "lr": 0.000386119052349418, "tps": 16490, "wall": 18738.3} {"step": 4715, "train_loss": 3.7447071075439453, "lr": 0.00038611167406565346, "tps": 16489, "wall": 18743.2} {"step": 4716, "train_loss": 3.7304794788360596, "lr": 0.0003861042939001668, "tps": 16488, "wall": 18748.2} {"step": 4717, "train_loss": 3.817352771759033, "lr": 0.0003860969118530417, "tps": 16487, "wall": 18753.2} {"step": 4718, "train_loss": 3.808377504348755, "lr": 0.0003860895279243618, "tps": 16486, "wall": 18758.1} {"step": 4719, "train_loss": 3.7402291297912598, "lr": 0.00038608214211421075, "tps": 16486, "wall": 18763.1} {"step": 4720, "train_loss": 3.7483890056610107, "lr": 0.00038607475442267215, "tps": 16485, "wall": 18768.1} {"step": 4721, "train_loss": 3.815581798553467, "lr": 0.00038606736484982985, "tps": 16484, "wall": 18773.1} {"step": 4722, "train_loss": 3.8255958557128906, "lr": 0.00038605997339576743, "tps": 16483, "wall": 18778.1} {"step": 4723, "train_loss": 3.884408950805664, "lr": 0.00038605258006056865, "tps": 16482, "wall": 18783.1} {"step": 4724, "train_loss": 3.8330204486846924, "lr": 0.00038604518484431716, "tps": 16481, "wall": 18788.0} {"step": 4725, "train_loss": 3.747993230819702, "lr": 0.000386037787747097, "tps": 16480, "wall": 18793.0} {"step": 4726, "train_loss": 3.808152437210083, "lr": 0.00038603038876899165, "tps": 16479, "wall": 18798.0} {"step": 4727, "train_loss": 3.76826548576355, "lr": 0.00038602298791008514, "tps": 16479, "wall": 18802.9} {"step": 4728, "train_loss": 3.718212366104126, "lr": 0.00038601558517046126, "tps": 16478, "wall": 18807.9} {"step": 4729, "train_loss": 3.9088568687438965, "lr": 0.00038600818055020377, "tps": 16477, "wall": 18812.8} {"step": 4730, "train_loss": 3.7567481994628906, "lr": 0.00038600077404939674, "tps": 16476, "wall": 18817.8} {"step": 4731, "train_loss": 3.9188737869262695, "lr": 0.0003859933656681239, "tps": 16475, "wall": 18822.7} {"step": 4732, "train_loss": 3.9209694862365723, "lr": 0.00038598595540646926, "tps": 16474, "wall": 18827.7} {"step": 4733, "train_loss": 3.780189037322998, "lr": 0.0003859785432645167, "tps": 16473, "wall": 18832.7} {"step": 4734, "train_loss": 3.6883323192596436, "lr": 0.00038597112924235026, "tps": 16473, "wall": 18837.7} {"step": 4735, "train_loss": 3.850471258163452, "lr": 0.0003859637133400539, "tps": 16472, "wall": 18842.6} {"step": 4736, "train_loss": 3.748488187789917, "lr": 0.0003859562955577115, "tps": 16471, "wall": 18847.6} {"step": 4737, "train_loss": 3.693319320678711, "lr": 0.0003859488758954073, "tps": 16470, "wall": 18852.5} {"step": 4738, "train_loss": 3.756906509399414, "lr": 0.0003859414543532253, "tps": 16469, "wall": 18857.5} {"step": 4739, "train_loss": 3.758262872695923, "lr": 0.0003859340309312495, "tps": 16468, "wall": 18862.4} {"step": 4740, "train_loss": 3.7352066040039062, "lr": 0.000385926605629564, "tps": 16467, "wall": 18867.4} {"step": 4741, "train_loss": 3.7165896892547607, "lr": 0.0003859191784482529, "tps": 16467, "wall": 18872.4} {"step": 4742, "train_loss": 3.7978386878967285, "lr": 0.00038591174938740034, "tps": 16466, "wall": 18877.3} {"step": 4743, "train_loss": 3.7947983741760254, "lr": 0.0003859043184470906, "tps": 16465, "wall": 18882.2} {"step": 4744, "train_loss": 3.782205581665039, "lr": 0.0003858968856274078, "tps": 16464, "wall": 18887.2} {"step": 4745, "train_loss": 3.7391505241394043, "lr": 0.000385889450928436, "tps": 16463, "wall": 18892.2} {"step": 4746, "train_loss": 3.736534833908081, "lr": 0.0003858820143502595, "tps": 16462, "wall": 18897.2} {"step": 4747, "train_loss": 3.9033658504486084, "lr": 0.0003858745758929627, "tps": 16461, "wall": 18902.1} {"step": 4748, "train_loss": 3.6776325702667236, "lr": 0.0003858671355566297, "tps": 16461, "wall": 18907.1} {"step": 4749, "train_loss": 3.7164855003356934, "lr": 0.0003858596933413447, "tps": 16460, "wall": 18912.0} {"step": 4750, "train_loss": 3.740703582763672, "lr": 0.0003858522492471922, "tps": 16459, "wall": 18917.0} {"step": 4751, "train_loss": 3.8218212127685547, "lr": 0.0003858448032742565, "tps": 16458, "wall": 18922.0} {"step": 4752, "train_loss": 3.80344557762146, "lr": 0.0003858373554226218, "tps": 16457, "wall": 18926.9} {"step": 4753, "train_loss": 3.662384510040283, "lr": 0.00038582990569237263, "tps": 16456, "wall": 18931.9} {"step": 4754, "train_loss": 3.778684616088867, "lr": 0.0003858224540835933, "tps": 16455, "wall": 18936.9} {"step": 4755, "train_loss": 3.8009841442108154, "lr": 0.0003858150005963682, "tps": 16455, "wall": 18941.8} {"step": 4756, "train_loss": 3.732445478439331, "lr": 0.0003858075452307819, "tps": 16454, "wall": 18946.8} {"step": 4757, "train_loss": 3.7787539958953857, "lr": 0.0003858000879869187, "tps": 16453, "wall": 18951.7} {"step": 4758, "train_loss": 3.759059429168701, "lr": 0.00038579262886486316, "tps": 16452, "wall": 18956.7} {"step": 4759, "train_loss": 3.7482402324676514, "lr": 0.00038578516786469966, "tps": 16451, "wall": 18961.7} {"step": 4760, "train_loss": 3.7442617416381836, "lr": 0.0003857777049865129, "tps": 16450, "wall": 18966.6} {"step": 4761, "train_loss": 3.706887722015381, "lr": 0.0003857702402303873, "tps": 16449, "wall": 18971.6} {"step": 4762, "train_loss": 3.7154150009155273, "lr": 0.0003857627735964074, "tps": 16449, "wall": 18976.5} {"step": 4763, "train_loss": 3.6782374382019043, "lr": 0.00038575530508465794, "tps": 16448, "wall": 18981.5} {"step": 4764, "train_loss": 3.7749481201171875, "lr": 0.00038574783469522334, "tps": 16447, "wall": 18986.5} {"step": 4765, "train_loss": 3.7914106845855713, "lr": 0.0003857403624281883, "tps": 16446, "wall": 18991.5} {"step": 4766, "train_loss": 3.6656603813171387, "lr": 0.0003857328882836375, "tps": 16445, "wall": 18996.4} {"step": 4767, "train_loss": 3.7263429164886475, "lr": 0.00038572541226165554, "tps": 16444, "wall": 19001.4} {"step": 4768, "train_loss": 3.8787827491760254, "lr": 0.0003857179343623272, "tps": 16444, "wall": 19006.3} {"step": 4769, "train_loss": 3.761787176132202, "lr": 0.0003857104545857371, "tps": 16443, "wall": 19011.3} {"step": 4770, "train_loss": 3.753821611404419, "lr": 0.00038570297293197, "tps": 16442, "wall": 19016.3} {"step": 4771, "train_loss": 3.730264186859131, "lr": 0.00038569548940111065, "tps": 16441, "wall": 19021.2} {"step": 4772, "train_loss": 3.61259388923645, "lr": 0.00038568800399324386, "tps": 16440, "wall": 19026.2} {"step": 4773, "train_loss": 3.7441539764404297, "lr": 0.00038568051670845435, "tps": 16439, "wall": 19031.2} {"step": 4774, "train_loss": 3.760613203048706, "lr": 0.0003856730275468271, "tps": 16438, "wall": 19036.1} {"step": 4775, "train_loss": 3.710516929626465, "lr": 0.0003856655365084467, "tps": 16438, "wall": 19041.1} {"step": 4776, "train_loss": 3.838627338409424, "lr": 0.00038565804359339825, "tps": 16437, "wall": 19046.1} {"step": 4777, "train_loss": 3.785062789916992, "lr": 0.0003856505488017665, "tps": 16436, "wall": 19051.0} {"step": 4778, "train_loss": 3.772268533706665, "lr": 0.0003856430521336363, "tps": 16435, "wall": 19056.0} {"step": 4779, "train_loss": 3.8749771118164062, "lr": 0.00038563555358909265, "tps": 16434, "wall": 19060.9} {"step": 4780, "train_loss": 3.753833770751953, "lr": 0.00038562805316822053, "tps": 16433, "wall": 19065.9} {"step": 4781, "train_loss": 3.7104177474975586, "lr": 0.00038562055087110485, "tps": 16433, "wall": 19070.9} {"step": 4782, "train_loss": 3.7921037673950195, "lr": 0.00038561304669783064, "tps": 16432, "wall": 19075.9} {"step": 4783, "train_loss": 3.7922372817993164, "lr": 0.0003856055406484828, "tps": 16431, "wall": 19080.9} {"step": 4784, "train_loss": 3.6888532638549805, "lr": 0.0003855980327231465, "tps": 16430, "wall": 19085.8} {"step": 4785, "train_loss": 3.784186601638794, "lr": 0.0003855905229219067, "tps": 16429, "wall": 19090.8} {"step": 4786, "train_loss": 3.651793956756592, "lr": 0.00038558301124484853, "tps": 16428, "wall": 19095.8} {"step": 4787, "train_loss": 3.7564947605133057, "lr": 0.00038557549769205703, "tps": 16427, "wall": 19100.8} {"step": 4788, "train_loss": 3.8552393913269043, "lr": 0.00038556798226361736, "tps": 16427, "wall": 19105.7} {"step": 4789, "train_loss": 3.7849831581115723, "lr": 0.00038556046495961455, "tps": 16426, "wall": 19110.7} {"step": 4790, "train_loss": 3.767909526824951, "lr": 0.0003855529457801339, "tps": 16425, "wall": 19115.6} {"step": 4791, "train_loss": 3.7057785987854004, "lr": 0.0003855454247252605, "tps": 16424, "wall": 19120.6} {"step": 4792, "train_loss": 3.691918134689331, "lr": 0.0003855379017950796, "tps": 16423, "wall": 19125.6} {"step": 4793, "train_loss": 3.74458909034729, "lr": 0.0003855303769896764, "tps": 16422, "wall": 19130.5} {"step": 4794, "train_loss": 3.853895664215088, "lr": 0.0003855228503091361, "tps": 16422, "wall": 19135.6} {"step": 4795, "train_loss": 3.826702833175659, "lr": 0.000385515321753544, "tps": 16421, "wall": 19140.6} {"step": 4796, "train_loss": 3.7014455795288086, "lr": 0.00038550779132298543, "tps": 16420, "wall": 19145.5} {"step": 4797, "train_loss": 3.71779727935791, "lr": 0.00038550025901754563, "tps": 16419, "wall": 19150.5} {"step": 4798, "train_loss": 3.68654727935791, "lr": 0.0003854927248373099, "tps": 16418, "wall": 19155.4} {"step": 4799, "train_loss": 3.7053465843200684, "lr": 0.00038548518878236363, "tps": 16417, "wall": 19160.4} {"step": 4800, "train_loss": 3.8056857585906982, "lr": 0.00038547765085279224, "tps": 16417, "wall": 19165.3} {"step": 4801, "train_loss": 3.7881274223327637, "lr": 0.000385470111048681, "tps": 16416, "wall": 19170.3} {"step": 4802, "train_loss": 3.746504783630371, "lr": 0.00038546256937011544, "tps": 16415, "wall": 19175.3} {"step": 4803, "train_loss": 3.732534408569336, "lr": 0.00038545502581718096, "tps": 16414, "wall": 19180.2} {"step": 4804, "train_loss": 3.764195442199707, "lr": 0.00038544748038996297, "tps": 16413, "wall": 19185.2} {"step": 4805, "train_loss": 3.6378631591796875, "lr": 0.0003854399330885469, "tps": 16412, "wall": 19190.1} {"step": 4806, "train_loss": 3.731869697570801, "lr": 0.00038543238391301846, "tps": 16412, "wall": 19195.2} {"step": 4807, "train_loss": 3.6981148719787598, "lr": 0.0003854248328634629, "tps": 16411, "wall": 19200.1} {"step": 4808, "train_loss": 3.837827682495117, "lr": 0.00038541727993996594, "tps": 16410, "wall": 19205.1} {"step": 4809, "train_loss": 3.7467799186706543, "lr": 0.00038540972514261313, "tps": 16409, "wall": 19210.1} {"step": 4810, "train_loss": 3.8178577423095703, "lr": 0.00038540216847149, "tps": 16408, "wall": 19215.0} {"step": 4811, "train_loss": 3.7621374130249023, "lr": 0.000385394609926682, "tps": 16407, "wall": 19220.0} {"step": 4812, "train_loss": 3.7918267250061035, "lr": 0.0003853870495082751, "tps": 16407, "wall": 19224.9} {"step": 4813, "train_loss": 3.787480115890503, "lr": 0.00038537948721635465, "tps": 16406, "wall": 19229.9} {"step": 4814, "train_loss": 3.7839293479919434, "lr": 0.0003853719230510064, "tps": 16405, "wall": 19234.9} {"step": 4815, "train_loss": 3.838656425476074, "lr": 0.00038536435701231616, "tps": 16404, "wall": 19239.8} {"step": 4816, "train_loss": 3.6986546516418457, "lr": 0.0003853567891003695, "tps": 16403, "wall": 19244.8} {"step": 4817, "train_loss": 3.732447624206543, "lr": 0.00038534921931525216, "tps": 16402, "wall": 19249.8} {"step": 4818, "train_loss": 3.780170202255249, "lr": 0.00038534164765705, "tps": 16402, "wall": 19254.8} {"step": 4819, "train_loss": 3.875823974609375, "lr": 0.0003853340741258486, "tps": 16401, "wall": 19259.7} {"step": 4820, "train_loss": 3.7510926723480225, "lr": 0.0003853264987217339, "tps": 16400, "wall": 19264.7} {"step": 4821, "train_loss": 3.851184606552124, "lr": 0.00038531892144479167, "tps": 16399, "wall": 19269.7} {"step": 4822, "train_loss": 3.7511520385742188, "lr": 0.0003853113422951078, "tps": 16398, "wall": 19274.7} {"step": 4823, "train_loss": 3.785588026046753, "lr": 0.00038530376127276806, "tps": 16397, "wall": 19279.7} {"step": 4824, "train_loss": 3.756518602371216, "lr": 0.0003852961783778584, "tps": 16397, "wall": 19284.6} {"step": 4825, "train_loss": 3.8374955654144287, "lr": 0.00038528859361046467, "tps": 16396, "wall": 19289.6} {"step": 4826, "train_loss": 3.801478385925293, "lr": 0.00038528100697067286, "tps": 16395, "wall": 19294.6} {"step": 4827, "train_loss": 3.66365122795105, "lr": 0.0003852734184585688, "tps": 16394, "wall": 19299.5} {"step": 4828, "train_loss": 3.847952365875244, "lr": 0.0003852658280742385, "tps": 16393, "wall": 19304.5} {"step": 4829, "train_loss": 3.903195858001709, "lr": 0.000385258235817768, "tps": 16392, "wall": 19309.5} {"step": 4830, "train_loss": 3.824662923812866, "lr": 0.0003852506416892432, "tps": 16392, "wall": 19314.5} {"step": 4831, "train_loss": 3.6662135124206543, "lr": 0.00038524304568875027, "tps": 16391, "wall": 19319.5} {"step": 4832, "train_loss": 3.782998561859131, "lr": 0.0003852354478163752, "tps": 16390, "wall": 19324.4} {"step": 4833, "train_loss": 3.7955427169799805, "lr": 0.0003852278480722039, "tps": 16389, "wall": 19329.4} {"step": 4834, "train_loss": 3.7647862434387207, "lr": 0.0003852202464563227, "tps": 16388, "wall": 19334.3} {"step": 4835, "train_loss": 3.7222752571105957, "lr": 0.00038521264296881763, "tps": 16387, "wall": 19339.3} {"step": 4836, "train_loss": 3.7503714561462402, "lr": 0.0003852050376097748, "tps": 16387, "wall": 19344.3} {"step": 4837, "train_loss": 3.7851409912109375, "lr": 0.0003851974303792803, "tps": 16386, "wall": 19349.3} {"step": 4838, "train_loss": 3.8068814277648926, "lr": 0.0003851898212774204, "tps": 16385, "wall": 19354.3} {"step": 4839, "train_loss": 3.8279058933258057, "lr": 0.00038518221030428134, "tps": 16384, "wall": 19359.2} {"step": 4840, "train_loss": 3.7945027351379395, "lr": 0.00038517459745994914, "tps": 16383, "wall": 19364.2} {"step": 4841, "train_loss": 3.748811960220337, "lr": 0.00038516698274451027, "tps": 16383, "wall": 19369.2} {"step": 4842, "train_loss": 3.821450710296631, "lr": 0.0003851593661580508, "tps": 16382, "wall": 19374.2} {"step": 4843, "train_loss": 3.7008919715881348, "lr": 0.00038515174770065717, "tps": 16381, "wall": 19379.1} {"step": 4844, "train_loss": 3.708928108215332, "lr": 0.00038514412737241554, "tps": 16380, "wall": 19384.1} {"step": 4845, "train_loss": 3.8051199913024902, "lr": 0.0003851365051734124, "tps": 16379, "wall": 19389.1} {"step": 4846, "train_loss": 3.7797977924346924, "lr": 0.00038512888110373385, "tps": 16378, "wall": 19394.0} {"step": 4847, "train_loss": 3.8443613052368164, "lr": 0.0003851212551634665, "tps": 16378, "wall": 19399.0} {"step": 4848, "train_loss": 3.7627947330474854, "lr": 0.00038511362735269667, "tps": 16377, "wall": 19404.0} {"step": 4849, "train_loss": 3.6881284713745117, "lr": 0.0003851059976715107, "tps": 16376, "wall": 19408.9} {"step": 4850, "train_loss": 3.6197011470794678, "lr": 0.000385098366119995, "tps": 16375, "wall": 19413.9} {"step": 4851, "train_loss": 3.708239793777466, "lr": 0.0003850907326982361, "tps": 16374, "wall": 19418.9} {"step": 4852, "train_loss": 3.739492654800415, "lr": 0.0003850830974063205, "tps": 16374, "wall": 19423.8} {"step": 4853, "train_loss": 3.8057661056518555, "lr": 0.0003850754602443346, "tps": 16373, "wall": 19428.8} {"step": 4854, "train_loss": 3.838869094848633, "lr": 0.00038506782121236493, "tps": 16372, "wall": 19433.8} {"step": 4855, "train_loss": 3.8480849266052246, "lr": 0.0003850601803104981, "tps": 16371, "wall": 19438.8} {"step": 4856, "train_loss": 3.787525177001953, "lr": 0.0003850525375388206, "tps": 16370, "wall": 19443.8} {"step": 4857, "train_loss": 3.844017744064331, "lr": 0.00038504489289741906, "tps": 16369, "wall": 19448.7} {"step": 4858, "train_loss": 3.7652273178100586, "lr": 0.00038503724638638, "tps": 16369, "wall": 19453.7} {"step": 4859, "train_loss": 3.7721786499023438, "lr": 0.0003850295980057901, "tps": 16368, "wall": 19458.7} {"step": 4860, "train_loss": 3.763186454772949, "lr": 0.000385021947755736, "tps": 16367, "wall": 19463.7} {"step": 4861, "train_loss": 3.7167067527770996, "lr": 0.0003850142956363043, "tps": 16366, "wall": 19468.7} {"step": 4862, "train_loss": 3.7745208740234375, "lr": 0.0003850066416475818, "tps": 16365, "wall": 19473.6} {"step": 4863, "train_loss": 3.7799768447875977, "lr": 0.0003849989857896551, "tps": 16364, "wall": 19478.6} {"step": 4864, "train_loss": 3.7362022399902344, "lr": 0.00038499132806261093, "tps": 16364, "wall": 19483.6} {"step": 4865, "train_loss": 3.716860055923462, "lr": 0.0003849836684665362, "tps": 16363, "wall": 19488.5} {"step": 4866, "train_loss": 3.7827351093292236, "lr": 0.0003849760070015174, "tps": 16362, "wall": 19493.6} {"step": 4867, "train_loss": 3.73833966255188, "lr": 0.00038496834366764156, "tps": 16361, "wall": 19498.5} {"step": 4868, "train_loss": 3.800846576690674, "lr": 0.0003849606784649954, "tps": 16360, "wall": 19503.5} {"step": 4869, "train_loss": 3.8294708728790283, "lr": 0.0003849530113936656, "tps": 16360, "wall": 19508.4} {"step": 4870, "train_loss": 3.7439422607421875, "lr": 0.0003849453424537393, "tps": 16359, "wall": 19513.4} {"step": 4871, "train_loss": 3.78432559967041, "lr": 0.0003849376716453032, "tps": 16358, "wall": 19518.4} {"step": 4872, "train_loss": 3.768972873687744, "lr": 0.00038492999896844426, "tps": 16357, "wall": 19523.4} {"step": 4873, "train_loss": 3.7811391353607178, "lr": 0.00038492232442324933, "tps": 16356, "wall": 19528.4} {"step": 4874, "train_loss": 3.7519454956054688, "lr": 0.0003849146480098054, "tps": 16356, "wall": 19533.3} {"step": 4875, "train_loss": 3.7522292137145996, "lr": 0.0003849069697281994, "tps": 16355, "wall": 19538.3} {"step": 4876, "train_loss": 3.739673137664795, "lr": 0.0003848992895785184, "tps": 16354, "wall": 19543.3} {"step": 4877, "train_loss": 3.75534725189209, "lr": 0.0003848916075608493, "tps": 16353, "wall": 19548.2} {"step": 4878, "train_loss": 3.657838821411133, "lr": 0.0003848839236752791, "tps": 16352, "wall": 19553.3} {"step": 4879, "train_loss": 3.81779146194458, "lr": 0.0003848762379218949, "tps": 16351, "wall": 19558.2} {"step": 4880, "train_loss": 3.773367404937744, "lr": 0.00038486855030078385, "tps": 16351, "wall": 19563.2} {"step": 4881, "train_loss": 3.804708957672119, "lr": 0.0003848608608120328, "tps": 16350, "wall": 19568.1} {"step": 4882, "train_loss": 3.8685407638549805, "lr": 0.0003848531694557291, "tps": 16349, "wall": 19573.1} {"step": 4883, "train_loss": 3.739985466003418, "lr": 0.0003848454762319597, "tps": 16348, "wall": 19578.1} {"step": 4884, "train_loss": 3.761700391769409, "lr": 0.00038483778114081193, "tps": 16347, "wall": 19583.0} {"step": 4885, "train_loss": 3.7486886978149414, "lr": 0.00038483008418237273, "tps": 16347, "wall": 19588.0} {"step": 4886, "train_loss": 3.722799062728882, "lr": 0.00038482238535672954, "tps": 16346, "wall": 19593.0} {"step": 4887, "train_loss": 3.6384119987487793, "lr": 0.0003848146846639694, "tps": 16345, "wall": 19597.9} {"step": 4888, "train_loss": 3.7721261978149414, "lr": 0.00038480698210417957, "tps": 16344, "wall": 19602.9} {"step": 4889, "train_loss": 3.8599376678466797, "lr": 0.0003847992776774474, "tps": 16343, "wall": 19607.9} {"step": 4890, "train_loss": 3.813228130340576, "lr": 0.00038479157138386004, "tps": 16343, "wall": 19612.9} {"step": 4891, "train_loss": 3.829596519470215, "lr": 0.00038478386322350486, "tps": 16342, "wall": 19617.9} {"step": 4892, "train_loss": 3.7949609756469727, "lr": 0.00038477615319646916, "tps": 16341, "wall": 19622.8} {"step": 4893, "train_loss": 3.7550837993621826, "lr": 0.0003847684413028403, "tps": 16340, "wall": 19627.8} {"step": 4894, "train_loss": 3.742215156555176, "lr": 0.0003847607275427056, "tps": 16339, "wall": 19632.8} {"step": 4895, "train_loss": 3.7245168685913086, "lr": 0.00038475301191615247, "tps": 16339, "wall": 19637.7} {"step": 4896, "train_loss": 3.8263368606567383, "lr": 0.00038474529442326835, "tps": 16338, "wall": 19642.7} {"step": 4897, "train_loss": 3.782029390335083, "lr": 0.0003847375750641406, "tps": 16337, "wall": 19647.7} {"step": 4898, "train_loss": 3.7292020320892334, "lr": 0.0003847298538388566, "tps": 16336, "wall": 19652.6} {"step": 4899, "train_loss": 3.7129621505737305, "lr": 0.000384722130747504, "tps": 16335, "wall": 19657.6} {"step": 4900, "train_loss": 3.7956089973449707, "lr": 0.00038471440579017016, "tps": 16335, "wall": 19662.6} {"step": 4901, "train_loss": 3.686244487762451, "lr": 0.00038470667896694263, "tps": 16334, "wall": 19667.5} {"step": 4902, "train_loss": 3.7310333251953125, "lr": 0.00038469895027790893, "tps": 16333, "wall": 19672.5} {"step": 4903, "train_loss": 3.581819772720337, "lr": 0.0003846912197231566, "tps": 16332, "wall": 19677.6} {"step": 4904, "train_loss": 3.761854410171509, "lr": 0.00038468348730277325, "tps": 16331, "wall": 19682.6} {"step": 4905, "train_loss": 3.7238056659698486, "lr": 0.0003846757530168464, "tps": 16331, "wall": 19687.6} {"step": 4906, "train_loss": 3.7787423133850098, "lr": 0.0003846680168654638, "tps": 16330, "wall": 19692.5} {"step": 4907, "train_loss": 3.7568345069885254, "lr": 0.00038466027884871294, "tps": 16329, "wall": 19697.5} {"step": 4908, "train_loss": 3.7177605628967285, "lr": 0.0003846525389666815, "tps": 16328, "wall": 19702.5} {"step": 4909, "train_loss": 3.885460376739502, "lr": 0.0003846447972194572, "tps": 16327, "wall": 19707.5} {"step": 4910, "train_loss": 3.729154348373413, "lr": 0.00038463705360712775, "tps": 16327, "wall": 19712.4} {"step": 4911, "train_loss": 3.8577122688293457, "lr": 0.00038462930812978085, "tps": 16326, "wall": 19717.4} {"step": 4912, "train_loss": 3.8009276390075684, "lr": 0.00038462156078750425, "tps": 16325, "wall": 19722.4} {"step": 4913, "train_loss": 3.7701773643493652, "lr": 0.0003846138115803857, "tps": 16324, "wall": 19727.3} {"step": 4914, "train_loss": 3.7229843139648438, "lr": 0.000384606060508513, "tps": 16323, "wall": 19732.3} {"step": 4915, "train_loss": 3.7309298515319824, "lr": 0.0003845983075719739, "tps": 16323, "wall": 19737.3} {"step": 4916, "train_loss": 3.782946825027466, "lr": 0.0003845905527708563, "tps": 16322, "wall": 19742.3} {"step": 4917, "train_loss": 3.9424729347229004, "lr": 0.00038458279610524803, "tps": 16321, "wall": 19747.3} {"step": 4918, "train_loss": 3.738191843032837, "lr": 0.0003845750375752369, "tps": 16320, "wall": 19752.2} {"step": 4919, "train_loss": 3.843050956726074, "lr": 0.0003845672771809108, "tps": 16319, "wall": 19757.2} {"step": 4920, "train_loss": 3.7443008422851562, "lr": 0.00038455951492235777, "tps": 16319, "wall": 19762.2} {"step": 4921, "train_loss": 3.833266258239746, "lr": 0.00038455175079966567, "tps": 16318, "wall": 19767.2} {"step": 4922, "train_loss": 3.837491512298584, "lr": 0.0003845439848129224, "tps": 16317, "wall": 19772.2} {"step": 4923, "train_loss": 3.767717123031616, "lr": 0.00038453621696221587, "tps": 16316, "wall": 19777.1} {"step": 4924, "train_loss": 3.6566226482391357, "lr": 0.0003845284472476343, "tps": 16316, "wall": 19782.1} {"step": 4925, "train_loss": 3.777235269546509, "lr": 0.00038452067566926556, "tps": 16315, "wall": 19787.0} {"step": 4926, "train_loss": 3.8801095485687256, "lr": 0.0003845129022271976, "tps": 16314, "wall": 19792.0} {"step": 4927, "train_loss": 3.806272029876709, "lr": 0.0003845051269215187, "tps": 16313, "wall": 19797.0} {"step": 4928, "train_loss": 3.654611110687256, "lr": 0.0003844973497523168, "tps": 16312, "wall": 19802.0} {"step": 4929, "train_loss": 3.691397190093994, "lr": 0.00038448957071968, "tps": 16312, "wall": 19807.0} {"step": 4930, "train_loss": 3.8727405071258545, "lr": 0.0003844817898236965, "tps": 16311, "wall": 19812.0} {"step": 4931, "train_loss": 3.7789306640625, "lr": 0.00038447400706445427, "tps": 16310, "wall": 19816.9} {"step": 4932, "train_loss": 3.7045230865478516, "lr": 0.00038446622244204165, "tps": 16309, "wall": 19821.9} {"step": 4933, "train_loss": 3.6811938285827637, "lr": 0.0003844584359565468, "tps": 16308, "wall": 19826.9} {"step": 4934, "train_loss": 3.788062572479248, "lr": 0.0003844506476080579, "tps": 16308, "wall": 19831.8} {"step": 4935, "train_loss": 3.671165943145752, "lr": 0.0003844428573966631, "tps": 16307, "wall": 19836.8} {"step": 4936, "train_loss": 3.8121676445007324, "lr": 0.0003844350653224508, "tps": 16306, "wall": 19841.8} {"step": 4937, "train_loss": 3.713489294052124, "lr": 0.0003844272713855091, "tps": 16305, "wall": 19846.7} {"step": 4938, "train_loss": 3.6711337566375732, "lr": 0.00038441947558592643, "tps": 16305, "wall": 19851.7} {"step": 4939, "train_loss": 3.8146119117736816, "lr": 0.000384411677923791, "tps": 16304, "wall": 19856.7} {"step": 4940, "train_loss": 3.7321412563323975, "lr": 0.00038440387839919123, "tps": 16303, "wall": 19861.7} {"step": 4941, "train_loss": 3.7737598419189453, "lr": 0.0003843960770122154, "tps": 16302, "wall": 19866.7} {"step": 4942, "train_loss": 3.628441572189331, "lr": 0.0003843882737629519, "tps": 16301, "wall": 19871.6} {"step": 4943, "train_loss": 3.704033851623535, "lr": 0.00038438046865148923, "tps": 16301, "wall": 19876.6} {"step": 4944, "train_loss": 3.7534079551696777, "lr": 0.0003843726616779156, "tps": 16300, "wall": 19881.6} {"step": 4945, "train_loss": 3.69329833984375, "lr": 0.00038436485284231965, "tps": 16299, "wall": 19886.6} {"step": 4946, "train_loss": 3.70858097076416, "lr": 0.0003843570421447897, "tps": 16298, "wall": 19891.5} {"step": 4947, "train_loss": 3.687695026397705, "lr": 0.00038434922958541435, "tps": 16297, "wall": 19896.5} {"step": 4948, "train_loss": 3.720428943634033, "lr": 0.000384341415164282, "tps": 16297, "wall": 19901.5} {"step": 4949, "train_loss": 3.7750115394592285, "lr": 0.00038433359888148124, "tps": 16296, "wall": 19906.4} {"step": 4950, "train_loss": 3.772177219390869, "lr": 0.00038432578073710054, "tps": 16295, "wall": 19911.4} {"step": 4951, "train_loss": 3.820422887802124, "lr": 0.00038431796073122847, "tps": 16294, "wall": 19916.4} {"step": 4952, "train_loss": 3.6923863887786865, "lr": 0.0003843101388639537, "tps": 16294, "wall": 19921.4} {"step": 4953, "train_loss": 3.8401880264282227, "lr": 0.0003843023151353648, "tps": 16293, "wall": 19926.3} {"step": 4954, "train_loss": 3.7158045768737793, "lr": 0.00038429448954555045, "tps": 16292, "wall": 19931.3} {"step": 4955, "train_loss": 3.794431209564209, "lr": 0.0003842866620945991, "tps": 16291, "wall": 19936.3} {"step": 4956, "train_loss": 3.7534937858581543, "lr": 0.0003842788327825996, "tps": 16290, "wall": 19941.2} {"step": 4957, "train_loss": 3.687060832977295, "lr": 0.0003842710016096406, "tps": 16290, "wall": 19946.2} {"step": 4958, "train_loss": 3.7902371883392334, "lr": 0.00038426316857581084, "tps": 16289, "wall": 19951.2} {"step": 4959, "train_loss": 3.6823713779449463, "lr": 0.00038425533368119895, "tps": 16288, "wall": 19956.2} {"step": 4960, "train_loss": 3.7299845218658447, "lr": 0.00038424749692589377, "tps": 16287, "wall": 19961.1} {"step": 4961, "train_loss": 3.646707773208618, "lr": 0.0003842396583099842, "tps": 16287, "wall": 19966.1} {"step": 4962, "train_loss": 3.653937339782715, "lr": 0.0003842318178335587, "tps": 16286, "wall": 19971.1} {"step": 4963, "train_loss": 3.7658050060272217, "lr": 0.0003842239754967064, "tps": 16285, "wall": 19976.1} {"step": 4964, "train_loss": 3.75337815284729, "lr": 0.00038421613129951596, "tps": 16284, "wall": 19981.1} {"step": 4965, "train_loss": 3.8373312950134277, "lr": 0.00038420828524207636, "tps": 16283, "wall": 19986.1} {"step": 4966, "train_loss": 3.8103530406951904, "lr": 0.00038420043732447634, "tps": 16283, "wall": 19991.0} {"step": 4967, "train_loss": 3.6362011432647705, "lr": 0.00038419258754680493, "tps": 16282, "wall": 19996.0} {"step": 4968, "train_loss": 3.672792434692383, "lr": 0.000384184735909151, "tps": 16281, "wall": 20001.0} {"step": 4969, "train_loss": 3.640153169631958, "lr": 0.00038417688241160355, "tps": 16280, "wall": 20006.0} {"step": 4970, "train_loss": 3.7787585258483887, "lr": 0.00038416902705425143, "tps": 16280, "wall": 20011.0} {"step": 4971, "train_loss": 3.748042345046997, "lr": 0.0003841611698371837, "tps": 16279, "wall": 20015.9} {"step": 4972, "train_loss": 3.7788162231445312, "lr": 0.00038415331076048937, "tps": 16278, "wall": 20020.9} {"step": 4973, "train_loss": 3.8350510597229004, "lr": 0.0003841454498242574, "tps": 16277, "wall": 20025.9} {"step": 4974, "train_loss": 3.676692485809326, "lr": 0.000384137587028577, "tps": 16276, "wall": 20030.8} {"step": 4975, "train_loss": 3.6772875785827637, "lr": 0.0003841297223735371, "tps": 16276, "wall": 20035.9} {"step": 4976, "train_loss": 3.894779682159424, "lr": 0.00038412185585922677, "tps": 16275, "wall": 20040.8} {"step": 4977, "train_loss": 3.7423832416534424, "lr": 0.0003841139874857352, "tps": 16274, "wall": 20045.8} {"step": 4978, "train_loss": 3.767573833465576, "lr": 0.0003841061172531516, "tps": 16273, "wall": 20050.8} {"step": 4979, "train_loss": 3.896864414215088, "lr": 0.0003840982451615649, "tps": 16273, "wall": 20055.7} {"step": 4980, "train_loss": 3.7334346771240234, "lr": 0.0003840903712110644, "tps": 16272, "wall": 20060.7} {"step": 4981, "train_loss": 3.6866683959960938, "lr": 0.0003840824954017394, "tps": 16271, "wall": 20065.7} {"step": 4982, "train_loss": 3.8117127418518066, "lr": 0.0003840746177336789, "tps": 16270, "wall": 20070.7} {"step": 4983, "train_loss": 3.724578380584717, "lr": 0.0003840667382069723, "tps": 16270, "wall": 20075.6} {"step": 4984, "train_loss": 3.7952823638916016, "lr": 0.00038405885682170885, "tps": 16269, "wall": 20080.6} {"step": 4985, "train_loss": 3.6801187992095947, "lr": 0.00038405097357797777, "tps": 16268, "wall": 20085.6} {"step": 4986, "train_loss": 3.802806854248047, "lr": 0.0003840430884758684, "tps": 16267, "wall": 20090.5} {"step": 4987, "train_loss": 3.6665735244750977, "lr": 0.00038403520151547, "tps": 16266, "wall": 20095.6} {"step": 4988, "train_loss": 3.762791633605957, "lr": 0.000384027312696872, "tps": 16266, "wall": 20100.5} {"step": 4989, "train_loss": 3.779900550842285, "lr": 0.00038401942202016375, "tps": 16265, "wall": 20105.5} {"step": 4990, "train_loss": 3.798389434814453, "lr": 0.0003840115294854346, "tps": 16264, "wall": 20110.5} {"step": 4991, "train_loss": 3.801452159881592, "lr": 0.0003840036350927739, "tps": 16263, "wall": 20115.4} {"step": 4992, "train_loss": 3.7386674880981445, "lr": 0.00038399573884227126, "tps": 16263, "wall": 20120.4} {"step": 4993, "train_loss": 3.6847164630889893, "lr": 0.00038398784073401596, "tps": 16262, "wall": 20125.4} {"step": 4994, "train_loss": 3.73936128616333, "lr": 0.0003839799407680975, "tps": 16261, "wall": 20130.4} {"step": 4995, "train_loss": 3.785799503326416, "lr": 0.00038397203894460546, "tps": 16260, "wall": 20135.3} {"step": 4996, "train_loss": 3.7259340286254883, "lr": 0.0003839641352636293, "tps": 16260, "wall": 20140.3} {"step": 4997, "train_loss": 3.7363100051879883, "lr": 0.0003839562297252585, "tps": 16259, "wall": 20145.3} {"step": 4998, "train_loss": 3.8046398162841797, "lr": 0.0003839483223295826, "tps": 16258, "wall": 20150.2} {"step": 4999, "train_loss": 3.777237892150879, "lr": 0.00038394041307669133, "tps": 16257, "wall": 20155.3} {"step": 5000, "train_loss": 3.6983797550201416, "lr": 0.0003839325019666742, "tps": 16257, "wall": 20160.3, "val_loss_monitor": 3.76510626974467, "val_loss_full": 3.7794146229135652} {"step": 5001, "train_loss": 3.7070789337158203, "lr": 0.0003839245889996208, "tps": 16121, "wall": 20334.3} {"step": 5002, "train_loss": 4.022380352020264, "lr": 0.0003839166741756208, "tps": 16120, "wall": 20339.3} {"step": 5003, "train_loss": 3.6235945224761963, "lr": 0.00038390875749476377, "tps": 16119, "wall": 20344.3} {"step": 5004, "train_loss": 3.804180383682251, "lr": 0.00038390083895713955, "tps": 16118, "wall": 20349.3} {"step": 5005, "train_loss": 3.740335464477539, "lr": 0.0003838929185628377, "tps": 16118, "wall": 20354.4} {"step": 5006, "train_loss": 3.7426888942718506, "lr": 0.000383884996311948, "tps": 16117, "wall": 20359.4} {"step": 5007, "train_loss": 3.681882858276367, "lr": 0.0003838770722045603, "tps": 16116, "wall": 20364.4} {"step": 5008, "train_loss": 3.755317211151123, "lr": 0.00038386914624076413, "tps": 16115, "wall": 20369.4} {"step": 5009, "train_loss": 3.842543601989746, "lr": 0.0003838612184206495, "tps": 16115, "wall": 20374.4} {"step": 5010, "train_loss": 3.7796578407287598, "lr": 0.00038385328874430605, "tps": 16114, "wall": 20379.5} {"step": 5011, "train_loss": 3.7589752674102783, "lr": 0.0003838453572118237, "tps": 16113, "wall": 20384.6} {"step": 5012, "train_loss": 3.8822498321533203, "lr": 0.0003838374238232923, "tps": 16112, "wall": 20389.7} {"step": 5013, "train_loss": 3.7079315185546875, "lr": 0.00038382948857880174, "tps": 16111, "wall": 20394.7} {"step": 5014, "train_loss": 3.7329111099243164, "lr": 0.0003838215514784418, "tps": 16111, "wall": 20399.7} {"step": 5015, "train_loss": 3.7257895469665527, "lr": 0.00038381361252230257, "tps": 16110, "wall": 20404.8} {"step": 5016, "train_loss": 3.786569118499756, "lr": 0.00038380567171047373, "tps": 16109, "wall": 20409.8} {"step": 5017, "train_loss": 3.73142671585083, "lr": 0.0003837977290430455, "tps": 16108, "wall": 20414.8} {"step": 5018, "train_loss": 3.785442590713501, "lr": 0.0003837897845201076, "tps": 16108, "wall": 20419.8} {"step": 5019, "train_loss": 3.8304319381713867, "lr": 0.00038378183814175026, "tps": 16107, "wall": 20424.8} {"step": 5020, "train_loss": 3.761117696762085, "lr": 0.00038377388990806343, "tps": 16106, "wall": 20429.8} {"step": 5021, "train_loss": 3.6762237548828125, "lr": 0.00038376593981913706, "tps": 16105, "wall": 20434.8} {"step": 5022, "train_loss": 3.7262701988220215, "lr": 0.00038375798787506125, "tps": 16105, "wall": 20439.8} {"step": 5023, "train_loss": 3.7157363891601562, "lr": 0.00038375003407592614, "tps": 16104, "wall": 20444.8} {"step": 5024, "train_loss": 3.626434564590454, "lr": 0.00038374207842182173, "tps": 16103, "wall": 20449.8} {"step": 5025, "train_loss": 3.782442092895508, "lr": 0.00038373412091283817, "tps": 16102, "wall": 20454.9} {"step": 5026, "train_loss": 3.7948851585388184, "lr": 0.00038372616154906566, "tps": 16102, "wall": 20459.9} {"step": 5027, "train_loss": 3.722223997116089, "lr": 0.0003837182003305944, "tps": 16101, "wall": 20465.0} {"step": 5028, "train_loss": 3.8227500915527344, "lr": 0.00038371023725751447, "tps": 16100, "wall": 20469.9} {"step": 5029, "train_loss": 3.8040032386779785, "lr": 0.0003837022723299161, "tps": 16099, "wall": 20474.9} {"step": 5030, "train_loss": 3.8226845264434814, "lr": 0.0003836943055478896, "tps": 16099, "wall": 20479.9} {"step": 5031, "train_loss": 3.754182815551758, "lr": 0.0003836863369115251, "tps": 16098, "wall": 20485.0} {"step": 5032, "train_loss": 3.7756645679473877, "lr": 0.00038367836642091285, "tps": 16097, "wall": 20490.0} {"step": 5033, "train_loss": 3.634669780731201, "lr": 0.0003836703940761433, "tps": 16097, "wall": 20495.0} {"step": 5034, "train_loss": 3.803567886352539, "lr": 0.00038366241987730664, "tps": 16096, "wall": 20500.0} {"step": 5035, "train_loss": 3.8288989067077637, "lr": 0.0003836544438244933, "tps": 16095, "wall": 20505.0} {"step": 5036, "train_loss": 3.748485565185547, "lr": 0.00038364646591779346, "tps": 16094, "wall": 20510.0} {"step": 5037, "train_loss": 3.760166645050049, "lr": 0.00038363848615729763, "tps": 16094, "wall": 20515.0} {"step": 5038, "train_loss": 3.7214879989624023, "lr": 0.0003836305045430962, "tps": 16093, "wall": 20520.0} {"step": 5039, "train_loss": 3.740262031555176, "lr": 0.00038362252107527957, "tps": 16092, "wall": 20525.0} {"step": 5040, "train_loss": 3.737562656402588, "lr": 0.0003836145357539382, "tps": 16091, "wall": 20530.0} {"step": 5041, "train_loss": 3.7135114669799805, "lr": 0.00038360654857916244, "tps": 16091, "wall": 20535.0} {"step": 5042, "train_loss": 3.772454023361206, "lr": 0.0003835985595510429, "tps": 16090, "wall": 20540.0} {"step": 5043, "train_loss": 3.7173309326171875, "lr": 0.00038359056866967, "tps": 16089, "wall": 20545.0} {"step": 5044, "train_loss": 3.6967427730560303, "lr": 0.00038358257593513426, "tps": 16089, "wall": 20550.0} {"step": 5045, "train_loss": 3.7568233013153076, "lr": 0.0003835745813475263, "tps": 16088, "wall": 20555.0} {"step": 5046, "train_loss": 3.7605509757995605, "lr": 0.00038356658490693664, "tps": 16087, "wall": 20559.9} {"step": 5047, "train_loss": 3.7861199378967285, "lr": 0.0003835585866134558, "tps": 16086, "wall": 20564.9} {"step": 5048, "train_loss": 3.802572727203369, "lr": 0.0003835505864671745, "tps": 16086, "wall": 20569.9} {"step": 5049, "train_loss": 3.871835231781006, "lr": 0.00038354258446818333, "tps": 16085, "wall": 20575.0} {"step": 5050, "train_loss": 3.697575092315674, "lr": 0.0003835345806165728, "tps": 16084, "wall": 20580.0} {"step": 5051, "train_loss": 3.655374765396118, "lr": 0.0003835265749124338, "tps": 16083, "wall": 20584.9} {"step": 5052, "train_loss": 3.7510826587677, "lr": 0.00038351856735585686, "tps": 16083, "wall": 20589.9} {"step": 5053, "train_loss": 3.718536853790283, "lr": 0.0003835105579469328, "tps": 16082, "wall": 20594.9} {"step": 5054, "train_loss": 3.7001655101776123, "lr": 0.0003835025466857523, "tps": 16081, "wall": 20599.9} {"step": 5055, "train_loss": 3.728698492050171, "lr": 0.000383494533572406, "tps": 16081, "wall": 20604.9} {"step": 5056, "train_loss": 3.7420365810394287, "lr": 0.0003834865186069849, "tps": 16080, "wall": 20609.9} {"step": 5057, "train_loss": 3.764585494995117, "lr": 0.0003834785017895796, "tps": 16079, "wall": 20614.9} {"step": 5058, "train_loss": 3.782728433609009, "lr": 0.000383470483120281, "tps": 16078, "wall": 20619.9} {"step": 5059, "train_loss": 3.734388828277588, "lr": 0.00038346246259917993, "tps": 16078, "wall": 20624.8} {"step": 5060, "train_loss": 3.665703773498535, "lr": 0.0003834544402263672, "tps": 16077, "wall": 20629.8} {"step": 5061, "train_loss": 3.8406500816345215, "lr": 0.00038344641600193376, "tps": 16076, "wall": 20634.8} {"step": 5062, "train_loss": 3.725616693496704, "lr": 0.0003834383899259705, "tps": 16076, "wall": 20639.8} {"step": 5063, "train_loss": 3.646538496017456, "lr": 0.00038343036199856825, "tps": 16075, "wall": 20644.8} {"step": 5064, "train_loss": 3.730825185775757, "lr": 0.0003834223322198181, "tps": 16074, "wall": 20649.8} {"step": 5065, "train_loss": 3.803081512451172, "lr": 0.0003834143005898109, "tps": 16074, "wall": 20654.8} {"step": 5066, "train_loss": 3.624439239501953, "lr": 0.00038340626710863765, "tps": 16073, "wall": 20659.8} {"step": 5067, "train_loss": 3.8129096031188965, "lr": 0.00038339823177638944, "tps": 16072, "wall": 20664.8} {"step": 5068, "train_loss": 3.6979877948760986, "lr": 0.0003833901945931571, "tps": 16071, "wall": 20669.8} {"step": 5069, "train_loss": 3.7858660221099854, "lr": 0.00038338215555903184, "tps": 16071, "wall": 20674.8} {"step": 5070, "train_loss": 3.762326955795288, "lr": 0.00038337411467410476, "tps": 16070, "wall": 20679.8} {"step": 5071, "train_loss": 3.698641300201416, "lr": 0.00038336607193846674, "tps": 16069, "wall": 20684.7} {"step": 5072, "train_loss": 3.619056463241577, "lr": 0.00038335802735220913, "tps": 16069, "wall": 20689.7} {"step": 5073, "train_loss": 3.859025716781616, "lr": 0.0003833499809154229, "tps": 16068, "wall": 20694.8} {"step": 5074, "train_loss": 3.6329469680786133, "lr": 0.00038334193262819927, "tps": 16067, "wall": 20699.8} {"step": 5075, "train_loss": 3.7830612659454346, "lr": 0.0003833338824906293, "tps": 16066, "wall": 20704.8} {"step": 5076, "train_loss": 3.733419418334961, "lr": 0.0003833258305028044, "tps": 16066, "wall": 20709.8} {"step": 5077, "train_loss": 3.7554514408111572, "lr": 0.00038331777666481557, "tps": 16065, "wall": 20714.8} {"step": 5078, "train_loss": 3.7640645503997803, "lr": 0.0003833097209767542, "tps": 16064, "wall": 20719.7} {"step": 5079, "train_loss": 3.758268356323242, "lr": 0.0003833016634387114, "tps": 16064, "wall": 20724.7} {"step": 5080, "train_loss": 3.7109861373901367, "lr": 0.00038329360405077857, "tps": 16063, "wall": 20729.7} {"step": 5081, "train_loss": 3.726840019226074, "lr": 0.0003832855428130469, "tps": 16062, "wall": 20734.7} {"step": 5082, "train_loss": 3.7775261402130127, "lr": 0.0003832774797256079, "tps": 16061, "wall": 20739.7} {"step": 5083, "train_loss": 3.7482714653015137, "lr": 0.00038326941478855273, "tps": 16061, "wall": 20744.7} {"step": 5084, "train_loss": 3.7924933433532715, "lr": 0.0003832613480019727, "tps": 16060, "wall": 20749.7} {"step": 5085, "train_loss": 3.6902096271514893, "lr": 0.00038325327936595936, "tps": 16059, "wall": 20754.7} {"step": 5086, "train_loss": 3.6534595489501953, "lr": 0.000383245208880604, "tps": 16059, "wall": 20759.7} {"step": 5087, "train_loss": 3.6882715225219727, "lr": 0.0003832371365459981, "tps": 16058, "wall": 20764.7} {"step": 5088, "train_loss": 3.6581575870513916, "lr": 0.0003832290623622331, "tps": 16057, "wall": 20769.7} {"step": 5089, "train_loss": 3.7280795574188232, "lr": 0.00038322098632940046, "tps": 16056, "wall": 20774.7} {"step": 5090, "train_loss": 3.736494541168213, "lr": 0.0003832129084475917, "tps": 16056, "wall": 20779.7} {"step": 5091, "train_loss": 3.708374500274658, "lr": 0.0003832048287168982, "tps": 16055, "wall": 20784.7} {"step": 5092, "train_loss": 3.546708583831787, "lr": 0.00038319674713741154, "tps": 16054, "wall": 20789.7} {"step": 5093, "train_loss": 3.724581718444824, "lr": 0.0003831886637092234, "tps": 16054, "wall": 20794.7} {"step": 5094, "train_loss": 3.7061171531677246, "lr": 0.0003831805784324252, "tps": 16053, "wall": 20799.7} {"step": 5095, "train_loss": 3.7006826400756836, "lr": 0.0003831724913071086, "tps": 16052, "wall": 20804.7} {"step": 5096, "train_loss": 3.7448437213897705, "lr": 0.0003831644023333652, "tps": 16051, "wall": 20809.7} {"step": 5097, "train_loss": 3.5895397663116455, "lr": 0.00038315631151128655, "tps": 16051, "wall": 20814.8} {"step": 5098, "train_loss": 3.8120439052581787, "lr": 0.0003831482188409645, "tps": 16050, "wall": 20819.8} {"step": 5099, "train_loss": 3.724390983581543, "lr": 0.0003831401243224905, "tps": 16049, "wall": 20824.8} {"step": 5100, "train_loss": 3.710275173187256, "lr": 0.00038313202795595635, "tps": 16049, "wall": 20829.8} {"step": 5101, "train_loss": 3.7072901725769043, "lr": 0.00038312392974145377, "tps": 16048, "wall": 20834.7} {"step": 5102, "train_loss": 3.840998411178589, "lr": 0.00038311582967907453, "tps": 16047, "wall": 20839.7} {"step": 5103, "train_loss": 3.706300973892212, "lr": 0.0003831077277689103, "tps": 16047, "wall": 20844.7} {"step": 5104, "train_loss": 3.7783637046813965, "lr": 0.000383099624011053, "tps": 16046, "wall": 20849.8} {"step": 5105, "train_loss": 3.711174488067627, "lr": 0.00038309151840559423, "tps": 16045, "wall": 20854.7} {"step": 5106, "train_loss": 3.7259836196899414, "lr": 0.0003830834109526259, "tps": 16044, "wall": 20859.8} {"step": 5107, "train_loss": 3.715790033340454, "lr": 0.00038307530165223994, "tps": 16044, "wall": 20864.8} {"step": 5108, "train_loss": 3.85988712310791, "lr": 0.0003830671905045281, "tps": 16043, "wall": 20869.7} {"step": 5109, "train_loss": 3.6862528324127197, "lr": 0.0003830590775095823, "tps": 16042, "wall": 20874.8} {"step": 5110, "train_loss": 3.830674171447754, "lr": 0.0003830509626674945, "tps": 16042, "wall": 20879.8} {"step": 5111, "train_loss": 3.7382874488830566, "lr": 0.0003830428459783566, "tps": 16041, "wall": 20884.8} {"step": 5112, "train_loss": 3.7640790939331055, "lr": 0.00038303472744226043, "tps": 16040, "wall": 20889.8} {"step": 5113, "train_loss": 3.7866196632385254, "lr": 0.00038302660705929814, "tps": 16039, "wall": 20894.8} {"step": 5114, "train_loss": 3.6851041316986084, "lr": 0.00038301848482956153, "tps": 16039, "wall": 20899.8} {"step": 5115, "train_loss": 3.756366729736328, "lr": 0.0003830103607531428, "tps": 16038, "wall": 20904.8} {"step": 5116, "train_loss": 3.719797134399414, "lr": 0.00038300223483013376, "tps": 16037, "wall": 20909.8} {"step": 5117, "train_loss": 3.827878475189209, "lr": 0.00038299410706062664, "tps": 16037, "wall": 20914.8} {"step": 5118, "train_loss": 3.754507064819336, "lr": 0.0003829859774447135, "tps": 16036, "wall": 20919.8} {"step": 5119, "train_loss": 3.625446319580078, "lr": 0.0003829778459824864, "tps": 16035, "wall": 20924.8} {"step": 5120, "train_loss": 3.642378091812134, "lr": 0.0003829697126740374, "tps": 16035, "wall": 20929.8} {"step": 5121, "train_loss": 3.784426212310791, "lr": 0.00038296157751945866, "tps": 16034, "wall": 20934.8} {"step": 5122, "train_loss": 3.7593278884887695, "lr": 0.0003829534405188424, "tps": 16033, "wall": 20939.8} {"step": 5123, "train_loss": 3.708770513534546, "lr": 0.00038294530167228073, "tps": 16032, "wall": 20944.8} {"step": 5124, "train_loss": 3.7667651176452637, "lr": 0.0003829371609798658, "tps": 16032, "wall": 20949.8} {"step": 5125, "train_loss": 3.736830949783325, "lr": 0.00038292901844169, "tps": 16031, "wall": 20954.8} {"step": 5126, "train_loss": 3.745100259780884, "lr": 0.00038292087405784544, "tps": 16030, "wall": 20959.8} {"step": 5127, "train_loss": 3.7521378993988037, "lr": 0.0003829127278284244, "tps": 16030, "wall": 20964.8} {"step": 5128, "train_loss": 3.7132585048675537, "lr": 0.0003829045797535191, "tps": 16029, "wall": 20969.8} {"step": 5129, "train_loss": 3.8751935958862305, "lr": 0.000382896429833222, "tps": 16028, "wall": 20974.9} {"step": 5130, "train_loss": 3.798583507537842, "lr": 0.0003828882780676253, "tps": 16027, "wall": 20979.9} {"step": 5131, "train_loss": 3.8078055381774902, "lr": 0.0003828801244568213, "tps": 16027, "wall": 20984.9} {"step": 5132, "train_loss": 3.672315835952759, "lr": 0.0003828719690009026, "tps": 16026, "wall": 20989.9} {"step": 5133, "train_loss": 3.7670063972473145, "lr": 0.0003828638116999613, "tps": 16025, "wall": 20995.0} {"step": 5134, "train_loss": 3.7644975185394287, "lr": 0.00038285565255408995, "tps": 16025, "wall": 21000.0} {"step": 5135, "train_loss": 3.7492098808288574, "lr": 0.000382847491563381, "tps": 16024, "wall": 21005.0} {"step": 5136, "train_loss": 3.8332066535949707, "lr": 0.00038283932872792677, "tps": 16023, "wall": 21009.9} {"step": 5137, "train_loss": 3.7133874893188477, "lr": 0.0003828311640478199, "tps": 16023, "wall": 21014.9} {"step": 5138, "train_loss": 3.772998809814453, "lr": 0.0003828229975231528, "tps": 16022, "wall": 21019.9} {"step": 5139, "train_loss": 3.7965195178985596, "lr": 0.0003828148291540179, "tps": 16021, "wall": 21024.9} {"step": 5140, "train_loss": 3.7397732734680176, "lr": 0.00038280665894050786, "tps": 16021, "wall": 21029.9} {"step": 5141, "train_loss": 3.8085243701934814, "lr": 0.00038279848688271514, "tps": 16020, "wall": 21034.9} {"step": 5142, "train_loss": 3.797671318054199, "lr": 0.0003827903129807324, "tps": 16019, "wall": 21039.9} {"step": 5143, "train_loss": 3.738666534423828, "lr": 0.00038278213723465216, "tps": 16018, "wall": 21044.9} {"step": 5144, "train_loss": 3.7504680156707764, "lr": 0.00038277395964456703, "tps": 16018, "wall": 21049.8} {"step": 5145, "train_loss": 3.802790880203247, "lr": 0.00038276578021056973, "tps": 16017, "wall": 21054.9} {"step": 5146, "train_loss": 3.66457462310791, "lr": 0.00038275759893275296, "tps": 16016, "wall": 21059.8} {"step": 5147, "train_loss": 3.6824698448181152, "lr": 0.00038274941581120913, "tps": 16016, "wall": 21064.8} {"step": 5148, "train_loss": 3.8313724994659424, "lr": 0.0003827412308460312, "tps": 16015, "wall": 21069.8} {"step": 5149, "train_loss": 3.6995489597320557, "lr": 0.0003827330440373118, "tps": 16014, "wall": 21074.8} {"step": 5150, "train_loss": 3.7931060791015625, "lr": 0.00038272485538514366, "tps": 16014, "wall": 21079.8} {"step": 5151, "train_loss": 3.7209291458129883, "lr": 0.0003827166648896195, "tps": 16013, "wall": 21084.8} {"step": 5152, "train_loss": 3.7197020053863525, "lr": 0.00038270847255083223, "tps": 16012, "wall": 21089.8} {"step": 5153, "train_loss": 3.6162843704223633, "lr": 0.0003827002783688746, "tps": 16012, "wall": 21094.8} {"step": 5154, "train_loss": 3.7389039993286133, "lr": 0.00038269208234383934, "tps": 16011, "wall": 21099.8} {"step": 5155, "train_loss": 3.792526960372925, "lr": 0.00038268388447581944, "tps": 16010, "wall": 21104.8} {"step": 5156, "train_loss": 3.7116024494171143, "lr": 0.00038267568476490766, "tps": 16010, "wall": 21109.8} {"step": 5157, "train_loss": 3.652543544769287, "lr": 0.0003826674832111969, "tps": 16009, "wall": 21114.8} {"step": 5158, "train_loss": 3.7864298820495605, "lr": 0.00038265927981478016, "tps": 16008, "wall": 21119.8} {"step": 5159, "train_loss": 3.832700729370117, "lr": 0.00038265107457575027, "tps": 16007, "wall": 21124.8} {"step": 5160, "train_loss": 3.792365074157715, "lr": 0.0003826428674942001, "tps": 16007, "wall": 21129.8} {"step": 5161, "train_loss": 3.7313528060913086, "lr": 0.00038263465857022285, "tps": 16006, "wall": 21134.8} {"step": 5162, "train_loss": 3.7343966960906982, "lr": 0.0003826264478039114, "tps": 16005, "wall": 21139.8} {"step": 5163, "train_loss": 3.644172430038452, "lr": 0.0003826182351953587, "tps": 16005, "wall": 21144.8} {"step": 5164, "train_loss": 3.7356033325195312, "lr": 0.0003826100207446578, "tps": 16004, "wall": 21149.8} {"step": 5165, "train_loss": 3.8079543113708496, "lr": 0.00038260180445190184, "tps": 16003, "wall": 21154.8} {"step": 5166, "train_loss": 3.6447341442108154, "lr": 0.00038259358631718385, "tps": 16003, "wall": 21159.8} {"step": 5167, "train_loss": 3.7223191261291504, "lr": 0.0003825853663405969, "tps": 16002, "wall": 21164.7} {"step": 5168, "train_loss": 3.620342969894409, "lr": 0.0003825771445222341, "tps": 16001, "wall": 21169.7} {"step": 5169, "train_loss": 3.749814510345459, "lr": 0.0003825689208621887, "tps": 16001, "wall": 21174.8} {"step": 5170, "train_loss": 3.705395221710205, "lr": 0.0003825606953605537, "tps": 16000, "wall": 21179.8} {"step": 5171, "train_loss": 3.7361152172088623, "lr": 0.0003825524680174224, "tps": 15999, "wall": 21184.8} {"step": 5172, "train_loss": 3.658842086791992, "lr": 0.00038254423883288784, "tps": 15999, "wall": 21189.8} {"step": 5173, "train_loss": 3.7524871826171875, "lr": 0.0003825360078070434, "tps": 15998, "wall": 21194.8} {"step": 5174, "train_loss": 3.724871873855591, "lr": 0.00038252777493998227, "tps": 15997, "wall": 21199.8} {"step": 5175, "train_loss": 3.7218873500823975, "lr": 0.0003825195402317977, "tps": 15997, "wall": 21204.8} {"step": 5176, "train_loss": 3.7576987743377686, "lr": 0.0003825113036825831, "tps": 15996, "wall": 21209.8} {"step": 5177, "train_loss": 3.6916401386260986, "lr": 0.0003825030652924316, "tps": 15995, "wall": 21214.8} {"step": 5178, "train_loss": 3.712948799133301, "lr": 0.0003824948250614365, "tps": 15995, "wall": 21219.8} {"step": 5179, "train_loss": 3.7245543003082275, "lr": 0.0003824865829896913, "tps": 15994, "wall": 21224.8} {"step": 5180, "train_loss": 3.7213616371154785, "lr": 0.0003824783390772893, "tps": 15993, "wall": 21229.8} {"step": 5181, "train_loss": 3.689772129058838, "lr": 0.0003824700933243239, "tps": 15992, "wall": 21234.8} {"step": 5182, "train_loss": 3.7877092361450195, "lr": 0.00038246184573088843, "tps": 15992, "wall": 21239.9} {"step": 5183, "train_loss": 3.653071880340576, "lr": 0.0003824535962970765, "tps": 15991, "wall": 21244.8} {"step": 5184, "train_loss": 3.746485710144043, "lr": 0.0003824453450229813, "tps": 15990, "wall": 21249.8} {"step": 5185, "train_loss": 3.6931586265563965, "lr": 0.0003824370919086965, "tps": 15990, "wall": 21254.8} {"step": 5186, "train_loss": 3.739943265914917, "lr": 0.00038242883695431556, "tps": 15989, "wall": 21259.9} {"step": 5187, "train_loss": 3.769636869430542, "lr": 0.0003824205801599319, "tps": 15988, "wall": 21264.8} {"step": 5188, "train_loss": 3.768704652786255, "lr": 0.00038241232152563917, "tps": 15988, "wall": 21269.9} {"step": 5189, "train_loss": 3.7291312217712402, "lr": 0.0003824040610515309, "tps": 15987, "wall": 21274.9} {"step": 5190, "train_loss": 3.764319658279419, "lr": 0.0003823957987377006, "tps": 15986, "wall": 21279.9} {"step": 5191, "train_loss": 3.6549344062805176, "lr": 0.00038238753458424193, "tps": 15986, "wall": 21284.8} {"step": 5192, "train_loss": 3.735971450805664, "lr": 0.00038237926859124844, "tps": 15985, "wall": 21289.8} {"step": 5193, "train_loss": 3.7177767753601074, "lr": 0.00038237100075881386, "tps": 15984, "wall": 21294.9} {"step": 5194, "train_loss": 3.7678332328796387, "lr": 0.0003823627310870318, "tps": 15984, "wall": 21299.9} {"step": 5195, "train_loss": 3.803523063659668, "lr": 0.0003823544595759959, "tps": 15983, "wall": 21304.9} {"step": 5196, "train_loss": 3.738973617553711, "lr": 0.00038234618622579996, "tps": 15982, "wall": 21309.9} {"step": 5197, "train_loss": 3.744643211364746, "lr": 0.0003823379110365376, "tps": 15982, "wall": 21314.9} {"step": 5198, "train_loss": 3.7296762466430664, "lr": 0.0003823296340083026, "tps": 15981, "wall": 21319.9} {"step": 5199, "train_loss": 3.8026912212371826, "lr": 0.00038232135514118873, "tps": 15980, "wall": 21324.9} {"step": 5200, "train_loss": 3.710022449493408, "lr": 0.00038231307443528976, "tps": 15980, "wall": 21329.9} {"step": 5201, "train_loss": 3.849820137023926, "lr": 0.0003823047918906995, "tps": 15979, "wall": 21334.9} {"step": 5202, "train_loss": 3.812678098678589, "lr": 0.0003822965075075118, "tps": 15978, "wall": 21339.9} {"step": 5203, "train_loss": 3.6962990760803223, "lr": 0.00038228822128582045, "tps": 15978, "wall": 21344.9} {"step": 5204, "train_loss": 3.756925582885742, "lr": 0.0003822799332257194, "tps": 15977, "wall": 21349.9} {"step": 5205, "train_loss": 3.727576732635498, "lr": 0.0003822716433273024, "tps": 15976, "wall": 21354.9} {"step": 5206, "train_loss": 3.7704970836639404, "lr": 0.0003822633515906635, "tps": 15975, "wall": 21359.9} {"step": 5207, "train_loss": 3.747469663619995, "lr": 0.0003822550580158966, "tps": 15975, "wall": 21364.9} {"step": 5208, "train_loss": 3.7075343132019043, "lr": 0.00038224676260309557, "tps": 15974, "wall": 21369.9} {"step": 5209, "train_loss": 3.792924404144287, "lr": 0.00038223846535235444, "tps": 15973, "wall": 21374.9} {"step": 5210, "train_loss": 3.7722513675689697, "lr": 0.00038223016626376724, "tps": 15973, "wall": 21379.9} {"step": 5211, "train_loss": 3.7253453731536865, "lr": 0.000382221865337428, "tps": 15972, "wall": 21384.9} {"step": 5212, "train_loss": 3.7871737480163574, "lr": 0.00038221356257343056, "tps": 15971, "wall": 21389.9} {"step": 5213, "train_loss": 3.7011606693267822, "lr": 0.00038220525797186917, "tps": 15971, "wall": 21394.9} {"step": 5214, "train_loss": 3.725832939147949, "lr": 0.00038219695153283783, "tps": 15970, "wall": 21399.9} {"step": 5215, "train_loss": 3.7420499324798584, "lr": 0.00038218864325643065, "tps": 15969, "wall": 21404.9} {"step": 5216, "train_loss": 3.7214009761810303, "lr": 0.0003821803331427418, "tps": 15969, "wall": 21409.9} {"step": 5217, "train_loss": 3.833831548690796, "lr": 0.0003821720211918652, "tps": 15968, "wall": 21415.0} {"step": 5218, "train_loss": 3.742086887359619, "lr": 0.0003821637074038953, "tps": 15967, "wall": 21419.9} {"step": 5219, "train_loss": 3.7421505451202393, "lr": 0.00038215539177892616, "tps": 15967, "wall": 21424.9} {"step": 5220, "train_loss": 3.641396999359131, "lr": 0.00038214707431705197, "tps": 15966, "wall": 21430.0} {"step": 5221, "train_loss": 3.7072417736053467, "lr": 0.0003821387550183669, "tps": 15965, "wall": 21435.0} {"step": 5222, "train_loss": 3.7720515727996826, "lr": 0.0003821304338829653, "tps": 15965, "wall": 21440.0} {"step": 5223, "train_loss": 3.7892937660217285, "lr": 0.00038212211091094133, "tps": 15964, "wall": 21445.0} {"step": 5224, "train_loss": 3.6650094985961914, "lr": 0.0003821137861023893, "tps": 15963, "wall": 21450.0} {"step": 5225, "train_loss": 3.6824440956115723, "lr": 0.00038210545945740353, "tps": 15963, "wall": 21455.0} {"step": 5226, "train_loss": 3.739307165145874, "lr": 0.0003820971309760784, "tps": 15962, "wall": 21460.0} {"step": 5227, "train_loss": 3.7867000102996826, "lr": 0.0003820888006585082, "tps": 15961, "wall": 21465.0} {"step": 5228, "train_loss": 3.7491705417633057, "lr": 0.0003820804685047873, "tps": 15961, "wall": 21470.0} {"step": 5229, "train_loss": 3.7172646522521973, "lr": 0.00038207213451501, "tps": 15960, "wall": 21475.0} {"step": 5230, "train_loss": 3.6211960315704346, "lr": 0.00038206379868927084, "tps": 15959, "wall": 21480.0} {"step": 5231, "train_loss": 3.7642312049865723, "lr": 0.0003820554610276642, "tps": 15959, "wall": 21485.0} {"step": 5232, "train_loss": 3.6688284873962402, "lr": 0.00038204712153028453, "tps": 15958, "wall": 21490.0} {"step": 5233, "train_loss": 3.7204720973968506, "lr": 0.0003820387801972263, "tps": 15957, "wall": 21495.0} {"step": 5234, "train_loss": 3.7004222869873047, "lr": 0.000382030437028584, "tps": 15957, "wall": 21500.0} {"step": 5235, "train_loss": 3.7006676197052, "lr": 0.00038202209202445217, "tps": 15956, "wall": 21505.0} {"step": 5236, "train_loss": 3.6710286140441895, "lr": 0.00038201374518492527, "tps": 15955, "wall": 21510.0} {"step": 5237, "train_loss": 3.7504498958587646, "lr": 0.00038200539651009796, "tps": 15955, "wall": 21515.0} {"step": 5238, "train_loss": 3.7731175422668457, "lr": 0.00038199704600006473, "tps": 15954, "wall": 21520.0} {"step": 5239, "train_loss": 3.712730646133423, "lr": 0.00038198869365492017, "tps": 15953, "wall": 21525.0} {"step": 5240, "train_loss": 3.7329611778259277, "lr": 0.000381980339474759, "tps": 15953, "wall": 21530.0} {"step": 5241, "train_loss": 3.8141565322875977, "lr": 0.00038197198345967567, "tps": 15952, "wall": 21535.0} {"step": 5242, "train_loss": 3.6434412002563477, "lr": 0.00038196362560976503, "tps": 15951, "wall": 21540.0} {"step": 5243, "train_loss": 3.751842975616455, "lr": 0.0003819552659251216, "tps": 15951, "wall": 21545.0} {"step": 5244, "train_loss": 3.7248082160949707, "lr": 0.0003819469044058403, "tps": 15950, "wall": 21550.0} {"step": 5245, "train_loss": 3.799403667449951, "lr": 0.0003819385410520156, "tps": 15949, "wall": 21555.0} {"step": 5246, "train_loss": 3.6462836265563965, "lr": 0.0003819301758637423, "tps": 15949, "wall": 21560.0} {"step": 5247, "train_loss": 3.775157928466797, "lr": 0.0003819218088411153, "tps": 15948, "wall": 21565.0} {"step": 5248, "train_loss": 3.714404821395874, "lr": 0.0003819134399842293, "tps": 15948, "wall": 21570.0} {"step": 5249, "train_loss": 3.6670267581939697, "lr": 0.00038190506929317903, "tps": 15947, "wall": 21575.0} {"step": 5250, "train_loss": 3.7243120670318604, "lr": 0.0003818966967680594, "tps": 15946, "wall": 21580.0} {"step": 5251, "train_loss": 3.638583183288574, "lr": 0.0003818883224089652, "tps": 15946, "wall": 21585.0} {"step": 5252, "train_loss": 3.769880771636963, "lr": 0.00038187994621599136, "tps": 15945, "wall": 21589.9} {"step": 5253, "train_loss": 3.739457607269287, "lr": 0.00038187156818923274, "tps": 15944, "wall": 21595.0} {"step": 5254, "train_loss": 3.7648627758026123, "lr": 0.00038186318832878423, "tps": 15944, "wall": 21600.0} {"step": 5255, "train_loss": 3.670656681060791, "lr": 0.0003818548066347407, "tps": 15943, "wall": 21605.0} {"step": 5256, "train_loss": 3.750483989715576, "lr": 0.00038184642310719726, "tps": 15942, "wall": 21610.0} {"step": 5257, "train_loss": 3.7292304039001465, "lr": 0.00038183803774624874, "tps": 15942, "wall": 21615.0} {"step": 5258, "train_loss": 3.705275535583496, "lr": 0.0003818296505519902, "tps": 15941, "wall": 21620.0} {"step": 5259, "train_loss": 3.7940585613250732, "lr": 0.00038182126152451663, "tps": 15940, "wall": 21625.0} {"step": 5260, "train_loss": 3.787447214126587, "lr": 0.000381812870663923, "tps": 15940, "wall": 21630.0} {"step": 5261, "train_loss": 3.7112371921539307, "lr": 0.00038180447797030447, "tps": 15939, "wall": 21635.0} {"step": 5262, "train_loss": 3.7447943687438965, "lr": 0.000381796083443756, "tps": 15938, "wall": 21640.0} {"step": 5263, "train_loss": 3.7043304443359375, "lr": 0.0003817876870843728, "tps": 15938, "wall": 21645.0} {"step": 5264, "train_loss": 3.613675594329834, "lr": 0.00038177928889224986, "tps": 15937, "wall": 21650.0} {"step": 5265, "train_loss": 3.632269859313965, "lr": 0.0003817708888674824, "tps": 15936, "wall": 21655.1} {"step": 5266, "train_loss": 3.7949299812316895, "lr": 0.0003817624870101656, "tps": 15936, "wall": 21660.1} {"step": 5267, "train_loss": 3.8301620483398438, "lr": 0.0003817540833203947, "tps": 15935, "wall": 21665.1} {"step": 5268, "train_loss": 3.6422297954559326, "lr": 0.0003817456777982646, "tps": 15934, "wall": 21670.1} {"step": 5269, "train_loss": 3.701512336730957, "lr": 0.0003817372704438708, "tps": 15934, "wall": 21675.0} {"step": 5270, "train_loss": 3.631748676300049, "lr": 0.00038172886125730843, "tps": 15933, "wall": 21680.0} {"step": 5271, "train_loss": 3.727163553237915, "lr": 0.00038172045023867284, "tps": 15932, "wall": 21685.0} {"step": 5272, "train_loss": 3.7499136924743652, "lr": 0.00038171203738805915, "tps": 15932, "wall": 21690.0} {"step": 5273, "train_loss": 3.7395710945129395, "lr": 0.0003817036227055628, "tps": 15931, "wall": 21695.0} {"step": 5274, "train_loss": 3.6971850395202637, "lr": 0.00038169520619127904, "tps": 15930, "wall": 21700.0} {"step": 5275, "train_loss": 3.7513182163238525, "lr": 0.00038168678784530327, "tps": 15930, "wall": 21705.0} {"step": 5276, "train_loss": 3.690150499343872, "lr": 0.0003816783676677307, "tps": 15929, "wall": 21710.0} {"step": 5277, "train_loss": 3.7679195404052734, "lr": 0.00038166994565865697, "tps": 15928, "wall": 21715.1} {"step": 5278, "train_loss": 3.7770063877105713, "lr": 0.00038166152181817736, "tps": 15928, "wall": 21720.0} {"step": 5279, "train_loss": 3.700911521911621, "lr": 0.0003816530961463872, "tps": 15927, "wall": 21725.0} {"step": 5280, "train_loss": 3.726421356201172, "lr": 0.0003816446686433821, "tps": 15927, "wall": 21730.0} {"step": 5281, "train_loss": 3.7503247261047363, "lr": 0.0003816362393092574, "tps": 15926, "wall": 21735.0} {"step": 5282, "train_loss": 3.7393112182617188, "lr": 0.0003816278081441086, "tps": 15925, "wall": 21740.0} {"step": 5283, "train_loss": 3.7463204860687256, "lr": 0.0003816193751480313, "tps": 15925, "wall": 21745.0} {"step": 5284, "train_loss": 3.6243319511413574, "lr": 0.000381610940321121, "tps": 15924, "wall": 21750.0} {"step": 5285, "train_loss": 3.6712725162506104, "lr": 0.00038160250366347316, "tps": 15923, "wall": 21754.9} {"step": 5286, "train_loss": 3.7379651069641113, "lr": 0.0003815940651751834, "tps": 15923, "wall": 21759.9} {"step": 5287, "train_loss": 3.8527846336364746, "lr": 0.00038158562485634737, "tps": 15922, "wall": 21764.9} {"step": 5288, "train_loss": 3.691337823867798, "lr": 0.0003815771827070607, "tps": 15921, "wall": 21769.9} {"step": 5289, "train_loss": 3.7210676670074463, "lr": 0.0003815687387274189, "tps": 15921, "wall": 21775.0} {"step": 5290, "train_loss": 3.701441764831543, "lr": 0.0003815602929175177, "tps": 15920, "wall": 21780.0} {"step": 5291, "train_loss": 3.791095018386841, "lr": 0.00038155184527745273, "tps": 15919, "wall": 21785.0} {"step": 5292, "train_loss": 3.7616636753082275, "lr": 0.00038154339580731973, "tps": 15919, "wall": 21790.0} {"step": 5293, "train_loss": 3.6549763679504395, "lr": 0.0003815349445072144, "tps": 15918, "wall": 21795.0} {"step": 5294, "train_loss": 3.707965135574341, "lr": 0.0003815264913772325, "tps": 15918, "wall": 21800.0} {"step": 5295, "train_loss": 3.78584361076355, "lr": 0.00038151803641746975, "tps": 15917, "wall": 21805.0} {"step": 5296, "train_loss": 3.8180112838745117, "lr": 0.00038150957962802194, "tps": 15916, "wall": 21809.9} {"step": 5297, "train_loss": 3.718337059020996, "lr": 0.0003815011210089849, "tps": 15916, "wall": 21814.9} {"step": 5298, "train_loss": 3.7100725173950195, "lr": 0.0003814926605604544, "tps": 15915, "wall": 21819.9} {"step": 5299, "train_loss": 3.7271924018859863, "lr": 0.0003814841982825264, "tps": 15914, "wall": 21824.9} {"step": 5300, "train_loss": 3.7232956886291504, "lr": 0.00038147573417529656, "tps": 15914, "wall": 21829.8} {"step": 5301, "train_loss": 3.785619020462036, "lr": 0.0003814672682388609, "tps": 15913, "wall": 21834.9} {"step": 5302, "train_loss": 3.8050732612609863, "lr": 0.0003814588004733153, "tps": 15912, "wall": 21839.9} {"step": 5303, "train_loss": 3.813364267349243, "lr": 0.0003814503308787556, "tps": 15912, "wall": 21844.9} {"step": 5304, "train_loss": 3.679018974304199, "lr": 0.0003814418594552779, "tps": 15911, "wall": 21849.9} {"step": 5305, "train_loss": 3.6707630157470703, "lr": 0.00038143338620297805, "tps": 15911, "wall": 21854.9} {"step": 5306, "train_loss": 3.8135862350463867, "lr": 0.00038142491112195203, "tps": 15910, "wall": 21859.8} {"step": 5307, "train_loss": 3.7149477005004883, "lr": 0.000381416434212296, "tps": 15909, "wall": 21864.8} {"step": 5308, "train_loss": 3.7696945667266846, "lr": 0.0003814079554741057, "tps": 15909, "wall": 21869.8} {"step": 5309, "train_loss": 3.7637579441070557, "lr": 0.0003813994749074775, "tps": 15908, "wall": 21874.8} {"step": 5310, "train_loss": 3.6798460483551025, "lr": 0.00038139099251250725, "tps": 15907, "wall": 21879.8} {"step": 5311, "train_loss": 3.7599010467529297, "lr": 0.0003813825082892911, "tps": 15907, "wall": 21884.7} {"step": 5312, "train_loss": 3.7232556343078613, "lr": 0.00038137402223792523, "tps": 15906, "wall": 21889.7} {"step": 5313, "train_loss": 3.7421817779541016, "lr": 0.0003813655343585056, "tps": 15906, "wall": 21894.8} {"step": 5314, "train_loss": 3.777824878692627, "lr": 0.0003813570446511286, "tps": 15905, "wall": 21899.7} {"step": 5315, "train_loss": 3.7489328384399414, "lr": 0.0003813485531158902, "tps": 15904, "wall": 21904.8} {"step": 5316, "train_loss": 3.6754279136657715, "lr": 0.00038134005975288664, "tps": 15904, "wall": 21909.8} {"step": 5317, "train_loss": 3.808291435241699, "lr": 0.00038133156456221414, "tps": 15903, "wall": 21914.8} {"step": 5318, "train_loss": 3.77339506149292, "lr": 0.00038132306754396893, "tps": 15902, "wall": 21919.8} {"step": 5319, "train_loss": 3.6799020767211914, "lr": 0.00038131456869824735, "tps": 15902, "wall": 21924.8} {"step": 5320, "train_loss": 3.7248497009277344, "lr": 0.0003813060680251456, "tps": 15901, "wall": 21929.7} {"step": 5321, "train_loss": 3.779757261276245, "lr": 0.00038129756552476, "tps": 15900, "wall": 21934.7} {"step": 5322, "train_loss": 3.7769570350646973, "lr": 0.00038128906119718685, "tps": 15900, "wall": 21939.7} {"step": 5323, "train_loss": 3.793654680252075, "lr": 0.0003812805550425225, "tps": 15899, "wall": 21944.7} {"step": 5324, "train_loss": 3.732703924179077, "lr": 0.0003812720470608632, "tps": 15899, "wall": 21949.6} {"step": 5325, "train_loss": 3.705599546432495, "lr": 0.00038126353725230554, "tps": 15898, "wall": 21954.7} {"step": 5326, "train_loss": 3.636320114135742, "lr": 0.0003812550256169458, "tps": 15897, "wall": 21959.7} {"step": 5327, "train_loss": 3.772592067718506, "lr": 0.00038124651215488026, "tps": 15897, "wall": 21964.6} {"step": 5328, "train_loss": 3.7479000091552734, "lr": 0.00038123799686620567, "tps": 15896, "wall": 21969.6} {"step": 5329, "train_loss": 3.7182741165161133, "lr": 0.0003812294797510183, "tps": 15895, "wall": 21974.6} {"step": 5330, "train_loss": 3.6321747303009033, "lr": 0.0003812209608094146, "tps": 15895, "wall": 21979.6} {"step": 5331, "train_loss": 3.7229552268981934, "lr": 0.0003812124400414911, "tps": 15894, "wall": 21984.5} {"step": 5332, "train_loss": 3.7808854579925537, "lr": 0.0003812039174473445, "tps": 15894, "wall": 21989.5} {"step": 5333, "train_loss": 3.712054491043091, "lr": 0.0003811953930270711, "tps": 15893, "wall": 21994.5} {"step": 5334, "train_loss": 3.7853844165802, "lr": 0.0003811868667807676, "tps": 15892, "wall": 21999.5} {"step": 5335, "train_loss": 3.8422751426696777, "lr": 0.00038117833870853054, "tps": 15892, "wall": 22004.5} {"step": 5336, "train_loss": 3.7998785972595215, "lr": 0.00038116980881045654, "tps": 15891, "wall": 22009.5} {"step": 5337, "train_loss": 3.6541378498077393, "lr": 0.00038116127708664224, "tps": 15890, "wall": 22014.6} {"step": 5338, "train_loss": 3.7105119228363037, "lr": 0.00038115274353718424, "tps": 15890, "wall": 22019.5} {"step": 5339, "train_loss": 3.7571938037872314, "lr": 0.00038114420816217926, "tps": 15889, "wall": 22024.5} {"step": 5340, "train_loss": 3.6888175010681152, "lr": 0.000381135670961724, "tps": 15889, "wall": 22029.5} {"step": 5341, "train_loss": 3.6558048725128174, "lr": 0.0003811271319359151, "tps": 15888, "wall": 22034.5} {"step": 5342, "train_loss": 3.708099126815796, "lr": 0.00038111859108484937, "tps": 15887, "wall": 22039.5} {"step": 5343, "train_loss": 3.6804018020629883, "lr": 0.0003811100484086235, "tps": 15887, "wall": 22044.5} {"step": 5344, "train_loss": 3.6410350799560547, "lr": 0.0003811015039073343, "tps": 15886, "wall": 22049.5} {"step": 5345, "train_loss": 3.7336535453796387, "lr": 0.0003810929575810786, "tps": 15885, "wall": 22054.5} {"step": 5346, "train_loss": 3.7103018760681152, "lr": 0.00038108440942995306, "tps": 15885, "wall": 22059.5} {"step": 5347, "train_loss": 3.668260335922241, "lr": 0.00038107585945405467, "tps": 15884, "wall": 22064.4} {"step": 5348, "train_loss": 3.5852673053741455, "lr": 0.00038106730765348024, "tps": 15884, "wall": 22069.4} {"step": 5349, "train_loss": 3.5995092391967773, "lr": 0.0003810587540283266, "tps": 15883, "wall": 22074.5} {"step": 5350, "train_loss": 3.7175440788269043, "lr": 0.0003810501985786907, "tps": 15882, "wall": 22079.5} {"step": 5351, "train_loss": 3.7411386966705322, "lr": 0.0003810416413046694, "tps": 15882, "wall": 22084.4} {"step": 5352, "train_loss": 3.7106642723083496, "lr": 0.00038103308220635974, "tps": 15881, "wall": 22089.4} {"step": 5353, "train_loss": 3.629988193511963, "lr": 0.00038102452128385857, "tps": 15880, "wall": 22094.4} {"step": 5354, "train_loss": 3.77949857711792, "lr": 0.0003810159585372629, "tps": 15880, "wall": 22099.4} {"step": 5355, "train_loss": 3.7476348876953125, "lr": 0.0003810073939666698, "tps": 15879, "wall": 22104.3} {"step": 5356, "train_loss": 3.764678478240967, "lr": 0.0003809988275721762, "tps": 15879, "wall": 22109.3} {"step": 5357, "train_loss": 3.635387420654297, "lr": 0.00038099025935387914, "tps": 15878, "wall": 22114.3} {"step": 5358, "train_loss": 3.688223361968994, "lr": 0.00038098168931187577, "tps": 15877, "wall": 22119.3} {"step": 5359, "train_loss": 3.7056374549865723, "lr": 0.00038097311744626306, "tps": 15877, "wall": 22124.3} {"step": 5360, "train_loss": 3.7577919960021973, "lr": 0.00038096454375713824, "tps": 15876, "wall": 22129.3} {"step": 5361, "train_loss": 3.8152806758880615, "lr": 0.00038095596824459826, "tps": 15875, "wall": 22134.3} {"step": 5362, "train_loss": 3.784226417541504, "lr": 0.0003809473909087404, "tps": 15875, "wall": 22139.3} {"step": 5363, "train_loss": 3.726395845413208, "lr": 0.00038093881174966184, "tps": 15874, "wall": 22144.3} {"step": 5364, "train_loss": 3.7831854820251465, "lr": 0.00038093023076745964, "tps": 15874, "wall": 22149.3} {"step": 5365, "train_loss": 3.6619508266448975, "lr": 0.0003809216479622312, "tps": 15873, "wall": 22154.3} {"step": 5366, "train_loss": 3.6007401943206787, "lr": 0.0003809130633340735, "tps": 15872, "wall": 22159.3} {"step": 5367, "train_loss": 3.6846203804016113, "lr": 0.00038090447688308396, "tps": 15872, "wall": 22164.3} {"step": 5368, "train_loss": 3.678834915161133, "lr": 0.00038089588860935983, "tps": 15871, "wall": 22169.3} {"step": 5369, "train_loss": 3.7580952644348145, "lr": 0.00038088729851299834, "tps": 15871, "wall": 22174.3} {"step": 5370, "train_loss": 3.724303722381592, "lr": 0.0003808787065940968, "tps": 15870, "wall": 22179.3} {"step": 5371, "train_loss": 3.7227132320404053, "lr": 0.00038087011285275265, "tps": 15869, "wall": 22184.2} {"step": 5372, "train_loss": 3.7103447914123535, "lr": 0.00038086151728906306, "tps": 15869, "wall": 22189.2} {"step": 5373, "train_loss": 3.765740394592285, "lr": 0.0003808529199031255, "tps": 15868, "wall": 22194.3} {"step": 5374, "train_loss": 3.636436939239502, "lr": 0.00038084432069503745, "tps": 15867, "wall": 22199.3} {"step": 5375, "train_loss": 3.601236343383789, "lr": 0.0003808357196648962, "tps": 15867, "wall": 22204.3} {"step": 5376, "train_loss": 3.7151238918304443, "lr": 0.00038082711681279916, "tps": 15866, "wall": 22209.3} {"step": 5377, "train_loss": 3.535564661026001, "lr": 0.0003808185121388439, "tps": 15866, "wall": 22214.3} {"step": 5378, "train_loss": 3.7061212062835693, "lr": 0.0003808099056431278, "tps": 15865, "wall": 22219.3} {"step": 5379, "train_loss": 3.7146260738372803, "lr": 0.00038080129732574844, "tps": 15864, "wall": 22224.3} {"step": 5380, "train_loss": 3.6363580226898193, "lr": 0.00038079268718680325, "tps": 15864, "wall": 22229.3} {"step": 5381, "train_loss": 3.7976741790771484, "lr": 0.0003807840752263898, "tps": 15863, "wall": 22234.3} {"step": 5382, "train_loss": 3.813944101333618, "lr": 0.00038077546144460564, "tps": 15862, "wall": 22239.3} {"step": 5383, "train_loss": 3.685622215270996, "lr": 0.0003807668458415484, "tps": 15862, "wall": 22244.2} {"step": 5384, "train_loss": 3.823674201965332, "lr": 0.00038075822841731553, "tps": 15861, "wall": 22249.2} {"step": 5385, "train_loss": 3.6207873821258545, "lr": 0.0003807496091720049, "tps": 15861, "wall": 22254.3} {"step": 5386, "train_loss": 3.668414831161499, "lr": 0.00038074098810571386, "tps": 15860, "wall": 22259.2} {"step": 5387, "train_loss": 3.641458034515381, "lr": 0.0003807323652185403, "tps": 15859, "wall": 22264.2} {"step": 5388, "train_loss": 3.7986323833465576, "lr": 0.00038072374051058175, "tps": 15859, "wall": 22269.2} {"step": 5389, "train_loss": 3.659498453140259, "lr": 0.00038071511398193603, "tps": 15858, "wall": 22274.2} {"step": 5390, "train_loss": 3.813997745513916, "lr": 0.0003807064856327008, "tps": 15858, "wall": 22279.2} {"step": 5391, "train_loss": 3.667552947998047, "lr": 0.0003806978554629738, "tps": 15857, "wall": 22284.1} {"step": 5392, "train_loss": 3.7388858795166016, "lr": 0.0003806892234728527, "tps": 15856, "wall": 22289.1} {"step": 5393, "train_loss": 3.587442398071289, "lr": 0.00038068058966243557, "tps": 15856, "wall": 22294.1} {"step": 5394, "train_loss": 3.679307222366333, "lr": 0.0003806719540318199, "tps": 15855, "wall": 22299.1} {"step": 5395, "train_loss": 3.7866005897521973, "lr": 0.00038066331658110367, "tps": 15855, "wall": 22304.1} {"step": 5396, "train_loss": 3.6585378646850586, "lr": 0.0003806546773103847, "tps": 15854, "wall": 22309.0} {"step": 5397, "train_loss": 3.6858768463134766, "lr": 0.0003806460362197609, "tps": 15853, "wall": 22314.1} {"step": 5398, "train_loss": 3.7822554111480713, "lr": 0.00038063739330933, "tps": 15853, "wall": 22319.1} {"step": 5399, "train_loss": 3.732616901397705, "lr": 0.0003806287485791901, "tps": 15852, "wall": 22324.1} {"step": 5400, "train_loss": 3.6971547603607178, "lr": 0.00038062010202943907, "tps": 15851, "wall": 22329.0} {"step": 5401, "train_loss": 3.734862804412842, "lr": 0.00038061145366017474, "tps": 15851, "wall": 22334.0} {"step": 5402, "train_loss": 3.7037715911865234, "lr": 0.00038060280347149524, "tps": 15850, "wall": 22339.0} {"step": 5403, "train_loss": 3.71500825881958, "lr": 0.0003805941514634985, "tps": 15850, "wall": 22344.0} {"step": 5404, "train_loss": 3.6986584663391113, "lr": 0.0003805854976362825, "tps": 15849, "wall": 22349.0} {"step": 5405, "train_loss": 3.754880666732788, "lr": 0.0003805768419899453, "tps": 15848, "wall": 22354.0} {"step": 5406, "train_loss": 3.586009979248047, "lr": 0.0003805681845245849, "tps": 15848, "wall": 22359.0} {"step": 5407, "train_loss": 3.7315545082092285, "lr": 0.00038055952524029954, "tps": 15847, "wall": 22364.0} {"step": 5408, "train_loss": 3.7876291275024414, "lr": 0.0003805508641371871, "tps": 15847, "wall": 22368.9} {"step": 5409, "train_loss": 3.661527633666992, "lr": 0.0003805422012153458, "tps": 15846, "wall": 22374.0} {"step": 5410, "train_loss": 3.7068846225738525, "lr": 0.0003805335364748738, "tps": 15845, "wall": 22379.0} {"step": 5411, "train_loss": 3.7831649780273438, "lr": 0.00038052486991586913, "tps": 15845, "wall": 22384.0} {"step": 5412, "train_loss": 3.8164844512939453, "lr": 0.0003805162015384301, "tps": 15844, "wall": 22389.0} {"step": 5413, "train_loss": 3.782212018966675, "lr": 0.0003805075313426549, "tps": 15844, "wall": 22394.0} {"step": 5414, "train_loss": 3.807164430618286, "lr": 0.0003804988593286416, "tps": 15843, "wall": 22398.9} {"step": 5415, "train_loss": 3.802927255630493, "lr": 0.0003804901854964886, "tps": 15842, "wall": 22403.9} {"step": 5416, "train_loss": 3.7686846256256104, "lr": 0.0003804815098462941, "tps": 15842, "wall": 22408.9} {"step": 5417, "train_loss": 3.8449316024780273, "lr": 0.0003804728323781564, "tps": 15841, "wall": 22413.9} {"step": 5418, "train_loss": 3.696765422821045, "lr": 0.0003804641530921737, "tps": 15841, "wall": 22418.9} {"step": 5419, "train_loss": 3.8069005012512207, "lr": 0.0003804554719884444, "tps": 15840, "wall": 22423.9} {"step": 5420, "train_loss": 3.7120847702026367, "lr": 0.0003804467890670669, "tps": 15839, "wall": 22428.9} {"step": 5421, "train_loss": 3.6543149948120117, "lr": 0.0003804381043281394, "tps": 15839, "wall": 22433.9} {"step": 5422, "train_loss": 3.884127378463745, "lr": 0.0003804294177717605, "tps": 15838, "wall": 22438.9} {"step": 5423, "train_loss": 3.6841633319854736, "lr": 0.0003804207293980284, "tps": 15838, "wall": 22443.8} {"step": 5424, "train_loss": 3.7318828105926514, "lr": 0.0003804120392070416, "tps": 15837, "wall": 22448.8} {"step": 5425, "train_loss": 3.715768814086914, "lr": 0.00038040334719889856, "tps": 15836, "wall": 22453.8} {"step": 5426, "train_loss": 3.7348060607910156, "lr": 0.0003803946533736977, "tps": 15836, "wall": 22458.8} {"step": 5427, "train_loss": 3.629281759262085, "lr": 0.00038038595773153753, "tps": 15835, "wall": 22463.8} {"step": 5428, "train_loss": 3.7630553245544434, "lr": 0.0003803772602725166, "tps": 15835, "wall": 22468.8} {"step": 5429, "train_loss": 3.7101948261260986, "lr": 0.00038036856099673335, "tps": 15834, "wall": 22473.8} {"step": 5430, "train_loss": 3.647343873977661, "lr": 0.0003803598599042864, "tps": 15833, "wall": 22478.8} {"step": 5431, "train_loss": 3.7579336166381836, "lr": 0.0003803511569952742, "tps": 15833, "wall": 22483.8} {"step": 5432, "train_loss": 3.68930721282959, "lr": 0.00038034245226979544, "tps": 15832, "wall": 22488.8} {"step": 5433, "train_loss": 3.705179214477539, "lr": 0.0003803337457279488, "tps": 15832, "wall": 22493.8} {"step": 5434, "train_loss": 3.735246181488037, "lr": 0.00038032503736983275, "tps": 15831, "wall": 22498.8} {"step": 5435, "train_loss": 3.6601216793060303, "lr": 0.00038031632719554595, "tps": 15830, "wall": 22503.8} {"step": 5436, "train_loss": 3.732884645462036, "lr": 0.0003803076152051872, "tps": 15830, "wall": 22508.8} {"step": 5437, "train_loss": 3.761756420135498, "lr": 0.00038029890139885513, "tps": 15829, "wall": 22513.7} {"step": 5438, "train_loss": 3.7852976322174072, "lr": 0.0003802901857766484, "tps": 15829, "wall": 22518.7} {"step": 5439, "train_loss": 3.7251017093658447, "lr": 0.00038028146833866575, "tps": 15828, "wall": 22523.7} {"step": 5440, "train_loss": 3.5357666015625, "lr": 0.00038027274908500596, "tps": 15827, "wall": 22528.7} {"step": 5441, "train_loss": 3.7370352745056152, "lr": 0.00038026402801576777, "tps": 15827, "wall": 22533.7} {"step": 5442, "train_loss": 3.670485496520996, "lr": 0.00038025530513105006, "tps": 15826, "wall": 22538.7} {"step": 5443, "train_loss": 3.7259411811828613, "lr": 0.00038024658043095156, "tps": 15826, "wall": 22543.7} {"step": 5444, "train_loss": 3.8055620193481445, "lr": 0.0003802378539155712, "tps": 15825, "wall": 22548.6} {"step": 5445, "train_loss": 3.7083375453948975, "lr": 0.00038022912558500767, "tps": 15824, "wall": 22553.7} {"step": 5446, "train_loss": 3.755296230316162, "lr": 0.00038022039543935993, "tps": 15824, "wall": 22558.7} {"step": 5447, "train_loss": 3.781251907348633, "lr": 0.00038021166347872696, "tps": 15823, "wall": 22563.6} {"step": 5448, "train_loss": 3.682626247406006, "lr": 0.00038020292970320754, "tps": 15823, "wall": 22568.6} {"step": 5449, "train_loss": 3.7505762577056885, "lr": 0.00038019419411290065, "tps": 15822, "wall": 22573.6} {"step": 5450, "train_loss": 3.682748317718506, "lr": 0.00038018545670790533, "tps": 15821, "wall": 22578.6} {"step": 5451, "train_loss": 3.737147331237793, "lr": 0.00038017671748832047, "tps": 15821, "wall": 22583.5} {"step": 5452, "train_loss": 3.7060904502868652, "lr": 0.00038016797645424504, "tps": 15820, "wall": 22588.5} {"step": 5453, "train_loss": 3.8249125480651855, "lr": 0.00038015923360577814, "tps": 15820, "wall": 22593.5} {"step": 5454, "train_loss": 3.6525139808654785, "lr": 0.0003801504889430187, "tps": 15819, "wall": 22598.5} {"step": 5455, "train_loss": 3.7011525630950928, "lr": 0.000380141742466066, "tps": 15819, "wall": 22603.5} {"step": 5456, "train_loss": 3.623443365097046, "lr": 0.00038013299417501893, "tps": 15818, "wall": 22608.4} {"step": 5457, "train_loss": 3.645615339279175, "lr": 0.00038012424406997654, "tps": 15817, "wall": 22613.5} {"step": 5458, "train_loss": 3.6868724822998047, "lr": 0.0003801154921510382, "tps": 15817, "wall": 22618.4} {"step": 5459, "train_loss": 3.686466932296753, "lr": 0.0003801067384183028, "tps": 15816, "wall": 22623.4} {"step": 5460, "train_loss": 3.7202725410461426, "lr": 0.00038009798287186964, "tps": 15816, "wall": 22628.4} {"step": 5461, "train_loss": 3.673753261566162, "lr": 0.0003800892255118379, "tps": 15815, "wall": 22633.4} {"step": 5462, "train_loss": 3.6994833946228027, "lr": 0.0003800804663383067, "tps": 15814, "wall": 22638.3} {"step": 5463, "train_loss": 3.712937831878662, "lr": 0.00038007170535137534, "tps": 15814, "wall": 22643.3} {"step": 5464, "train_loss": 3.690415143966675, "lr": 0.00038006294255114306, "tps": 15813, "wall": 22648.3} {"step": 5465, "train_loss": 3.7458128929138184, "lr": 0.0003800541779377091, "tps": 15813, "wall": 22653.3} {"step": 5466, "train_loss": 3.6919326782226562, "lr": 0.0003800454115111727, "tps": 15812, "wall": 22658.2} {"step": 5467, "train_loss": 3.706115245819092, "lr": 0.00038003664327163327, "tps": 15811, "wall": 22663.2} {"step": 5468, "train_loss": 3.7499191761016846, "lr": 0.0003800278732191901, "tps": 15811, "wall": 22668.2} {"step": 5469, "train_loss": 3.796440601348877, "lr": 0.0003800191013539425, "tps": 15810, "wall": 22673.3} {"step": 5470, "train_loss": 3.7033746242523193, "lr": 0.0003800103276759899, "tps": 15810, "wall": 22678.3} {"step": 5471, "train_loss": 3.5923523902893066, "lr": 0.0003800015521854316, "tps": 15809, "wall": 22683.2} {"step": 5472, "train_loss": 3.8316633701324463, "lr": 0.00037999277488236704, "tps": 15809, "wall": 22688.2} {"step": 5473, "train_loss": 3.8044631481170654, "lr": 0.0003799839957668957, "tps": 15808, "wall": 22693.2} {"step": 5474, "train_loss": 3.671027898788452, "lr": 0.00037997521483911704, "tps": 15807, "wall": 22698.2} {"step": 5475, "train_loss": 3.6814088821411133, "lr": 0.0003799664320991305, "tps": 15807, "wall": 22703.2} {"step": 5476, "train_loss": 3.759773015975952, "lr": 0.00037995764754703546, "tps": 15806, "wall": 22708.2} {"step": 5477, "train_loss": 3.6732633113861084, "lr": 0.0003799488611829316, "tps": 15806, "wall": 22713.2} {"step": 5478, "train_loss": 3.6452865600585938, "lr": 0.0003799400730069184, "tps": 15805, "wall": 22718.2} {"step": 5479, "train_loss": 3.630195379257202, "lr": 0.0003799312830190954, "tps": 15804, "wall": 22723.2} {"step": 5480, "train_loss": 3.6512680053710938, "lr": 0.00037992249121956214, "tps": 15804, "wall": 22728.2} {"step": 5481, "train_loss": 3.643052101135254, "lr": 0.0003799136976084183, "tps": 15803, "wall": 22733.2} {"step": 5482, "train_loss": 3.7501633167266846, "lr": 0.00037990490218576335, "tps": 15803, "wall": 22738.2} {"step": 5483, "train_loss": 3.6737818717956543, "lr": 0.00037989610495169714, "tps": 15802, "wall": 22743.2} {"step": 5484, "train_loss": 3.7648491859436035, "lr": 0.00037988730590631913, "tps": 15801, "wall": 22748.2} {"step": 5485, "train_loss": 3.678830623626709, "lr": 0.0003798785050497291, "tps": 15801, "wall": 22753.1} {"step": 5486, "train_loss": 3.7627310752868652, "lr": 0.0003798697023820267, "tps": 15800, "wall": 22758.1} {"step": 5487, "train_loss": 3.8104419708251953, "lr": 0.0003798608979033117, "tps": 15800, "wall": 22763.1} {"step": 5488, "train_loss": 3.7741761207580566, "lr": 0.0003798520916136837, "tps": 15799, "wall": 22768.1} {"step": 5489, "train_loss": 3.788524627685547, "lr": 0.0003798432835132426, "tps": 15798, "wall": 22773.2} {"step": 5490, "train_loss": 3.731997013092041, "lr": 0.00037983447360208817, "tps": 15798, "wall": 22778.1} {"step": 5491, "train_loss": 3.5843563079833984, "lr": 0.00037982566188032017, "tps": 15797, "wall": 22783.1} {"step": 5492, "train_loss": 3.681784152984619, "lr": 0.0003798168483480384, "tps": 15797, "wall": 22788.1} {"step": 5493, "train_loss": 3.650585651397705, "lr": 0.00037980803300534274, "tps": 15796, "wall": 22793.2} {"step": 5494, "train_loss": 3.801783561706543, "lr": 0.000379799215852333, "tps": 15796, "wall": 22798.1} {"step": 5495, "train_loss": 3.755707263946533, "lr": 0.0003797903968891092, "tps": 15795, "wall": 22803.1} {"step": 5496, "train_loss": 3.6396594047546387, "lr": 0.0003797815761157711, "tps": 15794, "wall": 22808.1} {"step": 5497, "train_loss": 3.6441400051116943, "lr": 0.0003797727535324186, "tps": 15794, "wall": 22813.1} {"step": 5498, "train_loss": 3.81762957572937, "lr": 0.00037976392913915177, "tps": 15793, "wall": 22818.1} {"step": 5499, "train_loss": 3.6947860717773438, "lr": 0.0003797551029360705, "tps": 15793, "wall": 22823.1} {"step": 5500, "train_loss": 3.7324438095092773, "lr": 0.00037974627492327477, "tps": 15792, "wall": 22828.1} {"step": 5501, "train_loss": 3.780787229537964, "lr": 0.00037973744510086453, "tps": 15791, "wall": 22833.3} {"step": 5502, "train_loss": 3.7283778190612793, "lr": 0.00037972861346893995, "tps": 15791, "wall": 22838.2} {"step": 5503, "train_loss": 3.8076276779174805, "lr": 0.000379719780027601, "tps": 15790, "wall": 22843.2} {"step": 5504, "train_loss": 3.7300708293914795, "lr": 0.00037971094477694766, "tps": 15790, "wall": 22848.2} {"step": 5505, "train_loss": 3.819878101348877, "lr": 0.0003797021077170802, "tps": 15789, "wall": 22853.2} {"step": 5506, "train_loss": 3.6748099327087402, "lr": 0.0003796932688480986, "tps": 15788, "wall": 22858.2} {"step": 5507, "train_loss": 3.7380590438842773, "lr": 0.0003796844281701029, "tps": 15788, "wall": 22863.2} {"step": 5508, "train_loss": 3.666335105895996, "lr": 0.0003796755856831935, "tps": 15787, "wall": 22868.2} {"step": 5509, "train_loss": 3.6768710613250732, "lr": 0.0003796667413874703, "tps": 15787, "wall": 22873.2} {"step": 5510, "train_loss": 3.728581428527832, "lr": 0.00037965789528303373, "tps": 15786, "wall": 22878.2} {"step": 5511, "train_loss": 3.8082966804504395, "lr": 0.0003796490473699839, "tps": 15785, "wall": 22883.3} {"step": 5512, "train_loss": 3.7710936069488525, "lr": 0.00037964019764842095, "tps": 15785, "wall": 22888.3} {"step": 5513, "train_loss": 3.698127269744873, "lr": 0.0003796313461184452, "tps": 15784, "wall": 22893.3} {"step": 5514, "train_loss": 3.727726459503174, "lr": 0.00037962249278015694, "tps": 15784, "wall": 22898.3} {"step": 5515, "train_loss": 3.7919492721557617, "lr": 0.00037961363763365643, "tps": 15783, "wall": 22903.3} {"step": 5516, "train_loss": 3.7381672859191895, "lr": 0.00037960478067904405, "tps": 15783, "wall": 22908.2} {"step": 5517, "train_loss": 3.6921770572662354, "lr": 0.00037959592191642004, "tps": 15782, "wall": 22913.3} {"step": 5518, "train_loss": 3.795274257659912, "lr": 0.00037958706134588483, "tps": 15781, "wall": 22918.3} {"step": 5519, "train_loss": 3.7070813179016113, "lr": 0.0003795781989675387, "tps": 15781, "wall": 22923.2} {"step": 5520, "train_loss": 3.6177101135253906, "lr": 0.00037956933478148217, "tps": 15780, "wall": 22928.2} {"step": 5521, "train_loss": 3.769284725189209, "lr": 0.00037956046878781556, "tps": 15780, "wall": 22933.2} {"step": 5522, "train_loss": 3.7385549545288086, "lr": 0.0003795516009866393, "tps": 15779, "wall": 22938.2} {"step": 5523, "train_loss": 3.7374744415283203, "lr": 0.00037954273137805384, "tps": 15779, "wall": 22943.1} {"step": 5524, "train_loss": 3.7191977500915527, "lr": 0.00037953385996215974, "tps": 15778, "wall": 22948.2} {"step": 5525, "train_loss": 3.7258336544036865, "lr": 0.00037952498673905744, "tps": 15777, "wall": 22953.2} {"step": 5526, "train_loss": 3.73223614692688, "lr": 0.0003795161117088475, "tps": 15777, "wall": 22958.1} {"step": 5527, "train_loss": 3.7002134323120117, "lr": 0.0003795072348716304, "tps": 15776, "wall": 22963.1} {"step": 5528, "train_loss": 3.7647171020507812, "lr": 0.0003794983562275066, "tps": 15776, "wall": 22968.1} {"step": 5529, "train_loss": 3.781446933746338, "lr": 0.0003794894757765769, "tps": 15775, "wall": 22973.1} {"step": 5530, "train_loss": 3.7003326416015625, "lr": 0.00037948059351894175, "tps": 15774, "wall": 22978.1} {"step": 5531, "train_loss": 3.727699041366577, "lr": 0.00037947170945470184, "tps": 15774, "wall": 22983.1} {"step": 5532, "train_loss": 3.7889599800109863, "lr": 0.00037946282358395777, "tps": 15773, "wall": 22988.1} {"step": 5533, "train_loss": 3.6793622970581055, "lr": 0.00037945393590681025, "tps": 15773, "wall": 22993.1} {"step": 5534, "train_loss": 3.714881658554077, "lr": 0.00037944504642335985, "tps": 15772, "wall": 22998.0} {"step": 5535, "train_loss": 3.7572319507598877, "lr": 0.0003794361551337073, "tps": 15772, "wall": 23003.0} {"step": 5536, "train_loss": 3.6363539695739746, "lr": 0.00037942726203795345, "tps": 15771, "wall": 23008.0} {"step": 5537, "train_loss": 3.6640491485595703, "lr": 0.0003794183671361989, "tps": 15771, "wall": 23013.0} {"step": 5538, "train_loss": 3.695073366165161, "lr": 0.0003794094704285445, "tps": 15770, "wall": 23018.0} {"step": 5539, "train_loss": 3.748110771179199, "lr": 0.000379400571915091, "tps": 15769, "wall": 23023.0} {"step": 5540, "train_loss": 3.758976936340332, "lr": 0.00037939167159593915, "tps": 15769, "wall": 23027.9} {"step": 5541, "train_loss": 3.720682144165039, "lr": 0.00037938276947118983, "tps": 15768, "wall": 23032.9} {"step": 5542, "train_loss": 3.7008373737335205, "lr": 0.0003793738655409439, "tps": 15768, "wall": 23038.0} {"step": 5543, "train_loss": 3.661593437194824, "lr": 0.00037936495980530217, "tps": 15767, "wall": 23042.9} {"step": 5544, "train_loss": 3.7526845932006836, "lr": 0.0003793560522643656, "tps": 15767, "wall": 23047.9} {"step": 5545, "train_loss": 3.703866481781006, "lr": 0.000379347142918235, "tps": 15766, "wall": 23052.9} {"step": 5546, "train_loss": 3.681481122970581, "lr": 0.0003793382317670114, "tps": 15765, "wall": 23057.9} {"step": 5547, "train_loss": 3.7066469192504883, "lr": 0.0003793293188107956, "tps": 15765, "wall": 23062.9} {"step": 5548, "train_loss": 3.7076780796051025, "lr": 0.0003793204040496888, "tps": 15764, "wall": 23067.9} {"step": 5549, "train_loss": 3.642456293106079, "lr": 0.0003793114874837917, "tps": 15764, "wall": 23072.9} {"step": 5550, "train_loss": 3.7369744777679443, "lr": 0.0003793025691132055, "tps": 15763, "wall": 23077.8} {"step": 5551, "train_loss": 3.7004666328430176, "lr": 0.0003792936489380312, "tps": 15763, "wall": 23082.8} {"step": 5552, "train_loss": 3.797895908355713, "lr": 0.0003792847269583698, "tps": 15762, "wall": 23087.8} {"step": 5553, "train_loss": 3.611111640930176, "lr": 0.00037927580317432245, "tps": 15761, "wall": 23092.8} {"step": 5554, "train_loss": 3.6812586784362793, "lr": 0.0003792668775859901, "tps": 15761, "wall": 23097.8} {"step": 5555, "train_loss": 3.7025227546691895, "lr": 0.000379257950193474, "tps": 15760, "wall": 23102.8} {"step": 5556, "train_loss": 3.663658618927002, "lr": 0.0003792490209968752, "tps": 15760, "wall": 23107.8} {"step": 5557, "train_loss": 3.7516918182373047, "lr": 0.0003792400899962949, "tps": 15759, "wall": 23112.7} {"step": 5558, "train_loss": 3.782595634460449, "lr": 0.0003792311571918343, "tps": 15759, "wall": 23117.7} {"step": 5559, "train_loss": 3.6583080291748047, "lr": 0.00037922222258359443, "tps": 15758, "wall": 23122.7} {"step": 5560, "train_loss": 3.7084133625030518, "lr": 0.0003792132861716767, "tps": 15757, "wall": 23127.7} {"step": 5561, "train_loss": 3.66748046875, "lr": 0.00037920434795618216, "tps": 15757, "wall": 23132.7} {"step": 5562, "train_loss": 3.639000415802002, "lr": 0.0003791954079372122, "tps": 15756, "wall": 23137.7} {"step": 5563, "train_loss": 3.7399115562438965, "lr": 0.00037918646611486805, "tps": 15756, "wall": 23142.7} {"step": 5564, "train_loss": 3.7133326530456543, "lr": 0.00037917752248925094, "tps": 15755, "wall": 23147.6} {"step": 5565, "train_loss": 3.7339088916778564, "lr": 0.00037916857706046233, "tps": 15755, "wall": 23152.6} {"step": 5566, "train_loss": 3.8307957649230957, "lr": 0.00037915962982860345, "tps": 15754, "wall": 23157.6} {"step": 5567, "train_loss": 3.712674856185913, "lr": 0.00037915068079377566, "tps": 15754, "wall": 23162.6} {"step": 5568, "train_loss": 3.7106311321258545, "lr": 0.00037914172995608033, "tps": 15753, "wall": 23167.6} {"step": 5569, "train_loss": 3.672067165374756, "lr": 0.0003791327773156189, "tps": 15752, "wall": 23172.6} {"step": 5570, "train_loss": 3.724482297897339, "lr": 0.00037912382287249273, "tps": 15752, "wall": 23177.6} {"step": 5571, "train_loss": 3.7301528453826904, "lr": 0.0003791148666268033, "tps": 15751, "wall": 23182.6} {"step": 5572, "train_loss": 3.6240170001983643, "lr": 0.00037910590857865206, "tps": 15751, "wall": 23187.5} {"step": 5573, "train_loss": 3.8043770790100098, "lr": 0.00037909694872814047, "tps": 15750, "wall": 23192.5} {"step": 5574, "train_loss": 3.673335313796997, "lr": 0.0003790879870753701, "tps": 15750, "wall": 23197.5} {"step": 5575, "train_loss": 3.6574480533599854, "lr": 0.0003790790236204423, "tps": 15749, "wall": 23202.5} {"step": 5576, "train_loss": 3.7496140003204346, "lr": 0.0003790700583634588, "tps": 15748, "wall": 23207.5} {"step": 5577, "train_loss": 3.6691179275512695, "lr": 0.00037906109130452105, "tps": 15748, "wall": 23212.5} {"step": 5578, "train_loss": 3.707468032836914, "lr": 0.0003790521224437306, "tps": 15747, "wall": 23217.5} {"step": 5579, "train_loss": 3.6852569580078125, "lr": 0.0003790431517811892, "tps": 15747, "wall": 23222.5} {"step": 5580, "train_loss": 3.8130974769592285, "lr": 0.0003790341793169983, "tps": 15746, "wall": 23227.5} {"step": 5581, "train_loss": 3.8098275661468506, "lr": 0.00037902520505125957, "tps": 15746, "wall": 23232.5} {"step": 5582, "train_loss": 3.6593003273010254, "lr": 0.0003790162289840748, "tps": 15745, "wall": 23237.5} {"step": 5583, "train_loss": 3.6611506938934326, "lr": 0.00037900725111554557, "tps": 15745, "wall": 23242.5} {"step": 5584, "train_loss": 3.711712598800659, "lr": 0.0003789982714457736, "tps": 15744, "wall": 23247.4} {"step": 5585, "train_loss": 3.7210402488708496, "lr": 0.0003789892899748606, "tps": 15743, "wall": 23252.4} {"step": 5586, "train_loss": 3.592085599899292, "lr": 0.0003789803067029083, "tps": 15743, "wall": 23257.4} {"step": 5587, "train_loss": 3.6814017295837402, "lr": 0.00037897132163001854, "tps": 15742, "wall": 23262.3} {"step": 5588, "train_loss": 3.533304214477539, "lr": 0.000378962334756293, "tps": 15742, "wall": 23267.4} {"step": 5589, "train_loss": 3.8078322410583496, "lr": 0.0003789533460818335, "tps": 15741, "wall": 23272.4} {"step": 5590, "train_loss": 3.684993267059326, "lr": 0.00037894435560674195, "tps": 15741, "wall": 23277.4} {"step": 5591, "train_loss": 3.708970785140991, "lr": 0.00037893536333112013, "tps": 15740, "wall": 23282.4} {"step": 5592, "train_loss": 3.7893757820129395, "lr": 0.0003789263692550699, "tps": 15739, "wall": 23287.4} {"step": 5593, "train_loss": 3.7347378730773926, "lr": 0.0003789173733786932, "tps": 15739, "wall": 23292.4} {"step": 5594, "train_loss": 3.6334738731384277, "lr": 0.0003789083757020919, "tps": 15738, "wall": 23297.4} {"step": 5595, "train_loss": 3.6849024295806885, "lr": 0.0003788993762253679, "tps": 15738, "wall": 23302.4} {"step": 5596, "train_loss": 3.7440378665924072, "lr": 0.00037889037494862315, "tps": 15737, "wall": 23307.4} {"step": 5597, "train_loss": 3.7001466751098633, "lr": 0.0003788813718719597, "tps": 15737, "wall": 23312.3} {"step": 5598, "train_loss": 3.649087429046631, "lr": 0.0003788723669954794, "tps": 15736, "wall": 23317.3} {"step": 5599, "train_loss": 3.613635301589966, "lr": 0.0003788633603192844, "tps": 15736, "wall": 23322.3} {"step": 5600, "train_loss": 3.67445707321167, "lr": 0.00037885435184347664, "tps": 15735, "wall": 23327.3} {"step": 5601, "train_loss": 3.7627813816070557, "lr": 0.0003788453415681581, "tps": 15734, "wall": 23332.2} {"step": 5602, "train_loss": 3.70762300491333, "lr": 0.000378836329493431, "tps": 15734, "wall": 23337.3} {"step": 5603, "train_loss": 3.7125532627105713, "lr": 0.0003788273156193974, "tps": 15733, "wall": 23342.3} {"step": 5604, "train_loss": 3.665860414505005, "lr": 0.00037881829994615933, "tps": 15733, "wall": 23347.3} {"step": 5605, "train_loss": 3.642361879348755, "lr": 0.000378809282473819, "tps": 15732, "wall": 23352.2} {"step": 5606, "train_loss": 3.773545265197754, "lr": 0.0003788002632024785, "tps": 15732, "wall": 23357.2} {"step": 5607, "train_loss": 3.723144054412842, "lr": 0.00037879124213224, "tps": 15731, "wall": 23362.2} {"step": 5608, "train_loss": 3.8096275329589844, "lr": 0.00037878221926320577, "tps": 15731, "wall": 23367.2} {"step": 5609, "train_loss": 3.6234846115112305, "lr": 0.000378773194595478, "tps": 15730, "wall": 23372.1} {"step": 5610, "train_loss": 3.6363956928253174, "lr": 0.0003787641681291588, "tps": 15730, "wall": 23377.1} {"step": 5611, "train_loss": 3.680785655975342, "lr": 0.0003787551398643506, "tps": 15729, "wall": 23382.1} {"step": 5612, "train_loss": 3.7446186542510986, "lr": 0.00037874610980115554, "tps": 15728, "wall": 23387.1} {"step": 5613, "train_loss": 3.719116687774658, "lr": 0.000378737077939676, "tps": 15728, "wall": 23392.1} {"step": 5614, "train_loss": 3.7958731651306152, "lr": 0.0003787280442800142, "tps": 15727, "wall": 23397.1} {"step": 5615, "train_loss": 3.6156558990478516, "lr": 0.00037871900882227263, "tps": 15727, "wall": 23402.1} {"step": 5616, "train_loss": 3.85788631439209, "lr": 0.0003787099715665534, "tps": 15726, "wall": 23407.1} {"step": 5617, "train_loss": 3.6839780807495117, "lr": 0.0003787009325129591, "tps": 15726, "wall": 23412.1} {"step": 5618, "train_loss": 3.723161220550537, "lr": 0.00037869189166159207, "tps": 15725, "wall": 23417.1} {"step": 5619, "train_loss": 3.7233567237854004, "lr": 0.0003786828490125547, "tps": 15725, "wall": 23422.1} {"step": 5620, "train_loss": 3.730778694152832, "lr": 0.0003786738045659494, "tps": 15724, "wall": 23427.0} {"step": 5621, "train_loss": 3.7863759994506836, "lr": 0.0003786647583218786, "tps": 15723, "wall": 23432.0} {"step": 5622, "train_loss": 3.6867167949676514, "lr": 0.0003786557102804449, "tps": 15723, "wall": 23437.0} {"step": 5623, "train_loss": 3.6316757202148438, "lr": 0.0003786466604417508, "tps": 15722, "wall": 23442.0} {"step": 5624, "train_loss": 3.743821144104004, "lr": 0.0003786376088058987, "tps": 15722, "wall": 23447.0} {"step": 5625, "train_loss": 3.731119394302368, "lr": 0.00037862855537299113, "tps": 15721, "wall": 23452.0} {"step": 5626, "train_loss": 3.7202069759368896, "lr": 0.00037861950014313076, "tps": 15721, "wall": 23457.0} {"step": 5627, "train_loss": 3.728031873703003, "lr": 0.00037861044311642006, "tps": 15720, "wall": 23462.0} {"step": 5628, "train_loss": 3.78061580657959, "lr": 0.00037860138429296177, "tps": 15720, "wall": 23467.0} {"step": 5629, "train_loss": 3.7248477935791016, "lr": 0.0003785923236728583, "tps": 15719, "wall": 23472.0} {"step": 5630, "train_loss": 3.8359227180480957, "lr": 0.00037858326125621245, "tps": 15718, "wall": 23477.0} {"step": 5631, "train_loss": 3.8396129608154297, "lr": 0.0003785741970431269, "tps": 15718, "wall": 23482.0} {"step": 5632, "train_loss": 3.8112587928771973, "lr": 0.00037856513103370416, "tps": 15717, "wall": 23487.0} {"step": 5633, "train_loss": 3.724280595779419, "lr": 0.00037855606322804715, "tps": 15717, "wall": 23492.0} {"step": 5634, "train_loss": 3.5962846279144287, "lr": 0.0003785469936262584, "tps": 15716, "wall": 23497.0} {"step": 5635, "train_loss": 3.6854844093322754, "lr": 0.0003785379222284407, "tps": 15716, "wall": 23501.9} {"step": 5636, "train_loss": 3.6505794525146484, "lr": 0.000378528849034697, "tps": 15715, "wall": 23506.9} {"step": 5637, "train_loss": 3.6966593265533447, "lr": 0.00037851977404512976, "tps": 15715, "wall": 23511.9} {"step": 5638, "train_loss": 3.7716755867004395, "lr": 0.000378510697259842, "tps": 15714, "wall": 23517.0} {"step": 5639, "train_loss": 3.7395095825195312, "lr": 0.00037850161867893653, "tps": 15713, "wall": 23522.0} {"step": 5640, "train_loss": 3.6879637241363525, "lr": 0.0003784925383025161, "tps": 15713, "wall": 23527.0} {"step": 5641, "train_loss": 3.746513843536377, "lr": 0.0003784834561306836, "tps": 15712, "wall": 23532.0} {"step": 5642, "train_loss": 3.762856960296631, "lr": 0.00037847437216354196, "tps": 15712, "wall": 23537.0} {"step": 5643, "train_loss": 3.696417808532715, "lr": 0.0003784652864011941, "tps": 15711, "wall": 23541.9} {"step": 5644, "train_loss": 3.6988773345947266, "lr": 0.0003784561988437428, "tps": 15711, "wall": 23547.0} {"step": 5645, "train_loss": 3.7839090824127197, "lr": 0.0003784471094912912, "tps": 15710, "wall": 23552.0} {"step": 5646, "train_loss": 3.681886672973633, "lr": 0.0003784380183439421, "tps": 15710, "wall": 23557.0} {"step": 5647, "train_loss": 3.812340259552002, "lr": 0.00037842892540179864, "tps": 15709, "wall": 23562.0} {"step": 5648, "train_loss": 3.6778273582458496, "lr": 0.00037841983066496374, "tps": 15708, "wall": 23566.9} {"step": 5649, "train_loss": 3.6720666885375977, "lr": 0.00037841073413354034, "tps": 15708, "wall": 23571.9} {"step": 5650, "train_loss": 3.77827787399292, "lr": 0.00037840163580763164, "tps": 15707, "wall": 23577.0} {"step": 5651, "train_loss": 3.792290687561035, "lr": 0.00037839253568734064, "tps": 15707, "wall": 23582.0} {"step": 5652, "train_loss": 3.753908157348633, "lr": 0.0003783834337727704, "tps": 15706, "wall": 23587.0} {"step": 5653, "train_loss": 3.830624580383301, "lr": 0.00037837433006402413, "tps": 15706, "wall": 23592.0} {"step": 5654, "train_loss": 3.690676212310791, "lr": 0.0003783652245612048, "tps": 15705, "wall": 23597.0} {"step": 5655, "train_loss": 3.752359390258789, "lr": 0.0003783561172644157, "tps": 15705, "wall": 23602.0} {"step": 5656, "train_loss": 3.751441478729248, "lr": 0.0003783470081737598, "tps": 15704, "wall": 23607.0} {"step": 5657, "train_loss": 3.741135597229004, "lr": 0.00037833789728934056, "tps": 15703, "wall": 23612.0} {"step": 5658, "train_loss": 3.748171329498291, "lr": 0.000378328784611261, "tps": 15703, "wall": 23617.0} {"step": 5659, "train_loss": 3.7880630493164062, "lr": 0.00037831967013962436, "tps": 15702, "wall": 23622.0} {"step": 5660, "train_loss": 3.6952459812164307, "lr": 0.00037831055387453405, "tps": 15702, "wall": 23627.0} {"step": 5661, "train_loss": 3.733266592025757, "lr": 0.0003783014358160931, "tps": 15701, "wall": 23632.0} {"step": 5662, "train_loss": 3.805617570877075, "lr": 0.000378292315964405, "tps": 15701, "wall": 23637.0} {"step": 5663, "train_loss": 3.6271812915802, "lr": 0.00037828319431957295, "tps": 15700, "wall": 23642.0} {"step": 5664, "train_loss": 3.7016689777374268, "lr": 0.0003782740708817003, "tps": 15700, "wall": 23647.0} {"step": 5665, "train_loss": 3.62603497505188, "lr": 0.0003782649456508905, "tps": 15699, "wall": 23652.0} {"step": 5666, "train_loss": 3.7480337619781494, "lr": 0.00037825581862724675, "tps": 15699, "wall": 23657.0} {"step": 5667, "train_loss": 3.7202272415161133, "lr": 0.00037824668981087254, "tps": 15698, "wall": 23662.0} {"step": 5668, "train_loss": 3.7458596229553223, "lr": 0.00037823755920187124, "tps": 15697, "wall": 23667.0} {"step": 5669, "train_loss": 3.7323851585388184, "lr": 0.00037822842680034635, "tps": 15697, "wall": 23672.0} {"step": 5670, "train_loss": 3.7742319107055664, "lr": 0.0003782192926064013, "tps": 15696, "wall": 23677.1} {"step": 5671, "train_loss": 3.75321102142334, "lr": 0.00037821015662013946, "tps": 15696, "wall": 23682.1} {"step": 5672, "train_loss": 3.7423617839813232, "lr": 0.0003782010188416645, "tps": 15695, "wall": 23687.1} {"step": 5673, "train_loss": 3.6935150623321533, "lr": 0.00037819187927107977, "tps": 15695, "wall": 23692.0} {"step": 5674, "train_loss": 3.656787872314453, "lr": 0.00037818273790848894, "tps": 15694, "wall": 23697.1} {"step": 5675, "train_loss": 3.6568374633789062, "lr": 0.00037817359475399544, "tps": 15694, "wall": 23702.1} {"step": 5676, "train_loss": 3.7050347328186035, "lr": 0.0003781644498077029, "tps": 15693, "wall": 23707.1} {"step": 5677, "train_loss": 3.783590316772461, "lr": 0.00037815530306971497, "tps": 15692, "wall": 23712.1} {"step": 5678, "train_loss": 3.6183605194091797, "lr": 0.0003781461545401352, "tps": 15692, "wall": 23717.1} {"step": 5679, "train_loss": 3.6239256858825684, "lr": 0.00037813700421906717, "tps": 15691, "wall": 23722.0} {"step": 5680, "train_loss": 3.6587977409362793, "lr": 0.00037812785210661467, "tps": 15691, "wall": 23727.1} {"step": 5681, "train_loss": 3.6214494705200195, "lr": 0.00037811869820288124, "tps": 15690, "wall": 23732.1} {"step": 5682, "train_loss": 3.680997371673584, "lr": 0.00037810954250797074, "tps": 15690, "wall": 23737.1} {"step": 5683, "train_loss": 3.781703472137451, "lr": 0.0003781003850219867, "tps": 15689, "wall": 23742.0} {"step": 5684, "train_loss": 3.802882194519043, "lr": 0.000378091225745033, "tps": 15689, "wall": 23747.0} {"step": 5685, "train_loss": 3.743253231048584, "lr": 0.0003780820646772133, "tps": 15688, "wall": 23752.0} {"step": 5686, "train_loss": 3.6720492839813232, "lr": 0.00037807290181863146, "tps": 15688, "wall": 23757.0} {"step": 5687, "train_loss": 3.718433380126953, "lr": 0.0003780637371693912, "tps": 15687, "wall": 23762.0} {"step": 5688, "train_loss": 3.7140297889709473, "lr": 0.0003780545707295964, "tps": 15687, "wall": 23767.0} {"step": 5689, "train_loss": 3.7161803245544434, "lr": 0.0003780454024993509, "tps": 15686, "wall": 23772.0} {"step": 5690, "train_loss": 3.7287092208862305, "lr": 0.0003780362324787584, "tps": 15685, "wall": 23777.0} {"step": 5691, "train_loss": 3.7752761840820312, "lr": 0.000378027060667923, "tps": 15685, "wall": 23782.0} {"step": 5692, "train_loss": 3.657968044281006, "lr": 0.00037801788706694857, "tps": 15684, "wall": 23786.9} {"step": 5693, "train_loss": 3.5825400352478027, "lr": 0.0003780087116759389, "tps": 15684, "wall": 23791.9} {"step": 5694, "train_loss": 3.6531262397766113, "lr": 0.000377999534494998, "tps": 15683, "wall": 23796.9} {"step": 5695, "train_loss": 3.7964694499969482, "lr": 0.0003779903555242299, "tps": 15683, "wall": 23801.9} {"step": 5696, "train_loss": 3.587242603302002, "lr": 0.00037798117476373836, "tps": 15682, "wall": 23806.8} {"step": 5697, "train_loss": 3.6615614891052246, "lr": 0.00037797199221362767, "tps": 15682, "wall": 23811.8} {"step": 5698, "train_loss": 3.7748403549194336, "lr": 0.00037796280787400155, "tps": 15681, "wall": 23816.9} {"step": 5699, "train_loss": 3.7278947830200195, "lr": 0.00037795362174496437, "tps": 15681, "wall": 23821.8} {"step": 5700, "train_loss": 3.748504877090454, "lr": 0.0003779444338266199, "tps": 15680, "wall": 23826.8} {"step": 5701, "train_loss": 3.6562366485595703, "lr": 0.0003779352441190724, "tps": 15680, "wall": 23831.8} {"step": 5702, "train_loss": 3.7127089500427246, "lr": 0.00037792605262242584, "tps": 15679, "wall": 23836.8} {"step": 5703, "train_loss": 3.715482711791992, "lr": 0.00037791685933678446, "tps": 15679, "wall": 23841.8} {"step": 5704, "train_loss": 3.6133060455322266, "lr": 0.0003779076642622523, "tps": 15678, "wall": 23846.7} {"step": 5705, "train_loss": 3.631382703781128, "lr": 0.0003778984673989336, "tps": 15678, "wall": 23851.7} {"step": 5706, "train_loss": 3.65108585357666, "lr": 0.0003778892687469326, "tps": 15677, "wall": 23856.7} {"step": 5707, "train_loss": 3.711113452911377, "lr": 0.00037788006830635334, "tps": 15676, "wall": 23861.7} {"step": 5708, "train_loss": 3.7292535305023193, "lr": 0.0003778708660773002, "tps": 15676, "wall": 23866.7} {"step": 5709, "train_loss": 3.6711266040802, "lr": 0.00037786166205987725, "tps": 15675, "wall": 23871.7} {"step": 5710, "train_loss": 3.779486656188965, "lr": 0.0003778524562541889, "tps": 15675, "wall": 23876.7} {"step": 5711, "train_loss": 3.602140426635742, "lr": 0.0003778432486603394, "tps": 15674, "wall": 23881.7} {"step": 5712, "train_loss": 3.680515766143799, "lr": 0.000377834039278433, "tps": 15674, "wall": 23886.7} {"step": 5713, "train_loss": 3.7265114784240723, "lr": 0.00037782482810857414, "tps": 15673, "wall": 23891.7} {"step": 5714, "train_loss": 3.668273448944092, "lr": 0.000377815615150867, "tps": 15673, "wall": 23896.6} {"step": 5715, "train_loss": 3.7526423931121826, "lr": 0.00037780640040541613, "tps": 15672, "wall": 23901.6} {"step": 5716, "train_loss": 3.748326301574707, "lr": 0.0003777971838723257, "tps": 15672, "wall": 23906.6} {"step": 5717, "train_loss": 3.6684916019439697, "lr": 0.00037778796555170037, "tps": 15671, "wall": 23911.6} {"step": 5718, "train_loss": 3.606576442718506, "lr": 0.0003777787454436443, "tps": 15671, "wall": 23916.6} {"step": 5719, "train_loss": 3.707284450531006, "lr": 0.0003777695235482621, "tps": 15670, "wall": 23921.6} {"step": 5720, "train_loss": 3.7365853786468506, "lr": 0.0003777602998656583, "tps": 15670, "wall": 23926.6} {"step": 5721, "train_loss": 3.7113490104675293, "lr": 0.0003777510743959372, "tps": 15669, "wall": 23931.5} {"step": 5722, "train_loss": 3.7048017978668213, "lr": 0.0003777418471392034, "tps": 15669, "wall": 23936.6} {"step": 5723, "train_loss": 3.777946949005127, "lr": 0.00037773261809556137, "tps": 15668, "wall": 23941.5} {"step": 5724, "train_loss": 3.7595877647399902, "lr": 0.0003777233872651158, "tps": 15667, "wall": 23946.5} {"step": 5725, "train_loss": 3.634136199951172, "lr": 0.00037771415464797116, "tps": 15667, "wall": 23951.5} {"step": 5726, "train_loss": 3.6111631393432617, "lr": 0.00037770492024423203, "tps": 15666, "wall": 23956.4} {"step": 5727, "train_loss": 3.7257018089294434, "lr": 0.000377695684054003, "tps": 15666, "wall": 23961.4} {"step": 5728, "train_loss": 3.7037806510925293, "lr": 0.00037768644607738875, "tps": 15665, "wall": 23966.5} {"step": 5729, "train_loss": 3.6727042198181152, "lr": 0.0003776772063144939, "tps": 15665, "wall": 23971.4} {"step": 5730, "train_loss": 3.7370071411132812, "lr": 0.00037766796476542314, "tps": 15664, "wall": 23976.4} {"step": 5731, "train_loss": 3.705986499786377, "lr": 0.00037765872143028114, "tps": 15664, "wall": 23981.4} {"step": 5732, "train_loss": 3.8275418281555176, "lr": 0.0003776494763091726, "tps": 15663, "wall": 23986.4} {"step": 5733, "train_loss": 3.6873576641082764, "lr": 0.0003776402294022023, "tps": 15663, "wall": 23991.3} {"step": 5734, "train_loss": 3.693129301071167, "lr": 0.00037763098070947495, "tps": 15662, "wall": 23996.4} {"step": 5735, "train_loss": 3.7783713340759277, "lr": 0.0003776217302310953, "tps": 15662, "wall": 24001.4} {"step": 5736, "train_loss": 3.7751498222351074, "lr": 0.00037761247796716817, "tps": 15661, "wall": 24006.3} {"step": 5737, "train_loss": 3.7995710372924805, "lr": 0.0003776032239177984, "tps": 15661, "wall": 24011.3} {"step": 5738, "train_loss": 3.637415885925293, "lr": 0.00037759396808309065, "tps": 15660, "wall": 24016.3} {"step": 5739, "train_loss": 3.7186267375946045, "lr": 0.00037758471046315004, "tps": 15660, "wall": 24021.2} {"step": 5740, "train_loss": 3.7088186740875244, "lr": 0.00037757545105808124, "tps": 15659, "wall": 24026.2} {"step": 5741, "train_loss": 3.8390698432922363, "lr": 0.00037756618986798925, "tps": 15659, "wall": 24031.2} {"step": 5742, "train_loss": 3.7504770755767822, "lr": 0.0003775569268929789, "tps": 15658, "wall": 24036.1} {"step": 5743, "train_loss": 3.7711617946624756, "lr": 0.0003775476621331552, "tps": 15658, "wall": 24041.1} {"step": 5744, "train_loss": 3.7038607597351074, "lr": 0.000377538395588623, "tps": 15657, "wall": 24046.1} {"step": 5745, "train_loss": 3.63673734664917, "lr": 0.00037752912725948744, "tps": 15657, "wall": 24051.1} {"step": 5746, "train_loss": 3.6567652225494385, "lr": 0.0003775198571458533, "tps": 15656, "wall": 24056.1} {"step": 5747, "train_loss": 3.5471441745758057, "lr": 0.00037751058524782574, "tps": 15656, "wall": 24061.1} {"step": 5748, "train_loss": 3.7251415252685547, "lr": 0.0003775013115655097, "tps": 15655, "wall": 24066.0} {"step": 5749, "train_loss": 3.7438652515411377, "lr": 0.00037749203609901033, "tps": 15655, "wall": 24071.0} {"step": 5750, "train_loss": 3.628689765930176, "lr": 0.00037748275884843266, "tps": 15654, "wall": 24076.0} {"step": 5751, "train_loss": 3.7293670177459717, "lr": 0.00037747347981388174, "tps": 15653, "wall": 24081.0} {"step": 5752, "train_loss": 3.7234385013580322, "lr": 0.0003774641989954628, "tps": 15653, "wall": 24086.0} {"step": 5753, "train_loss": 3.7249631881713867, "lr": 0.0003774549163932808, "tps": 15652, "wall": 24090.9} {"step": 5754, "train_loss": 3.6380558013916016, "lr": 0.000377445632007441, "tps": 15652, "wall": 24095.9} {"step": 5755, "train_loss": 3.617530584335327, "lr": 0.0003774363458380486, "tps": 15651, "wall": 24100.9} {"step": 5756, "train_loss": 3.688739538192749, "lr": 0.00037742705788520873, "tps": 15651, "wall": 24105.8} {"step": 5757, "train_loss": 3.680654525756836, "lr": 0.00037741776814902665, "tps": 15650, "wall": 24110.8} {"step": 5758, "train_loss": 3.7295122146606445, "lr": 0.0003774084766296076, "tps": 15650, "wall": 24115.9} {"step": 5759, "train_loss": 3.6400022506713867, "lr": 0.0003773991833270568, "tps": 15649, "wall": 24120.9} {"step": 5760, "train_loss": 3.7517805099487305, "lr": 0.0003773898882414795, "tps": 15649, "wall": 24125.8} {"step": 5761, "train_loss": 3.8082215785980225, "lr": 0.00037738059137298104, "tps": 15648, "wall": 24130.8} {"step": 5762, "train_loss": 3.7338714599609375, "lr": 0.0003773712927216667, "tps": 15648, "wall": 24135.8} {"step": 5763, "train_loss": 3.686556577682495, "lr": 0.00037736199228764197, "tps": 15647, "wall": 24140.8} {"step": 5764, "train_loss": 3.665513515472412, "lr": 0.00037735269007101196, "tps": 15647, "wall": 24145.7} {"step": 5765, "train_loss": 3.794703960418701, "lr": 0.00037734338607188213, "tps": 15646, "wall": 24150.7} {"step": 5766, "train_loss": 3.640838146209717, "lr": 0.00037733408029035797, "tps": 15646, "wall": 24155.7} {"step": 5767, "train_loss": 3.724445343017578, "lr": 0.00037732477272654487, "tps": 15645, "wall": 24160.7} {"step": 5768, "train_loss": 3.744493007659912, "lr": 0.00037731546338054826, "tps": 15645, "wall": 24165.7} {"step": 5769, "train_loss": 3.7763845920562744, "lr": 0.00037730615225247354, "tps": 15644, "wall": 24170.6} {"step": 5770, "train_loss": 3.731734275817871, "lr": 0.00037729683934242613, "tps": 15644, "wall": 24175.7} {"step": 5771, "train_loss": 3.6429643630981445, "lr": 0.0003772875246505117, "tps": 15643, "wall": 24180.7} {"step": 5772, "train_loss": 3.6093857288360596, "lr": 0.0003772782081768357, "tps": 15643, "wall": 24185.7} {"step": 5773, "train_loss": 3.669316530227661, "lr": 0.00037726888992150356, "tps": 15642, "wall": 24190.7} {"step": 5774, "train_loss": 3.7302868366241455, "lr": 0.000377259569884621, "tps": 15642, "wall": 24195.6} {"step": 5775, "train_loss": 3.6734495162963867, "lr": 0.00037725024806629345, "tps": 15641, "wall": 24200.6} {"step": 5776, "train_loss": 3.677485942840576, "lr": 0.00037724092446662666, "tps": 15641, "wall": 24205.6} {"step": 5777, "train_loss": 3.6379404067993164, "lr": 0.0003772315990857262, "tps": 15640, "wall": 24210.6} {"step": 5778, "train_loss": 3.696821451187134, "lr": 0.0003772222719236976, "tps": 15640, "wall": 24215.5} {"step": 5779, "train_loss": 3.73948073387146, "lr": 0.00037721294298064656, "tps": 15639, "wall": 24220.5} {"step": 5780, "train_loss": 3.5937013626098633, "lr": 0.0003772036122566789, "tps": 15639, "wall": 24225.5} {"step": 5781, "train_loss": 3.7064175605773926, "lr": 0.00037719427975190016, "tps": 15638, "wall": 24230.5} {"step": 5782, "train_loss": 3.6901447772979736, "lr": 0.0003771849454664162, "tps": 15637, "wall": 24235.5} {"step": 5783, "train_loss": 3.7512996196746826, "lr": 0.00037717560940033254, "tps": 15637, "wall": 24240.5} {"step": 5784, "train_loss": 3.9186153411865234, "lr": 0.0003771662715537552, "tps": 15636, "wall": 24245.5} {"step": 5785, "train_loss": 3.743515968322754, "lr": 0.0003771569319267897, "tps": 15636, "wall": 24250.5} {"step": 5786, "train_loss": 3.7015252113342285, "lr": 0.00037714759051954205, "tps": 15635, "wall": 24255.4} {"step": 5787, "train_loss": 3.666328191757202, "lr": 0.00037713824733211795, "tps": 15635, "wall": 24260.4} {"step": 5788, "train_loss": 3.804943323135376, "lr": 0.00037712890236462336, "tps": 15634, "wall": 24265.4} {"step": 5789, "train_loss": 3.655503273010254, "lr": 0.00037711955561716407, "tps": 15634, "wall": 24270.4} {"step": 5790, "train_loss": 3.5708823204040527, "lr": 0.0003771102070898458, "tps": 15633, "wall": 24275.4} {"step": 5791, "train_loss": 3.57145094871521, "lr": 0.0003771008567827748, "tps": 15633, "wall": 24280.4} {"step": 5792, "train_loss": 3.652857780456543, "lr": 0.0003770915046960567, "tps": 15632, "wall": 24285.3} {"step": 5793, "train_loss": 3.6544480323791504, "lr": 0.00037708215082979754, "tps": 15632, "wall": 24290.3} {"step": 5794, "train_loss": 3.5526626110076904, "lr": 0.00037707279518410324, "tps": 15631, "wall": 24295.3} {"step": 5795, "train_loss": 3.6668944358825684, "lr": 0.0003770634377590799, "tps": 15631, "wall": 24300.3} {"step": 5796, "train_loss": 3.84744930267334, "lr": 0.00037705407855483336, "tps": 15630, "wall": 24305.3} {"step": 5797, "train_loss": 3.7196455001831055, "lr": 0.0003770447175714698, "tps": 15630, "wall": 24310.3} {"step": 5798, "train_loss": 3.6531572341918945, "lr": 0.00037703535480909515, "tps": 15629, "wall": 24315.3} {"step": 5799, "train_loss": 3.714064359664917, "lr": 0.00037702599026781546, "tps": 15629, "wall": 24320.2} {"step": 5800, "train_loss": 3.6169724464416504, "lr": 0.00037701662394773694, "tps": 15628, "wall": 24325.2} {"step": 5801, "train_loss": 3.6852290630340576, "lr": 0.0003770072558489655, "tps": 15628, "wall": 24330.2} {"step": 5802, "train_loss": 3.7929394245147705, "lr": 0.00037699788597160745, "tps": 15627, "wall": 24335.2} {"step": 5803, "train_loss": 3.6067252159118652, "lr": 0.0003769885143157689, "tps": 15627, "wall": 24340.1} {"step": 5804, "train_loss": 3.702646255493164, "lr": 0.00037697914088155593, "tps": 15626, "wall": 24345.1} {"step": 5805, "train_loss": 3.694192886352539, "lr": 0.0003769697656690747, "tps": 15626, "wall": 24350.1} {"step": 5806, "train_loss": 3.6554946899414062, "lr": 0.00037696038867843153, "tps": 15625, "wall": 24355.1} {"step": 5807, "train_loss": 3.67758846282959, "lr": 0.00037695100990973253, "tps": 15625, "wall": 24360.1} {"step": 5808, "train_loss": 3.684450149536133, "lr": 0.00037694162936308405, "tps": 15624, "wall": 24365.0} {"step": 5809, "train_loss": 3.7076525688171387, "lr": 0.0003769322470385923, "tps": 15624, "wall": 24370.0} {"step": 5810, "train_loss": 3.6649744510650635, "lr": 0.00037692286293636355, "tps": 15623, "wall": 24375.0} {"step": 5811, "train_loss": 3.6648645401000977, "lr": 0.0003769134770565041, "tps": 15623, "wall": 24380.0} {"step": 5812, "train_loss": 3.776486873626709, "lr": 0.0003769040893991203, "tps": 15622, "wall": 24384.9} {"step": 5813, "train_loss": 3.7475337982177734, "lr": 0.00037689469996431856, "tps": 15622, "wall": 24389.9} {"step": 5814, "train_loss": 3.661487102508545, "lr": 0.00037688530875220504, "tps": 15621, "wall": 24394.9} {"step": 5815, "train_loss": 3.717921733856201, "lr": 0.00037687591576288635, "tps": 15621, "wall": 24399.8} {"step": 5816, "train_loss": 3.7363760471343994, "lr": 0.0003768665209964688, "tps": 15620, "wall": 24404.8} {"step": 5817, "train_loss": 3.7961010932922363, "lr": 0.0003768571244530588, "tps": 15620, "wall": 24409.8} {"step": 5818, "train_loss": 3.763343334197998, "lr": 0.0003768477261327628, "tps": 15619, "wall": 24414.9} {"step": 5819, "train_loss": 3.587392807006836, "lr": 0.0003768383260356872, "tps": 15619, "wall": 24419.8} {"step": 5820, "train_loss": 3.518258571624756, "lr": 0.0003768289241619387, "tps": 15618, "wall": 24424.8} {"step": 5821, "train_loss": 3.751467227935791, "lr": 0.00037681952051162363, "tps": 15618, "wall": 24429.7} {"step": 5822, "train_loss": 3.6315503120422363, "lr": 0.0003768101150848485, "tps": 15617, "wall": 24434.7} {"step": 5823, "train_loss": 3.7023305892944336, "lr": 0.00037680070788171987, "tps": 15617, "wall": 24439.7} {"step": 5824, "train_loss": 3.621612071990967, "lr": 0.0003767912989023444, "tps": 15616, "wall": 24444.7} {"step": 5825, "train_loss": 3.778438091278076, "lr": 0.00037678188814682857, "tps": 15616, "wall": 24449.6} {"step": 5826, "train_loss": 3.5943105220794678, "lr": 0.0003767724756152791, "tps": 15615, "wall": 24454.6} {"step": 5827, "train_loss": 3.6541872024536133, "lr": 0.0003767630613078025, "tps": 15615, "wall": 24459.5} {"step": 5828, "train_loss": 3.606034994125366, "lr": 0.0003767536452245054, "tps": 15614, "wall": 24464.5} {"step": 5829, "train_loss": 3.685426712036133, "lr": 0.00037674422736549463, "tps": 15614, "wall": 24469.5} {"step": 5830, "train_loss": 3.7174532413482666, "lr": 0.00037673480773087675, "tps": 15613, "wall": 24474.6} {"step": 5831, "train_loss": 3.6606953144073486, "lr": 0.0003767253863207585, "tps": 15613, "wall": 24479.5} {"step": 5832, "train_loss": 3.6853513717651367, "lr": 0.0003767159631352465, "tps": 15612, "wall": 24484.5} {"step": 5833, "train_loss": 3.6189966201782227, "lr": 0.0003767065381744477, "tps": 15612, "wall": 24489.4} {"step": 5834, "train_loss": 3.638134241104126, "lr": 0.0003766971114384687, "tps": 15611, "wall": 24494.4} {"step": 5835, "train_loss": 3.733339548110962, "lr": 0.00037668768292741634, "tps": 15611, "wall": 24499.5} {"step": 5836, "train_loss": 3.593022346496582, "lr": 0.00037667825264139747, "tps": 15610, "wall": 24504.4} {"step": 5837, "train_loss": 3.763242244720459, "lr": 0.0003766688205805188, "tps": 15610, "wall": 24509.4} {"step": 5838, "train_loss": 3.6905527114868164, "lr": 0.00037665938674488736, "tps": 15609, "wall": 24514.4} {"step": 5839, "train_loss": 3.5347259044647217, "lr": 0.0003766499511346099, "tps": 15609, "wall": 24519.3} {"step": 5840, "train_loss": 3.743661403656006, "lr": 0.0003766405137497933, "tps": 15608, "wall": 24524.3} {"step": 5841, "train_loss": 3.6639933586120605, "lr": 0.00037663107459054445, "tps": 15608, "wall": 24529.3} {"step": 5842, "train_loss": 3.677488088607788, "lr": 0.0003766216336569703, "tps": 15607, "wall": 24534.3} {"step": 5843, "train_loss": 3.772613525390625, "lr": 0.0003766121909491779, "tps": 15607, "wall": 24539.3} {"step": 5844, "train_loss": 3.751600980758667, "lr": 0.00037660274646727403, "tps": 15606, "wall": 24544.2} {"step": 5845, "train_loss": 3.5473625659942627, "lr": 0.00037659330021136585, "tps": 15606, "wall": 24549.2} {"step": 5846, "train_loss": 3.730134963989258, "lr": 0.00037658385218156023, "tps": 15605, "wall": 24554.2} {"step": 5847, "train_loss": 3.6453447341918945, "lr": 0.0003765744023779643, "tps": 15605, "wall": 24559.1} {"step": 5848, "train_loss": 3.675640821456909, "lr": 0.00037656495080068506, "tps": 15604, "wall": 24564.1} {"step": 5849, "train_loss": 3.6825032234191895, "lr": 0.00037655549744982964, "tps": 15604, "wall": 24569.1} {"step": 5850, "train_loss": 3.690199851989746, "lr": 0.000376546042325505, "tps": 15603, "wall": 24574.0} {"step": 5851, "train_loss": 3.6461167335510254, "lr": 0.0003765365854278183, "tps": 15603, "wall": 24579.0} {"step": 5852, "train_loss": 3.5887787342071533, "lr": 0.0003765271267568768, "tps": 15602, "wall": 24584.0} {"step": 5853, "train_loss": 3.5962767601013184, "lr": 0.0003765176663127875, "tps": 15602, "wall": 24588.9} {"step": 5854, "train_loss": 3.726775884628296, "lr": 0.0003765082040956576, "tps": 15601, "wall": 24594.0} {"step": 5855, "train_loss": 3.6921632289886475, "lr": 0.00037649874010559423, "tps": 15601, "wall": 24598.9} {"step": 5856, "train_loss": 3.8290462493896484, "lr": 0.00037648927434270473, "tps": 15600, "wall": 24603.9} {"step": 5857, "train_loss": 3.577033758163452, "lr": 0.00037647980680709627, "tps": 15600, "wall": 24608.9} {"step": 5858, "train_loss": 3.729792594909668, "lr": 0.0003764703374988761, "tps": 15599, "wall": 24613.8} {"step": 5859, "train_loss": 3.752089500427246, "lr": 0.00037646086641815143, "tps": 15599, "wall": 24618.8} {"step": 5860, "train_loss": 3.590927839279175, "lr": 0.0003764513935650296, "tps": 15598, "wall": 24623.8} {"step": 5861, "train_loss": 3.6274566650390625, "lr": 0.00037644191893961796, "tps": 15598, "wall": 24628.8} {"step": 5862, "train_loss": 3.7050983905792236, "lr": 0.0003764324425420238, "tps": 15598, "wall": 24633.7} {"step": 5863, "train_loss": 3.615063190460205, "lr": 0.0003764229643723545, "tps": 15597, "wall": 24638.7} {"step": 5864, "train_loss": 3.6612796783447266, "lr": 0.0003764134844307173, "tps": 15597, "wall": 24643.7} {"step": 5865, "train_loss": 3.6448702812194824, "lr": 0.0003764040027172198, "tps": 15596, "wall": 24648.6} {"step": 5866, "train_loss": 3.7380881309509277, "lr": 0.00037639451923196927, "tps": 15596, "wall": 24653.7} {"step": 5867, "train_loss": 3.655329465866089, "lr": 0.00037638503397507305, "tps": 15595, "wall": 24658.6} {"step": 5868, "train_loss": 3.717815399169922, "lr": 0.00037637554694663883, "tps": 15595, "wall": 24663.6} {"step": 5869, "train_loss": 3.6641926765441895, "lr": 0.0003763660581467739, "tps": 15594, "wall": 24668.6} {"step": 5870, "train_loss": 3.7469515800476074, "lr": 0.0003763565675755858, "tps": 15594, "wall": 24673.5} {"step": 5871, "train_loss": 3.7173984050750732, "lr": 0.00037634707523318206, "tps": 15593, "wall": 24678.5} {"step": 5872, "train_loss": 3.685629367828369, "lr": 0.00037633758111967026, "tps": 15593, "wall": 24683.5} {"step": 5873, "train_loss": 3.6997814178466797, "lr": 0.0003763280852351578, "tps": 15592, "wall": 24688.5} {"step": 5874, "train_loss": 3.633836269378662, "lr": 0.0003763185875797523, "tps": 15592, "wall": 24693.4} {"step": 5875, "train_loss": 3.7861433029174805, "lr": 0.00037630908815356145, "tps": 15591, "wall": 24698.4} {"step": 5876, "train_loss": 3.698991298675537, "lr": 0.0003762995869566928, "tps": 15591, "wall": 24703.4} {"step": 5877, "train_loss": 3.713352680206299, "lr": 0.00037629008398925396, "tps": 15590, "wall": 24708.3} {"step": 5878, "train_loss": 3.6124274730682373, "lr": 0.0003762805792513526, "tps": 15590, "wall": 24713.4} {"step": 5879, "train_loss": 3.6602649688720703, "lr": 0.00037627107274309634, "tps": 15589, "wall": 24718.3} {"step": 5880, "train_loss": 3.562675952911377, "lr": 0.00037626156446459293, "tps": 15589, "wall": 24723.3} {"step": 5881, "train_loss": 3.68247389793396, "lr": 0.0003762520544159501, "tps": 15588, "wall": 24728.2} {"step": 5882, "train_loss": 3.789334774017334, "lr": 0.00037624254259727553, "tps": 15588, "wall": 24733.2} {"step": 5883, "train_loss": 3.6208324432373047, "lr": 0.000376233029008677, "tps": 15587, "wall": 24738.2} {"step": 5884, "train_loss": 3.7311739921569824, "lr": 0.0003762235136502622, "tps": 15587, "wall": 24743.1} {"step": 5885, "train_loss": 3.6891369819641113, "lr": 0.00037621399652213903, "tps": 15586, "wall": 24748.1} {"step": 5886, "train_loss": 3.6824331283569336, "lr": 0.00037620447762441527, "tps": 15586, "wall": 24753.0} {"step": 5887, "train_loss": 3.7031607627868652, "lr": 0.0003761949569571987, "tps": 15585, "wall": 24758.0} {"step": 5888, "train_loss": 3.664066791534424, "lr": 0.0003761854345205972, "tps": 15585, "wall": 24763.0} {"step": 5889, "train_loss": 3.66325044631958, "lr": 0.0003761759103147187, "tps": 15584, "wall": 24767.9} {"step": 5890, "train_loss": 3.7590909004211426, "lr": 0.000376166384339671, "tps": 15584, "wall": 24772.9} {"step": 5891, "train_loss": 3.647017478942871, "lr": 0.00037615685659556205, "tps": 15583, "wall": 24778.0} {"step": 5892, "train_loss": 3.71171236038208, "lr": 0.0003761473270824998, "tps": 15583, "wall": 24782.9} {"step": 5893, "train_loss": 3.711721897125244, "lr": 0.00037613779580059217, "tps": 15582, "wall": 24787.9} {"step": 5894, "train_loss": 3.609837055206299, "lr": 0.00037612826274994717, "tps": 15582, "wall": 24792.8} {"step": 5895, "train_loss": 3.7445688247680664, "lr": 0.00037611872793067276, "tps": 15582, "wall": 24797.8} {"step": 5896, "train_loss": 3.735614776611328, "lr": 0.00037610919134287694, "tps": 15581, "wall": 24802.8} {"step": 5897, "train_loss": 3.6796610355377197, "lr": 0.00037609965298666774, "tps": 15581, "wall": 24807.7} {"step": 5898, "train_loss": 3.8269805908203125, "lr": 0.00037609011286215326, "tps": 15580, "wall": 24812.7} {"step": 5899, "train_loss": 3.6324093341827393, "lr": 0.0003760805709694415, "tps": 15580, "wall": 24817.7} {"step": 5900, "train_loss": 3.667069435119629, "lr": 0.00037607102730864066, "tps": 15579, "wall": 24822.6} {"step": 5901, "train_loss": 3.6613683700561523, "lr": 0.0003760614818798587, "tps": 15579, "wall": 24827.6} {"step": 5902, "train_loss": 3.7346479892730713, "lr": 0.00037605193468320385, "tps": 15578, "wall": 24832.5} {"step": 5903, "train_loss": 3.6730971336364746, "lr": 0.0003760423857187842, "tps": 15578, "wall": 24837.6} {"step": 5904, "train_loss": 3.6744368076324463, "lr": 0.000376032834986708, "tps": 15577, "wall": 24842.5} {"step": 5905, "train_loss": 3.7397022247314453, "lr": 0.00037602328248708344, "tps": 15577, "wall": 24847.5} {"step": 5906, "train_loss": 3.7441110610961914, "lr": 0.00037601372822001865, "tps": 15576, "wall": 24852.4} {"step": 5907, "train_loss": 3.5853679180145264, "lr": 0.0003760041721856219, "tps": 15576, "wall": 24857.4} {"step": 5908, "train_loss": 3.7232871055603027, "lr": 0.0003759946143840015, "tps": 15575, "wall": 24862.4} {"step": 5909, "train_loss": 3.6314802169799805, "lr": 0.0003759850548152656, "tps": 15575, "wall": 24867.3} {"step": 5910, "train_loss": 3.622185468673706, "lr": 0.0003759754934795226, "tps": 15574, "wall": 24872.3} {"step": 5911, "train_loss": 3.7338218688964844, "lr": 0.0003759659303768808, "tps": 15574, "wall": 24877.3} {"step": 5912, "train_loss": 3.7573184967041016, "lr": 0.0003759563655074485, "tps": 15573, "wall": 24882.2} {"step": 5913, "train_loss": 3.678110361099243, "lr": 0.00037594679887133404, "tps": 15573, "wall": 24887.2} {"step": 5914, "train_loss": 3.6708388328552246, "lr": 0.0003759372304686458, "tps": 15573, "wall": 24892.1} {"step": 5915, "train_loss": 3.6754438877105713, "lr": 0.00037592766029949213, "tps": 15572, "wall": 24897.1} {"step": 5916, "train_loss": 3.631410837173462, "lr": 0.00037591808836398154, "tps": 15572, "wall": 24902.1} {"step": 5917, "train_loss": 3.651550769805908, "lr": 0.0003759085146622224, "tps": 15571, "wall": 24907.0} {"step": 5918, "train_loss": 3.698288917541504, "lr": 0.0003758989391943232, "tps": 15571, "wall": 24912.0} {"step": 5919, "train_loss": 3.708101511001587, "lr": 0.00037588936196039234, "tps": 15570, "wall": 24917.0} {"step": 5920, "train_loss": 3.6815695762634277, "lr": 0.0003758797829605384, "tps": 15570, "wall": 24921.9} {"step": 5921, "train_loss": 3.6550168991088867, "lr": 0.0003758702021948698, "tps": 15569, "wall": 24926.9} {"step": 5922, "train_loss": 3.721311330795288, "lr": 0.00037586061966349515, "tps": 15569, "wall": 24931.9} {"step": 5923, "train_loss": 3.792541027069092, "lr": 0.00037585103536652293, "tps": 15568, "wall": 24936.8} {"step": 5924, "train_loss": 3.725341320037842, "lr": 0.00037584144930406175, "tps": 15568, "wall": 24941.8} {"step": 5925, "train_loss": 3.657790422439575, "lr": 0.00037583186147622025, "tps": 15567, "wall": 24946.8} {"step": 5926, "train_loss": 3.822511672973633, "lr": 0.00037582227188310695, "tps": 15567, "wall": 24951.7} {"step": 5927, "train_loss": 3.8355884552001953, "lr": 0.00037581268052483055, "tps": 15566, "wall": 24956.7} {"step": 5928, "train_loss": 3.744640588760376, "lr": 0.00037580308740149963, "tps": 15566, "wall": 24961.7} {"step": 5929, "train_loss": 3.804940700531006, "lr": 0.000375793492513223, "tps": 15565, "wall": 24966.7} {"step": 5930, "train_loss": 3.695103168487549, "lr": 0.00037578389586010916, "tps": 15565, "wall": 24971.6} {"step": 5931, "train_loss": 3.645158290863037, "lr": 0.000375774297442267, "tps": 15564, "wall": 24976.6} {"step": 5932, "train_loss": 3.757805347442627, "lr": 0.00037576469725980507, "tps": 15564, "wall": 24981.6} {"step": 5933, "train_loss": 3.5978846549987793, "lr": 0.0003757550953128323, "tps": 15564, "wall": 24986.5} {"step": 5934, "train_loss": 3.749131679534912, "lr": 0.00037574549160145743, "tps": 15563, "wall": 24991.4} {"step": 5935, "train_loss": 3.6709952354431152, "lr": 0.0003757358861257891, "tps": 15563, "wall": 24996.4} {"step": 5936, "train_loss": 3.6760611534118652, "lr": 0.00037572627888593626, "tps": 15562, "wall": 25001.4} {"step": 5937, "train_loss": 3.6395339965820312, "lr": 0.0003757166698820077, "tps": 15562, "wall": 25006.3} {"step": 5938, "train_loss": 3.6205179691314697, "lr": 0.00037570705911411234, "tps": 15561, "wall": 25011.3} {"step": 5939, "train_loss": 3.715139389038086, "lr": 0.00037569744658235896, "tps": 15561, "wall": 25016.3} {"step": 5940, "train_loss": 3.6442654132843018, "lr": 0.00037568783228685644, "tps": 15560, "wall": 25021.3} {"step": 5941, "train_loss": 3.678783893585205, "lr": 0.0003756782162277138, "tps": 15560, "wall": 25026.2} {"step": 5942, "train_loss": 3.6332359313964844, "lr": 0.00037566859840503983, "tps": 15559, "wall": 25031.2} {"step": 5943, "train_loss": 3.6935312747955322, "lr": 0.0003756589788189436, "tps": 15559, "wall": 25036.1} {"step": 5944, "train_loss": 3.697006940841675, "lr": 0.00037564935746953404, "tps": 15558, "wall": 25041.1} {"step": 5945, "train_loss": 3.703399658203125, "lr": 0.00037563973435692015, "tps": 15558, "wall": 25046.1} {"step": 5946, "train_loss": 3.790095090866089, "lr": 0.0003756301094812109, "tps": 15557, "wall": 25051.1} {"step": 5947, "train_loss": 3.749959945678711, "lr": 0.00037562048284251533, "tps": 15557, "wall": 25056.0} {"step": 5948, "train_loss": 3.713468313217163, "lr": 0.0003756108544409426, "tps": 15556, "wall": 25061.0} {"step": 5949, "train_loss": 3.6367530822753906, "lr": 0.0003756012242766016, "tps": 15556, "wall": 25065.9} {"step": 5950, "train_loss": 3.644582509994507, "lr": 0.0003755915923496016, "tps": 15556, "wall": 25070.9} {"step": 5951, "train_loss": 3.7086703777313232, "lr": 0.0003755819586600515, "tps": 15555, "wall": 25075.9} {"step": 5952, "train_loss": 3.4826722145080566, "lr": 0.00037557232320806065, "tps": 15555, "wall": 25080.9} {"step": 5953, "train_loss": 3.689565658569336, "lr": 0.00037556268599373807, "tps": 15554, "wall": 25085.8} {"step": 5954, "train_loss": 3.741237163543701, "lr": 0.00037555304701719297, "tps": 15554, "wall": 25090.8} {"step": 5955, "train_loss": 3.6624579429626465, "lr": 0.0003755434062785346, "tps": 15553, "wall": 25095.7} {"step": 5956, "train_loss": 3.6630396842956543, "lr": 0.00037553376377787205, "tps": 15553, "wall": 25100.7} {"step": 5957, "train_loss": 3.5630173683166504, "lr": 0.0003755241195153146, "tps": 15552, "wall": 25105.6} {"step": 5958, "train_loss": 3.640120506286621, "lr": 0.00037551447349097155, "tps": 15552, "wall": 25110.6} {"step": 5959, "train_loss": 3.6962392330169678, "lr": 0.0003755048257049521, "tps": 15551, "wall": 25115.6} {"step": 5960, "train_loss": 3.7317299842834473, "lr": 0.00037549517615736555, "tps": 15551, "wall": 25120.5} {"step": 5961, "train_loss": 3.6404638290405273, "lr": 0.00037548552484832127, "tps": 15550, "wall": 25125.5} {"step": 5962, "train_loss": 3.7567684650421143, "lr": 0.00037547587177792855, "tps": 15550, "wall": 25130.4} {"step": 5963, "train_loss": 3.712796688079834, "lr": 0.0003754662169462968, "tps": 15550, "wall": 25135.5} {"step": 5964, "train_loss": 3.669680118560791, "lr": 0.00037545656035353525, "tps": 15549, "wall": 25140.4} {"step": 5965, "train_loss": 3.7121706008911133, "lr": 0.0003754469019997534, "tps": 15549, "wall": 25145.4} {"step": 5966, "train_loss": 3.6699485778808594, "lr": 0.00037543724188506065, "tps": 15548, "wall": 25150.3} {"step": 5967, "train_loss": 3.7157766819000244, "lr": 0.00037542758000956637, "tps": 15548, "wall": 25155.3} {"step": 5968, "train_loss": 3.688821792602539, "lr": 0.00037541791637338013, "tps": 15547, "wall": 25160.2} {"step": 5969, "train_loss": 3.704500198364258, "lr": 0.0003754082509766113, "tps": 15547, "wall": 25165.2} {"step": 5970, "train_loss": 3.7086386680603027, "lr": 0.00037539858381936935, "tps": 15546, "wall": 25170.1} {"step": 5971, "train_loss": 3.672529935836792, "lr": 0.0003753889149017638, "tps": 15546, "wall": 25175.1} {"step": 5972, "train_loss": 3.737381935119629, "lr": 0.0003753792442239043, "tps": 15545, "wall": 25180.0} {"step": 5973, "train_loss": 3.731907367706299, "lr": 0.0003753695717859003, "tps": 15545, "wall": 25185.0} {"step": 5974, "train_loss": 3.65140962600708, "lr": 0.0003753598975878614, "tps": 15544, "wall": 25190.0} {"step": 5975, "train_loss": 3.673861265182495, "lr": 0.0003753502216298971, "tps": 15544, "wall": 25195.0} {"step": 5976, "train_loss": 3.639552593231201, "lr": 0.0003753405439121171, "tps": 15544, "wall": 25199.9} {"step": 5977, "train_loss": 3.5248403549194336, "lr": 0.00037533086443463113, "tps": 15543, "wall": 25204.9} {"step": 5978, "train_loss": 3.611246109008789, "lr": 0.0003753211831975486, "tps": 15543, "wall": 25209.8} {"step": 5979, "train_loss": 3.702824831008911, "lr": 0.00037531150020097935, "tps": 15542, "wall": 25214.8} {"step": 5980, "train_loss": 3.6008288860321045, "lr": 0.000375301815445033, "tps": 15542, "wall": 25219.8} {"step": 5981, "train_loss": 3.6902434825897217, "lr": 0.00037529212892981935, "tps": 15541, "wall": 25224.7} {"step": 5982, "train_loss": 3.7291457653045654, "lr": 0.000375282440655448, "tps": 15541, "wall": 25229.7} {"step": 5983, "train_loss": 3.663093090057373, "lr": 0.0003752727506220288, "tps": 15540, "wall": 25234.6} {"step": 5984, "train_loss": 3.759119987487793, "lr": 0.00037526305882967147, "tps": 15540, "wall": 25239.6} {"step": 5985, "train_loss": 3.704704761505127, "lr": 0.0003752533652784858, "tps": 15539, "wall": 25244.6} {"step": 5986, "train_loss": 3.7597274780273438, "lr": 0.00037524366996858163, "tps": 15539, "wall": 25249.5} {"step": 5987, "train_loss": 3.679438352584839, "lr": 0.0003752339729000687, "tps": 15538, "wall": 25254.5} {"step": 5988, "train_loss": 3.7603883743286133, "lr": 0.00037522427407305696, "tps": 15538, "wall": 25259.5} {"step": 5989, "train_loss": 3.6874258518218994, "lr": 0.00037521457348765625, "tps": 15538, "wall": 25264.4} {"step": 5990, "train_loss": 3.6492691040039062, "lr": 0.0003752048711439765, "tps": 15537, "wall": 25269.4} {"step": 5991, "train_loss": 3.6429104804992676, "lr": 0.0003751951670421275, "tps": 15537, "wall": 25274.4} {"step": 5992, "train_loss": 3.71649169921875, "lr": 0.00037518546118221936, "tps": 15536, "wall": 25279.3} {"step": 5993, "train_loss": 3.618497371673584, "lr": 0.0003751757535643618, "tps": 15536, "wall": 25284.3} {"step": 5994, "train_loss": 3.517700672149658, "lr": 0.00037516604418866495, "tps": 15535, "wall": 25289.3} {"step": 5995, "train_loss": 3.6260499954223633, "lr": 0.00037515633305523874, "tps": 15535, "wall": 25294.2} {"step": 5996, "train_loss": 3.774813175201416, "lr": 0.00037514662016419325, "tps": 15534, "wall": 25299.2} {"step": 5997, "train_loss": 3.771401882171631, "lr": 0.00037513690551563847, "tps": 15534, "wall": 25304.1} {"step": 5998, "train_loss": 3.6241819858551025, "lr": 0.00037512718910968435, "tps": 15533, "wall": 25309.1} {"step": 5999, "train_loss": 3.6914591789245605, "lr": 0.00037511747094644114, "tps": 15533, "wall": 25314.2} {"step": 6000, "train_loss": 3.704664945602417, "lr": 0.0003751077510260188, "tps": 15532, "wall": 25319.1, "val_loss_monitor": 3.700313885355923} {"step": 6001, "train_loss": 3.75569486618042, "lr": 0.00037509802934852733, "tps": 15503, "wall": 25372.2} {"step": 6002, "train_loss": 3.699453830718994, "lr": 0.0003750883059140771, "tps": 15502, "wall": 25377.2} {"step": 6003, "train_loss": 3.7574615478515625, "lr": 0.0003750785807227782, "tps": 15502, "wall": 25382.2} {"step": 6004, "train_loss": 3.6277008056640625, "lr": 0.0003750688537747407, "tps": 15501, "wall": 25387.2} {"step": 6005, "train_loss": 3.783630132675171, "lr": 0.0003750591250700748, "tps": 15501, "wall": 25392.1} {"step": 6006, "train_loss": 3.742826223373413, "lr": 0.0003750493946088907, "tps": 15500, "wall": 25397.1} {"step": 6007, "train_loss": 3.5863282680511475, "lr": 0.00037503966239129874, "tps": 15500, "wall": 25402.1} {"step": 6008, "train_loss": 3.6768178939819336, "lr": 0.0003750299284174091, "tps": 15499, "wall": 25407.1} {"step": 6009, "train_loss": 3.5938172340393066, "lr": 0.0003750201926873321, "tps": 15499, "wall": 25412.0} {"step": 6010, "train_loss": 3.706479787826538, "lr": 0.0003750104552011779, "tps": 15498, "wall": 25417.1} {"step": 6011, "train_loss": 3.7086501121520996, "lr": 0.00037500071595905686, "tps": 15498, "wall": 25422.0} {"step": 6012, "train_loss": 3.7773733139038086, "lr": 0.00037499097496107933, "tps": 15498, "wall": 25427.0} {"step": 6013, "train_loss": 3.701807975769043, "lr": 0.0003749812322073557, "tps": 15497, "wall": 25431.9} {"step": 6014, "train_loss": 3.6659557819366455, "lr": 0.0003749714876979963, "tps": 15497, "wall": 25437.0} {"step": 6015, "train_loss": 3.613018274307251, "lr": 0.0003749617414331114, "tps": 15496, "wall": 25441.9} {"step": 6016, "train_loss": 3.6455767154693604, "lr": 0.0003749519934128116, "tps": 15496, "wall": 25446.9} {"step": 6017, "train_loss": 3.625765323638916, "lr": 0.00037494224363720716, "tps": 15495, "wall": 25451.9} {"step": 6018, "train_loss": 3.599343776702881, "lr": 0.0003749324921064087, "tps": 15495, "wall": 25456.9} {"step": 6019, "train_loss": 3.6971235275268555, "lr": 0.00037492273882052654, "tps": 15494, "wall": 25461.8} {"step": 6020, "train_loss": 3.7286367416381836, "lr": 0.00037491298377967115, "tps": 15494, "wall": 25466.8} {"step": 6021, "train_loss": 3.6856632232666016, "lr": 0.0003749032269839532, "tps": 15493, "wall": 25471.8} {"step": 6022, "train_loss": 3.732271194458008, "lr": 0.0003748934684334831, "tps": 15493, "wall": 25476.7} {"step": 6023, "train_loss": 3.691462993621826, "lr": 0.0003748837081283714, "tps": 15493, "wall": 25481.7} {"step": 6024, "train_loss": 3.6131303310394287, "lr": 0.00037487394606872863, "tps": 15492, "wall": 25486.7} {"step": 6025, "train_loss": 3.674269914627075, "lr": 0.00037486418225466544, "tps": 15492, "wall": 25491.6} {"step": 6026, "train_loss": 3.685453176498413, "lr": 0.00037485441668629244, "tps": 15491, "wall": 25496.6} {"step": 6027, "train_loss": 3.5725882053375244, "lr": 0.0003748446493637202, "tps": 15491, "wall": 25501.6} {"step": 6028, "train_loss": 3.726262331008911, "lr": 0.00037483488028705944, "tps": 15490, "wall": 25506.6} {"step": 6029, "train_loss": 3.6993794441223145, "lr": 0.0003748251094564207, "tps": 15490, "wall": 25511.5} {"step": 6030, "train_loss": 3.6816906929016113, "lr": 0.0003748153368719149, "tps": 15489, "wall": 25516.5} {"step": 6031, "train_loss": 3.6319046020507812, "lr": 0.0003748055625336524, "tps": 15489, "wall": 25521.4} {"step": 6032, "train_loss": 3.7650508880615234, "lr": 0.0003747957864417442, "tps": 15489, "wall": 25526.4} {"step": 6033, "train_loss": 3.7269201278686523, "lr": 0.00037478600859630097, "tps": 15488, "wall": 25531.4} {"step": 6034, "train_loss": 3.6817216873168945, "lr": 0.00037477622899743343, "tps": 15488, "wall": 25536.3} {"step": 6035, "train_loss": 3.681349754333496, "lr": 0.0003747664476452524, "tps": 15487, "wall": 25541.3} {"step": 6036, "train_loss": 3.577068328857422, "lr": 0.00037475666453986873, "tps": 15487, "wall": 25546.3} {"step": 6037, "train_loss": 3.630526542663574, "lr": 0.0003747468796813931, "tps": 15486, "wall": 25551.3} {"step": 6038, "train_loss": 3.6382718086242676, "lr": 0.00037473709306993656, "tps": 15486, "wall": 25556.3} {"step": 6039, "train_loss": 3.661736249923706, "lr": 0.00037472730470560975, "tps": 15485, "wall": 25561.2} {"step": 6040, "train_loss": 3.690195083618164, "lr": 0.00037471751458852375, "tps": 15485, "wall": 25566.2} {"step": 6041, "train_loss": 3.719870090484619, "lr": 0.00037470772271878933, "tps": 15484, "wall": 25571.1} {"step": 6042, "train_loss": 3.669891357421875, "lr": 0.00037469792909651745, "tps": 15484, "wall": 25576.1} {"step": 6043, "train_loss": 3.682119607925415, "lr": 0.0003746881337218191, "tps": 15484, "wall": 25581.0} {"step": 6044, "train_loss": 3.641270399093628, "lr": 0.0003746783365948051, "tps": 15483, "wall": 25586.0} {"step": 6045, "train_loss": 3.7625555992126465, "lr": 0.0003746685377155866, "tps": 15483, "wall": 25590.9} {"step": 6046, "train_loss": 3.5823965072631836, "lr": 0.0003746587370842746, "tps": 15482, "wall": 25595.9} {"step": 6047, "train_loss": 3.6588172912597656, "lr": 0.00037464893470097997, "tps": 15482, "wall": 25600.9} {"step": 6048, "train_loss": 3.5641984939575195, "lr": 0.0003746391305658139, "tps": 15481, "wall": 25605.8} {"step": 6049, "train_loss": 3.6553049087524414, "lr": 0.0003746293246788873, "tps": 15481, "wall": 25610.8} {"step": 6050, "train_loss": 3.8405418395996094, "lr": 0.00037461951704031147, "tps": 15481, "wall": 25615.8} {"step": 6051, "train_loss": 3.632498025894165, "lr": 0.0003746097076501973, "tps": 15480, "wall": 25620.7} {"step": 6052, "train_loss": 3.7118935585021973, "lr": 0.00037459989650865603, "tps": 15480, "wall": 25625.7} {"step": 6053, "train_loss": 3.7072062492370605, "lr": 0.00037459008361579875, "tps": 15479, "wall": 25630.6} {"step": 6054, "train_loss": 3.61344313621521, "lr": 0.00037458026897173666, "tps": 15479, "wall": 25635.6} {"step": 6055, "train_loss": 3.7464041709899902, "lr": 0.00037457045257658093, "tps": 15478, "wall": 25640.5} {"step": 6056, "train_loss": 3.6575701236724854, "lr": 0.0003745606344304427, "tps": 15478, "wall": 25645.5} {"step": 6057, "train_loss": 3.7108144760131836, "lr": 0.0003745508145334333, "tps": 15478, "wall": 25650.4} {"step": 6058, "train_loss": 3.6837267875671387, "lr": 0.0003745409928856639, "tps": 15477, "wall": 25655.4} {"step": 6059, "train_loss": 3.900522232055664, "lr": 0.00037453116948724574, "tps": 15477, "wall": 25660.3} {"step": 6060, "train_loss": 3.6659202575683594, "lr": 0.0003745213443382902, "tps": 15476, "wall": 25665.2} {"step": 6061, "train_loss": 3.7126119136810303, "lr": 0.00037451151743890846, "tps": 15476, "wall": 25670.2} {"step": 6062, "train_loss": 3.7420830726623535, "lr": 0.0003745016887892119, "tps": 15475, "wall": 25675.2} {"step": 6063, "train_loss": 3.614363670349121, "lr": 0.0003744918583893118, "tps": 15475, "wall": 25680.2} {"step": 6064, "train_loss": 3.6157493591308594, "lr": 0.0003744820262393196, "tps": 15474, "wall": 25685.1} {"step": 6065, "train_loss": 3.7361345291137695, "lr": 0.0003744721923393467, "tps": 15474, "wall": 25690.1} {"step": 6066, "train_loss": 3.7318687438964844, "lr": 0.0003744623566895044, "tps": 15474, "wall": 25695.0} {"step": 6067, "train_loss": 3.7033307552337646, "lr": 0.00037445251928990415, "tps": 15473, "wall": 25700.0} {"step": 6068, "train_loss": 3.7637736797332764, "lr": 0.0003744426801406575, "tps": 15473, "wall": 25704.9} {"step": 6069, "train_loss": 3.6398725509643555, "lr": 0.00037443283924187576, "tps": 15472, "wall": 25709.9} {"step": 6070, "train_loss": 3.669675350189209, "lr": 0.00037442299659367045, "tps": 15472, "wall": 25714.8} {"step": 6071, "train_loss": 3.609949827194214, "lr": 0.00037441315219615307, "tps": 15471, "wall": 25719.8} {"step": 6072, "train_loss": 3.665825128555298, "lr": 0.0003744033060494352, "tps": 15471, "wall": 25724.7} {"step": 6073, "train_loss": 3.6689138412475586, "lr": 0.00037439345815362825, "tps": 15471, "wall": 25729.7} {"step": 6074, "train_loss": 3.689474582672119, "lr": 0.0003743836085088439, "tps": 15470, "wall": 25734.7} {"step": 6075, "train_loss": 3.6324496269226074, "lr": 0.0003743737571151936, "tps": 15470, "wall": 25739.7} {"step": 6076, "train_loss": 3.7155001163482666, "lr": 0.00037436390397278915, "tps": 15469, "wall": 25744.6} {"step": 6077, "train_loss": 3.7133476734161377, "lr": 0.000374354049081742, "tps": 15469, "wall": 25749.6} {"step": 6078, "train_loss": 3.6583456993103027, "lr": 0.00037434419244216385, "tps": 15468, "wall": 25754.5} {"step": 6079, "train_loss": 3.7053964138031006, "lr": 0.0003743343340541663, "tps": 15468, "wall": 25759.5} {"step": 6080, "train_loss": 3.6273670196533203, "lr": 0.0003743244739178611, "tps": 15468, "wall": 25764.4} {"step": 6081, "train_loss": 3.7386176586151123, "lr": 0.00037431461203335986, "tps": 15467, "wall": 25769.3} {"step": 6082, "train_loss": 3.7220308780670166, "lr": 0.0003743047484007744, "tps": 15467, "wall": 25774.3} {"step": 6083, "train_loss": 3.596820116043091, "lr": 0.00037429488302021636, "tps": 15466, "wall": 25779.3} {"step": 6084, "train_loss": 3.5438485145568848, "lr": 0.00037428501589179756, "tps": 15466, "wall": 25784.2} {"step": 6085, "train_loss": 3.763413190841675, "lr": 0.00037427514701562974, "tps": 15465, "wall": 25789.2} {"step": 6086, "train_loss": 3.7201459407806396, "lr": 0.0003742652763918248, "tps": 15465, "wall": 25794.2} {"step": 6087, "train_loss": 3.6528353691101074, "lr": 0.00037425540402049435, "tps": 15465, "wall": 25799.1} {"step": 6088, "train_loss": 3.608083486557007, "lr": 0.00037424552990175035, "tps": 15464, "wall": 25804.1} {"step": 6089, "train_loss": 3.625436782836914, "lr": 0.00037423565403570466, "tps": 15464, "wall": 25809.0} {"step": 6090, "train_loss": 3.6622979640960693, "lr": 0.0003742257764224691, "tps": 15463, "wall": 25814.0} {"step": 6091, "train_loss": 3.662339687347412, "lr": 0.0003742158970621557, "tps": 15463, "wall": 25818.9} {"step": 6092, "train_loss": 3.632852077484131, "lr": 0.00037420601595487623, "tps": 15462, "wall": 25823.9} {"step": 6093, "train_loss": 3.635429859161377, "lr": 0.00037419613310074265, "tps": 15462, "wall": 25828.8} {"step": 6094, "train_loss": 3.7230772972106934, "lr": 0.00037418624849986694, "tps": 15461, "wall": 25833.8} {"step": 6095, "train_loss": 3.633316993713379, "lr": 0.00037417636215236104, "tps": 15461, "wall": 25838.8} {"step": 6096, "train_loss": 3.7526111602783203, "lr": 0.000374166474058337, "tps": 15461, "wall": 25843.7} {"step": 6097, "train_loss": 3.6116256713867188, "lr": 0.0003741565842179068, "tps": 15460, "wall": 25848.7} {"step": 6098, "train_loss": 3.659595489501953, "lr": 0.00037414669263118245, "tps": 15460, "wall": 25853.7} {"step": 6099, "train_loss": 3.70597505569458, "lr": 0.0003741367992982761, "tps": 15459, "wall": 25858.6} {"step": 6100, "train_loss": 3.659396171569824, "lr": 0.00037412690421929966, "tps": 15459, "wall": 25863.6} {"step": 6101, "train_loss": 3.6162333488464355, "lr": 0.0003741170073943653, "tps": 15458, "wall": 25868.5} {"step": 6102, "train_loss": 3.718794107437134, "lr": 0.0003741071088235852, "tps": 15458, "wall": 25873.5} {"step": 6103, "train_loss": 3.7311041355133057, "lr": 0.00037409720850707146, "tps": 15458, "wall": 25878.4} {"step": 6104, "train_loss": 3.537014961242676, "lr": 0.00037408730644493616, "tps": 15457, "wall": 25883.4} {"step": 6105, "train_loss": 3.660787582397461, "lr": 0.0003740774026372915, "tps": 15457, "wall": 25888.3} {"step": 6106, "train_loss": 3.6486575603485107, "lr": 0.00037406749708424975, "tps": 15456, "wall": 25893.3} {"step": 6107, "train_loss": 3.624117136001587, "lr": 0.000374057589785923, "tps": 15456, "wall": 25898.3} {"step": 6108, "train_loss": 3.7505855560302734, "lr": 0.0003740476807424236, "tps": 15455, "wall": 25903.2} {"step": 6109, "train_loss": 3.735116720199585, "lr": 0.00037403776995386366, "tps": 15455, "wall": 25908.1} {"step": 6110, "train_loss": 3.7546751499176025, "lr": 0.00037402785742035556, "tps": 15455, "wall": 25913.1} {"step": 6111, "train_loss": 3.7665936946868896, "lr": 0.00037401794314201157, "tps": 15454, "wall": 25918.1} {"step": 6112, "train_loss": 3.6381497383117676, "lr": 0.000374008027118944, "tps": 15454, "wall": 25923.1} {"step": 6113, "train_loss": 3.700187921524048, "lr": 0.00037399810935126514, "tps": 15453, "wall": 25928.0} {"step": 6114, "train_loss": 3.7263169288635254, "lr": 0.00037398818983908733, "tps": 15453, "wall": 25933.0} {"step": 6115, "train_loss": 3.770608901977539, "lr": 0.00037397826858252305, "tps": 15452, "wall": 25937.9} {"step": 6116, "train_loss": 3.5801711082458496, "lr": 0.0003739683455816846, "tps": 15452, "wall": 25942.9} {"step": 6117, "train_loss": 3.679058790206909, "lr": 0.0003739584208366844, "tps": 15452, "wall": 25947.8} {"step": 6118, "train_loss": 3.654664993286133, "lr": 0.00037394849434763485, "tps": 15451, "wall": 25952.8} {"step": 6119, "train_loss": 3.650398015975952, "lr": 0.00037393856611464847, "tps": 15451, "wall": 25957.8} {"step": 6120, "train_loss": 3.633380174636841, "lr": 0.00037392863613783765, "tps": 15450, "wall": 25962.7} {"step": 6121, "train_loss": 3.6000170707702637, "lr": 0.0003739187044173149, "tps": 15450, "wall": 25967.7} {"step": 6122, "train_loss": 3.7171339988708496, "lr": 0.0003739087709531928, "tps": 15449, "wall": 25972.6} {"step": 6123, "train_loss": 3.5985569953918457, "lr": 0.00037389883574558374, "tps": 15449, "wall": 25977.6} {"step": 6124, "train_loss": 3.7213072776794434, "lr": 0.0003738888987946004, "tps": 15449, "wall": 25982.6} {"step": 6125, "train_loss": 3.634709358215332, "lr": 0.00037387896010035524, "tps": 15448, "wall": 25987.5} {"step": 6126, "train_loss": 3.5196707248687744, "lr": 0.0003738690196629609, "tps": 15448, "wall": 25992.5} {"step": 6127, "train_loss": 3.6197361946105957, "lr": 0.00037385907748253004, "tps": 15447, "wall": 25997.4} {"step": 6128, "train_loss": 3.637734889984131, "lr": 0.00037384913355917516, "tps": 15447, "wall": 26002.4} {"step": 6129, "train_loss": 3.7252426147460938, "lr": 0.00037383918789300904, "tps": 15446, "wall": 26007.4} {"step": 6130, "train_loss": 3.691107988357544, "lr": 0.0003738292404841442, "tps": 15446, "wall": 26012.3} {"step": 6131, "train_loss": 3.708334445953369, "lr": 0.00037381929133269344, "tps": 15446, "wall": 26017.3} {"step": 6132, "train_loss": 3.902078628540039, "lr": 0.00037380934043876947, "tps": 15445, "wall": 26022.2} {"step": 6133, "train_loss": 3.6339802742004395, "lr": 0.0003737993878024849, "tps": 15445, "wall": 26027.2} {"step": 6134, "train_loss": 3.715104341506958, "lr": 0.00037378943342395257, "tps": 15444, "wall": 26032.1} {"step": 6135, "train_loss": 3.5775833129882812, "lr": 0.0003737794773032852, "tps": 15444, "wall": 26037.1} {"step": 6136, "train_loss": 3.644136428833008, "lr": 0.00037376951944059566, "tps": 15444, "wall": 26042.1} {"step": 6137, "train_loss": 3.6901965141296387, "lr": 0.00037375955983599666, "tps": 15443, "wall": 26047.1} {"step": 6138, "train_loss": 3.6786959171295166, "lr": 0.00037374959848960097, "tps": 15443, "wall": 26052.0} {"step": 6139, "train_loss": 3.555981159210205, "lr": 0.00037373963540152165, "tps": 15442, "wall": 26057.0} {"step": 6140, "train_loss": 3.6700963973999023, "lr": 0.0003737296705718713, "tps": 15442, "wall": 26061.9} {"step": 6141, "train_loss": 3.659515857696533, "lr": 0.000373719704000763, "tps": 15441, "wall": 26066.9} {"step": 6142, "train_loss": 3.676813840866089, "lr": 0.0003737097356883095, "tps": 15441, "wall": 26071.9} {"step": 6143, "train_loss": 3.757052421569824, "lr": 0.00037369976563462386, "tps": 15441, "wall": 26076.8} {"step": 6144, "train_loss": 3.5091142654418945, "lr": 0.0003736897938398189, "tps": 15440, "wall": 26081.8} {"step": 6145, "train_loss": 3.8129289150238037, "lr": 0.00037367982030400774, "tps": 15440, "wall": 26086.8} {"step": 6146, "train_loss": 3.571444511413574, "lr": 0.0003736698450273032, "tps": 15439, "wall": 26091.7} {"step": 6147, "train_loss": 3.6077873706817627, "lr": 0.0003736598680098183, "tps": 15439, "wall": 26096.7} {"step": 6148, "train_loss": 3.703335762023926, "lr": 0.00037364988925166616, "tps": 15438, "wall": 26101.7} {"step": 6149, "train_loss": 3.6804065704345703, "lr": 0.00037363990875295976, "tps": 15438, "wall": 26106.7} {"step": 6150, "train_loss": 3.640774726867676, "lr": 0.0003736299265138122, "tps": 15438, "wall": 26111.6} {"step": 6151, "train_loss": 3.734438419342041, "lr": 0.00037361994253433644, "tps": 15437, "wall": 26116.6} {"step": 6152, "train_loss": 3.5899574756622314, "lr": 0.0003736099568146457, "tps": 15437, "wall": 26121.5} {"step": 6153, "train_loss": 3.750002384185791, "lr": 0.000373599969354853, "tps": 15436, "wall": 26126.5} {"step": 6154, "train_loss": 3.724893093109131, "lr": 0.00037358998015507165, "tps": 15436, "wall": 26131.4} {"step": 6155, "train_loss": 3.7287051677703857, "lr": 0.0003735799892154146, "tps": 15435, "wall": 26136.4} {"step": 6156, "train_loss": 3.6096408367156982, "lr": 0.00037356999653599514, "tps": 15435, "wall": 26141.4} {"step": 6157, "train_loss": 3.7458982467651367, "lr": 0.0003735600021169265, "tps": 15435, "wall": 26146.3} {"step": 6158, "train_loss": 3.719320297241211, "lr": 0.00037355000595832183, "tps": 15434, "wall": 26151.3} {"step": 6159, "train_loss": 3.720202922821045, "lr": 0.00037354000806029435, "tps": 15434, "wall": 26156.3} {"step": 6160, "train_loss": 3.6164917945861816, "lr": 0.0003735300084229574, "tps": 15433, "wall": 26161.3} {"step": 6161, "train_loss": 3.6106371879577637, "lr": 0.00037352000704642417, "tps": 15433, "wall": 26166.3} {"step": 6162, "train_loss": 3.6087327003479004, "lr": 0.000373510003930808, "tps": 15432, "wall": 26171.2} {"step": 6163, "train_loss": 3.5977559089660645, "lr": 0.0003734999990762222, "tps": 15432, "wall": 26176.1} {"step": 6164, "train_loss": 3.6677627563476562, "lr": 0.00037348999248278017, "tps": 15432, "wall": 26181.1} {"step": 6165, "train_loss": 3.6563165187835693, "lr": 0.00037347998415059513, "tps": 15431, "wall": 26186.0} {"step": 6166, "train_loss": 3.685093402862549, "lr": 0.00037346997407978057, "tps": 15431, "wall": 26191.0} {"step": 6167, "train_loss": 3.560962677001953, "lr": 0.0003734599622704498, "tps": 15430, "wall": 26196.0} {"step": 6168, "train_loss": 3.6829757690429688, "lr": 0.00037344994872271625, "tps": 15430, "wall": 26200.9} {"step": 6169, "train_loss": 3.5441577434539795, "lr": 0.00037343993343669343, "tps": 15430, "wall": 26205.9} {"step": 6170, "train_loss": 3.612231731414795, "lr": 0.0003734299164124947, "tps": 15429, "wall": 26210.8} {"step": 6171, "train_loss": 3.7104599475860596, "lr": 0.00037341989765023366, "tps": 15429, "wall": 26215.9} {"step": 6172, "train_loss": 3.6519875526428223, "lr": 0.0003734098771500237, "tps": 15428, "wall": 26220.8} {"step": 6173, "train_loss": 3.6585566997528076, "lr": 0.0003733998549119783, "tps": 15428, "wall": 26225.8} {"step": 6174, "train_loss": 3.6752305030822754, "lr": 0.00037338983093621107, "tps": 15427, "wall": 26230.7} {"step": 6175, "train_loss": 3.737807273864746, "lr": 0.00037337980522283553, "tps": 15427, "wall": 26235.7} {"step": 6176, "train_loss": 3.7092599868774414, "lr": 0.0003733697777719653, "tps": 15427, "wall": 26240.6} {"step": 6177, "train_loss": 3.6990342140197754, "lr": 0.00037335974858371387, "tps": 15426, "wall": 26245.6} {"step": 6178, "train_loss": 3.549835681915283, "lr": 0.00037334971765819495, "tps": 15426, "wall": 26250.6} {"step": 6179, "train_loss": 3.8090882301330566, "lr": 0.0003733396849955221, "tps": 15425, "wall": 26255.5} {"step": 6180, "train_loss": 3.681518077850342, "lr": 0.000373329650595809, "tps": 15425, "wall": 26260.5} {"step": 6181, "train_loss": 3.659783363342285, "lr": 0.00037331961445916936, "tps": 15424, "wall": 26265.4} {"step": 6182, "train_loss": 3.721219539642334, "lr": 0.00037330957658571683, "tps": 15424, "wall": 26270.4} {"step": 6183, "train_loss": 3.6492702960968018, "lr": 0.0003732995369755651, "tps": 15424, "wall": 26275.4} {"step": 6184, "train_loss": 3.6416032314300537, "lr": 0.00037328949562882787, "tps": 15423, "wall": 26280.3} {"step": 6185, "train_loss": 3.6728291511535645, "lr": 0.0003732794525456191, "tps": 15423, "wall": 26285.3} {"step": 6186, "train_loss": 3.6248323917388916, "lr": 0.00037326940772605227, "tps": 15422, "wall": 26290.2} {"step": 6187, "train_loss": 3.712071418762207, "lr": 0.0003732593611702413, "tps": 15422, "wall": 26295.2} {"step": 6188, "train_loss": 3.5959157943725586, "lr": 0.00037324931287830007, "tps": 15421, "wall": 26300.3} {"step": 6189, "train_loss": 3.628398895263672, "lr": 0.0003732392628503422, "tps": 15421, "wall": 26305.2} {"step": 6190, "train_loss": 3.6753451824188232, "lr": 0.00037322921108648183, "tps": 15421, "wall": 26310.1} {"step": 6191, "train_loss": 3.62587833404541, "lr": 0.00037321915758683257, "tps": 15420, "wall": 26315.1} {"step": 6192, "train_loss": 3.6692919731140137, "lr": 0.00037320910235150845, "tps": 15420, "wall": 26320.1} {"step": 6193, "train_loss": 3.7290706634521484, "lr": 0.00037319904538062336, "tps": 15419, "wall": 26325.0} {"step": 6194, "train_loss": 3.6183433532714844, "lr": 0.0003731889866742911, "tps": 15419, "wall": 26330.0} {"step": 6195, "train_loss": 3.6190035343170166, "lr": 0.00037317892623262575, "tps": 15419, "wall": 26335.0} {"step": 6196, "train_loss": 3.671910524368286, "lr": 0.00037316886405574124, "tps": 15418, "wall": 26339.9} {"step": 6197, "train_loss": 3.679943084716797, "lr": 0.0003731588001437515, "tps": 15418, "wall": 26344.9} {"step": 6198, "train_loss": 3.7986366748809814, "lr": 0.00037314873449677065, "tps": 15417, "wall": 26349.8} {"step": 6199, "train_loss": 3.766327381134033, "lr": 0.00037313866711491265, "tps": 15417, "wall": 26354.9} {"step": 6200, "train_loss": 3.7315235137939453, "lr": 0.0003731285979982916, "tps": 15416, "wall": 26359.8} {"step": 6201, "train_loss": 3.628922700881958, "lr": 0.0003731185271470214, "tps": 15416, "wall": 26364.8} {"step": 6202, "train_loss": 3.7221317291259766, "lr": 0.0003731084545612163, "tps": 15416, "wall": 26369.7} {"step": 6203, "train_loss": 3.557692766189575, "lr": 0.0003730983802409903, "tps": 15415, "wall": 26374.7} {"step": 6204, "train_loss": 3.6369717121124268, "lr": 0.0003730883041864576, "tps": 15415, "wall": 26379.6} {"step": 6205, "train_loss": 3.7978742122650146, "lr": 0.00037307822639773226, "tps": 15414, "wall": 26384.6} {"step": 6206, "train_loss": 3.611893653869629, "lr": 0.00037306814687492856, "tps": 15414, "wall": 26389.5} {"step": 6207, "train_loss": 3.8028342723846436, "lr": 0.0003730580656181606, "tps": 15414, "wall": 26394.6} {"step": 6208, "train_loss": 3.652862548828125, "lr": 0.00037304798262754253, "tps": 15413, "wall": 26399.5} {"step": 6209, "train_loss": 3.6574339866638184, "lr": 0.0003730378979031887, "tps": 15413, "wall": 26404.4} {"step": 6210, "train_loss": 3.6737775802612305, "lr": 0.00037302781144521333, "tps": 15412, "wall": 26409.4} {"step": 6211, "train_loss": 3.6748623847961426, "lr": 0.00037301772325373057, "tps": 15412, "wall": 26414.3} {"step": 6212, "train_loss": 3.6736178398132324, "lr": 0.0003730076333288547, "tps": 15412, "wall": 26419.3} {"step": 6213, "train_loss": 3.616067409515381, "lr": 0.0003729975416707002, "tps": 15411, "wall": 26424.2} {"step": 6214, "train_loss": 3.6523654460906982, "lr": 0.00037298744827938114, "tps": 15411, "wall": 26429.1} {"step": 6215, "train_loss": 3.7216274738311768, "lr": 0.0003729773531550121, "tps": 15410, "wall": 26434.1} {"step": 6216, "train_loss": 3.733133316040039, "lr": 0.00037296725629770727, "tps": 15410, "wall": 26439.1} {"step": 6217, "train_loss": 3.6842732429504395, "lr": 0.0003729571577075811, "tps": 15410, "wall": 26444.0} {"step": 6218, "train_loss": 3.664808511734009, "lr": 0.000372947057384748, "tps": 15409, "wall": 26449.0} {"step": 6219, "train_loss": 3.6676347255706787, "lr": 0.0003729369553293223, "tps": 15409, "wall": 26454.0} {"step": 6220, "train_loss": 3.667844772338867, "lr": 0.00037292685154141853, "tps": 15408, "wall": 26458.9} {"step": 6221, "train_loss": 3.691556930541992, "lr": 0.0003729167460211511, "tps": 15408, "wall": 26463.9} {"step": 6222, "train_loss": 3.6611649990081787, "lr": 0.00037290663876863455, "tps": 15407, "wall": 26468.8} {"step": 6223, "train_loss": 3.784891128540039, "lr": 0.0003728965297839833, "tps": 15407, "wall": 26473.8} {"step": 6224, "train_loss": 3.6794323921203613, "lr": 0.00037288641906731184, "tps": 15407, "wall": 26478.7} {"step": 6225, "train_loss": 3.5005857944488525, "lr": 0.0003728763066187348, "tps": 15406, "wall": 26483.7} {"step": 6226, "train_loss": 3.684323310852051, "lr": 0.0003728661924383667, "tps": 15406, "wall": 26488.6} {"step": 6227, "train_loss": 3.846984386444092, "lr": 0.00037285607652632203, "tps": 15405, "wall": 26493.6} {"step": 6228, "train_loss": 3.6018476486206055, "lr": 0.00037284595888271554, "tps": 15405, "wall": 26498.6} {"step": 6229, "train_loss": 3.6383705139160156, "lr": 0.0003728358395076617, "tps": 15405, "wall": 26503.5} {"step": 6230, "train_loss": 3.6213159561157227, "lr": 0.0003728257184012753, "tps": 15404, "wall": 26508.5} {"step": 6231, "train_loss": 3.5611512660980225, "lr": 0.00037281559556367073, "tps": 15404, "wall": 26513.5} {"step": 6232, "train_loss": 3.7118775844573975, "lr": 0.00037280547099496295, "tps": 15403, "wall": 26518.5} {"step": 6233, "train_loss": 3.68672513961792, "lr": 0.0003727953446952665, "tps": 15403, "wall": 26523.4} {"step": 6234, "train_loss": 3.664620876312256, "lr": 0.0003727852166646961, "tps": 15402, "wall": 26528.4} {"step": 6235, "train_loss": 3.7200329303741455, "lr": 0.0003727750869033665, "tps": 15402, "wall": 26533.3} {"step": 6236, "train_loss": 3.6608102321624756, "lr": 0.00037276495541139245, "tps": 15402, "wall": 26538.3} {"step": 6237, "train_loss": 3.6384451389312744, "lr": 0.0003727548221888888, "tps": 15401, "wall": 26543.3} {"step": 6238, "train_loss": 3.6646971702575684, "lr": 0.00037274468723597017, "tps": 15401, "wall": 26548.2} {"step": 6239, "train_loss": 3.6811556816101074, "lr": 0.00037273455055275155, "tps": 15400, "wall": 26553.2} {"step": 6240, "train_loss": 3.6536619663238525, "lr": 0.00037272441213934756, "tps": 15400, "wall": 26558.1} {"step": 6241, "train_loss": 3.6577868461608887, "lr": 0.0003727142719958732, "tps": 15400, "wall": 26563.1} {"step": 6242, "train_loss": 3.6588714122772217, "lr": 0.0003727041301224433, "tps": 15399, "wall": 26568.0} {"step": 6243, "train_loss": 3.643806219100952, "lr": 0.0003726939865191728, "tps": 15399, "wall": 26573.0} {"step": 6244, "train_loss": 3.719942569732666, "lr": 0.0003726838411861766, "tps": 15398, "wall": 26578.0} {"step": 6245, "train_loss": 3.676879405975342, "lr": 0.00037267369412356946, "tps": 15398, "wall": 26582.9} {"step": 6246, "train_loss": 3.6425981521606445, "lr": 0.0003726635453314665, "tps": 15398, "wall": 26587.9} {"step": 6247, "train_loss": 3.6731624603271484, "lr": 0.0003726533948099827, "tps": 15397, "wall": 26592.8} {"step": 6248, "train_loss": 3.7742316722869873, "lr": 0.00037264324255923293, "tps": 15397, "wall": 26597.8} {"step": 6249, "train_loss": 3.6820313930511475, "lr": 0.00037263308857933227, "tps": 15396, "wall": 26602.7} {"step": 6250, "train_loss": 3.6950812339782715, "lr": 0.00037262293287039576, "tps": 15396, "wall": 26607.6} {"step": 6251, "train_loss": 3.588355541229248, "lr": 0.00037261277543253836, "tps": 15396, "wall": 26612.6} {"step": 6252, "train_loss": 3.670740842819214, "lr": 0.0003726026162658752, "tps": 15395, "wall": 26617.6} {"step": 6253, "train_loss": 3.5777852535247803, "lr": 0.00037259245537052133, "tps": 15395, "wall": 26622.5} {"step": 6254, "train_loss": 3.6292874813079834, "lr": 0.0003725822927465918, "tps": 15394, "wall": 26627.4} {"step": 6255, "train_loss": 3.7416012287139893, "lr": 0.00037257212839420195, "tps": 15394, "wall": 26632.4} {"step": 6256, "train_loss": 3.616537094116211, "lr": 0.0003725619623134667, "tps": 15394, "wall": 26637.4} {"step": 6257, "train_loss": 3.611237049102783, "lr": 0.0003725517945045013, "tps": 15393, "wall": 26642.4} {"step": 6258, "train_loss": 3.6866421699523926, "lr": 0.0003725416249674209, "tps": 15393, "wall": 26647.4} {"step": 6259, "train_loss": 3.6129472255706787, "lr": 0.0003725314537023407, "tps": 15392, "wall": 26652.5} {"step": 6260, "train_loss": 3.7410402297973633, "lr": 0.00037252128070937605, "tps": 15392, "wall": 26657.4} {"step": 6261, "train_loss": 3.7466423511505127, "lr": 0.00037251110598864203, "tps": 15391, "wall": 26662.4} {"step": 6262, "train_loss": 3.6306450366973877, "lr": 0.0003725009295402539, "tps": 15391, "wall": 26667.3} {"step": 6263, "train_loss": 3.67366099357605, "lr": 0.00037249075136432705, "tps": 15391, "wall": 26672.3} {"step": 6264, "train_loss": 3.5638082027435303, "lr": 0.00037248057146097664, "tps": 15390, "wall": 26677.2} {"step": 6265, "train_loss": 3.7048068046569824, "lr": 0.0003724703898303181, "tps": 15390, "wall": 26682.2} {"step": 6266, "train_loss": 3.723958730697632, "lr": 0.0003724602064724668, "tps": 15389, "wall": 26687.1} {"step": 6267, "train_loss": 3.703446865081787, "lr": 0.000372450021387538, "tps": 15389, "wall": 26692.1} {"step": 6268, "train_loss": 3.624843120574951, "lr": 0.00037243983457564705, "tps": 15389, "wall": 26697.1} {"step": 6269, "train_loss": 3.610238552093506, "lr": 0.00037242964603690943, "tps": 15388, "wall": 26702.0} {"step": 6270, "train_loss": 3.652170419692993, "lr": 0.0003724194557714406, "tps": 15388, "wall": 26707.0} {"step": 6271, "train_loss": 3.6546287536621094, "lr": 0.00037240926377935587, "tps": 15387, "wall": 26711.9} {"step": 6272, "train_loss": 3.690157413482666, "lr": 0.00037239907006077075, "tps": 15387, "wall": 26716.9} {"step": 6273, "train_loss": 3.7244181632995605, "lr": 0.00037238887461580076, "tps": 15387, "wall": 26721.8} {"step": 6274, "train_loss": 3.6037867069244385, "lr": 0.0003723786774445613, "tps": 15386, "wall": 26726.8} {"step": 6275, "train_loss": 3.683501720428467, "lr": 0.000372368478547168, "tps": 15386, "wall": 26731.7} {"step": 6276, "train_loss": 3.747596263885498, "lr": 0.0003723582779237363, "tps": 15385, "wall": 26736.7} {"step": 6277, "train_loss": 3.61222505569458, "lr": 0.00037234807557438176, "tps": 15385, "wall": 26741.6} {"step": 6278, "train_loss": 3.57873272895813, "lr": 0.00037233787149922, "tps": 15385, "wall": 26746.6} {"step": 6279, "train_loss": 3.705678939819336, "lr": 0.0003723276656983666, "tps": 15384, "wall": 26751.5} {"step": 6280, "train_loss": 3.6219992637634277, "lr": 0.0003723174581719372, "tps": 15384, "wall": 26756.5} {"step": 6281, "train_loss": 3.605201482772827, "lr": 0.00037230724892004733, "tps": 15383, "wall": 26761.4} {"step": 6282, "train_loss": 3.63754940032959, "lr": 0.0003722970379428127, "tps": 15383, "wall": 26766.4} {"step": 6283, "train_loss": 3.662360668182373, "lr": 0.00037228682524034903, "tps": 15383, "wall": 26771.3} {"step": 6284, "train_loss": 3.6945033073425293, "lr": 0.000372276610812772, "tps": 15382, "wall": 26776.3} {"step": 6285, "train_loss": 3.6567187309265137, "lr": 0.0003722663946601972, "tps": 15382, "wall": 26781.2} {"step": 6286, "train_loss": 3.748201847076416, "lr": 0.0003722561767827405, "tps": 15381, "wall": 26786.2} {"step": 6287, "train_loss": 3.654097318649292, "lr": 0.0003722459571805175, "tps": 15381, "wall": 26791.1} {"step": 6288, "train_loss": 3.827139377593994, "lr": 0.0003722357358536442, "tps": 15381, "wall": 26796.1} {"step": 6289, "train_loss": 3.667541742324829, "lr": 0.0003722255128022361, "tps": 15380, "wall": 26801.0} {"step": 6290, "train_loss": 3.6650397777557373, "lr": 0.00037221528802640927, "tps": 15380, "wall": 26806.0} {"step": 6291, "train_loss": 3.7052719593048096, "lr": 0.00037220506152627937, "tps": 15380, "wall": 26810.9} {"step": 6292, "train_loss": 3.656968355178833, "lr": 0.0003721948333019623, "tps": 15379, "wall": 26815.9} {"step": 6293, "train_loss": 3.6301498413085938, "lr": 0.00037218460335357393, "tps": 15379, "wall": 26820.9} {"step": 6294, "train_loss": 3.6540327072143555, "lr": 0.0003721743716812302, "tps": 15378, "wall": 26825.8} {"step": 6295, "train_loss": 3.597372055053711, "lr": 0.0003721641382850469, "tps": 15378, "wall": 26830.7} {"step": 6296, "train_loss": 3.6551403999328613, "lr": 0.00037215390316514, "tps": 15378, "wall": 26835.7} {"step": 6297, "train_loss": 3.661311626434326, "lr": 0.0003721436663216255, "tps": 15377, "wall": 26840.6} {"step": 6298, "train_loss": 3.622330665588379, "lr": 0.00037213342775461924, "tps": 15377, "wall": 26845.6} {"step": 6299, "train_loss": 3.6999990940093994, "lr": 0.00037212318746423736, "tps": 15376, "wall": 26850.5} {"step": 6300, "train_loss": 3.6515026092529297, "lr": 0.00037211294545059576, "tps": 15376, "wall": 26855.5} {"step": 6301, "train_loss": 3.6274070739746094, "lr": 0.00037210270171381045, "tps": 15376, "wall": 26860.4} {"step": 6302, "train_loss": 3.68546199798584, "lr": 0.00037209245625399756, "tps": 15375, "wall": 26865.3} {"step": 6303, "train_loss": 3.709589958190918, "lr": 0.000372082209071273, "tps": 15375, "wall": 26870.3} {"step": 6304, "train_loss": 3.6594901084899902, "lr": 0.000372071960165753, "tps": 15374, "wall": 26875.3} {"step": 6305, "train_loss": 3.72450590133667, "lr": 0.0003720617095375537, "tps": 15374, "wall": 26880.2} {"step": 6306, "train_loss": 3.832288980484009, "lr": 0.000372051457186791, "tps": 15374, "wall": 26885.2} {"step": 6307, "train_loss": 3.594130039215088, "lr": 0.0003720412031135812, "tps": 15373, "wall": 26890.1} {"step": 6308, "train_loss": 3.7639122009277344, "lr": 0.00037203094731804045, "tps": 15373, "wall": 26895.1} {"step": 6309, "train_loss": 3.6683526039123535, "lr": 0.0003720206898002849, "tps": 15372, "wall": 26900.0} {"step": 6310, "train_loss": 3.7284669876098633, "lr": 0.00037201043056043077, "tps": 15372, "wall": 26905.0} {"step": 6311, "train_loss": 3.6960620880126953, "lr": 0.0003720001695985942, "tps": 15372, "wall": 26910.0} {"step": 6312, "train_loss": 3.6829779148101807, "lr": 0.0003719899069148915, "tps": 15371, "wall": 26914.9} {"step": 6313, "train_loss": 3.700395345687866, "lr": 0.000371979642509439, "tps": 15371, "wall": 26919.9} {"step": 6314, "train_loss": 3.6490769386291504, "lr": 0.0003719693763823528, "tps": 15370, "wall": 26924.8} {"step": 6315, "train_loss": 3.5895700454711914, "lr": 0.0003719591085337493, "tps": 15370, "wall": 26929.8} {"step": 6316, "train_loss": 3.6660356521606445, "lr": 0.0003719488389637448, "tps": 15370, "wall": 26934.8} {"step": 6317, "train_loss": 3.624993324279785, "lr": 0.00037193856767245563, "tps": 15369, "wall": 26939.7} {"step": 6318, "train_loss": 3.612597942352295, "lr": 0.00037192829465999816, "tps": 15369, "wall": 26944.7} {"step": 6319, "train_loss": 3.645566463470459, "lr": 0.00037191801992648873, "tps": 15368, "wall": 26949.6} {"step": 6320, "train_loss": 3.586221218109131, "lr": 0.0003719077434720438, "tps": 15368, "wall": 26954.5} {"step": 6321, "train_loss": 3.680757522583008, "lr": 0.00037189746529677967, "tps": 15368, "wall": 26959.5} {"step": 6322, "train_loss": 3.549283981323242, "lr": 0.00037188718540081286, "tps": 15367, "wall": 26964.4} {"step": 6323, "train_loss": 3.6901350021362305, "lr": 0.0003718769037842598, "tps": 15367, "wall": 26969.3} {"step": 6324, "train_loss": 3.716902732849121, "lr": 0.000371866620447237, "tps": 15367, "wall": 26974.3} {"step": 6325, "train_loss": 3.6174654960632324, "lr": 0.0003718563353898608, "tps": 15366, "wall": 26979.3} {"step": 6326, "train_loss": 3.611283779144287, "lr": 0.00037184604861224786, "tps": 15366, "wall": 26984.2} {"step": 6327, "train_loss": 3.5911407470703125, "lr": 0.0003718357601145148, "tps": 15365, "wall": 26989.1} {"step": 6328, "train_loss": 3.7019033432006836, "lr": 0.0003718254698967779, "tps": 15365, "wall": 26994.1} {"step": 6329, "train_loss": 3.5413405895233154, "lr": 0.0003718151779591538, "tps": 15365, "wall": 26999.0} {"step": 6330, "train_loss": 3.666700601577759, "lr": 0.0003718048843017593, "tps": 15364, "wall": 27004.0} {"step": 6331, "train_loss": 3.700164318084717, "lr": 0.0003717945889247108, "tps": 15364, "wall": 27008.9} {"step": 6332, "train_loss": 3.7779784202575684, "lr": 0.00037178429182812493, "tps": 15363, "wall": 27013.8} {"step": 6333, "train_loss": 3.720259189605713, "lr": 0.00037177399301211844, "tps": 15363, "wall": 27018.8} {"step": 6334, "train_loss": 3.692779541015625, "lr": 0.000371763692476808, "tps": 15363, "wall": 27023.7} {"step": 6335, "train_loss": 3.6504523754119873, "lr": 0.0003717533902223102, "tps": 15362, "wall": 27028.7} {"step": 6336, "train_loss": 3.6339168548583984, "lr": 0.00037174308624874177, "tps": 15362, "wall": 27033.6} {"step": 6337, "train_loss": 3.64021897315979, "lr": 0.00037173278055621943, "tps": 15362, "wall": 27038.6} {"step": 6338, "train_loss": 3.720884323120117, "lr": 0.00037172247314486, "tps": 15361, "wall": 27043.5} {"step": 6339, "train_loss": 3.651982069015503, "lr": 0.0003717121640147801, "tps": 15361, "wall": 27048.4} {"step": 6340, "train_loss": 3.6402249336242676, "lr": 0.0003717018531660967, "tps": 15360, "wall": 27053.4} {"step": 6341, "train_loss": 3.638821601867676, "lr": 0.0003716915405989264, "tps": 15360, "wall": 27058.4} {"step": 6342, "train_loss": 3.6737332344055176, "lr": 0.0003716812263133862, "tps": 15360, "wall": 27063.3} {"step": 6343, "train_loss": 3.6346426010131836, "lr": 0.0003716709103095929, "tps": 15359, "wall": 27068.2} {"step": 6344, "train_loss": 3.6600284576416016, "lr": 0.00037166059258766324, "tps": 15359, "wall": 27073.2} {"step": 6345, "train_loss": 3.6161909103393555, "lr": 0.0003716502731477142, "tps": 15358, "wall": 27078.1} {"step": 6346, "train_loss": 3.7511191368103027, "lr": 0.0003716399519898626, "tps": 15358, "wall": 27083.0} {"step": 6347, "train_loss": 3.7152626514434814, "lr": 0.0003716296291142255, "tps": 15358, "wall": 27088.0} {"step": 6348, "train_loss": 3.5708112716674805, "lr": 0.00037161930452091977, "tps": 15357, "wall": 27092.9} {"step": 6349, "train_loss": 3.711512565612793, "lr": 0.0003716089782100623, "tps": 15357, "wall": 27097.9} {"step": 6350, "train_loss": 3.717764377593994, "lr": 0.00037159865018177013, "tps": 15357, "wall": 27102.8} {"step": 6351, "train_loss": 3.6714916229248047, "lr": 0.0003715883204361603, "tps": 15356, "wall": 27107.8} {"step": 6352, "train_loss": 3.689427614212036, "lr": 0.00037157798897334977, "tps": 15356, "wall": 27112.7} {"step": 6353, "train_loss": 3.7271721363067627, "lr": 0.0003715676557934555, "tps": 15355, "wall": 27117.7} {"step": 6354, "train_loss": 3.6484169960021973, "lr": 0.00037155732089659473, "tps": 15355, "wall": 27122.7} {"step": 6355, "train_loss": 3.623075008392334, "lr": 0.0003715469842828844, "tps": 15355, "wall": 27127.6} {"step": 6356, "train_loss": 3.7548837661743164, "lr": 0.00037153664595244155, "tps": 15354, "wall": 27132.5} {"step": 6357, "train_loss": 3.602876663208008, "lr": 0.00037152630590538344, "tps": 15354, "wall": 27137.5} {"step": 6358, "train_loss": 3.6099514961242676, "lr": 0.0003715159641418272, "tps": 15353, "wall": 27142.4} {"step": 6359, "train_loss": 3.653867483139038, "lr": 0.0003715056206618899, "tps": 15353, "wall": 27147.4} {"step": 6360, "train_loss": 3.5519282817840576, "lr": 0.0003714952754656887, "tps": 15353, "wall": 27152.4} {"step": 6361, "train_loss": 3.5524020195007324, "lr": 0.0003714849285533407, "tps": 15352, "wall": 27157.4} {"step": 6362, "train_loss": 3.528531074523926, "lr": 0.0003714745799249634, "tps": 15352, "wall": 27162.4} {"step": 6363, "train_loss": 3.6863865852355957, "lr": 0.0003714642295806738, "tps": 15351, "wall": 27167.4} {"step": 6364, "train_loss": 3.698946475982666, "lr": 0.0003714538775205893, "tps": 15351, "wall": 27172.3} {"step": 6365, "train_loss": 3.6361961364746094, "lr": 0.00037144352374482697, "tps": 15351, "wall": 27177.4} {"step": 6366, "train_loss": 3.5998616218566895, "lr": 0.00037143316825350423, "tps": 15350, "wall": 27182.4} {"step": 6367, "train_loss": 3.643507480621338, "lr": 0.0003714228110467384, "tps": 15350, "wall": 27187.4} {"step": 6368, "train_loss": 3.7434744834899902, "lr": 0.0003714124521246468, "tps": 15349, "wall": 27192.4} {"step": 6369, "train_loss": 3.658216953277588, "lr": 0.00037140209148734673, "tps": 15349, "wall": 27197.4} {"step": 6370, "train_loss": 3.6405763626098633, "lr": 0.00037139172913495553, "tps": 15349, "wall": 27202.4} {"step": 6371, "train_loss": 3.6354193687438965, "lr": 0.0003713813650675907, "tps": 15348, "wall": 27207.4} {"step": 6372, "train_loss": 3.7227439880371094, "lr": 0.00037137099928536945, "tps": 15348, "wall": 27212.4} {"step": 6373, "train_loss": 3.7337286472320557, "lr": 0.0003713606317884095, "tps": 15347, "wall": 27217.4} {"step": 6374, "train_loss": 3.6428587436676025, "lr": 0.000371350262576828, "tps": 15347, "wall": 27222.4} {"step": 6375, "train_loss": 3.597170114517212, "lr": 0.00037133989165074265, "tps": 15346, "wall": 27227.4} {"step": 6376, "train_loss": 3.586106777191162, "lr": 0.00037132951901027074, "tps": 15346, "wall": 27232.4} {"step": 6377, "train_loss": 3.6539244651794434, "lr": 0.00037131914465552985, "tps": 15346, "wall": 27237.4} {"step": 6378, "train_loss": 3.666649103164673, "lr": 0.0003713087685866375, "tps": 15345, "wall": 27242.4} {"step": 6379, "train_loss": 3.5296640396118164, "lr": 0.00037129839080371127, "tps": 15345, "wall": 27247.4} {"step": 6380, "train_loss": 3.70505952835083, "lr": 0.0003712880113068687, "tps": 15344, "wall": 27252.4} {"step": 6381, "train_loss": 3.647850751876831, "lr": 0.0003712776300962273, "tps": 15344, "wall": 27257.3} {"step": 6382, "train_loss": 3.6394524574279785, "lr": 0.00037126724717190474, "tps": 15344, "wall": 27262.3} {"step": 6383, "train_loss": 3.6577539443969727, "lr": 0.00037125686253401864, "tps": 15343, "wall": 27267.3} {"step": 6384, "train_loss": 3.675112009048462, "lr": 0.0003712464761826866, "tps": 15343, "wall": 27272.3} {"step": 6385, "train_loss": 3.6037824153900146, "lr": 0.0003712360881180263, "tps": 15342, "wall": 27277.3} {"step": 6386, "train_loss": 3.6560487747192383, "lr": 0.0003712256983401554, "tps": 15342, "wall": 27282.3} {"step": 6387, "train_loss": 3.782650947570801, "lr": 0.00037121530684919155, "tps": 15342, "wall": 27287.2} {"step": 6388, "train_loss": 3.5822181701660156, "lr": 0.0003712049136452527, "tps": 15341, "wall": 27292.2} {"step": 6389, "train_loss": 3.734762668609619, "lr": 0.0003711945187284563, "tps": 15341, "wall": 27297.2} {"step": 6390, "train_loss": 3.798870086669922, "lr": 0.00037118412209892016, "tps": 15340, "wall": 27302.2} {"step": 6391, "train_loss": 3.5415263175964355, "lr": 0.0003711737237567622, "tps": 15340, "wall": 27307.2} {"step": 6392, "train_loss": 3.608741044998169, "lr": 0.00037116332370210005, "tps": 15340, "wall": 27312.2} {"step": 6393, "train_loss": 3.7172205448150635, "lr": 0.0003711529219350516, "tps": 15339, "wall": 27317.1} {"step": 6394, "train_loss": 3.6095008850097656, "lr": 0.00037114251845573465, "tps": 15339, "wall": 27322.1} {"step": 6395, "train_loss": 3.626384973526001, "lr": 0.00037113211326426714, "tps": 15338, "wall": 27327.1} {"step": 6396, "train_loss": 3.6542186737060547, "lr": 0.0003711217063607669, "tps": 15338, "wall": 27332.1} {"step": 6397, "train_loss": 3.7483410835266113, "lr": 0.0003711112977453517, "tps": 15338, "wall": 27337.1} {"step": 6398, "train_loss": 3.6350362300872803, "lr": 0.0003711008874181396, "tps": 15337, "wall": 27342.1} {"step": 6399, "train_loss": 3.7902283668518066, "lr": 0.00037109047537924847, "tps": 15337, "wall": 27347.3} {"step": 6400, "train_loss": 3.6505236625671387, "lr": 0.00037108006162879623, "tps": 15336, "wall": 27352.2} {"step": 6401, "train_loss": 3.639944553375244, "lr": 0.00037106964616690093, "tps": 15336, "wall": 27357.3} {"step": 6402, "train_loss": 3.6464736461639404, "lr": 0.0003710592289936805, "tps": 15335, "wall": 27362.3} {"step": 6403, "train_loss": 3.5512852668762207, "lr": 0.0003710488101092529, "tps": 15335, "wall": 27367.2} {"step": 6404, "train_loss": 3.65228533744812, "lr": 0.0003710383895137363, "tps": 15335, "wall": 27372.4} {"step": 6405, "train_loss": 3.7037949562072754, "lr": 0.00037102796720724855, "tps": 15334, "wall": 27377.4} {"step": 6406, "train_loss": 3.6204988956451416, "lr": 0.00037101754318990784, "tps": 15334, "wall": 27382.4} {"step": 6407, "train_loss": 3.731431484222412, "lr": 0.0003710071174618323, "tps": 15333, "wall": 27387.5} {"step": 6408, "train_loss": 3.6255569458007812, "lr": 0.0003709966900231399, "tps": 15333, "wall": 27392.5} {"step": 6409, "train_loss": 3.738400936126709, "lr": 0.0003709862608739488, "tps": 15333, "wall": 27397.4} {"step": 6410, "train_loss": 3.6792402267456055, "lr": 0.00037097583001437717, "tps": 15332, "wall": 27402.4} {"step": 6411, "train_loss": 3.620879650115967, "lr": 0.0003709653974445432, "tps": 15332, "wall": 27407.4} {"step": 6412, "train_loss": 3.698749303817749, "lr": 0.0003709549631645651, "tps": 15331, "wall": 27412.4} {"step": 6413, "train_loss": 3.63458251953125, "lr": 0.00037094452717456095, "tps": 15331, "wall": 27417.4} {"step": 6414, "train_loss": 3.666715145111084, "lr": 0.00037093408947464905, "tps": 15331, "wall": 27422.4} {"step": 6415, "train_loss": 3.6502952575683594, "lr": 0.00037092365006494756, "tps": 15330, "wall": 27427.4} {"step": 6416, "train_loss": 3.653247594833374, "lr": 0.0003709132089455749, "tps": 15330, "wall": 27432.3} {"step": 6417, "train_loss": 3.631610155105591, "lr": 0.0003709027661166491, "tps": 15329, "wall": 27437.3} {"step": 6418, "train_loss": 3.7048802375793457, "lr": 0.0003708923215782888, "tps": 15329, "wall": 27442.2} {"step": 6419, "train_loss": 3.6717047691345215, "lr": 0.00037088187533061196, "tps": 15329, "wall": 27447.2} {"step": 6420, "train_loss": 3.6840977668762207, "lr": 0.00037087142737373714, "tps": 15328, "wall": 27452.2} {"step": 6421, "train_loss": 3.7351791858673096, "lr": 0.0003708609777077826, "tps": 15328, "wall": 27457.2} {"step": 6422, "train_loss": 3.636042356491089, "lr": 0.00037085052633286676, "tps": 15327, "wall": 27462.2} {"step": 6423, "train_loss": 3.6859915256500244, "lr": 0.000370840073249108, "tps": 15327, "wall": 27467.2} {"step": 6424, "train_loss": 3.6463189125061035, "lr": 0.0003708296184566247, "tps": 15327, "wall": 27472.1} {"step": 6425, "train_loss": 3.558340072631836, "lr": 0.00037081916195553534, "tps": 15326, "wall": 27477.2} {"step": 6426, "train_loss": 3.6355018615722656, "lr": 0.00037080870374595835, "tps": 15326, "wall": 27482.1} {"step": 6427, "train_loss": 3.552415132522583, "lr": 0.00037079824382801223, "tps": 15325, "wall": 27487.1} {"step": 6428, "train_loss": 3.6593899726867676, "lr": 0.0003707877822018154, "tps": 15325, "wall": 27492.1} {"step": 6429, "train_loss": 3.6576247215270996, "lr": 0.0003707773188674865, "tps": 15325, "wall": 27497.0} {"step": 6430, "train_loss": 3.5931737422943115, "lr": 0.0003707668538251439, "tps": 15324, "wall": 27502.0} {"step": 6431, "train_loss": 3.7206919193267822, "lr": 0.0003707563870749062, "tps": 15324, "wall": 27507.0} {"step": 6432, "train_loss": 3.698869228363037, "lr": 0.0003707459186168921, "tps": 15324, "wall": 27511.9} {"step": 6433, "train_loss": 3.6820502281188965, "lr": 0.00037073544845121997, "tps": 15323, "wall": 27517.0} {"step": 6434, "train_loss": 3.663753032684326, "lr": 0.00037072497657800863, "tps": 15323, "wall": 27521.9} {"step": 6435, "train_loss": 3.5510735511779785, "lr": 0.00037071450299737646, "tps": 15322, "wall": 27526.9} {"step": 6436, "train_loss": 3.7258167266845703, "lr": 0.00037070402770944235, "tps": 15322, "wall": 27531.9} {"step": 6437, "train_loss": 3.6062004566192627, "lr": 0.00037069355071432485, "tps": 15322, "wall": 27536.9} {"step": 6438, "train_loss": 3.637462854385376, "lr": 0.00037068307201214263, "tps": 15321, "wall": 27541.9} {"step": 6439, "train_loss": 3.7909786701202393, "lr": 0.00037067259160301447, "tps": 15321, "wall": 27546.9} {"step": 6440, "train_loss": 3.584601879119873, "lr": 0.00037066210948705897, "tps": 15320, "wall": 27552.0} {"step": 6441, "train_loss": 3.570021390914917, "lr": 0.00037065162566439497, "tps": 15320, "wall": 27556.9} {"step": 6442, "train_loss": 3.570693016052246, "lr": 0.0003706411401351412, "tps": 15320, "wall": 27561.9} {"step": 6443, "train_loss": 3.5783438682556152, "lr": 0.0003706306528994165, "tps": 15319, "wall": 27566.9} {"step": 6444, "train_loss": 3.747122049331665, "lr": 0.00037062016395733957, "tps": 15319, "wall": 27572.0} {"step": 6445, "train_loss": 3.6920456886291504, "lr": 0.00037060967330902923, "tps": 15318, "wall": 27576.9} {"step": 6446, "train_loss": 3.692596435546875, "lr": 0.00037059918095460443, "tps": 15318, "wall": 27582.0} {"step": 6447, "train_loss": 3.6790120601654053, "lr": 0.00037058868689418393, "tps": 15317, "wall": 27586.9} {"step": 6448, "train_loss": 3.6834630966186523, "lr": 0.0003705781911278866, "tps": 15317, "wall": 27591.9} {"step": 6449, "train_loss": 3.572361946105957, "lr": 0.0003705676936558315, "tps": 15317, "wall": 27597.0} {"step": 6450, "train_loss": 3.599834442138672, "lr": 0.0003705571944781373, "tps": 15316, "wall": 27602.1} {"step": 6451, "train_loss": 3.7487735748291016, "lr": 0.0003705466935949231, "tps": 15316, "wall": 27607.0} {"step": 6452, "train_loss": 3.6671037673950195, "lr": 0.0003705361910063078, "tps": 15315, "wall": 27612.0} {"step": 6453, "train_loss": 3.7016336917877197, "lr": 0.0003705256867124104, "tps": 15315, "wall": 27617.0} {"step": 6454, "train_loss": 3.736954689025879, "lr": 0.00037051518071334986, "tps": 15315, "wall": 27622.0} {"step": 6455, "train_loss": 3.646667003631592, "lr": 0.00037050467300924525, "tps": 15314, "wall": 27626.9} {"step": 6456, "train_loss": 3.658104181289673, "lr": 0.00037049416360021554, "tps": 15314, "wall": 27632.3} {"step": 6457, "train_loss": 3.71050763130188, "lr": 0.00037048365248637977, "tps": 15313, "wall": 27637.4} {"step": 6458, "train_loss": 3.6366262435913086, "lr": 0.0003704731396678571, "tps": 15313, "wall": 27642.7} {"step": 6459, "train_loss": 3.6231589317321777, "lr": 0.00037046262514476647, "tps": 15312, "wall": 27647.9} {"step": 6460, "train_loss": 3.571880340576172, "lr": 0.0003704521089172272, "tps": 15312, "wall": 27653.1} {"step": 6461, "train_loss": 3.755681037902832, "lr": 0.00037044159098535825, "tps": 15311, "wall": 27658.4} {"step": 6462, "train_loss": 3.6176564693450928, "lr": 0.0003704310713492788, "tps": 15311, "wall": 27663.6} {"step": 6463, "train_loss": 3.733994960784912, "lr": 0.000370420550009108, "tps": 15310, "wall": 27668.9} {"step": 6464, "train_loss": 3.699979782104492, "lr": 0.00037041002696496514, "tps": 15309, "wall": 27674.1} {"step": 6465, "train_loss": 3.7392020225524902, "lr": 0.0003703995022169694, "tps": 15309, "wall": 27679.3} {"step": 6466, "train_loss": 3.6443915367126465, "lr": 0.00037038897576523985, "tps": 15308, "wall": 27684.5} {"step": 6467, "train_loss": 3.640657424926758, "lr": 0.0003703784476098959, "tps": 15308, "wall": 27689.7} {"step": 6468, "train_loss": 3.6521055698394775, "lr": 0.0003703679177510568, "tps": 15307, "wall": 27695.0} {"step": 6469, "train_loss": 3.61147141456604, "lr": 0.00037035738618884173, "tps": 15307, "wall": 27700.2} {"step": 6470, "train_loss": 3.666614532470703, "lr": 0.0003703468529233701, "tps": 15306, "wall": 27705.5} {"step": 6471, "train_loss": 3.6326873302459717, "lr": 0.0003703363179547611, "tps": 15306, "wall": 27710.7} {"step": 6472, "train_loss": 3.6092123985290527, "lr": 0.0003703257812831343, "tps": 15305, "wall": 27715.7} {"step": 6473, "train_loss": 3.594876289367676, "lr": 0.0003703152429086088, "tps": 15305, "wall": 27720.7} {"step": 6474, "train_loss": 3.631503105163574, "lr": 0.0003703047028313042, "tps": 15305, "wall": 27725.7} {"step": 6475, "train_loss": 3.7179360389709473, "lr": 0.0003702941610513397, "tps": 15304, "wall": 27730.7} {"step": 6476, "train_loss": 3.7563605308532715, "lr": 0.0003702836175688348, "tps": 15304, "wall": 27735.7} {"step": 6477, "train_loss": 3.7128968238830566, "lr": 0.00037027307238390894, "tps": 15303, "wall": 27740.6} {"step": 6478, "train_loss": 3.631397247314453, "lr": 0.0003702625254966817, "tps": 15303, "wall": 27745.6} {"step": 6479, "train_loss": 3.6651384830474854, "lr": 0.00037025197690727235, "tps": 15303, "wall": 27750.6} {"step": 6480, "train_loss": 3.5676605701446533, "lr": 0.0003702414266158005, "tps": 15302, "wall": 27755.6} {"step": 6481, "train_loss": 3.5475544929504395, "lr": 0.0003702308746223857, "tps": 15302, "wall": 27760.5} {"step": 6482, "train_loss": 3.50837779045105, "lr": 0.00037022032092714737, "tps": 15302, "wall": 27765.5} {"step": 6483, "train_loss": 3.5910754203796387, "lr": 0.00037020976553020507, "tps": 15301, "wall": 27770.5} {"step": 6484, "train_loss": 3.718966484069824, "lr": 0.0003701992084316785, "tps": 15301, "wall": 27775.5} {"step": 6485, "train_loss": 3.7050557136535645, "lr": 0.0003701886496316871, "tps": 15300, "wall": 27780.6} {"step": 6486, "train_loss": 3.6422996520996094, "lr": 0.0003701780891303506, "tps": 15300, "wall": 27785.7} {"step": 6487, "train_loss": 3.726921319961548, "lr": 0.00037016752692778864, "tps": 15299, "wall": 27790.9} {"step": 6488, "train_loss": 3.659738063812256, "lr": 0.0003701569630241207, "tps": 15299, "wall": 27796.2} {"step": 6489, "train_loss": 3.6030988693237305, "lr": 0.0003701463974194666, "tps": 15298, "wall": 27801.4} {"step": 6490, "train_loss": 3.6196422576904297, "lr": 0.000370135830113946, "tps": 15298, "wall": 27806.6} {"step": 6491, "train_loss": 3.6702687740325928, "lr": 0.0003701252611076786, "tps": 15297, "wall": 27811.8} {"step": 6492, "train_loss": 3.6816234588623047, "lr": 0.00037011469040078407, "tps": 15297, "wall": 27817.0} {"step": 6493, "train_loss": 3.695080518722534, "lr": 0.00037010411799338227, "tps": 15296, "wall": 27822.2} {"step": 6494, "train_loss": 3.644963502883911, "lr": 0.0003700935438855929, "tps": 15296, "wall": 27827.5} {"step": 6495, "train_loss": 3.6833274364471436, "lr": 0.0003700829680775357, "tps": 15295, "wall": 27832.7} {"step": 6496, "train_loss": 3.6081693172454834, "lr": 0.00037007239056933056, "tps": 15295, "wall": 27837.9} {"step": 6497, "train_loss": 3.7312188148498535, "lr": 0.0003700618113610972, "tps": 15294, "wall": 27843.1} {"step": 6498, "train_loss": 3.6526451110839844, "lr": 0.0003700512304529556, "tps": 15294, "wall": 27848.3} {"step": 6499, "train_loss": 3.592191219329834, "lr": 0.0003700406478450255, "tps": 15293, "wall": 27853.5} {"step": 6500, "train_loss": 3.704029083251953, "lr": 0.0003700300635374268, "tps": 15293, "wall": 27858.7} {"step": 6501, "train_loss": 3.6851248741149902, "lr": 0.0003700194775302795, "tps": 15292, "wall": 27864.1} {"step": 6502, "train_loss": 3.6087703704833984, "lr": 0.0003700088898237034, "tps": 15292, "wall": 27869.1} {"step": 6503, "train_loss": 3.532425880432129, "lr": 0.00036999830041781846, "tps": 15291, "wall": 27874.1} {"step": 6504, "train_loss": 3.6674442291259766, "lr": 0.00036998770931274467, "tps": 15291, "wall": 27879.0} {"step": 6505, "train_loss": 3.5098538398742676, "lr": 0.00036997711650860204, "tps": 15291, "wall": 27884.0} {"step": 6506, "train_loss": 3.6577234268188477, "lr": 0.00036996652200551043, "tps": 15290, "wall": 27888.9} {"step": 6507, "train_loss": 3.680748462677002, "lr": 0.00036995592580359003, "tps": 15290, "wall": 27893.9} {"step": 6508, "train_loss": 3.688791275024414, "lr": 0.00036994532790296075, "tps": 15290, "wall": 27898.8} {"step": 6509, "train_loss": 3.6536121368408203, "lr": 0.0003699347283037427, "tps": 15289, "wall": 27903.8} {"step": 6510, "train_loss": 3.568830966949463, "lr": 0.0003699241270060559, "tps": 15289, "wall": 27908.7} {"step": 6511, "train_loss": 3.648083448410034, "lr": 0.0003699135240100205, "tps": 15288, "wall": 27913.6} {"step": 6512, "train_loss": 3.549673557281494, "lr": 0.00036990291931575663, "tps": 15288, "wall": 27918.5} {"step": 6513, "train_loss": 3.7563343048095703, "lr": 0.00036989231292338434, "tps": 15288, "wall": 27923.5} {"step": 6514, "train_loss": 3.6355972290039062, "lr": 0.0003698817048330238, "tps": 15287, "wall": 27928.4} {"step": 6515, "train_loss": 3.570845603942871, "lr": 0.00036987109504479525, "tps": 15287, "wall": 27933.3} {"step": 6516, "train_loss": 3.61991548538208, "lr": 0.00036986048355881876, "tps": 15287, "wall": 27938.3} {"step": 6517, "train_loss": 3.6366825103759766, "lr": 0.0003698498703752146, "tps": 15286, "wall": 27943.2} {"step": 6518, "train_loss": 3.605609655380249, "lr": 0.0003698392554941031, "tps": 15286, "wall": 27948.1} {"step": 6519, "train_loss": 3.6748504638671875, "lr": 0.0003698286389156044, "tps": 15286, "wall": 27953.0} {"step": 6520, "train_loss": 3.678941249847412, "lr": 0.0003698180206398387, "tps": 15285, "wall": 27958.0} {"step": 6521, "train_loss": 3.7378649711608887, "lr": 0.0003698074006669264, "tps": 15285, "wall": 27962.9} {"step": 6522, "train_loss": 3.673020124435425, "lr": 0.0003697967789969877, "tps": 15285, "wall": 27967.8} {"step": 6523, "train_loss": 3.5794715881347656, "lr": 0.00036978615563014304, "tps": 15284, "wall": 27972.8} {"step": 6524, "train_loss": 3.513730049133301, "lr": 0.00036977553056651274, "tps": 15284, "wall": 27977.7} {"step": 6525, "train_loss": 3.596280574798584, "lr": 0.00036976490380621706, "tps": 15284, "wall": 27982.6} {"step": 6526, "train_loss": 3.578389883041382, "lr": 0.0003697542753493764, "tps": 15283, "wall": 27987.5} {"step": 6527, "train_loss": 3.675612449645996, "lr": 0.00036974364519611134, "tps": 15283, "wall": 27992.4} {"step": 6528, "train_loss": 3.6516551971435547, "lr": 0.00036973301334654204, "tps": 15283, "wall": 27997.4} {"step": 6529, "train_loss": 3.5741732120513916, "lr": 0.0003697223798007892, "tps": 15282, "wall": 28002.3} {"step": 6530, "train_loss": 3.6944580078125, "lr": 0.00036971174455897307, "tps": 15282, "wall": 28007.2} {"step": 6531, "train_loss": 3.6499788761138916, "lr": 0.0003697011076212142, "tps": 15281, "wall": 28012.1} {"step": 6532, "train_loss": 3.660705089569092, "lr": 0.00036969046898763306, "tps": 15281, "wall": 28017.1} {"step": 6533, "train_loss": 3.6967740058898926, "lr": 0.0003696798286583502, "tps": 15281, "wall": 28022.1} {"step": 6534, "train_loss": 3.7580151557922363, "lr": 0.00036966918663348616, "tps": 15280, "wall": 28027.0} {"step": 6535, "train_loss": 3.5989933013916016, "lr": 0.0003696585429131615, "tps": 15280, "wall": 28032.0} {"step": 6536, "train_loss": 3.693652629852295, "lr": 0.0003696478974974967, "tps": 15280, "wall": 28036.9} {"step": 6537, "train_loss": 3.6672589778900146, "lr": 0.0003696372503866125, "tps": 15279, "wall": 28041.8} {"step": 6538, "train_loss": 3.737095355987549, "lr": 0.0003696266015806294, "tps": 15279, "wall": 28046.8} {"step": 6539, "train_loss": 3.720266342163086, "lr": 0.00036961595107966804, "tps": 15279, "wall": 28051.7} {"step": 6540, "train_loss": 3.645051956176758, "lr": 0.0003696052988838491, "tps": 15278, "wall": 28056.6} {"step": 6541, "train_loss": 3.6372859477996826, "lr": 0.00036959464499329326, "tps": 15278, "wall": 28061.5} {"step": 6542, "train_loss": 3.686272144317627, "lr": 0.00036958398940812123, "tps": 15278, "wall": 28066.5} {"step": 6543, "train_loss": 3.6038525104522705, "lr": 0.0003695733321284536, "tps": 15277, "wall": 28071.4} {"step": 6544, "train_loss": 3.4893336296081543, "lr": 0.0003695626731544112, "tps": 15277, "wall": 28076.3} {"step": 6545, "train_loss": 3.615086317062378, "lr": 0.0003695520124861147, "tps": 15277, "wall": 28081.3} {"step": 6546, "train_loss": 3.695528745651245, "lr": 0.00036954135012368496, "tps": 15276, "wall": 28086.2} {"step": 6547, "train_loss": 3.6074442863464355, "lr": 0.00036953068606724275, "tps": 15276, "wall": 28091.1} {"step": 6548, "train_loss": 3.6117191314697266, "lr": 0.0003695200203169088, "tps": 15275, "wall": 28096.1} {"step": 6549, "train_loss": 3.6673402786254883, "lr": 0.00036950935287280396, "tps": 15275, "wall": 28101.0} {"step": 6550, "train_loss": 3.6916985511779785, "lr": 0.0003694986837350491, "tps": 15275, "wall": 28106.0} {"step": 6551, "train_loss": 3.5838232040405273, "lr": 0.00036948801290376504, "tps": 15274, "wall": 28110.9} {"step": 6552, "train_loss": 3.6052756309509277, "lr": 0.00036947734037907275, "tps": 15274, "wall": 28115.8} {"step": 6553, "train_loss": 3.6759393215179443, "lr": 0.000369466666161093, "tps": 15274, "wall": 28120.7} {"step": 6554, "train_loss": 3.7407169342041016, "lr": 0.00036945599024994674, "tps": 15273, "wall": 28125.7} {"step": 6555, "train_loss": 3.6585655212402344, "lr": 0.000369445312645755, "tps": 15273, "wall": 28130.6} {"step": 6556, "train_loss": 3.6265156269073486, "lr": 0.00036943463334863864, "tps": 15273, "wall": 28135.6} {"step": 6557, "train_loss": 3.6699318885803223, "lr": 0.0003694239523587187, "tps": 15272, "wall": 28140.5} {"step": 6558, "train_loss": 3.7305479049682617, "lr": 0.0003694132696761161, "tps": 15272, "wall": 28145.5} {"step": 6559, "train_loss": 3.638463020324707, "lr": 0.000369402585300952, "tps": 15272, "wall": 28150.4} {"step": 6560, "train_loss": 3.6549954414367676, "lr": 0.0003693918992333472, "tps": 15271, "wall": 28155.3} {"step": 6561, "train_loss": 3.5543148517608643, "lr": 0.0003693812114734229, "tps": 15271, "wall": 28160.3} {"step": 6562, "train_loss": 3.697507381439209, "lr": 0.00036937052202130026, "tps": 15271, "wall": 28165.2} {"step": 6563, "train_loss": 3.7102184295654297, "lr": 0.0003693598308771002, "tps": 15270, "wall": 28170.2} {"step": 6564, "train_loss": 3.634312868118286, "lr": 0.0003693491380409439, "tps": 15270, "wall": 28175.1} {"step": 6565, "train_loss": 3.6252212524414062, "lr": 0.0003693384435129524, "tps": 15269, "wall": 28180.1} {"step": 6566, "train_loss": 3.689314126968384, "lr": 0.0003693277472932471, "tps": 15269, "wall": 28185.0} {"step": 6567, "train_loss": 3.7103776931762695, "lr": 0.00036931704938194886, "tps": 15269, "wall": 28189.9} {"step": 6568, "train_loss": 3.6131174564361572, "lr": 0.000369306349779179, "tps": 15268, "wall": 28195.0} {"step": 6569, "train_loss": 3.6930789947509766, "lr": 0.00036929564848505884, "tps": 15268, "wall": 28199.9} {"step": 6570, "train_loss": 3.5509510040283203, "lr": 0.00036928494549970945, "tps": 15268, "wall": 28204.8} {"step": 6571, "train_loss": 3.565236806869507, "lr": 0.00036927424082325213, "tps": 15267, "wall": 28209.7} {"step": 6572, "train_loss": 3.7324090003967285, "lr": 0.0003692635344558081, "tps": 15267, "wall": 28214.7} {"step": 6573, "train_loss": 3.669010877609253, "lr": 0.0003692528263974987, "tps": 15267, "wall": 28219.6} {"step": 6574, "train_loss": 3.6869752407073975, "lr": 0.0003692421166484453, "tps": 15266, "wall": 28224.5} {"step": 6575, "train_loss": 3.600095272064209, "lr": 0.000369231405208769, "tps": 15266, "wall": 28229.5} {"step": 6576, "train_loss": 3.624523401260376, "lr": 0.0003692206920785913, "tps": 15266, "wall": 28234.4} {"step": 6577, "train_loss": 3.6563284397125244, "lr": 0.0003692099772580335, "tps": 15265, "wall": 28239.3} {"step": 6578, "train_loss": 3.6111090183258057, "lr": 0.00036919926074721707, "tps": 15265, "wall": 28244.2} {"step": 6579, "train_loss": 3.7111854553222656, "lr": 0.0003691885425462633, "tps": 15265, "wall": 28249.2} {"step": 6580, "train_loss": 3.6339848041534424, "lr": 0.00036917782265529365, "tps": 15264, "wall": 28254.2} {"step": 6581, "train_loss": 3.6797702312469482, "lr": 0.0003691671010744296, "tps": 15264, "wall": 28259.1} {"step": 6582, "train_loss": 3.5804271697998047, "lr": 0.00036915637780379247, "tps": 15264, "wall": 28264.0} {"step": 6583, "train_loss": 3.709106206893921, "lr": 0.0003691456528435039, "tps": 15263, "wall": 28268.9} {"step": 6584, "train_loss": 3.8261489868164062, "lr": 0.00036913492619368524, "tps": 15263, "wall": 28273.8} {"step": 6585, "train_loss": 3.5911002159118652, "lr": 0.00036912419785445816, "tps": 15263, "wall": 28278.8} {"step": 6586, "train_loss": 3.6607065200805664, "lr": 0.00036911346782594407, "tps": 15262, "wall": 28283.7} {"step": 6587, "train_loss": 3.716702699661255, "lr": 0.0003691027361082645, "tps": 15262, "wall": 28288.6} {"step": 6588, "train_loss": 3.6523256301879883, "lr": 0.0003690920027015411, "tps": 15261, "wall": 28293.6} {"step": 6589, "train_loss": 3.6862716674804688, "lr": 0.0003690812676058954, "tps": 15261, "wall": 28298.6} {"step": 6590, "train_loss": 3.7490999698638916, "lr": 0.00036907053082144907, "tps": 15261, "wall": 28303.6} {"step": 6591, "train_loss": 3.6552717685699463, "lr": 0.0003690597923483237, "tps": 15260, "wall": 28308.5} {"step": 6592, "train_loss": 3.6302223205566406, "lr": 0.00036904905218664095, "tps": 15260, "wall": 28313.5} {"step": 6593, "train_loss": 3.667080879211426, "lr": 0.00036903831033652246, "tps": 15260, "wall": 28318.6} {"step": 6594, "train_loss": 3.7141497135162354, "lr": 0.00036902756679808987, "tps": 15259, "wall": 28323.5} {"step": 6595, "train_loss": 3.6164302825927734, "lr": 0.000369016821571465, "tps": 15259, "wall": 28328.5} {"step": 6596, "train_loss": 3.7045788764953613, "lr": 0.00036900607465676955, "tps": 15259, "wall": 28333.4} {"step": 6597, "train_loss": 3.6195530891418457, "lr": 0.00036899532605412516, "tps": 15258, "wall": 28338.3} {"step": 6598, "train_loss": 3.6485774517059326, "lr": 0.0003689845757636537, "tps": 15258, "wall": 28343.3} {"step": 6599, "train_loss": 3.6684951782226562, "lr": 0.00036897382378547693, "tps": 15257, "wall": 28348.3} {"step": 6600, "train_loss": 3.6321911811828613, "lr": 0.00036896307011971655, "tps": 15257, "wall": 28353.3} {"step": 6601, "train_loss": 3.633038282394409, "lr": 0.0003689523147664944, "tps": 15257, "wall": 28358.2} {"step": 6602, "train_loss": 3.5994887351989746, "lr": 0.0003689415577259325, "tps": 15256, "wall": 28363.1} {"step": 6603, "train_loss": 3.6147303581237793, "lr": 0.00036893079899815253, "tps": 15256, "wall": 28368.0} {"step": 6604, "train_loss": 3.708527088165283, "lr": 0.0003689200385832764, "tps": 15256, "wall": 28373.0} {"step": 6605, "train_loss": 3.626297950744629, "lr": 0.0003689092764814261, "tps": 15255, "wall": 28378.0} {"step": 6606, "train_loss": 3.572157382965088, "lr": 0.00036889851269272334, "tps": 15255, "wall": 28382.9} {"step": 6607, "train_loss": 3.587120532989502, "lr": 0.00036888774721729025, "tps": 15255, "wall": 28387.8} {"step": 6608, "train_loss": 3.5650501251220703, "lr": 0.0003688769800552487, "tps": 15254, "wall": 28392.7} {"step": 6609, "train_loss": 3.8001136779785156, "lr": 0.0003688662112067206, "tps": 15254, "wall": 28397.7} {"step": 6610, "train_loss": 3.658646583557129, "lr": 0.00036885544067182804, "tps": 15254, "wall": 28402.6} {"step": 6611, "train_loss": 3.7949180603027344, "lr": 0.000368844668450693, "tps": 15253, "wall": 28407.6} {"step": 6612, "train_loss": 3.631366729736328, "lr": 0.00036883389454343753, "tps": 15253, "wall": 28412.5} {"step": 6613, "train_loss": 3.651751756668091, "lr": 0.00036882311895018364, "tps": 15253, "wall": 28417.4} {"step": 6614, "train_loss": 3.5325591564178467, "lr": 0.00036881234167105337, "tps": 15252, "wall": 28422.4} {"step": 6615, "train_loss": 3.6126298904418945, "lr": 0.0003688015627061689, "tps": 15252, "wall": 28427.3} {"step": 6616, "train_loss": 3.7210280895233154, "lr": 0.0003687907820556522, "tps": 15252, "wall": 28432.2} {"step": 6617, "train_loss": 3.7083117961883545, "lr": 0.0003687799997196255, "tps": 15251, "wall": 28437.2} {"step": 6618, "train_loss": 3.636852741241455, "lr": 0.00036876921569821094, "tps": 15251, "wall": 28442.1} {"step": 6619, "train_loss": 3.5926625728607178, "lr": 0.0003687584299915306, "tps": 15251, "wall": 28447.1} {"step": 6620, "train_loss": 3.6150810718536377, "lr": 0.0003687476425997068, "tps": 15250, "wall": 28452.0} {"step": 6621, "train_loss": 3.7250375747680664, "lr": 0.00036873685352286164, "tps": 15250, "wall": 28456.9} {"step": 6622, "train_loss": 3.663234233856201, "lr": 0.00036872606276111737, "tps": 15250, "wall": 28461.9} {"step": 6623, "train_loss": 3.4845669269561768, "lr": 0.0003687152703145962, "tps": 15249, "wall": 28466.8} {"step": 6624, "train_loss": 3.6235976219177246, "lr": 0.0003687044761834203, "tps": 15249, "wall": 28471.8} {"step": 6625, "train_loss": 3.60235595703125, "lr": 0.0003686936803677122, "tps": 15248, "wall": 28476.7} {"step": 6626, "train_loss": 3.5895137786865234, "lr": 0.0003686828828675939, "tps": 15248, "wall": 28481.7} {"step": 6627, "train_loss": 3.6558966636657715, "lr": 0.000368672083683188, "tps": 15248, "wall": 28486.6} {"step": 6628, "train_loss": 3.6023685932159424, "lr": 0.0003686612828146166, "tps": 15247, "wall": 28491.5} {"step": 6629, "train_loss": 3.644534111022949, "lr": 0.0003686504802620022, "tps": 15247, "wall": 28496.5} {"step": 6630, "train_loss": 3.662872791290283, "lr": 0.00036863967602546714, "tps": 15247, "wall": 28501.4} {"step": 6631, "train_loss": 3.728250503540039, "lr": 0.0003686288701051337, "tps": 15246, "wall": 28506.3} {"step": 6632, "train_loss": 3.5613646507263184, "lr": 0.0003686180625011245, "tps": 15246, "wall": 28511.3} {"step": 6633, "train_loss": 3.607276678085327, "lr": 0.0003686072532135617, "tps": 15246, "wall": 28516.2} {"step": 6634, "train_loss": 3.7678921222686768, "lr": 0.000368596442242568, "tps": 15245, "wall": 28521.1} {"step": 6635, "train_loss": 3.5855164527893066, "lr": 0.00036858562958826574, "tps": 15245, "wall": 28526.1} {"step": 6636, "train_loss": 3.561168670654297, "lr": 0.0003685748152507774, "tps": 15245, "wall": 28531.0} {"step": 6637, "train_loss": 3.672433853149414, "lr": 0.0003685639992302255, "tps": 15244, "wall": 28535.9} {"step": 6638, "train_loss": 3.6149539947509766, "lr": 0.00036855318152673264, "tps": 15244, "wall": 28540.8} {"step": 6639, "train_loss": 3.6176507472991943, "lr": 0.00036854236214042124, "tps": 15244, "wall": 28545.8} {"step": 6640, "train_loss": 3.6988837718963623, "lr": 0.000368531541071414, "tps": 15243, "wall": 28550.7} {"step": 6641, "train_loss": 3.6181514263153076, "lr": 0.0003685207183198334, "tps": 15243, "wall": 28555.7} {"step": 6642, "train_loss": 3.6904945373535156, "lr": 0.000368509893885802, "tps": 15243, "wall": 28560.6} {"step": 6643, "train_loss": 3.6835365295410156, "lr": 0.00036849906776944256, "tps": 15242, "wall": 28565.6} {"step": 6644, "train_loss": 3.6708755493164062, "lr": 0.0003684882399708777, "tps": 15242, "wall": 28570.5} {"step": 6645, "train_loss": 3.6977882385253906, "lr": 0.00036847741049022994, "tps": 15242, "wall": 28575.4} {"step": 6646, "train_loss": 3.7040956020355225, "lr": 0.000368466579327622, "tps": 15241, "wall": 28580.3} {"step": 6647, "train_loss": 3.6248927116394043, "lr": 0.0003684557464831767, "tps": 15241, "wall": 28585.3} {"step": 6648, "train_loss": 3.700674533843994, "lr": 0.0003684449119570167, "tps": 15241, "wall": 28590.2} {"step": 6649, "train_loss": 3.688239812850952, "lr": 0.0003684340757492646, "tps": 15240, "wall": 28595.1} {"step": 6650, "train_loss": 3.657355308532715, "lr": 0.00036842323786004334, "tps": 15240, "wall": 28600.0} {"step": 6651, "train_loss": 3.7227277755737305, "lr": 0.0003684123982894756, "tps": 15240, "wall": 28604.9} {"step": 6652, "train_loss": 3.585799217224121, "lr": 0.0003684015570376842, "tps": 15239, "wall": 28609.9} {"step": 6653, "train_loss": 3.6094417572021484, "lr": 0.00036839071410479186, "tps": 15239, "wall": 28614.9} {"step": 6654, "train_loss": 3.6405751705169678, "lr": 0.00036837986949092154, "tps": 15239, "wall": 28619.8} {"step": 6655, "train_loss": 3.7527146339416504, "lr": 0.000368369023196196, "tps": 15238, "wall": 28624.7} {"step": 6656, "train_loss": 3.5947909355163574, "lr": 0.00036835817522073815, "tps": 15238, "wall": 28629.6} {"step": 6657, "train_loss": 3.6488277912139893, "lr": 0.0003683473255646709, "tps": 15238, "wall": 28634.6} {"step": 6658, "train_loss": 3.696659803390503, "lr": 0.0003683364742281171, "tps": 15237, "wall": 28639.5} {"step": 6659, "train_loss": 3.7088961601257324, "lr": 0.0003683256212111997, "tps": 15237, "wall": 28644.4} {"step": 6660, "train_loss": 3.6433491706848145, "lr": 0.0003683147665140416, "tps": 15237, "wall": 28649.4} {"step": 6661, "train_loss": 3.628386974334717, "lr": 0.00036830391013676587, "tps": 15236, "wall": 28654.3} {"step": 6662, "train_loss": 3.664426803588867, "lr": 0.00036829305207949534, "tps": 15236, "wall": 28659.2} {"step": 6663, "train_loss": 3.7474653720855713, "lr": 0.00036828219234235314, "tps": 15236, "wall": 28664.2} {"step": 6664, "train_loss": 3.593859910964966, "lr": 0.0003682713309254622, "tps": 15235, "wall": 28669.1} {"step": 6665, "train_loss": 3.679258108139038, "lr": 0.0003682604678289457, "tps": 15235, "wall": 28674.1} {"step": 6666, "train_loss": 3.639651298522949, "lr": 0.00036824960305292646, "tps": 15235, "wall": 28679.0} {"step": 6667, "train_loss": 3.665785312652588, "lr": 0.0003682387365975278, "tps": 15234, "wall": 28683.9} {"step": 6668, "train_loss": 3.639430046081543, "lr": 0.0003682278684628727, "tps": 15234, "wall": 28688.8} {"step": 6669, "train_loss": 3.6607558727264404, "lr": 0.0003682169986490843, "tps": 15234, "wall": 28693.8} {"step": 6670, "train_loss": 3.6654739379882812, "lr": 0.0003682061271562857, "tps": 15233, "wall": 28698.7} {"step": 6671, "train_loss": 3.67549467086792, "lr": 0.00036819525398460004, "tps": 15233, "wall": 28703.6} {"step": 6672, "train_loss": 3.6928579807281494, "lr": 0.0003681843791341506, "tps": 15233, "wall": 28708.5} {"step": 6673, "train_loss": 3.6433420181274414, "lr": 0.00036817350260506045, "tps": 15232, "wall": 28713.5} {"step": 6674, "train_loss": 3.6548917293548584, "lr": 0.0003681626243974528, "tps": 15232, "wall": 28718.4} {"step": 6675, "train_loss": 3.6418654918670654, "lr": 0.00036815174451145096, "tps": 15232, "wall": 28723.4} {"step": 6676, "train_loss": 3.6537280082702637, "lr": 0.0003681408629471782, "tps": 15231, "wall": 28728.7} {"step": 6677, "train_loss": 3.619356632232666, "lr": 0.00036812997970475767, "tps": 15231, "wall": 28733.9} {"step": 6678, "train_loss": 3.573326826095581, "lr": 0.00036811909478431275, "tps": 15230, "wall": 28738.9} {"step": 6679, "train_loss": 3.715712547302246, "lr": 0.0003681082081859667, "tps": 15230, "wall": 28744.3} {"step": 6680, "train_loss": 3.632951498031616, "lr": 0.0003680973199098428, "tps": 15229, "wall": 28749.3} {"step": 6681, "train_loss": 3.7371954917907715, "lr": 0.0003680864299560645, "tps": 15229, "wall": 28754.4} {"step": 6682, "train_loss": 3.5748064517974854, "lr": 0.00036807553832475515, "tps": 15228, "wall": 28759.5} {"step": 6683, "train_loss": 3.76898193359375, "lr": 0.000368064645016038, "tps": 15228, "wall": 28764.5} {"step": 6684, "train_loss": 3.716284990310669, "lr": 0.00036805375003003663, "tps": 15228, "wall": 28769.7} {"step": 6685, "train_loss": 3.603679656982422, "lr": 0.0003680428533668743, "tps": 15227, "wall": 28774.9} {"step": 6686, "train_loss": 3.662777900695801, "lr": 0.00036803195502667455, "tps": 15227, "wall": 28779.9} {"step": 6687, "train_loss": 3.693500280380249, "lr": 0.0003680210550095609, "tps": 15226, "wall": 28785.0} {"step": 6688, "train_loss": 3.7523412704467773, "lr": 0.0003680101533156566, "tps": 15226, "wall": 28790.1} {"step": 6689, "train_loss": 3.5436906814575195, "lr": 0.0003679992499450853, "tps": 15225, "wall": 28795.3} {"step": 6690, "train_loss": 3.5942702293395996, "lr": 0.0003679883448979705, "tps": 15225, "wall": 28800.4} {"step": 6691, "train_loss": 3.704468250274658, "lr": 0.00036797743817443566, "tps": 15225, "wall": 28805.5} {"step": 6692, "train_loss": 3.6594901084899902, "lr": 0.0003679665297746045, "tps": 15224, "wall": 28810.5} {"step": 6693, "train_loss": 3.55295467376709, "lr": 0.00036795561969860043, "tps": 15224, "wall": 28815.7} {"step": 6694, "train_loss": 3.677708148956299, "lr": 0.00036794470794654713, "tps": 15223, "wall": 28820.8} {"step": 6695, "train_loss": 3.6603150367736816, "lr": 0.00036793379451856815, "tps": 15223, "wall": 28826.2} {"step": 6696, "train_loss": 3.6374690532684326, "lr": 0.00036792287941478716, "tps": 15222, "wall": 28831.3} {"step": 6697, "train_loss": 3.5885543823242188, "lr": 0.00036791196263532774, "tps": 15222, "wall": 28836.4} {"step": 6698, "train_loss": 3.6739485263824463, "lr": 0.00036790104418031366, "tps": 15222, "wall": 28841.4} {"step": 6699, "train_loss": 3.6938300132751465, "lr": 0.00036789012404986847, "tps": 15221, "wall": 28846.4} {"step": 6700, "train_loss": 3.7149734497070312, "lr": 0.0003678792022441161, "tps": 15221, "wall": 28851.6} {"step": 6701, "train_loss": 3.5865166187286377, "lr": 0.00036786827876318006, "tps": 15220, "wall": 28857.0} {"step": 6702, "train_loss": 3.6026298999786377, "lr": 0.0003678573536071841, "tps": 15220, "wall": 28862.1} {"step": 6703, "train_loss": 3.6031370162963867, "lr": 0.0003678464267762521, "tps": 15219, "wall": 28867.1} {"step": 6704, "train_loss": 3.584928035736084, "lr": 0.00036783549827050776, "tps": 15219, "wall": 28872.3} {"step": 6705, "train_loss": 3.6311094760894775, "lr": 0.00036782456809007487, "tps": 15218, "wall": 28877.5} {"step": 6706, "train_loss": 3.509751319885254, "lr": 0.0003678136362350773, "tps": 15218, "wall": 28882.5} {"step": 6707, "train_loss": 3.5902292728424072, "lr": 0.0003678027027056389, "tps": 15218, "wall": 28887.5} {"step": 6708, "train_loss": 3.6289899349212646, "lr": 0.00036779176750188346, "tps": 15217, "wall": 28892.8} {"step": 6709, "train_loss": 3.6233508586883545, "lr": 0.0003677808306239349, "tps": 15217, "wall": 28897.9} {"step": 6710, "train_loss": 3.6251718997955322, "lr": 0.00036776989207191704, "tps": 15216, "wall": 28903.1} {"step": 6711, "train_loss": 3.586168050765991, "lr": 0.0003677589518459539, "tps": 15216, "wall": 28908.1} {"step": 6712, "train_loss": 3.60923171043396, "lr": 0.0003677480099461693, "tps": 15216, "wall": 28913.1} {"step": 6713, "train_loss": 3.6340224742889404, "lr": 0.0003677370663726873, "tps": 15215, "wall": 28918.2} {"step": 6714, "train_loss": 3.608369827270508, "lr": 0.0003677261211256318, "tps": 15215, "wall": 28923.1} {"step": 6715, "train_loss": 3.6875734329223633, "lr": 0.00036771517420512684, "tps": 15214, "wall": 28928.2} {"step": 6716, "train_loss": 3.6095619201660156, "lr": 0.00036770422561129636, "tps": 15214, "wall": 28933.2} {"step": 6717, "train_loss": 3.659604072570801, "lr": 0.00036769327534426447, "tps": 15214, "wall": 28938.2} {"step": 6718, "train_loss": 3.6824307441711426, "lr": 0.0003676823234041551, "tps": 15213, "wall": 28943.1} {"step": 6719, "train_loss": 3.6371116638183594, "lr": 0.0003676713697910924, "tps": 15213, "wall": 28948.1} {"step": 6720, "train_loss": 3.6147303581237793, "lr": 0.00036766041450520047, "tps": 15213, "wall": 28953.1} {"step": 6721, "train_loss": 3.715806007385254, "lr": 0.0003676494575466033, "tps": 15212, "wall": 28958.2} {"step": 6722, "train_loss": 3.592714786529541, "lr": 0.0003676384989154252, "tps": 15212, "wall": 28963.3} {"step": 6723, "train_loss": 3.74265193939209, "lr": 0.00036762753861179013, "tps": 15211, "wall": 28968.4} {"step": 6724, "train_loss": 3.600969076156616, "lr": 0.0003676165766358223, "tps": 15211, "wall": 28973.6} {"step": 6725, "train_loss": 3.6125271320343018, "lr": 0.00036760561298764596, "tps": 15211, "wall": 28978.7} {"step": 6726, "train_loss": 3.6022789478302, "lr": 0.00036759464766738517, "tps": 15210, "wall": 28983.8} {"step": 6727, "train_loss": 3.6010804176330566, "lr": 0.0003675836806751643, "tps": 15209, "wall": 28989.3} {"step": 6728, "train_loss": 3.5668020248413086, "lr": 0.0003675727120111075, "tps": 15209, "wall": 28994.4} {"step": 6729, "train_loss": 3.7235429286956787, "lr": 0.00036756174167533906, "tps": 15209, "wall": 28999.5} {"step": 6730, "train_loss": 3.7183427810668945, "lr": 0.0003675507696679831, "tps": 15208, "wall": 29004.6} {"step": 6731, "train_loss": 3.5928261280059814, "lr": 0.0003675397959891642, "tps": 15208, "wall": 29009.7} {"step": 6732, "train_loss": 3.6320602893829346, "lr": 0.00036752882063900645, "tps": 15207, "wall": 29014.8} {"step": 6733, "train_loss": 3.68430757522583, "lr": 0.0003675178436176342, "tps": 15207, "wall": 29020.2} {"step": 6734, "train_loss": 3.656860828399658, "lr": 0.0003675068649251718, "tps": 15206, "wall": 29025.6} {"step": 6735, "train_loss": 3.705164909362793, "lr": 0.00036749588456174375, "tps": 15206, "wall": 29030.9} {"step": 6736, "train_loss": 3.6974472999572754, "lr": 0.0003674849025274743, "tps": 15205, "wall": 29036.2} {"step": 6737, "train_loss": 3.546126365661621, "lr": 0.00036747391882248787, "tps": 15205, "wall": 29041.5} {"step": 6738, "train_loss": 3.5917506217956543, "lr": 0.00036746293344690906, "tps": 15204, "wall": 29046.7} {"step": 6739, "train_loss": 3.585865020751953, "lr": 0.000367451946400862, "tps": 15204, "wall": 29052.0} {"step": 6740, "train_loss": 3.6244125366210938, "lr": 0.0003674409576844713, "tps": 15203, "wall": 29057.4} {"step": 6741, "train_loss": 3.730646848678589, "lr": 0.00036742996729786156, "tps": 15203, "wall": 29062.7} {"step": 6742, "train_loss": 3.73197078704834, "lr": 0.0003674189752411571, "tps": 15202, "wall": 29068.0} {"step": 6743, "train_loss": 3.656663417816162, "lr": 0.0003674079815144826, "tps": 15202, "wall": 29073.2} {"step": 6744, "train_loss": 3.6570565700531006, "lr": 0.00036739698611796244, "tps": 15201, "wall": 29078.6} {"step": 6745, "train_loss": 3.578481435775757, "lr": 0.00036738598905172124, "tps": 15201, "wall": 29084.0} {"step": 6746, "train_loss": 3.6510865688323975, "lr": 0.00036737499031588356, "tps": 15200, "wall": 29089.3} {"step": 6747, "train_loss": 3.6232411861419678, "lr": 0.0003673639899105741, "tps": 15199, "wall": 29094.7} {"step": 6748, "train_loss": 3.59312105178833, "lr": 0.00036735298783591733, "tps": 15199, "wall": 29100.0} {"step": 6749, "train_loss": 3.5383524894714355, "lr": 0.0003673419840920379, "tps": 15198, "wall": 29105.4} {"step": 6750, "train_loss": 3.6715779304504395, "lr": 0.0003673309786790606, "tps": 15198, "wall": 29110.7} {"step": 6751, "train_loss": 3.6190314292907715, "lr": 0.00036731997159710996, "tps": 15197, "wall": 29116.0} {"step": 6752, "train_loss": 3.6297073364257812, "lr": 0.00036730896284631077, "tps": 15197, "wall": 29121.4} {"step": 6753, "train_loss": 3.7287650108337402, "lr": 0.0003672979524267876, "tps": 15196, "wall": 29126.6} {"step": 6754, "train_loss": 3.6688666343688965, "lr": 0.00036728694033866526, "tps": 15196, "wall": 29131.7} {"step": 6755, "train_loss": 3.625153064727783, "lr": 0.00036727592658206853, "tps": 15195, "wall": 29136.7} {"step": 6756, "train_loss": 3.6830921173095703, "lr": 0.0003672649111571221, "tps": 15195, "wall": 29141.7} {"step": 6757, "train_loss": 3.5875000953674316, "lr": 0.0003672538940639508, "tps": 15195, "wall": 29146.6} {"step": 6758, "train_loss": 3.664680004119873, "lr": 0.0003672428753026795, "tps": 15194, "wall": 29151.6} {"step": 6759, "train_loss": 3.5765151977539062, "lr": 0.0003672318548734329, "tps": 15194, "wall": 29156.7} {"step": 6760, "train_loss": 3.5805742740631104, "lr": 0.0003672208327763358, "tps": 15194, "wall": 29161.7} {"step": 6761, "train_loss": 3.6509947776794434, "lr": 0.00036720980901151323, "tps": 15193, "wall": 29166.7} {"step": 6762, "train_loss": 3.5476889610290527, "lr": 0.00036719878357908996, "tps": 15193, "wall": 29171.7} {"step": 6763, "train_loss": 3.6677019596099854, "lr": 0.00036718775647919086, "tps": 15193, "wall": 29176.7} {"step": 6764, "train_loss": 3.621459484100342, "lr": 0.00036717672771194093, "tps": 15192, "wall": 29181.7} {"step": 6765, "train_loss": 3.5663909912109375, "lr": 0.00036716569727746507, "tps": 15192, "wall": 29186.8} {"step": 6766, "train_loss": 3.734099864959717, "lr": 0.00036715466517588824, "tps": 15192, "wall": 29191.8} {"step": 6767, "train_loss": 3.5873641967773438, "lr": 0.0003671436314073354, "tps": 15191, "wall": 29196.8} {"step": 6768, "train_loss": 3.6438817977905273, "lr": 0.0003671325959719315, "tps": 15191, "wall": 29201.9} {"step": 6769, "train_loss": 3.576859474182129, "lr": 0.0003671215588698016, "tps": 15190, "wall": 29207.0} {"step": 6770, "train_loss": 3.5829782485961914, "lr": 0.00036711052010107075, "tps": 15190, "wall": 29212.0} {"step": 6771, "train_loss": 3.685739755630493, "lr": 0.00036709947966586396, "tps": 15189, "wall": 29217.3} {"step": 6772, "train_loss": 3.6450355052948, "lr": 0.00036708843756430635, "tps": 15189, "wall": 29222.6} {"step": 6773, "train_loss": 3.7250285148620605, "lr": 0.00036707739379652295, "tps": 15189, "wall": 29227.7} {"step": 6774, "train_loss": 3.6612472534179688, "lr": 0.0003670663483626388, "tps": 15188, "wall": 29232.8} {"step": 6775, "train_loss": 3.557047128677368, "lr": 0.00036705530126277913, "tps": 15188, "wall": 29237.9} {"step": 6776, "train_loss": 3.611764907836914, "lr": 0.0003670442524970691, "tps": 15187, "wall": 29242.8} {"step": 6777, "train_loss": 3.627159357070923, "lr": 0.00036703320206563376, "tps": 15187, "wall": 29248.0} {"step": 6778, "train_loss": 3.555448055267334, "lr": 0.0003670221499685984, "tps": 15186, "wall": 29253.6} {"step": 6779, "train_loss": 3.572511672973633, "lr": 0.0003670110962060882, "tps": 15186, "wall": 29258.6} {"step": 6780, "train_loss": 3.5798988342285156, "lr": 0.00036700004077822826, "tps": 15186, "wall": 29263.7} {"step": 6781, "train_loss": 3.6640684604644775, "lr": 0.0003669889836851439, "tps": 15185, "wall": 29268.8} {"step": 6782, "train_loss": 3.659115791320801, "lr": 0.00036697792492696054, "tps": 15185, "wall": 29273.9} {"step": 6783, "train_loss": 3.6938750743865967, "lr": 0.00036696686450380316, "tps": 15184, "wall": 29279.0} {"step": 6784, "train_loss": 3.5941693782806396, "lr": 0.0003669558024157972, "tps": 15184, "wall": 29284.1} {"step": 6785, "train_loss": 3.6627612113952637, "lr": 0.000366944738663068, "tps": 15183, "wall": 29289.2} {"step": 6786, "train_loss": 3.568014621734619, "lr": 0.0003669336732457408, "tps": 15183, "wall": 29294.3} {"step": 6787, "train_loss": 3.5617003440856934, "lr": 0.0003669226061639411, "tps": 15183, "wall": 29299.4} {"step": 6788, "train_loss": 3.682084083557129, "lr": 0.00036691153741779406, "tps": 15182, "wall": 29304.5} {"step": 6789, "train_loss": 3.6308577060699463, "lr": 0.00036690046700742516, "tps": 15182, "wall": 29309.9} {"step": 6790, "train_loss": 3.637315511703491, "lr": 0.0003668893949329599, "tps": 15181, "wall": 29315.1} {"step": 6791, "train_loss": 3.715667724609375, "lr": 0.0003668783211945236, "tps": 15181, "wall": 29320.1} {"step": 6792, "train_loss": 3.6113693714141846, "lr": 0.00036686724579224175, "tps": 15180, "wall": 29325.3} {"step": 6793, "train_loss": 3.510035276412964, "lr": 0.0003668561687262398, "tps": 15180, "wall": 29330.6} {"step": 6794, "train_loss": 3.6974380016326904, "lr": 0.0003668450899966432, "tps": 15180, "wall": 29335.7} {"step": 6795, "train_loss": 3.6993792057037354, "lr": 0.0003668340096035775, "tps": 15179, "wall": 29340.7} {"step": 6796, "train_loss": 3.7098488807678223, "lr": 0.00036682292754716813, "tps": 15179, "wall": 29345.7} {"step": 6797, "train_loss": 3.5763533115386963, "lr": 0.00036681184382754076, "tps": 15178, "wall": 29350.8} {"step": 6798, "train_loss": 3.650312662124634, "lr": 0.00036680075844482086, "tps": 15178, "wall": 29356.0} {"step": 6799, "train_loss": 3.672910213470459, "lr": 0.000366789671399134, "tps": 15178, "wall": 29361.1} {"step": 6800, "train_loss": 3.6421451568603516, "lr": 0.00036677858269060584, "tps": 15177, "wall": 29366.3} {"step": 6801, "train_loss": 3.650458335876465, "lr": 0.000366767492319362, "tps": 15177, "wall": 29371.4} {"step": 6802, "train_loss": 3.707017660140991, "lr": 0.00036675640028552796, "tps": 15176, "wall": 29376.5} {"step": 6803, "train_loss": 3.6304068565368652, "lr": 0.0003667453065892295, "tps": 15176, "wall": 29381.6} {"step": 6804, "train_loss": 3.6707637310028076, "lr": 0.00036673421123059233, "tps": 15175, "wall": 29386.7} {"step": 6805, "train_loss": 3.610985279083252, "lr": 0.0003667231142097421, "tps": 15175, "wall": 29391.7} {"step": 6806, "train_loss": 3.6497764587402344, "lr": 0.00036671201552680434, "tps": 15175, "wall": 29396.9} {"step": 6807, "train_loss": 3.584012031555176, "lr": 0.00036670091518190505, "tps": 15174, "wall": 29402.2} {"step": 6808, "train_loss": 3.6120243072509766, "lr": 0.00036668981317516985, "tps": 15174, "wall": 29407.6} {"step": 6809, "train_loss": 3.718320846557617, "lr": 0.00036667870950672453, "tps": 15173, "wall": 29413.1} {"step": 6810, "train_loss": 3.656843423843384, "lr": 0.0003666676041766948, "tps": 15172, "wall": 29418.5} {"step": 6811, "train_loss": 3.740070104598999, "lr": 0.00036665649718520656, "tps": 15172, "wall": 29424.0} {"step": 6812, "train_loss": 3.6991946697235107, "lr": 0.0003666453885323855, "tps": 15171, "wall": 29429.3} {"step": 6813, "train_loss": 3.6701161861419678, "lr": 0.0003666342782183576, "tps": 15171, "wall": 29434.8} {"step": 6814, "train_loss": 3.625685214996338, "lr": 0.0003666231662432487, "tps": 15170, "wall": 29440.3} {"step": 6815, "train_loss": 3.593940258026123, "lr": 0.0003666120526071846, "tps": 15170, "wall": 29445.3} {"step": 6816, "train_loss": 3.574012041091919, "lr": 0.00036660093731029125, "tps": 15169, "wall": 29450.7} {"step": 6817, "train_loss": 3.70853853225708, "lr": 0.00036658982035269453, "tps": 15169, "wall": 29455.7} {"step": 6818, "train_loss": 3.5769505500793457, "lr": 0.0003665787017345204, "tps": 15168, "wall": 29460.8} {"step": 6819, "train_loss": 3.687047004699707, "lr": 0.00036656758145589487, "tps": 15168, "wall": 29466.3} {"step": 6820, "train_loss": 3.641907215118408, "lr": 0.00036655645951694384, "tps": 15167, "wall": 29471.7} {"step": 6821, "train_loss": 3.721383571624756, "lr": 0.0003665453359177932, "tps": 15167, "wall": 29477.1} {"step": 6822, "train_loss": 3.6114935874938965, "lr": 0.00036653421065856916, "tps": 15166, "wall": 29482.5} {"step": 6823, "train_loss": 3.6283373832702637, "lr": 0.00036652308373939763, "tps": 15166, "wall": 29487.7} {"step": 6824, "train_loss": 3.6604220867156982, "lr": 0.00036651195516040463, "tps": 15165, "wall": 29493.0} {"step": 6825, "train_loss": 3.648660659790039, "lr": 0.00036650082492171635, "tps": 15165, "wall": 29498.4} {"step": 6826, "train_loss": 3.7167983055114746, "lr": 0.0003664896930234587, "tps": 15164, "wall": 29503.7} {"step": 6827, "train_loss": 3.5982978343963623, "lr": 0.00036647855946575806, "tps": 15164, "wall": 29509.0} {"step": 6828, "train_loss": 3.652587413787842, "lr": 0.0003664674242487402, "tps": 15163, "wall": 29514.2} {"step": 6829, "train_loss": 3.61509370803833, "lr": 0.00036645628737253156, "tps": 15163, "wall": 29519.6} {"step": 6830, "train_loss": 3.7074530124664307, "lr": 0.0003664451488372581, "tps": 15162, "wall": 29525.0} {"step": 6831, "train_loss": 3.5969314575195312, "lr": 0.0003664340086430461, "tps": 15162, "wall": 29530.3} {"step": 6832, "train_loss": 3.6682825088500977, "lr": 0.00036642286679002174, "tps": 15161, "wall": 29535.5} {"step": 6833, "train_loss": 3.6790270805358887, "lr": 0.00036641172327831124, "tps": 15161, "wall": 29540.8} {"step": 6834, "train_loss": 3.59658145904541, "lr": 0.0003664005781080407, "tps": 15160, "wall": 29546.1} {"step": 6835, "train_loss": 3.6263113021850586, "lr": 0.00036638943127933663, "tps": 15160, "wall": 29551.6} {"step": 6836, "train_loss": 3.7490599155426025, "lr": 0.00036637828279232503, "tps": 15159, "wall": 29557.4} {"step": 6837, "train_loss": 3.6704647541046143, "lr": 0.0003663671326471324, "tps": 15158, "wall": 29563.3} {"step": 6838, "train_loss": 3.6564829349517822, "lr": 0.00036635598084388497, "tps": 15157, "wall": 29569.2} {"step": 6839, "train_loss": 3.702537775039673, "lr": 0.00036634482738270906, "tps": 15157, "wall": 29574.7} {"step": 6840, "train_loss": 3.639272689819336, "lr": 0.00036633367226373106, "tps": 15156, "wall": 29579.9} {"step": 6841, "train_loss": 3.6217174530029297, "lr": 0.00036632251548707727, "tps": 15156, "wall": 29585.3} {"step": 6842, "train_loss": 3.5816779136657715, "lr": 0.00036631135705287416, "tps": 15155, "wall": 29590.6} {"step": 6843, "train_loss": 3.5636067390441895, "lr": 0.00036630019696124805, "tps": 15155, "wall": 29595.9} {"step": 6844, "train_loss": 3.519483804702759, "lr": 0.0003662890352123254, "tps": 15154, "wall": 29601.3} {"step": 6845, "train_loss": 3.585566282272339, "lr": 0.0003662778718062326, "tps": 15154, "wall": 29606.6} {"step": 6846, "train_loss": 3.685377597808838, "lr": 0.0003662667067430962, "tps": 15153, "wall": 29611.8} {"step": 6847, "train_loss": 3.5784058570861816, "lr": 0.0003662555400230426, "tps": 15153, "wall": 29617.1} {"step": 6848, "train_loss": 3.637615203857422, "lr": 0.00036624437164619835, "tps": 15152, "wall": 29622.5} {"step": 6849, "train_loss": 3.7329037189483643, "lr": 0.00036623320161268996, "tps": 15152, "wall": 29627.7} {"step": 6850, "train_loss": 3.588107109069824, "lr": 0.00036622202992264393, "tps": 15151, "wall": 29632.8} {"step": 6851, "train_loss": 3.545224666595459, "lr": 0.00036621085657618683, "tps": 15151, "wall": 29638.0} {"step": 6852, "train_loss": 3.5792064666748047, "lr": 0.0003661996815734453, "tps": 15150, "wall": 29643.0} {"step": 6853, "train_loss": 3.55324387550354, "lr": 0.0003661885049145458, "tps": 15150, "wall": 29648.0} {"step": 6854, "train_loss": 3.59302020072937, "lr": 0.000366177326599615, "tps": 15150, "wall": 29653.0} {"step": 6855, "train_loss": 3.5862069129943848, "lr": 0.00036616614662877956, "tps": 15149, "wall": 29657.9} {"step": 6856, "train_loss": 3.7302393913269043, "lr": 0.0003661549650021661, "tps": 15149, "wall": 29662.9} {"step": 6857, "train_loss": 3.736231803894043, "lr": 0.00036614378171990136, "tps": 15149, "wall": 29667.9} {"step": 6858, "train_loss": 3.601620674133301, "lr": 0.00036613259678211187, "tps": 15148, "wall": 29672.9} {"step": 6859, "train_loss": 3.692718982696533, "lr": 0.0003661214101889244, "tps": 15148, "wall": 29678.4} {"step": 6860, "train_loss": 3.517911434173584, "lr": 0.00036611022194046574, "tps": 15147, "wall": 29683.8} {"step": 6861, "train_loss": 3.631253242492676, "lr": 0.0003660990320368626, "tps": 15147, "wall": 29688.7} {"step": 6862, "train_loss": 3.635425567626953, "lr": 0.00036608784047824166, "tps": 15147, "wall": 29693.7} {"step": 6863, "train_loss": 3.63913893699646, "lr": 0.00036607664726472983, "tps": 15146, "wall": 29698.8} {"step": 6864, "train_loss": 3.5520989894866943, "lr": 0.00036606545239645374, "tps": 15146, "wall": 29703.9} {"step": 6865, "train_loss": 3.696589946746826, "lr": 0.0003660542558735404, "tps": 15145, "wall": 29709.2} {"step": 6866, "train_loss": 3.7202000617980957, "lr": 0.00036604305769611647, "tps": 15145, "wall": 29714.4} {"step": 6867, "train_loss": 3.6344499588012695, "lr": 0.000366031857864309, "tps": 15144, "wall": 29719.8} {"step": 6868, "train_loss": 3.5728025436401367, "lr": 0.0003660206563782446, "tps": 15144, "wall": 29725.0} {"step": 6869, "train_loss": 3.614562511444092, "lr": 0.00036600945323805043, "tps": 15144, "wall": 29730.0} {"step": 6870, "train_loss": 3.5377397537231445, "lr": 0.00036599824844385314, "tps": 15143, "wall": 29735.0} {"step": 6871, "train_loss": 3.6434717178344727, "lr": 0.00036598704199577986, "tps": 15143, "wall": 29740.1} {"step": 6872, "train_loss": 3.620178699493408, "lr": 0.0003659758338939575, "tps": 15142, "wall": 29745.1} {"step": 6873, "train_loss": 3.6570165157318115, "lr": 0.000365964624138513, "tps": 15142, "wall": 29750.0} {"step": 6874, "train_loss": 3.5868682861328125, "lr": 0.0003659534127295733, "tps": 15142, "wall": 29755.2} {"step": 6875, "train_loss": 3.653843402862549, "lr": 0.00036594219966726543, "tps": 15141, "wall": 29760.2} {"step": 6876, "train_loss": 3.6048531532287598, "lr": 0.00036593098495171653, "tps": 15141, "wall": 29765.2} {"step": 6877, "train_loss": 3.5662362575531006, "lr": 0.00036591976858305346, "tps": 15141, "wall": 29770.2} {"step": 6878, "train_loss": 3.6699788570404053, "lr": 0.0003659085505614033, "tps": 15140, "wall": 29775.2} {"step": 6879, "train_loss": 3.6944785118103027, "lr": 0.0003658973308868933, "tps": 15140, "wall": 29780.3} {"step": 6880, "train_loss": 3.6573984622955322, "lr": 0.0003658861095596503, "tps": 15140, "wall": 29785.2} {"step": 6881, "train_loss": 3.6395585536956787, "lr": 0.0003658748865798017, "tps": 15139, "wall": 29790.1} {"step": 6882, "train_loss": 3.5808682441711426, "lr": 0.00036586366194747444, "tps": 15139, "wall": 29795.1} {"step": 6883, "train_loss": 3.6361732482910156, "lr": 0.0003658524356627957, "tps": 15139, "wall": 29800.1} {"step": 6884, "train_loss": 3.640953779220581, "lr": 0.00036584120772589274, "tps": 15138, "wall": 29805.1} {"step": 6885, "train_loss": 3.5566043853759766, "lr": 0.00036582997813689263, "tps": 15138, "wall": 29810.0} {"step": 6886, "train_loss": 3.668151378631592, "lr": 0.00036581874689592273, "tps": 15138, "wall": 29815.0} {"step": 6887, "train_loss": 3.6360251903533936, "lr": 0.0003658075140031101, "tps": 15137, "wall": 29820.0} {"step": 6888, "train_loss": 3.6239125728607178, "lr": 0.00036579627945858203, "tps": 15137, "wall": 29825.0} {"step": 6889, "train_loss": 3.506270170211792, "lr": 0.00036578504326246586, "tps": 15137, "wall": 29830.0} {"step": 6890, "train_loss": 3.5581626892089844, "lr": 0.00036577380541488887, "tps": 15136, "wall": 29834.9} {"step": 6891, "train_loss": 3.719383716583252, "lr": 0.0003657625659159783, "tps": 15136, "wall": 29839.9} {"step": 6892, "train_loss": 3.7067880630493164, "lr": 0.00036575132476586144, "tps": 15136, "wall": 29844.8} {"step": 6893, "train_loss": 3.6227822303771973, "lr": 0.0003657400819646658, "tps": 15135, "wall": 29849.8} {"step": 6894, "train_loss": 3.5687899589538574, "lr": 0.00036572883751251854, "tps": 15135, "wall": 29854.8} {"step": 6895, "train_loss": 3.687688112258911, "lr": 0.00036571759140954714, "tps": 15135, "wall": 29859.8} {"step": 6896, "train_loss": 3.6018738746643066, "lr": 0.000365706343655879, "tps": 15134, "wall": 29864.7} {"step": 6897, "train_loss": 3.62207293510437, "lr": 0.0003656950942516415, "tps": 15134, "wall": 29869.7} {"step": 6898, "train_loss": 3.7534444332122803, "lr": 0.0003656838431969621, "tps": 15134, "wall": 29874.8} {"step": 6899, "train_loss": 3.7367382049560547, "lr": 0.00036567259049196825, "tps": 15133, "wall": 29879.7} {"step": 6900, "train_loss": 3.583277702331543, "lr": 0.00036566133613678744, "tps": 15133, "wall": 29884.7} {"step": 6901, "train_loss": 3.661116123199463, "lr": 0.0003656500801315471, "tps": 15133, "wall": 29889.6} {"step": 6902, "train_loss": 3.6456799507141113, "lr": 0.0003656388224763747, "tps": 15133, "wall": 29894.6} {"step": 6903, "train_loss": 3.626929521560669, "lr": 0.00036562756317139796, "tps": 15132, "wall": 29899.5} {"step": 6904, "train_loss": 3.568314552307129, "lr": 0.00036561630221674423, "tps": 15132, "wall": 29904.6} {"step": 6905, "train_loss": 3.599231719970703, "lr": 0.0003656050396125412, "tps": 15131, "wall": 29910.3} {"step": 6906, "train_loss": 3.6217241287231445, "lr": 0.0003655937753589164, "tps": 15131, "wall": 29915.4} {"step": 6907, "train_loss": 3.6009552478790283, "lr": 0.00036558250945599745, "tps": 15130, "wall": 29920.6} {"step": 6908, "train_loss": 3.604665517807007, "lr": 0.00036557124190391186, "tps": 15130, "wall": 29925.7} {"step": 6909, "train_loss": 3.5908684730529785, "lr": 0.0003655599727027875, "tps": 15130, "wall": 29930.8} {"step": 6910, "train_loss": 3.622745990753174, "lr": 0.0003655487018527518, "tps": 15129, "wall": 29935.9} {"step": 6911, "train_loss": 3.623032569885254, "lr": 0.00036553742935393254, "tps": 15129, "wall": 29941.0} {"step": 6912, "train_loss": 3.5450119972229004, "lr": 0.00036552615520645746, "tps": 15128, "wall": 29946.1} {"step": 6913, "train_loss": 3.7247934341430664, "lr": 0.0003655148794104541, "tps": 15128, "wall": 29951.2} {"step": 6914, "train_loss": 3.5848124027252197, "lr": 0.00036550360196605045, "tps": 15128, "wall": 29956.3} {"step": 6915, "train_loss": 3.620663642883301, "lr": 0.000365492322873374, "tps": 15127, "wall": 29961.4} {"step": 6916, "train_loss": 3.5707309246063232, "lr": 0.00036548104213255284, "tps": 15127, "wall": 29966.4} {"step": 6917, "train_loss": 3.6552226543426514, "lr": 0.0003654697597437144, "tps": 15126, "wall": 29971.6} {"step": 6918, "train_loss": 3.5647568702697754, "lr": 0.00036545847570698675, "tps": 15126, "wall": 29976.6} {"step": 6919, "train_loss": 3.581247329711914, "lr": 0.00036544719002249755, "tps": 15126, "wall": 29981.7} {"step": 6920, "train_loss": 3.5860953330993652, "lr": 0.0003654359026903747, "tps": 15125, "wall": 29986.8} {"step": 6921, "train_loss": 3.6672627925872803, "lr": 0.0003654246137107461, "tps": 15125, "wall": 29991.9} {"step": 6922, "train_loss": 3.6683638095855713, "lr": 0.0003654133230837396, "tps": 15125, "wall": 29997.1} {"step": 6923, "train_loss": 3.6863131523132324, "lr": 0.00036540203080948313, "tps": 15124, "wall": 30002.2} {"step": 6924, "train_loss": 3.7301979064941406, "lr": 0.0003653907368881046, "tps": 15124, "wall": 30007.3} {"step": 6925, "train_loss": 3.613825559616089, "lr": 0.00036537944131973194, "tps": 15123, "wall": 30012.3} {"step": 6926, "train_loss": 3.6183080673217773, "lr": 0.00036536814410449307, "tps": 15123, "wall": 30017.4} {"step": 6927, "train_loss": 3.6099748611450195, "lr": 0.00036535684524251596, "tps": 15123, "wall": 30022.5} {"step": 6928, "train_loss": 3.569364547729492, "lr": 0.00036534554473392875, "tps": 15122, "wall": 30027.6} {"step": 6929, "train_loss": 3.6170451641082764, "lr": 0.0003653342425788592, "tps": 15122, "wall": 30032.7} {"step": 6930, "train_loss": 3.608977794647217, "lr": 0.0003653229387774356, "tps": 15121, "wall": 30037.7} {"step": 6931, "train_loss": 3.632883310317993, "lr": 0.0003653116333297859, "tps": 15121, "wall": 30042.8} {"step": 6932, "train_loss": 3.697582244873047, "lr": 0.0003653003262360381, "tps": 15121, "wall": 30047.9} {"step": 6933, "train_loss": 3.5738165378570557, "lr": 0.00036528901749632045, "tps": 15120, "wall": 30053.0} {"step": 6934, "train_loss": 3.638478994369507, "lr": 0.00036527770711076085, "tps": 15120, "wall": 30058.1} {"step": 6935, "train_loss": 3.568056583404541, "lr": 0.0003652663950794875, "tps": 15120, "wall": 30063.3} {"step": 6936, "train_loss": 3.4784011840820312, "lr": 0.00036525508140262865, "tps": 15119, "wall": 30068.4} {"step": 6937, "train_loss": 3.6165709495544434, "lr": 0.0003652437660803123, "tps": 15119, "wall": 30073.5} {"step": 6938, "train_loss": 3.6148061752319336, "lr": 0.00036523244911266676, "tps": 15118, "wall": 30078.6} {"step": 6939, "train_loss": 3.5561161041259766, "lr": 0.00036522113049982014, "tps": 15118, "wall": 30083.7} {"step": 6940, "train_loss": 3.659679889678955, "lr": 0.0003652098102419008, "tps": 15118, "wall": 30088.8} {"step": 6941, "train_loss": 3.7147648334503174, "lr": 0.00036519848833903675, "tps": 15117, "wall": 30093.9} {"step": 6942, "train_loss": 3.671574115753174, "lr": 0.0003651871647913564, "tps": 15117, "wall": 30099.0} {"step": 6943, "train_loss": 3.6217024326324463, "lr": 0.000365175839598988, "tps": 15116, "wall": 30104.1} {"step": 6944, "train_loss": 3.692270517349243, "lr": 0.0003651645127620598, "tps": 15116, "wall": 30109.3} {"step": 6945, "train_loss": 3.641357898712158, "lr": 0.0003651531842807003, "tps": 15116, "wall": 30114.5} {"step": 6946, "train_loss": 3.70276141166687, "lr": 0.00036514185415503753, "tps": 15115, "wall": 30119.6} {"step": 6947, "train_loss": 3.730060577392578, "lr": 0.0003651305223852, "tps": 15115, "wall": 30124.7} {"step": 6948, "train_loss": 3.701663017272949, "lr": 0.0003651191889713161, "tps": 15114, "wall": 30129.8} {"step": 6949, "train_loss": 3.619434356689453, "lr": 0.00036510785391351416, "tps": 15114, "wall": 30134.9} {"step": 6950, "train_loss": 3.5471434593200684, "lr": 0.0003650965172119226, "tps": 15114, "wall": 30140.0} {"step": 6951, "train_loss": 3.6956052780151367, "lr": 0.00036508517886666987, "tps": 15113, "wall": 30145.1} {"step": 6952, "train_loss": 3.7730064392089844, "lr": 0.00036507383887788436, "tps": 15113, "wall": 30150.2} {"step": 6953, "train_loss": 3.5195889472961426, "lr": 0.0003650624972456945, "tps": 15113, "wall": 30155.2} {"step": 6954, "train_loss": 3.7084646224975586, "lr": 0.0003650511539702289, "tps": 15112, "wall": 30160.3} {"step": 6955, "train_loss": 3.607302188873291, "lr": 0.00036503980905161596, "tps": 15112, "wall": 30165.4} {"step": 6956, "train_loss": 3.5386109352111816, "lr": 0.00036502846248998423, "tps": 15111, "wall": 30170.5} {"step": 6957, "train_loss": 3.604607105255127, "lr": 0.00036501711428546226, "tps": 15111, "wall": 30175.7} {"step": 6958, "train_loss": 3.5021252632141113, "lr": 0.0003650057644381785, "tps": 15111, "wall": 30180.8} {"step": 6959, "train_loss": 3.560518741607666, "lr": 0.00036499441294826157, "tps": 15110, "wall": 30185.9} {"step": 6960, "train_loss": 3.6968655586242676, "lr": 0.0003649830598158402, "tps": 15110, "wall": 30191.0} {"step": 6961, "train_loss": 3.663658618927002, "lr": 0.0003649717050410428, "tps": 15109, "wall": 30196.1} {"step": 6962, "train_loss": 3.5872678756713867, "lr": 0.0003649603486239981, "tps": 15109, "wall": 30201.2} {"step": 6963, "train_loss": 3.6607565879821777, "lr": 0.0003649489905648348, "tps": 15109, "wall": 30206.3} {"step": 6964, "train_loss": 3.6179895401000977, "lr": 0.00036493763086368136, "tps": 15108, "wall": 30211.4} {"step": 6965, "train_loss": 3.562051773071289, "lr": 0.0003649262695206667, "tps": 15108, "wall": 30216.5} {"step": 6966, "train_loss": 3.709506034851074, "lr": 0.0003649149065359194, "tps": 15108, "wall": 30221.6} {"step": 6967, "train_loss": 3.582146644592285, "lr": 0.00036490354190956814, "tps": 15107, "wall": 30226.7} {"step": 6968, "train_loss": 3.554962396621704, "lr": 0.0003648921756417418, "tps": 15107, "wall": 30231.8} {"step": 6969, "train_loss": 3.5741963386535645, "lr": 0.000364880807732569, "tps": 15106, "wall": 30236.9} {"step": 6970, "train_loss": 3.687490701675415, "lr": 0.0003648694381821786, "tps": 15106, "wall": 30242.1} {"step": 6971, "train_loss": 3.5416054725646973, "lr": 0.00036485806699069936, "tps": 15106, "wall": 30247.2} {"step": 6972, "train_loss": 3.5629758834838867, "lr": 0.0003648466941582601, "tps": 15105, "wall": 30252.3} {"step": 6973, "train_loss": 3.6170828342437744, "lr": 0.0003648353196849897, "tps": 15105, "wall": 30257.4} {"step": 6974, "train_loss": 3.660264015197754, "lr": 0.00036482394357101685, "tps": 15104, "wall": 30262.4} {"step": 6975, "train_loss": 3.6029512882232666, "lr": 0.0003648125658164706, "tps": 15104, "wall": 30267.5} {"step": 6976, "train_loss": 3.607311725616455, "lr": 0.0003648011864214798, "tps": 15104, "wall": 30272.6} {"step": 6977, "train_loss": 3.580813407897949, "lr": 0.00036478980538617325, "tps": 15103, "wall": 30277.7} {"step": 6978, "train_loss": 3.6635379791259766, "lr": 0.00036477842271068005, "tps": 15103, "wall": 30282.9} {"step": 6979, "train_loss": 3.7229394912719727, "lr": 0.000364767038395129, "tps": 15103, "wall": 30287.9} {"step": 6980, "train_loss": 3.698854923248291, "lr": 0.00036475565243964905, "tps": 15102, "wall": 30292.8} {"step": 6981, "train_loss": 3.56219482421875, "lr": 0.0003647442648443693, "tps": 15102, "wall": 30297.8} {"step": 6982, "train_loss": 3.519465923309326, "lr": 0.0003647328756094186, "tps": 15102, "wall": 30302.7} {"step": 6983, "train_loss": 3.659320592880249, "lr": 0.0003647214847349262, "tps": 15101, "wall": 30307.6} {"step": 6984, "train_loss": 3.75716233253479, "lr": 0.0003647100922210209, "tps": 15101, "wall": 30312.5} {"step": 6985, "train_loss": 3.679575204849243, "lr": 0.0003646986980678319, "tps": 15101, "wall": 30317.4} {"step": 6986, "train_loss": 3.8293917179107666, "lr": 0.00036468730227548815, "tps": 15101, "wall": 30322.4} {"step": 6987, "train_loss": 3.6290626525878906, "lr": 0.00036467590484411886, "tps": 15100, "wall": 30327.3} {"step": 6988, "train_loss": 3.657731533050537, "lr": 0.00036466450577385303, "tps": 15100, "wall": 30332.2} {"step": 6989, "train_loss": 3.6076767444610596, "lr": 0.00036465310506481996, "tps": 15100, "wall": 30337.1} {"step": 6990, "train_loss": 3.5953173637390137, "lr": 0.00036464170271714865, "tps": 15099, "wall": 30342.0} {"step": 6991, "train_loss": 3.6212270259857178, "lr": 0.00036463029873096825, "tps": 15099, "wall": 30346.9} {"step": 6992, "train_loss": 3.6522016525268555, "lr": 0.00036461889310640804, "tps": 15099, "wall": 30351.8} {"step": 6993, "train_loss": 3.502493381500244, "lr": 0.0003646074858435972, "tps": 15099, "wall": 30356.8} {"step": 6994, "train_loss": 3.5730690956115723, "lr": 0.00036459607694266493, "tps": 15098, "wall": 30361.7} {"step": 6995, "train_loss": 3.526841640472412, "lr": 0.0003645846664037405, "tps": 15098, "wall": 30366.6} {"step": 6996, "train_loss": 3.6257951259613037, "lr": 0.0003645732542269531, "tps": 15098, "wall": 30371.5} {"step": 6997, "train_loss": 3.569790840148926, "lr": 0.0003645618404124321, "tps": 15097, "wall": 30376.4} {"step": 6998, "train_loss": 3.6586849689483643, "lr": 0.0003645504249603067, "tps": 15097, "wall": 30381.3} {"step": 6999, "train_loss": 3.638550281524658, "lr": 0.0003645390078707063, "tps": 15097, "wall": 30386.2} {"step": 7000, "train_loss": 3.6491951942443848, "lr": 0.0003645275891437602, "tps": 15097, "wall": 30391.1, "val_loss_monitor": 3.645826636951802} {"step": 7001, "train_loss": 3.519995927810669, "lr": 0.0003645161687795978, "tps": 15073, "wall": 30443.8} {"step": 7002, "train_loss": 3.6518445014953613, "lr": 0.0003645047467783483, "tps": 15072, "wall": 30448.7} {"step": 7003, "train_loss": 3.590071201324463, "lr": 0.00036449332314014124, "tps": 15072, "wall": 30453.6} {"step": 7004, "train_loss": 3.6366515159606934, "lr": 0.00036448189786510604, "tps": 15072, "wall": 30458.5} {"step": 7005, "train_loss": 3.6250953674316406, "lr": 0.0003644704709533721, "tps": 15072, "wall": 30463.4} {"step": 7006, "train_loss": 3.6752688884735107, "lr": 0.00036445904240506885, "tps": 15071, "wall": 30468.3} {"step": 7007, "train_loss": 3.6298575401306152, "lr": 0.0003644476122203257, "tps": 15071, "wall": 30473.3} {"step": 7008, "train_loss": 3.6619813442230225, "lr": 0.00036443618039927217, "tps": 15071, "wall": 30478.3} {"step": 7009, "train_loss": 3.656832218170166, "lr": 0.00036442474694203786, "tps": 15070, "wall": 30483.2} {"step": 7010, "train_loss": 3.635903835296631, "lr": 0.0003644133118487522, "tps": 15070, "wall": 30488.2} {"step": 7011, "train_loss": 3.6569018363952637, "lr": 0.00036440187511954463, "tps": 15070, "wall": 30493.1} {"step": 7012, "train_loss": 3.7202658653259277, "lr": 0.0003643904367545449, "tps": 15069, "wall": 30498.0} {"step": 7013, "train_loss": 3.599639415740967, "lr": 0.00036437899675388245, "tps": 15069, "wall": 30502.9} {"step": 7014, "train_loss": 3.5440726280212402, "lr": 0.00036436755511768694, "tps": 15069, "wall": 30507.8} {"step": 7015, "train_loss": 3.6566855907440186, "lr": 0.000364356111846088, "tps": 15069, "wall": 30512.7} {"step": 7016, "train_loss": 3.643580913543701, "lr": 0.00036434466693921507, "tps": 15068, "wall": 30517.6} {"step": 7017, "train_loss": 3.57454776763916, "lr": 0.00036433322039719805, "tps": 15068, "wall": 30522.5} {"step": 7018, "train_loss": 3.6376752853393555, "lr": 0.00036432177222016647, "tps": 15068, "wall": 30527.4} {"step": 7019, "train_loss": 3.6699748039245605, "lr": 0.0003643103224082501, "tps": 15068, "wall": 30532.3} {"step": 7020, "train_loss": 3.531656265258789, "lr": 0.00036429887096157856, "tps": 15067, "wall": 30537.3} {"step": 7021, "train_loss": 3.556354522705078, "lr": 0.00036428741788028157, "tps": 15067, "wall": 30542.2} {"step": 7022, "train_loss": 3.6793389320373535, "lr": 0.0003642759631644889, "tps": 15067, "wall": 30547.1} {"step": 7023, "train_loss": 3.6415796279907227, "lr": 0.0003642645068143304, "tps": 15066, "wall": 30552.0} {"step": 7024, "train_loss": 3.736050605773926, "lr": 0.00036425304882993563, "tps": 15066, "wall": 30556.9} {"step": 7025, "train_loss": 3.5876150131225586, "lr": 0.00036424158921143465, "tps": 15066, "wall": 30561.8} {"step": 7026, "train_loss": 3.655975341796875, "lr": 0.0003642301279589571, "tps": 15066, "wall": 30566.7} {"step": 7027, "train_loss": 3.6887927055358887, "lr": 0.0003642186650726328, "tps": 15065, "wall": 30571.6} {"step": 7028, "train_loss": 3.575653553009033, "lr": 0.0003642072005525917, "tps": 15065, "wall": 30576.6} {"step": 7029, "train_loss": 3.6359262466430664, "lr": 0.0003641957343989636, "tps": 15065, "wall": 30581.4} {"step": 7030, "train_loss": 3.6185355186462402, "lr": 0.0003641842666118785, "tps": 15064, "wall": 30586.4} {"step": 7031, "train_loss": 3.6445438861846924, "lr": 0.00036417279719146617, "tps": 15064, "wall": 30591.3} {"step": 7032, "train_loss": 3.579420328140259, "lr": 0.00036416132613785663, "tps": 15064, "wall": 30596.2} {"step": 7033, "train_loss": 3.5594735145568848, "lr": 0.0003641498534511797, "tps": 15064, "wall": 30601.1} {"step": 7034, "train_loss": 3.6158227920532227, "lr": 0.00036413837913156557, "tps": 15063, "wall": 30606.0} {"step": 7035, "train_loss": 3.612809419631958, "lr": 0.000364126903179144, "tps": 15063, "wall": 30610.9} {"step": 7036, "train_loss": 3.7130260467529297, "lr": 0.00036411542559404507, "tps": 15063, "wall": 30615.8} {"step": 7037, "train_loss": 3.604182720184326, "lr": 0.0003641039463763988, "tps": 15063, "wall": 30620.7} {"step": 7038, "train_loss": 3.6454827785491943, "lr": 0.00036409246552633525, "tps": 15062, "wall": 30625.6} {"step": 7039, "train_loss": 3.5937182903289795, "lr": 0.0003640809830439845, "tps": 15062, "wall": 30630.5} {"step": 7040, "train_loss": 3.6239140033721924, "lr": 0.00036406949892947647, "tps": 15062, "wall": 30635.4} {"step": 7041, "train_loss": 3.6136229038238525, "lr": 0.0003640580131829414, "tps": 15062, "wall": 30640.3} {"step": 7042, "train_loss": 3.536947727203369, "lr": 0.0003640465258045094, "tps": 15061, "wall": 30645.1} {"step": 7043, "train_loss": 3.6510276794433594, "lr": 0.0003640350367943105, "tps": 15061, "wall": 30650.0} {"step": 7044, "train_loss": 3.7200207710266113, "lr": 0.000364023546152475, "tps": 15061, "wall": 30655.0} {"step": 7045, "train_loss": 3.7267205715179443, "lr": 0.000364012053879133, "tps": 15060, "wall": 30659.8} {"step": 7046, "train_loss": 3.6150951385498047, "lr": 0.0003640005599744146, "tps": 15060, "wall": 30664.7} {"step": 7047, "train_loss": 3.642580509185791, "lr": 0.00036398906443845, "tps": 15060, "wall": 30669.6} {"step": 7048, "train_loss": 3.6213274002075195, "lr": 0.00036397756727136956, "tps": 15060, "wall": 30674.5} {"step": 7049, "train_loss": 3.6043429374694824, "lr": 0.00036396606847330343, "tps": 15059, "wall": 30679.4} {"step": 7050, "train_loss": 3.6509451866149902, "lr": 0.0003639545680443819, "tps": 15059, "wall": 30684.3} {"step": 7051, "train_loss": 3.6739606857299805, "lr": 0.0003639430659847353, "tps": 15059, "wall": 30689.1} {"step": 7052, "train_loss": 3.6732499599456787, "lr": 0.0003639315622944938, "tps": 15059, "wall": 30694.0} {"step": 7053, "train_loss": 3.650920867919922, "lr": 0.0003639200569737877, "tps": 15058, "wall": 30698.9} {"step": 7054, "train_loss": 3.622746467590332, "lr": 0.00036390855002274753, "tps": 15058, "wall": 30703.8} {"step": 7055, "train_loss": 3.511474370956421, "lr": 0.00036389704144150346, "tps": 15058, "wall": 30708.7} {"step": 7056, "train_loss": 3.6714346408843994, "lr": 0.00036388553123018597, "tps": 15058, "wall": 30713.6} {"step": 7057, "train_loss": 3.5550506114959717, "lr": 0.00036387401938892534, "tps": 15057, "wall": 30718.5} {"step": 7058, "train_loss": 3.583766460418701, "lr": 0.00036386250591785205, "tps": 15057, "wall": 30723.4} {"step": 7059, "train_loss": 3.542898416519165, "lr": 0.0003638509908170965, "tps": 15057, "wall": 30728.3} {"step": 7060, "train_loss": 3.5944666862487793, "lr": 0.00036383947408678916, "tps": 15057, "wall": 30733.1} {"step": 7061, "train_loss": 3.5344200134277344, "lr": 0.00036382795572706053, "tps": 15056, "wall": 30738.0} {"step": 7062, "train_loss": 3.602060079574585, "lr": 0.0003638164357380409, "tps": 15056, "wall": 30742.9} {"step": 7063, "train_loss": 3.588672161102295, "lr": 0.00036380491411986104, "tps": 15056, "wall": 30747.8} {"step": 7064, "train_loss": 3.71738338470459, "lr": 0.00036379339087265125, "tps": 15056, "wall": 30752.6} {"step": 7065, "train_loss": 3.7119951248168945, "lr": 0.0003637818659965422, "tps": 15055, "wall": 30757.5} {"step": 7066, "train_loss": 3.5343799591064453, "lr": 0.00036377033949166435, "tps": 15055, "wall": 30762.4} {"step": 7067, "train_loss": 3.4976983070373535, "lr": 0.00036375881135814836, "tps": 15055, "wall": 30767.3} {"step": 7068, "train_loss": 3.6840131282806396, "lr": 0.00036374728159612477, "tps": 15054, "wall": 30772.1} {"step": 7069, "train_loss": 3.69950270652771, "lr": 0.0003637357502057242, "tps": 15054, "wall": 30777.1} {"step": 7070, "train_loss": 3.563570499420166, "lr": 0.0003637242171870772, "tps": 15054, "wall": 30781.9} {"step": 7071, "train_loss": 3.5703277587890625, "lr": 0.00036371268254031455, "tps": 15054, "wall": 30786.8} {"step": 7072, "train_loss": 3.565699577331543, "lr": 0.0003637011462655669, "tps": 15053, "wall": 30791.7} {"step": 7073, "train_loss": 3.575037717819214, "lr": 0.0003636896083629648, "tps": 15053, "wall": 30796.6} {"step": 7074, "train_loss": 3.650336980819702, "lr": 0.00036367806883263917, "tps": 15053, "wall": 30801.5} {"step": 7075, "train_loss": 3.5672760009765625, "lr": 0.00036366652767472044, "tps": 15053, "wall": 30806.3} {"step": 7076, "train_loss": 3.559231758117676, "lr": 0.0003636549848893396, "tps": 15052, "wall": 30811.2} {"step": 7077, "train_loss": 3.6806912422180176, "lr": 0.00036364344047662737, "tps": 15052, "wall": 30816.1} {"step": 7078, "train_loss": 3.636296033859253, "lr": 0.0003636318944367144, "tps": 15052, "wall": 30821.0} {"step": 7079, "train_loss": 3.6759307384490967, "lr": 0.0003636203467697316, "tps": 15052, "wall": 30825.8} {"step": 7080, "train_loss": 3.6211936473846436, "lr": 0.00036360879747580975, "tps": 15051, "wall": 30830.7} {"step": 7081, "train_loss": 3.6315133571624756, "lr": 0.0003635972465550796, "tps": 15051, "wall": 30835.6} {"step": 7082, "train_loss": 3.6558573246002197, "lr": 0.0003635856940076721, "tps": 15051, "wall": 30840.5} {"step": 7083, "train_loss": 3.734166383743286, "lr": 0.00036357413983371814, "tps": 15051, "wall": 30845.4} {"step": 7084, "train_loss": 3.6850266456604004, "lr": 0.0003635625840333486, "tps": 15050, "wall": 30850.2} {"step": 7085, "train_loss": 3.4935450553894043, "lr": 0.0003635510266066942, "tps": 15050, "wall": 30855.1} {"step": 7086, "train_loss": 3.5831758975982666, "lr": 0.0003635394675538861, "tps": 15050, "wall": 30860.0} {"step": 7087, "train_loss": 3.569394826889038, "lr": 0.00036352790687505513, "tps": 15050, "wall": 30864.9} {"step": 7088, "train_loss": 3.6023385524749756, "lr": 0.0003635163445703322, "tps": 15049, "wall": 30869.7} {"step": 7089, "train_loss": 3.7022552490234375, "lr": 0.00036350478063984845, "tps": 15049, "wall": 30874.6} {"step": 7090, "train_loss": 3.609534978866577, "lr": 0.0003634932150837348, "tps": 15049, "wall": 30879.5} {"step": 7091, "train_loss": 3.6378207206726074, "lr": 0.0003634816479021221, "tps": 15049, "wall": 30884.4} {"step": 7092, "train_loss": 3.695366382598877, "lr": 0.00036347007909514164, "tps": 15048, "wall": 30889.2} {"step": 7093, "train_loss": 3.6586127281188965, "lr": 0.0003634585086629244, "tps": 15048, "wall": 30894.2} {"step": 7094, "train_loss": 3.6537716388702393, "lr": 0.0003634469366056013, "tps": 15048, "wall": 30899.1} {"step": 7095, "train_loss": 3.597672462463379, "lr": 0.0003634353629233036, "tps": 15048, "wall": 30903.9} {"step": 7096, "train_loss": 3.682994842529297, "lr": 0.0003634237876161623, "tps": 15047, "wall": 30908.8} {"step": 7097, "train_loss": 3.712019920349121, "lr": 0.0003634122106843087, "tps": 15047, "wall": 30913.7} {"step": 7098, "train_loss": 3.64037823677063, "lr": 0.0003634006321278737, "tps": 15047, "wall": 30918.6} {"step": 7099, "train_loss": 3.6426563262939453, "lr": 0.00036338905194698863, "tps": 15047, "wall": 30923.5} {"step": 7100, "train_loss": 3.531639575958252, "lr": 0.0003633774701417846, "tps": 15046, "wall": 30928.3} {"step": 7101, "train_loss": 3.614497661590576, "lr": 0.00036336588671239284, "tps": 15046, "wall": 30933.2} {"step": 7102, "train_loss": 3.6326980590820312, "lr": 0.0003633543016589446, "tps": 15046, "wall": 30938.1} {"step": 7103, "train_loss": 3.673323631286621, "lr": 0.000363342714981571, "tps": 15046, "wall": 30942.9} {"step": 7104, "train_loss": 3.6005470752716064, "lr": 0.00036333112668040347, "tps": 15045, "wall": 30947.8} {"step": 7105, "train_loss": 3.718208074569702, "lr": 0.0003633195367555731, "tps": 15045, "wall": 30952.7} {"step": 7106, "train_loss": 3.5873115062713623, "lr": 0.0003633079452072113, "tps": 15045, "wall": 30957.6} {"step": 7107, "train_loss": 3.7201900482177734, "lr": 0.00036329635203544933, "tps": 15044, "wall": 30962.5} {"step": 7108, "train_loss": 3.6681652069091797, "lr": 0.00036328475724041855, "tps": 15044, "wall": 30967.4} {"step": 7109, "train_loss": 3.5237114429473877, "lr": 0.00036327316082225027, "tps": 15044, "wall": 30972.3} {"step": 7110, "train_loss": 3.582561492919922, "lr": 0.00036326156278107584, "tps": 15044, "wall": 30977.1} {"step": 7111, "train_loss": 3.6471550464630127, "lr": 0.00036324996311702673, "tps": 15043, "wall": 30982.0} {"step": 7112, "train_loss": 3.7096948623657227, "lr": 0.0003632383618302343, "tps": 15043, "wall": 30986.9} {"step": 7113, "train_loss": 3.511958122253418, "lr": 0.0003632267589208299, "tps": 15043, "wall": 30991.8} {"step": 7114, "train_loss": 3.6159355640411377, "lr": 0.00036321515438894505, "tps": 15043, "wall": 30996.6} {"step": 7115, "train_loss": 3.6117398738861084, "lr": 0.0003632035482347112, "tps": 15042, "wall": 31001.5} {"step": 7116, "train_loss": 3.6313796043395996, "lr": 0.0003631919404582598, "tps": 15042, "wall": 31006.4} {"step": 7117, "train_loss": 3.663675308227539, "lr": 0.00036318033105972234, "tps": 15042, "wall": 31011.3} {"step": 7118, "train_loss": 3.542616844177246, "lr": 0.0003631687200392303, "tps": 15042, "wall": 31016.2} {"step": 7119, "train_loss": 3.584329843521118, "lr": 0.00036315710739691533, "tps": 15041, "wall": 31021.1} {"step": 7120, "train_loss": 3.5592966079711914, "lr": 0.0003631454931329089, "tps": 15041, "wall": 31026.0} {"step": 7121, "train_loss": 3.7681756019592285, "lr": 0.0003631338772473425, "tps": 15041, "wall": 31030.8} {"step": 7122, "train_loss": 3.6936614513397217, "lr": 0.0003631222597403479, "tps": 15041, "wall": 31035.7} {"step": 7123, "train_loss": 3.5610315799713135, "lr": 0.00036311064061205655, "tps": 15040, "wall": 31040.6} {"step": 7124, "train_loss": 3.6155943870544434, "lr": 0.00036309901986260015, "tps": 15040, "wall": 31045.5} {"step": 7125, "train_loss": 3.616321563720703, "lr": 0.00036308739749211025, "tps": 15040, "wall": 31050.4} {"step": 7126, "train_loss": 3.6575510501861572, "lr": 0.0003630757735007186, "tps": 15040, "wall": 31055.2} {"step": 7127, "train_loss": 3.545637845993042, "lr": 0.00036306414788855683, "tps": 15039, "wall": 31060.1} {"step": 7128, "train_loss": 3.478327751159668, "lr": 0.0003630525206557567, "tps": 15039, "wall": 31065.0} {"step": 7129, "train_loss": 3.6489298343658447, "lr": 0.00036304089180244983, "tps": 15039, "wall": 31069.9} {"step": 7130, "train_loss": 3.7221240997314453, "lr": 0.00036302926132876804, "tps": 15039, "wall": 31074.8} {"step": 7131, "train_loss": 3.6578118801116943, "lr": 0.00036301762923484303, "tps": 15038, "wall": 31079.7} {"step": 7132, "train_loss": 3.7232275009155273, "lr": 0.0003630059955208066, "tps": 15038, "wall": 31084.5} {"step": 7133, "train_loss": 3.6046152114868164, "lr": 0.0003629943601867904, "tps": 15038, "wall": 31089.4} {"step": 7134, "train_loss": 3.5390515327453613, "lr": 0.0003629827232329265, "tps": 15038, "wall": 31094.3} {"step": 7135, "train_loss": 3.622408390045166, "lr": 0.00036297108465934655, "tps": 15037, "wall": 31099.2} {"step": 7136, "train_loss": 3.578284740447998, "lr": 0.0003629594444661824, "tps": 15037, "wall": 31104.0} {"step": 7137, "train_loss": 3.5237627029418945, "lr": 0.00036294780265356587, "tps": 15037, "wall": 31108.9} {"step": 7138, "train_loss": 3.585456609725952, "lr": 0.00036293615922162895, "tps": 15037, "wall": 31113.8} {"step": 7139, "train_loss": 3.6611454486846924, "lr": 0.00036292451417050347, "tps": 15036, "wall": 31118.7} {"step": 7140, "train_loss": 3.5908780097961426, "lr": 0.00036291286750032137, "tps": 15036, "wall": 31123.6} {"step": 7141, "train_loss": 3.5477890968322754, "lr": 0.00036290121921121456, "tps": 15036, "wall": 31128.4} {"step": 7142, "train_loss": 3.597146511077881, "lr": 0.000362889569303315, "tps": 15036, "wall": 31133.3} {"step": 7143, "train_loss": 3.5935373306274414, "lr": 0.0003628779177767547, "tps": 15035, "wall": 31138.2} {"step": 7144, "train_loss": 3.5682389736175537, "lr": 0.00036286626463166564, "tps": 15035, "wall": 31143.1} {"step": 7145, "train_loss": 3.620791435241699, "lr": 0.00036285460986817974, "tps": 15035, "wall": 31148.0} {"step": 7146, "train_loss": 3.6586570739746094, "lr": 0.0003628429534864292, "tps": 15035, "wall": 31152.9} {"step": 7147, "train_loss": 3.5403096675872803, "lr": 0.00036283129548654575, "tps": 15034, "wall": 31157.7} {"step": 7148, "train_loss": 3.7022595405578613, "lr": 0.0003628196358686618, "tps": 15034, "wall": 31162.6} {"step": 7149, "train_loss": 3.546219825744629, "lr": 0.00036280797463290936, "tps": 15034, "wall": 31167.5} {"step": 7150, "train_loss": 3.589747667312622, "lr": 0.00036279631177942034, "tps": 15034, "wall": 31172.4} {"step": 7151, "train_loss": 3.4805960655212402, "lr": 0.00036278464730832706, "tps": 15033, "wall": 31177.3} {"step": 7152, "train_loss": 3.6775126457214355, "lr": 0.00036277298121976145, "tps": 15033, "wall": 31182.1} {"step": 7153, "train_loss": 3.5830435752868652, "lr": 0.00036276131351385585, "tps": 15033, "wall": 31187.0} {"step": 7154, "train_loss": 3.5486271381378174, "lr": 0.00036274964419074235, "tps": 15033, "wall": 31191.9} {"step": 7155, "train_loss": 3.6442580223083496, "lr": 0.00036273797325055325, "tps": 15032, "wall": 31196.8} {"step": 7156, "train_loss": 3.6302366256713867, "lr": 0.0003627263006934206, "tps": 15032, "wall": 31201.7} {"step": 7157, "train_loss": 3.6239075660705566, "lr": 0.00036271462651947664, "tps": 15032, "wall": 31206.6} {"step": 7158, "train_loss": 3.6909303665161133, "lr": 0.00036270295072885373, "tps": 15032, "wall": 31211.4} {"step": 7159, "train_loss": 3.540245294570923, "lr": 0.0003626912733216841, "tps": 15031, "wall": 31216.3} {"step": 7160, "train_loss": 3.687180519104004, "lr": 0.0003626795942980999, "tps": 15031, "wall": 31221.2} {"step": 7161, "train_loss": 3.622021436691284, "lr": 0.0003626679136582337, "tps": 15031, "wall": 31226.0} {"step": 7162, "train_loss": 3.6319966316223145, "lr": 0.00036265623140221753, "tps": 15031, "wall": 31230.9} {"step": 7163, "train_loss": 3.5715508460998535, "lr": 0.00036264454753018386, "tps": 15030, "wall": 31235.8} {"step": 7164, "train_loss": 3.5377883911132812, "lr": 0.0003626328620422651, "tps": 15030, "wall": 31240.6} {"step": 7165, "train_loss": 3.6031696796417236, "lr": 0.00036262117493859354, "tps": 15030, "wall": 31245.5} {"step": 7166, "train_loss": 3.6168813705444336, "lr": 0.0003626094862193015, "tps": 15030, "wall": 31250.4} {"step": 7167, "train_loss": 3.5785675048828125, "lr": 0.00036259779588452163, "tps": 15029, "wall": 31255.3} {"step": 7168, "train_loss": 3.688326835632324, "lr": 0.00036258610393438614, "tps": 15029, "wall": 31260.2} {"step": 7169, "train_loss": 3.6224775314331055, "lr": 0.00036257441036902755, "tps": 15029, "wall": 31265.1} {"step": 7170, "train_loss": 3.5341649055480957, "lr": 0.00036256271518857837, "tps": 15029, "wall": 31269.9} {"step": 7171, "train_loss": 3.683276653289795, "lr": 0.00036255101839317096, "tps": 15028, "wall": 31274.8} {"step": 7172, "train_loss": 3.558161735534668, "lr": 0.000362539319982938, "tps": 15028, "wall": 31279.7} {"step": 7173, "train_loss": 3.610260009765625, "lr": 0.0003625276199580118, "tps": 15028, "wall": 31284.5} {"step": 7174, "train_loss": 3.6038978099823, "lr": 0.00036251591831852506, "tps": 15028, "wall": 31289.4} {"step": 7175, "train_loss": 3.589174747467041, "lr": 0.00036250421506461036, "tps": 15027, "wall": 31294.3} {"step": 7176, "train_loss": 3.667753219604492, "lr": 0.0003624925101964001, "tps": 15027, "wall": 31299.2} {"step": 7177, "train_loss": 3.645721912384033, "lr": 0.00036248080371402707, "tps": 15027, "wall": 31304.0} {"step": 7178, "train_loss": 3.597827672958374, "lr": 0.00036246909561762366, "tps": 15027, "wall": 31308.9} {"step": 7179, "train_loss": 3.62176513671875, "lr": 0.00036245738590732276, "tps": 15026, "wall": 31313.8} {"step": 7180, "train_loss": 3.694002151489258, "lr": 0.0003624456745832568, "tps": 15026, "wall": 31318.7} {"step": 7181, "train_loss": 3.646514415740967, "lr": 0.0003624339616455586, "tps": 15026, "wall": 31323.6} {"step": 7182, "train_loss": 3.5836472511291504, "lr": 0.00036242224709436075, "tps": 15026, "wall": 31328.5} {"step": 7183, "train_loss": 3.6474111080169678, "lr": 0.0003624105309297959, "tps": 15025, "wall": 31333.3} {"step": 7184, "train_loss": 3.50968074798584, "lr": 0.000362398813151997, "tps": 15025, "wall": 31338.2} {"step": 7185, "train_loss": 3.6120355129241943, "lr": 0.00036238709376109653, "tps": 15025, "wall": 31343.1} {"step": 7186, "train_loss": 3.6408324241638184, "lr": 0.0003623753727572274, "tps": 15025, "wall": 31347.9} {"step": 7187, "train_loss": 3.5920844078063965, "lr": 0.0003623636501405223, "tps": 15024, "wall": 31352.8} {"step": 7188, "train_loss": 3.665496349334717, "lr": 0.0003623519259111141, "tps": 15024, "wall": 31357.7} {"step": 7189, "train_loss": 3.725637197494507, "lr": 0.0003623402000691356, "tps": 15024, "wall": 31362.5} {"step": 7190, "train_loss": 3.676906108856201, "lr": 0.0003623284726147196, "tps": 15024, "wall": 31367.4} {"step": 7191, "train_loss": 3.597587823867798, "lr": 0.00036231674354799895, "tps": 15023, "wall": 31372.3} {"step": 7192, "train_loss": 3.6833152770996094, "lr": 0.00036230501286910655, "tps": 15023, "wall": 31377.2} {"step": 7193, "train_loss": 3.591998338699341, "lr": 0.00036229328057817525, "tps": 15023, "wall": 31382.1} {"step": 7194, "train_loss": 3.549154043197632, "lr": 0.00036228154667533797, "tps": 15023, "wall": 31386.9} {"step": 7195, "train_loss": 3.6176199913024902, "lr": 0.00036226981116072764, "tps": 15022, "wall": 31391.8} {"step": 7196, "train_loss": 3.644073009490967, "lr": 0.0003622580740344772, "tps": 15022, "wall": 31396.6} {"step": 7197, "train_loss": 3.62981915473938, "lr": 0.0003622463352967196, "tps": 15022, "wall": 31401.5} {"step": 7198, "train_loss": 3.645123243331909, "lr": 0.0003622345949475878, "tps": 15022, "wall": 31406.4} {"step": 7199, "train_loss": 3.648447275161743, "lr": 0.0003622228529872148, "tps": 15021, "wall": 31411.2} {"step": 7200, "train_loss": 3.7331082820892334, "lr": 0.0003622111094157337, "tps": 15021, "wall": 31416.1} {"step": 7201, "train_loss": 3.6674211025238037, "lr": 0.0003621993642332774, "tps": 15021, "wall": 31421.0} {"step": 7202, "train_loss": 3.5963892936706543, "lr": 0.000362187617439979, "tps": 15021, "wall": 31425.8} {"step": 7203, "train_loss": 3.536938428878784, "lr": 0.0003621758690359716, "tps": 15021, "wall": 31430.7} {"step": 7204, "train_loss": 3.7086973190307617, "lr": 0.0003621641190213883, "tps": 15020, "wall": 31435.7} {"step": 7205, "train_loss": 3.662194013595581, "lr": 0.0003621523673963621, "tps": 15020, "wall": 31440.5} {"step": 7206, "train_loss": 3.623192548751831, "lr": 0.00036214061416102623, "tps": 15020, "wall": 31445.4} {"step": 7207, "train_loss": 3.592930316925049, "lr": 0.0003621288593155138, "tps": 15020, "wall": 31450.3} {"step": 7208, "train_loss": 3.5143771171569824, "lr": 0.0003621171028599579, "tps": 15019, "wall": 31455.1} {"step": 7209, "train_loss": 3.6716628074645996, "lr": 0.00036210534479449183, "tps": 15019, "wall": 31460.0} {"step": 7210, "train_loss": 3.678593397140503, "lr": 0.0003620935851192487, "tps": 15019, "wall": 31464.9} {"step": 7211, "train_loss": 3.632850170135498, "lr": 0.00036208182383436183, "tps": 15019, "wall": 31469.8} {"step": 7212, "train_loss": 3.6341114044189453, "lr": 0.0003620700609399642, "tps": 15018, "wall": 31474.6} {"step": 7213, "train_loss": 3.64119291305542, "lr": 0.0003620582964361894, "tps": 15018, "wall": 31479.5} {"step": 7214, "train_loss": 3.6221694946289062, "lr": 0.00036204653032317045, "tps": 15018, "wall": 31484.4} {"step": 7215, "train_loss": 3.5710246562957764, "lr": 0.0003620347626010408, "tps": 15018, "wall": 31489.2} {"step": 7216, "train_loss": 3.7154178619384766, "lr": 0.00036202299326993357, "tps": 15017, "wall": 31494.2} {"step": 7217, "train_loss": 3.6591031551361084, "lr": 0.00036201122232998225, "tps": 15017, "wall": 31499.0} {"step": 7218, "train_loss": 3.5720629692077637, "lr": 0.0003619994497813201, "tps": 15017, "wall": 31503.9} {"step": 7219, "train_loss": 3.682039499282837, "lr": 0.0003619876756240805, "tps": 15017, "wall": 31508.7} {"step": 7220, "train_loss": 3.624162197113037, "lr": 0.0003619758998583969, "tps": 15016, "wall": 31513.6} {"step": 7221, "train_loss": 3.636108875274658, "lr": 0.00036196412248440255, "tps": 15016, "wall": 31518.5} {"step": 7222, "train_loss": 3.6793997287750244, "lr": 0.00036195234350223097, "tps": 15016, "wall": 31523.3} {"step": 7223, "train_loss": 3.5748636722564697, "lr": 0.0003619405629120155, "tps": 15016, "wall": 31528.2} {"step": 7224, "train_loss": 3.6448867321014404, "lr": 0.0003619287807138897, "tps": 15015, "wall": 31533.0} {"step": 7225, "train_loss": 3.623349189758301, "lr": 0.00036191699690798704, "tps": 15015, "wall": 31537.9} {"step": 7226, "train_loss": 3.5645089149475098, "lr": 0.0003619052114944409, "tps": 15015, "wall": 31542.8} {"step": 7227, "train_loss": 3.5830636024475098, "lr": 0.00036189342447338484, "tps": 15015, "wall": 31547.7} {"step": 7228, "train_loss": 3.6445484161376953, "lr": 0.00036188163584495247, "tps": 15014, "wall": 31552.5} {"step": 7229, "train_loss": 3.5595550537109375, "lr": 0.00036186984560927717, "tps": 15014, "wall": 31557.5} {"step": 7230, "train_loss": 3.6845703125, "lr": 0.0003618580537664926, "tps": 15014, "wall": 31562.3} {"step": 7231, "train_loss": 3.5875332355499268, "lr": 0.00036184626031673234, "tps": 15014, "wall": 31567.2} {"step": 7232, "train_loss": 3.5637612342834473, "lr": 0.00036183446526012996, "tps": 15013, "wall": 31572.1} {"step": 7233, "train_loss": 3.637556791305542, "lr": 0.0003618226685968191, "tps": 15013, "wall": 31576.9} {"step": 7234, "train_loss": 3.5259952545166016, "lr": 0.00036181087032693336, "tps": 15013, "wall": 31581.8} {"step": 7235, "train_loss": 3.65132474899292, "lr": 0.0003617990704506064, "tps": 15013, "wall": 31586.7} {"step": 7236, "train_loss": 3.7114334106445312, "lr": 0.00036178726896797194, "tps": 15013, "wall": 31591.5} {"step": 7237, "train_loss": 3.518362522125244, "lr": 0.00036177546587916364, "tps": 15012, "wall": 31596.4} {"step": 7238, "train_loss": 3.5629491806030273, "lr": 0.00036176366118431517, "tps": 15012, "wall": 31601.3} {"step": 7239, "train_loss": 3.5539157390594482, "lr": 0.0003617518548835602, "tps": 15012, "wall": 31606.2} {"step": 7240, "train_loss": 3.6382880210876465, "lr": 0.00036174004697703266, "tps": 15012, "wall": 31611.0} {"step": 7241, "train_loss": 3.6704134941101074, "lr": 0.00036172823746486615, "tps": 15011, "wall": 31615.9} {"step": 7242, "train_loss": 3.632993698120117, "lr": 0.00036171642634719446, "tps": 15011, "wall": 31620.8} {"step": 7243, "train_loss": 3.6363515853881836, "lr": 0.00036170461362415146, "tps": 15011, "wall": 31625.7} {"step": 7244, "train_loss": 3.5218183994293213, "lr": 0.00036169279929587096, "tps": 15011, "wall": 31630.5} {"step": 7245, "train_loss": 3.715602159500122, "lr": 0.00036168098336248673, "tps": 15010, "wall": 31635.4} {"step": 7246, "train_loss": 3.714663505554199, "lr": 0.0003616691658241327, "tps": 15010, "wall": 31640.3} {"step": 7247, "train_loss": 3.669466257095337, "lr": 0.00036165734668094267, "tps": 15010, "wall": 31645.2} {"step": 7248, "train_loss": 3.645137310028076, "lr": 0.00036164552593305054, "tps": 15010, "wall": 31650.0} {"step": 7249, "train_loss": 3.5865578651428223, "lr": 0.00036163370358059015, "tps": 15009, "wall": 31654.9} {"step": 7250, "train_loss": 3.5471982955932617, "lr": 0.00036162187962369567, "tps": 15009, "wall": 31659.7} {"step": 7251, "train_loss": 3.5447068214416504, "lr": 0.0003616100540625008, "tps": 15009, "wall": 31664.6} {"step": 7252, "train_loss": 3.6810741424560547, "lr": 0.00036159822689713956, "tps": 15009, "wall": 31669.5} {"step": 7253, "train_loss": 3.6148948669433594, "lr": 0.0003615863981277459, "tps": 15008, "wall": 31674.4} {"step": 7254, "train_loss": 3.6787731647491455, "lr": 0.00036157456775445394, "tps": 15008, "wall": 31679.3} {"step": 7255, "train_loss": 3.6721179485321045, "lr": 0.00036156273577739756, "tps": 15008, "wall": 31684.2} {"step": 7256, "train_loss": 3.5793240070343018, "lr": 0.0003615509021967109, "tps": 15008, "wall": 31689.0} {"step": 7257, "train_loss": 3.7748122215270996, "lr": 0.00036153906701252793, "tps": 15007, "wall": 31693.9} {"step": 7258, "train_loss": 3.476893424987793, "lr": 0.00036152723022498285, "tps": 15007, "wall": 31698.9} {"step": 7259, "train_loss": 3.600261926651001, "lr": 0.0003615153918342095, "tps": 15007, "wall": 31703.7} {"step": 7260, "train_loss": 3.6623055934906006, "lr": 0.00036150355184034225, "tps": 15007, "wall": 31708.6} {"step": 7261, "train_loss": 3.605621814727783, "lr": 0.00036149171024351507, "tps": 15006, "wall": 31713.5} {"step": 7262, "train_loss": 3.7073354721069336, "lr": 0.0003614798670438621, "tps": 15006, "wall": 31718.3} {"step": 7263, "train_loss": 3.6939053535461426, "lr": 0.0003614680222415176, "tps": 15006, "wall": 31723.2} {"step": 7264, "train_loss": 3.5972347259521484, "lr": 0.0003614561758366157, "tps": 15006, "wall": 31728.1} {"step": 7265, "train_loss": 3.5518617630004883, "lr": 0.00036144432782929056, "tps": 15006, "wall": 31732.9} {"step": 7266, "train_loss": 3.6163737773895264, "lr": 0.0003614324782196764, "tps": 15005, "wall": 31737.8} {"step": 7267, "train_loss": 3.5316367149353027, "lr": 0.00036142062700790745, "tps": 15005, "wall": 31742.7} {"step": 7268, "train_loss": 3.60007905960083, "lr": 0.000361408774194118, "tps": 15005, "wall": 31747.5} {"step": 7269, "train_loss": 3.6243016719818115, "lr": 0.0003613969197784424, "tps": 15005, "wall": 31752.4} {"step": 7270, "train_loss": 3.6502602100372314, "lr": 0.0003613850637610148, "tps": 15004, "wall": 31757.3} {"step": 7271, "train_loss": 3.6388919353485107, "lr": 0.00036137320614196955, "tps": 15004, "wall": 31762.1} {"step": 7272, "train_loss": 3.6239395141601562, "lr": 0.0003613613469214409, "tps": 15004, "wall": 31767.0} {"step": 7273, "train_loss": 3.6566483974456787, "lr": 0.00036134948609956334, "tps": 15004, "wall": 31771.9} {"step": 7274, "train_loss": 3.6469531059265137, "lr": 0.00036133762367647113, "tps": 15003, "wall": 31776.7} {"step": 7275, "train_loss": 3.6422741413116455, "lr": 0.00036132575965229865, "tps": 15003, "wall": 31781.6} {"step": 7276, "train_loss": 3.6387908458709717, "lr": 0.00036131389402718035, "tps": 15003, "wall": 31786.5} {"step": 7277, "train_loss": 3.6744132041931152, "lr": 0.00036130202680125065, "tps": 15003, "wall": 31791.3} {"step": 7278, "train_loss": 3.590043783187866, "lr": 0.00036129015797464384, "tps": 15002, "wall": 31796.2} {"step": 7279, "train_loss": 3.5242080688476562, "lr": 0.0003612782875474946, "tps": 15002, "wall": 31801.1} {"step": 7280, "train_loss": 3.6539742946624756, "lr": 0.00036126641551993715, "tps": 15002, "wall": 31806.0} {"step": 7281, "train_loss": 3.6374928951263428, "lr": 0.0003612545418921062, "tps": 15002, "wall": 31810.8} {"step": 7282, "train_loss": 3.6591241359710693, "lr": 0.0003612426666641361, "tps": 15001, "wall": 31815.7} {"step": 7283, "train_loss": 3.52329683303833, "lr": 0.0003612307898361615, "tps": 15001, "wall": 31820.5} {"step": 7284, "train_loss": 3.5958023071289062, "lr": 0.0003612189114083168, "tps": 15001, "wall": 31825.4} {"step": 7285, "train_loss": 3.6041932106018066, "lr": 0.00036120703138073666, "tps": 15001, "wall": 31830.3} {"step": 7286, "train_loss": 3.6517128944396973, "lr": 0.00036119514975355567, "tps": 15001, "wall": 31835.1} {"step": 7287, "train_loss": 3.6138453483581543, "lr": 0.0003611832665269083, "tps": 15000, "wall": 31840.0} {"step": 7288, "train_loss": 3.6353073120117188, "lr": 0.0003611713817009293, "tps": 15000, "wall": 31844.9} {"step": 7289, "train_loss": 3.6011428833007812, "lr": 0.00036115949527575325, "tps": 15000, "wall": 31849.7} {"step": 7290, "train_loss": 3.601426362991333, "lr": 0.0003611476072515148, "tps": 15000, "wall": 31854.7} {"step": 7291, "train_loss": 3.5474140644073486, "lr": 0.00036113571762834857, "tps": 14999, "wall": 31859.5} {"step": 7292, "train_loss": 3.63845157623291, "lr": 0.0003611238264063894, "tps": 14999, "wall": 31864.4} {"step": 7293, "train_loss": 3.713198184967041, "lr": 0.00036111193358577185, "tps": 14999, "wall": 31869.3} {"step": 7294, "train_loss": 3.7591493129730225, "lr": 0.0003611000391666306, "tps": 14999, "wall": 31874.1} {"step": 7295, "train_loss": 3.5364484786987305, "lr": 0.0003610881431491005, "tps": 14998, "wall": 31879.0} {"step": 7296, "train_loss": 3.6035759449005127, "lr": 0.00036107624553331633, "tps": 14998, "wall": 31883.8} {"step": 7297, "train_loss": 3.668574333190918, "lr": 0.00036106434631941284, "tps": 14998, "wall": 31888.7} {"step": 7298, "train_loss": 3.5852842330932617, "lr": 0.00036105244550752475, "tps": 14998, "wall": 31893.6} {"step": 7299, "train_loss": 3.4952712059020996, "lr": 0.000361040543097787, "tps": 14998, "wall": 31898.4} {"step": 7300, "train_loss": 3.6413357257843018, "lr": 0.00036102863909033426, "tps": 14997, "wall": 31903.3} {"step": 7301, "train_loss": 3.6203277111053467, "lr": 0.0003610167334853015, "tps": 14997, "wall": 31908.2} {"step": 7302, "train_loss": 3.580191135406494, "lr": 0.0003610048262828235, "tps": 14997, "wall": 31913.0} {"step": 7303, "train_loss": 3.5949177742004395, "lr": 0.00036099291748303527, "tps": 14997, "wall": 31917.9} {"step": 7304, "train_loss": 3.5364623069763184, "lr": 0.0003609810070860717, "tps": 14996, "wall": 31922.8} {"step": 7305, "train_loss": 3.5661704540252686, "lr": 0.0003609690950920675, "tps": 14996, "wall": 31927.6} {"step": 7306, "train_loss": 3.5570859909057617, "lr": 0.00036095718150115793, "tps": 14996, "wall": 31932.5} {"step": 7307, "train_loss": 3.6385340690612793, "lr": 0.0003609452663134776, "tps": 14996, "wall": 31937.3} {"step": 7308, "train_loss": 3.720916748046875, "lr": 0.0003609333495291618, "tps": 14995, "wall": 31942.2} {"step": 7309, "train_loss": 3.6080684661865234, "lr": 0.00036092143114834543, "tps": 14995, "wall": 31947.0} {"step": 7310, "train_loss": 3.5705647468566895, "lr": 0.00036090951117116336, "tps": 14995, "wall": 31951.9} {"step": 7311, "train_loss": 3.493854284286499, "lr": 0.0003608975895977508, "tps": 14995, "wall": 31956.8} {"step": 7312, "train_loss": 3.702807903289795, "lr": 0.00036088566642824264, "tps": 14995, "wall": 31961.6} {"step": 7313, "train_loss": 3.5766894817352295, "lr": 0.00036087374166277405, "tps": 14994, "wall": 31966.5} {"step": 7314, "train_loss": 3.6587870121002197, "lr": 0.0003608618153014801, "tps": 14994, "wall": 31971.6} {"step": 7315, "train_loss": 3.4915146827697754, "lr": 0.0003608498873444959, "tps": 14993, "wall": 31977.1} {"step": 7316, "train_loss": 3.6090142726898193, "lr": 0.0003608379577919566, "tps": 14993, "wall": 31982.2} {"step": 7317, "train_loss": 3.5500411987304688, "lr": 0.0003608260266439972, "tps": 14993, "wall": 31987.1} {"step": 7318, "train_loss": 3.7110486030578613, "lr": 0.000360814093900753, "tps": 14993, "wall": 31991.9} {"step": 7319, "train_loss": 3.5547776222229004, "lr": 0.00036080215956235917, "tps": 14992, "wall": 31996.8} {"step": 7320, "train_loss": 3.6136245727539062, "lr": 0.0003607902236289508, "tps": 14992, "wall": 32001.7} {"step": 7321, "train_loss": 3.624516010284424, "lr": 0.00036077828610066315, "tps": 14992, "wall": 32006.6} {"step": 7322, "train_loss": 3.614567279815674, "lr": 0.0003607663469776315, "tps": 14992, "wall": 32011.4} {"step": 7323, "train_loss": 3.6820902824401855, "lr": 0.000360754406259991, "tps": 14991, "wall": 32016.3} {"step": 7324, "train_loss": 3.597818374633789, "lr": 0.0003607424639478771, "tps": 14991, "wall": 32021.1} {"step": 7325, "train_loss": 3.554638385772705, "lr": 0.00036073052004142477, "tps": 14991, "wall": 32026.0} {"step": 7326, "train_loss": 3.572843074798584, "lr": 0.00036071857454076967, "tps": 14991, "wall": 32030.8} {"step": 7327, "train_loss": 3.5188236236572266, "lr": 0.00036070662744604686, "tps": 14990, "wall": 32035.7} {"step": 7328, "train_loss": 3.6498193740844727, "lr": 0.0003606946787573917, "tps": 14990, "wall": 32040.6} {"step": 7329, "train_loss": 3.605870246887207, "lr": 0.0003606827284749397, "tps": 14990, "wall": 32045.5} {"step": 7330, "train_loss": 3.5677032470703125, "lr": 0.0003606707765988261, "tps": 14990, "wall": 32050.3} {"step": 7331, "train_loss": 3.726407289505005, "lr": 0.0003606588231291864, "tps": 14990, "wall": 32055.2} {"step": 7332, "train_loss": 3.638843297958374, "lr": 0.0003606468680661559, "tps": 14989, "wall": 32060.0} {"step": 7333, "train_loss": 3.5661585330963135, "lr": 0.0003606349114098701, "tps": 14989, "wall": 32064.9} {"step": 7334, "train_loss": 3.6816415786743164, "lr": 0.0003606229531604643, "tps": 14989, "wall": 32069.7} {"step": 7335, "train_loss": 3.5253186225891113, "lr": 0.0003606109933180742, "tps": 14989, "wall": 32074.6} {"step": 7336, "train_loss": 3.6388585567474365, "lr": 0.0003605990318828351, "tps": 14988, "wall": 32079.4} {"step": 7337, "train_loss": 3.5754146575927734, "lr": 0.00036058706885488257, "tps": 14988, "wall": 32084.3} {"step": 7338, "train_loss": 3.544609308242798, "lr": 0.0003605751042343521, "tps": 14988, "wall": 32089.2} {"step": 7339, "train_loss": 3.7806105613708496, "lr": 0.00036056313802137926, "tps": 14988, "wall": 32094.1} {"step": 7340, "train_loss": 3.7170121669769287, "lr": 0.0003605511702160996, "tps": 14988, "wall": 32099.0} {"step": 7341, "train_loss": 3.624084949493408, "lr": 0.0003605392008186487, "tps": 14987, "wall": 32103.8} {"step": 7342, "train_loss": 3.593484878540039, "lr": 0.00036052722982916213, "tps": 14987, "wall": 32108.7} {"step": 7343, "train_loss": 3.5193979740142822, "lr": 0.0003605152572477755, "tps": 14987, "wall": 32113.5} {"step": 7344, "train_loss": 3.686721086502075, "lr": 0.0003605032830746244, "tps": 14987, "wall": 32118.4} {"step": 7345, "train_loss": 3.5621938705444336, "lr": 0.0003604913073098445, "tps": 14986, "wall": 32123.2} {"step": 7346, "train_loss": 3.599419116973877, "lr": 0.0003604793299535715, "tps": 14986, "wall": 32128.1} {"step": 7347, "train_loss": 3.667189121246338, "lr": 0.00036046735100594106, "tps": 14986, "wall": 32132.9} {"step": 7348, "train_loss": 3.528733730316162, "lr": 0.00036045537046708884, "tps": 14986, "wall": 32137.8} {"step": 7349, "train_loss": 3.573000907897949, "lr": 0.0003604433883371506, "tps": 14986, "wall": 32142.6} {"step": 7350, "train_loss": 3.5624988079071045, "lr": 0.0003604314046162621, "tps": 14985, "wall": 32147.5} {"step": 7351, "train_loss": 3.529928684234619, "lr": 0.00036041941930455896, "tps": 14985, "wall": 32152.3} {"step": 7352, "train_loss": 3.6617655754089355, "lr": 0.0003604074324021771, "tps": 14985, "wall": 32157.3} {"step": 7353, "train_loss": 3.5868735313415527, "lr": 0.0003603954439092522, "tps": 14985, "wall": 32162.1} {"step": 7354, "train_loss": 3.6272716522216797, "lr": 0.00036038345382592013, "tps": 14984, "wall": 32167.0} {"step": 7355, "train_loss": 3.639927864074707, "lr": 0.0003603714621523168, "tps": 14984, "wall": 32171.8} {"step": 7356, "train_loss": 3.6440024375915527, "lr": 0.00036035946888857785, "tps": 14984, "wall": 32176.7} {"step": 7357, "train_loss": 3.6486175060272217, "lr": 0.0003603474740348392, "tps": 14984, "wall": 32181.5} {"step": 7358, "train_loss": 3.609713554382324, "lr": 0.0003603354775912369, "tps": 14983, "wall": 32186.4} {"step": 7359, "train_loss": 3.5141148567199707, "lr": 0.00036032347955790664, "tps": 14983, "wall": 32191.2} {"step": 7360, "train_loss": 3.562854290008545, "lr": 0.00036031147993498443, "tps": 14983, "wall": 32196.1} {"step": 7361, "train_loss": 3.657677412033081, "lr": 0.00036029947872260617, "tps": 14983, "wall": 32200.9} {"step": 7362, "train_loss": 3.693392753601074, "lr": 0.0003602874759209078, "tps": 14983, "wall": 32205.8} {"step": 7363, "train_loss": 3.611112117767334, "lr": 0.0003602754715300254, "tps": 14982, "wall": 32210.6} {"step": 7364, "train_loss": 3.6255083084106445, "lr": 0.00036026346555009483, "tps": 14982, "wall": 32215.5} {"step": 7365, "train_loss": 3.6003360748291016, "lr": 0.0003602514579812521, "tps": 14982, "wall": 32220.4} {"step": 7366, "train_loss": 3.629798173904419, "lr": 0.0003602394488236333, "tps": 14982, "wall": 32225.3} {"step": 7367, "train_loss": 3.5700337886810303, "lr": 0.0003602274380773744, "tps": 14981, "wall": 32230.1} {"step": 7368, "train_loss": 3.531470775604248, "lr": 0.0003602154257426115, "tps": 14981, "wall": 32234.9} {"step": 7369, "train_loss": 3.5989906787872314, "lr": 0.00036020341181948077, "tps": 14981, "wall": 32239.8} {"step": 7370, "train_loss": 3.568384885787964, "lr": 0.00036019139630811815, "tps": 14981, "wall": 32244.6} {"step": 7371, "train_loss": 3.5736820697784424, "lr": 0.0003601793792086598, "tps": 14981, "wall": 32249.5} {"step": 7372, "train_loss": 3.585447311401367, "lr": 0.0003601673605212418, "tps": 14980, "wall": 32254.4} {"step": 7373, "train_loss": 3.527857780456543, "lr": 0.0003601553402460004, "tps": 14980, "wall": 32259.2} {"step": 7374, "train_loss": 3.63586688041687, "lr": 0.0003601433183830717, "tps": 14980, "wall": 32264.1} {"step": 7375, "train_loss": 3.5766329765319824, "lr": 0.000360131294932592, "tps": 14980, "wall": 32268.9} {"step": 7376, "train_loss": 3.5012683868408203, "lr": 0.0003601192698946973, "tps": 14979, "wall": 32273.8} {"step": 7377, "train_loss": 3.6014318466186523, "lr": 0.000360107243269524, "tps": 14979, "wall": 32278.7} {"step": 7378, "train_loss": 3.6624608039855957, "lr": 0.00036009521505720826, "tps": 14979, "wall": 32283.5} {"step": 7379, "train_loss": 3.52661395072937, "lr": 0.0003600831852578863, "tps": 14979, "wall": 32288.4} {"step": 7380, "train_loss": 3.5877485275268555, "lr": 0.0003600711538716945, "tps": 14979, "wall": 32293.2} {"step": 7381, "train_loss": 3.643826961517334, "lr": 0.00036005912089876905, "tps": 14978, "wall": 32298.1} {"step": 7382, "train_loss": 3.6569182872772217, "lr": 0.00036004708633924636, "tps": 14978, "wall": 32302.9} {"step": 7383, "train_loss": 3.6174376010894775, "lr": 0.0003600350501932626, "tps": 14978, "wall": 32307.8} {"step": 7384, "train_loss": 3.589034080505371, "lr": 0.0003600230124609543, "tps": 14978, "wall": 32312.6} {"step": 7385, "train_loss": 3.547262191772461, "lr": 0.00036001097314245775, "tps": 14977, "wall": 32317.5} {"step": 7386, "train_loss": 3.5864152908325195, "lr": 0.00035999893223790926, "tps": 14977, "wall": 32322.3} {"step": 7387, "train_loss": 3.6201932430267334, "lr": 0.0003599868897474453, "tps": 14977, "wall": 32327.2} {"step": 7388, "train_loss": 3.5801749229431152, "lr": 0.0003599748456712023, "tps": 14977, "wall": 32332.1} {"step": 7389, "train_loss": 3.5483908653259277, "lr": 0.0003599628000093166, "tps": 14977, "wall": 32336.9} {"step": 7390, "train_loss": 3.566464900970459, "lr": 0.00035995075276192484, "tps": 14976, "wall": 32341.8} {"step": 7391, "train_loss": 3.5786168575286865, "lr": 0.00035993870392916335, "tps": 14976, "wall": 32346.7} {"step": 7392, "train_loss": 3.655449390411377, "lr": 0.0003599266535111686, "tps": 14976, "wall": 32351.5} {"step": 7393, "train_loss": 3.592468738555908, "lr": 0.0003599146015080772, "tps": 14976, "wall": 32356.4} {"step": 7394, "train_loss": 3.5705878734588623, "lr": 0.00035990254792002565, "tps": 14975, "wall": 32361.2} {"step": 7395, "train_loss": 3.5879085063934326, "lr": 0.00035989049274715045, "tps": 14975, "wall": 32366.0} {"step": 7396, "train_loss": 3.593719959259033, "lr": 0.00035987843598958813, "tps": 14975, "wall": 32370.9} {"step": 7397, "train_loss": 3.5993075370788574, "lr": 0.0003598663776474754, "tps": 14975, "wall": 32375.8} {"step": 7398, "train_loss": 3.6586389541625977, "lr": 0.00035985431772094867, "tps": 14975, "wall": 32380.6} {"step": 7399, "train_loss": 3.623694658279419, "lr": 0.0003598422562101447, "tps": 14974, "wall": 32385.5} {"step": 7400, "train_loss": 3.5869524478912354, "lr": 0.00035983019311520016, "tps": 14974, "wall": 32390.3} {"step": 7401, "train_loss": 3.6392085552215576, "lr": 0.0003598181284362516, "tps": 14974, "wall": 32395.2} {"step": 7402, "train_loss": 3.6979010105133057, "lr": 0.0003598060621734356, "tps": 14974, "wall": 32400.0} {"step": 7403, "train_loss": 3.5470199584960938, "lr": 0.00035979399432688907, "tps": 14973, "wall": 32404.9} {"step": 7404, "train_loss": 3.6774277687072754, "lr": 0.00035978192489674864, "tps": 14973, "wall": 32409.7} {"step": 7405, "train_loss": 3.5983872413635254, "lr": 0.000359769853883151, "tps": 14973, "wall": 32414.6} {"step": 7406, "train_loss": 3.5931239128112793, "lr": 0.00035975778128623286, "tps": 14973, "wall": 32419.4} {"step": 7407, "train_loss": 3.5360653400421143, "lr": 0.00035974570710613094, "tps": 14973, "wall": 32424.3} {"step": 7408, "train_loss": 3.6625561714172363, "lr": 0.00035973363134298217, "tps": 14972, "wall": 32429.2} {"step": 7409, "train_loss": 3.601203441619873, "lr": 0.0003597215539969232, "tps": 14972, "wall": 32434.0} {"step": 7410, "train_loss": 3.6327285766601562, "lr": 0.00035970947506809103, "tps": 14972, "wall": 32438.8} {"step": 7411, "train_loss": 3.624204397201538, "lr": 0.00035969739455662226, "tps": 14972, "wall": 32443.7} {"step": 7412, "train_loss": 3.5122787952423096, "lr": 0.00035968531246265395, "tps": 14971, "wall": 32448.5} {"step": 7413, "train_loss": 3.586761474609375, "lr": 0.0003596732287863228, "tps": 14971, "wall": 32453.4} {"step": 7414, "train_loss": 3.610367774963379, "lr": 0.0003596611435277657, "tps": 14971, "wall": 32458.3} {"step": 7415, "train_loss": 3.586282968521118, "lr": 0.00035964905668711965, "tps": 14971, "wall": 32463.1} {"step": 7416, "train_loss": 3.596066951751709, "lr": 0.0003596369682645216, "tps": 14971, "wall": 32467.9} {"step": 7417, "train_loss": 3.5457170009613037, "lr": 0.0003596248782601083, "tps": 14970, "wall": 32472.8} {"step": 7418, "train_loss": 3.6480839252471924, "lr": 0.00035961278667401693, "tps": 14970, "wall": 32477.6} {"step": 7419, "train_loss": 3.7830820083618164, "lr": 0.00035960069350638433, "tps": 14970, "wall": 32482.5} {"step": 7420, "train_loss": 3.5493743419647217, "lr": 0.0003595885987573475, "tps": 14970, "wall": 32487.3} {"step": 7421, "train_loss": 3.6154401302337646, "lr": 0.0003595765024270435, "tps": 14969, "wall": 32492.2} {"step": 7422, "train_loss": 3.5904133319854736, "lr": 0.0003595644045156093, "tps": 14969, "wall": 32497.1} {"step": 7423, "train_loss": 3.531407117843628, "lr": 0.000359552305023182, "tps": 14969, "wall": 32501.9} {"step": 7424, "train_loss": 3.656606674194336, "lr": 0.0003595402039498986, "tps": 14969, "wall": 32506.8} {"step": 7425, "train_loss": 3.681279420852661, "lr": 0.0003595281012958962, "tps": 14969, "wall": 32511.6} {"step": 7426, "train_loss": 3.5562870502471924, "lr": 0.00035951599706131207, "tps": 14968, "wall": 32516.5} {"step": 7427, "train_loss": 3.556673765182495, "lr": 0.00035950389124628305, "tps": 14968, "wall": 32521.4} {"step": 7428, "train_loss": 3.5743680000305176, "lr": 0.0003594917838509464, "tps": 14968, "wall": 32526.2} {"step": 7429, "train_loss": 3.6049768924713135, "lr": 0.00035947967487543934, "tps": 14968, "wall": 32531.0} {"step": 7430, "train_loss": 3.5887317657470703, "lr": 0.00035946756431989895, "tps": 14968, "wall": 32535.9} {"step": 7431, "train_loss": 3.5678296089172363, "lr": 0.00035945545218446246, "tps": 14967, "wall": 32540.7} {"step": 7432, "train_loss": 3.5660653114318848, "lr": 0.000359443338469267, "tps": 14967, "wall": 32545.6} {"step": 7433, "train_loss": 3.555569887161255, "lr": 0.0003594312231744499, "tps": 14967, "wall": 32550.4} {"step": 7434, "train_loss": 3.6411824226379395, "lr": 0.0003594191063001484, "tps": 14967, "wall": 32555.2} {"step": 7435, "train_loss": 3.60068416595459, "lr": 0.0003594069878464997, "tps": 14966, "wall": 32560.1} {"step": 7436, "train_loss": 3.566828966140747, "lr": 0.00035939486781364107, "tps": 14966, "wall": 32564.9} {"step": 7437, "train_loss": 3.560746669769287, "lr": 0.00035938274620170985, "tps": 14966, "wall": 32569.8} {"step": 7438, "train_loss": 3.539299726486206, "lr": 0.00035937062301084335, "tps": 14966, "wall": 32574.7} {"step": 7439, "train_loss": 3.6237258911132812, "lr": 0.00035935849824117883, "tps": 14966, "wall": 32579.5} {"step": 7440, "train_loss": 3.6171770095825195, "lr": 0.0003593463718928538, "tps": 14965, "wall": 32584.4} {"step": 7441, "train_loss": 3.5229909420013428, "lr": 0.0003593342439660055, "tps": 14965, "wall": 32589.2} {"step": 7442, "train_loss": 3.5025131702423096, "lr": 0.0003593221144607713, "tps": 14965, "wall": 32594.1} {"step": 7443, "train_loss": 3.475924015045166, "lr": 0.00035930998337728866, "tps": 14965, "wall": 32598.9} {"step": 7444, "train_loss": 3.582763671875, "lr": 0.00035929785071569506, "tps": 14964, "wall": 32603.8} {"step": 7445, "train_loss": 3.539194107055664, "lr": 0.0003592857164761278, "tps": 14964, "wall": 32608.6} {"step": 7446, "train_loss": 3.553692579269409, "lr": 0.00035927358065872446, "tps": 14964, "wall": 32613.5} {"step": 7447, "train_loss": 3.5221662521362305, "lr": 0.00035926144326362246, "tps": 14964, "wall": 32618.3} {"step": 7448, "train_loss": 3.575387954711914, "lr": 0.00035924930429095925, "tps": 14964, "wall": 32623.1} {"step": 7449, "train_loss": 3.510361909866333, "lr": 0.0003592371637408724, "tps": 14963, "wall": 32628.0} {"step": 7450, "train_loss": 3.6069295406341553, "lr": 0.0003592250216134994, "tps": 14963, "wall": 32632.8} {"step": 7451, "train_loss": 3.5849719047546387, "lr": 0.0003592128779089779, "tps": 14963, "wall": 32637.7} {"step": 7452, "train_loss": 3.5949764251708984, "lr": 0.0003592007326274454, "tps": 14963, "wall": 32642.6} {"step": 7453, "train_loss": 3.594468355178833, "lr": 0.0003591885857690394, "tps": 14963, "wall": 32647.4} {"step": 7454, "train_loss": 3.608431816101074, "lr": 0.00035917643733389756, "tps": 14962, "wall": 32652.3} {"step": 7455, "train_loss": 3.507854700088501, "lr": 0.0003591642873221575, "tps": 14962, "wall": 32657.1} {"step": 7456, "train_loss": 3.618504047393799, "lr": 0.00035915213573395696, "tps": 14962, "wall": 32662.0} {"step": 7457, "train_loss": 3.641176223754883, "lr": 0.00035913998256943344, "tps": 14962, "wall": 32666.8} {"step": 7458, "train_loss": 3.668278217315674, "lr": 0.0003591278278287246, "tps": 14962, "wall": 32671.6} {"step": 7459, "train_loss": 3.5833094120025635, "lr": 0.00035911567151196834, "tps": 14961, "wall": 32676.5} {"step": 7460, "train_loss": 3.4966912269592285, "lr": 0.0003591035136193022, "tps": 14961, "wall": 32681.3} {"step": 7461, "train_loss": 3.549015522003174, "lr": 0.0003590913541508639, "tps": 14961, "wall": 32686.1} {"step": 7462, "train_loss": 3.5972280502319336, "lr": 0.0003590791931067912, "tps": 14961, "wall": 32691.0} {"step": 7463, "train_loss": 3.7056093215942383, "lr": 0.0003590670304872218, "tps": 14960, "wall": 32695.9} {"step": 7464, "train_loss": 3.5980896949768066, "lr": 0.0003590548662922937, "tps": 14960, "wall": 32700.7} {"step": 7465, "train_loss": 3.5742883682250977, "lr": 0.0003590427005221445, "tps": 14960, "wall": 32705.5} {"step": 7466, "train_loss": 3.6211628913879395, "lr": 0.000359030533176912, "tps": 14960, "wall": 32710.4} {"step": 7467, "train_loss": 3.666123151779175, "lr": 0.00035901836425673416, "tps": 14960, "wall": 32715.2} {"step": 7468, "train_loss": 3.5301856994628906, "lr": 0.0003590061937617488, "tps": 14959, "wall": 32720.1} {"step": 7469, "train_loss": 3.6133229732513428, "lr": 0.0003589940216920937, "tps": 14959, "wall": 32724.9} {"step": 7470, "train_loss": 3.5560317039489746, "lr": 0.0003589818480479068, "tps": 14959, "wall": 32729.7} {"step": 7471, "train_loss": 3.5305349826812744, "lr": 0.00035896967282932605, "tps": 14959, "wall": 32734.6} {"step": 7472, "train_loss": 3.6294827461242676, "lr": 0.00035895749603648936, "tps": 14959, "wall": 32739.4} {"step": 7473, "train_loss": 3.560594081878662, "lr": 0.00035894531766953456, "tps": 14958, "wall": 32744.2} {"step": 7474, "train_loss": 3.6308298110961914, "lr": 0.0003589331377285997, "tps": 14958, "wall": 32749.1} {"step": 7475, "train_loss": 3.648730754852295, "lr": 0.0003589209562138228, "tps": 14958, "wall": 32754.0} {"step": 7476, "train_loss": 3.481346607208252, "lr": 0.0003589087731253417, "tps": 14958, "wall": 32758.8} {"step": 7477, "train_loss": 3.5753417015075684, "lr": 0.0003588965884632946, "tps": 14957, "wall": 32763.7} {"step": 7478, "train_loss": 3.5741331577301025, "lr": 0.0003588844022278193, "tps": 14957, "wall": 32768.5} {"step": 7479, "train_loss": 3.677748680114746, "lr": 0.00035887221441905406, "tps": 14957, "wall": 32773.3} {"step": 7480, "train_loss": 3.7060928344726562, "lr": 0.0003588600250371369, "tps": 14957, "wall": 32778.2} {"step": 7481, "train_loss": 3.5024399757385254, "lr": 0.00035884783408220584, "tps": 14957, "wall": 32783.0} {"step": 7482, "train_loss": 3.581089496612549, "lr": 0.00035883564155439896, "tps": 14956, "wall": 32787.8} {"step": 7483, "train_loss": 3.64460825920105, "lr": 0.0003588234474538545, "tps": 14956, "wall": 32792.7} {"step": 7484, "train_loss": 3.5876102447509766, "lr": 0.00035881125178071043, "tps": 14956, "wall": 32797.5} {"step": 7485, "train_loss": 3.573892593383789, "lr": 0.00035879905453510503, "tps": 14956, "wall": 32802.4} {"step": 7486, "train_loss": 3.589087963104248, "lr": 0.0003587868557171764, "tps": 14956, "wall": 32807.2} {"step": 7487, "train_loss": 3.5944080352783203, "lr": 0.0003587746553270628, "tps": 14955, "wall": 32812.1} {"step": 7488, "train_loss": 3.623880386352539, "lr": 0.00035876245336490236, "tps": 14955, "wall": 32816.9} {"step": 7489, "train_loss": 3.597874164581299, "lr": 0.0003587502498308334, "tps": 14955, "wall": 32821.8} {"step": 7490, "train_loss": 3.689657211303711, "lr": 0.0003587380447249941, "tps": 14955, "wall": 32826.6} {"step": 7491, "train_loss": 3.6113319396972656, "lr": 0.00035872583804752266, "tps": 14955, "wall": 32831.5} {"step": 7492, "train_loss": 3.5942111015319824, "lr": 0.0003587136297985574, "tps": 14954, "wall": 32836.3} {"step": 7493, "train_loss": 3.6236484050750732, "lr": 0.00035870141997823676, "tps": 14954, "wall": 32841.1} {"step": 7494, "train_loss": 3.5258026123046875, "lr": 0.00035868920858669884, "tps": 14954, "wall": 32846.0} {"step": 7495, "train_loss": 3.618525505065918, "lr": 0.0003586769956240821, "tps": 14954, "wall": 32850.9} {"step": 7496, "train_loss": 3.642927885055542, "lr": 0.0003586647810905248, "tps": 14953, "wall": 32855.7} {"step": 7497, "train_loss": 3.6297707557678223, "lr": 0.0003586525649861654, "tps": 14953, "wall": 32860.5} {"step": 7498, "train_loss": 3.6093173027038574, "lr": 0.00035864034731114227, "tps": 14953, "wall": 32865.4} {"step": 7499, "train_loss": 3.5250258445739746, "lr": 0.00035862812806559377, "tps": 14953, "wall": 32870.2} {"step": 7500, "train_loss": 3.668349266052246, "lr": 0.0003586159072496583, "tps": 14953, "wall": 32875.2} {"step": 7501, "train_loss": 3.48691463470459, "lr": 0.00035860368486347434, "tps": 14952, "wall": 32880.2} {"step": 7502, "train_loss": 3.6528284549713135, "lr": 0.0003585914609071804, "tps": 14952, "wall": 32885.0} {"step": 7503, "train_loss": 3.716446876525879, "lr": 0.0003585792353809148, "tps": 14952, "wall": 32889.8} {"step": 7504, "train_loss": 3.53603458404541, "lr": 0.00035856700828481615, "tps": 14952, "wall": 32894.7} {"step": 7505, "train_loss": 3.6311450004577637, "lr": 0.000358554779619023, "tps": 14952, "wall": 32899.5} {"step": 7506, "train_loss": 3.634953022003174, "lr": 0.00035854254938367375, "tps": 14951, "wall": 32904.3} {"step": 7507, "train_loss": 3.598416328430176, "lr": 0.00035853031757890704, "tps": 14951, "wall": 32909.2} {"step": 7508, "train_loss": 3.6448469161987305, "lr": 0.00035851808420486134, "tps": 14951, "wall": 32914.0} {"step": 7509, "train_loss": 3.63265323638916, "lr": 0.0003585058492616753, "tps": 14951, "wall": 32918.8} {"step": 7510, "train_loss": 3.6431186199188232, "lr": 0.0003584936127494876, "tps": 14950, "wall": 32923.7} {"step": 7511, "train_loss": 3.598351001739502, "lr": 0.00035848137466843664, "tps": 14950, "wall": 32928.5} {"step": 7512, "train_loss": 3.648630380630493, "lr": 0.0003584691350186613, "tps": 14950, "wall": 32933.4} {"step": 7513, "train_loss": 3.655876874923706, "lr": 0.0003584568938003, "tps": 14950, "wall": 32938.3} {"step": 7514, "train_loss": 3.5783824920654297, "lr": 0.00035844465101349157, "tps": 14950, "wall": 32943.1} {"step": 7515, "train_loss": 3.5964012145996094, "lr": 0.0003584324066583746, "tps": 14949, "wall": 32947.9} {"step": 7516, "train_loss": 3.5733580589294434, "lr": 0.00035842016073508786, "tps": 14949, "wall": 32952.8} {"step": 7517, "train_loss": 3.559612989425659, "lr": 0.0003584079132437701, "tps": 14949, "wall": 32957.6} {"step": 7518, "train_loss": 3.5570473670959473, "lr": 0.00035839566418455996, "tps": 14949, "wall": 32962.4} {"step": 7519, "train_loss": 3.662888526916504, "lr": 0.00035838341355759625, "tps": 14949, "wall": 32967.3} {"step": 7520, "train_loss": 3.6249310970306396, "lr": 0.00035837116136301774, "tps": 14948, "wall": 32972.1} {"step": 7521, "train_loss": 3.692685127258301, "lr": 0.00035835890760096327, "tps": 14948, "wall": 32977.0} {"step": 7522, "train_loss": 3.5764873027801514, "lr": 0.00035834665227157155, "tps": 14948, "wall": 32981.8} {"step": 7523, "train_loss": 3.6912717819213867, "lr": 0.0003583343953749815, "tps": 14948, "wall": 32986.6} {"step": 7524, "train_loss": 3.524482250213623, "lr": 0.00035832213691133194, "tps": 14948, "wall": 32991.5} {"step": 7525, "train_loss": 3.4896724224090576, "lr": 0.0003583098768807617, "tps": 14947, "wall": 32996.4} {"step": 7526, "train_loss": 3.5971384048461914, "lr": 0.00035829761528340977, "tps": 14947, "wall": 33001.2} {"step": 7527, "train_loss": 3.5672271251678467, "lr": 0.0003582853521194149, "tps": 14947, "wall": 33006.1} {"step": 7528, "train_loss": 3.5583348274230957, "lr": 0.0003582730873889161, "tps": 14947, "wall": 33010.9} {"step": 7529, "train_loss": 3.6050710678100586, "lr": 0.0003582608210920523, "tps": 14946, "wall": 33015.8} {"step": 7530, "train_loss": 3.6576905250549316, "lr": 0.0003582485532289624, "tps": 14946, "wall": 33020.6} {"step": 7531, "train_loss": 3.4691195487976074, "lr": 0.0003582362837997855, "tps": 14946, "wall": 33025.4} {"step": 7532, "train_loss": 3.524116039276123, "lr": 0.0003582240128046604, "tps": 14946, "wall": 33030.3} {"step": 7533, "train_loss": 3.6244280338287354, "lr": 0.00035821174024372617, "tps": 14946, "wall": 33035.1} {"step": 7534, "train_loss": 3.6596174240112305, "lr": 0.00035819946611712197, "tps": 14945, "wall": 33039.9} {"step": 7535, "train_loss": 3.5910143852233887, "lr": 0.0003581871904249867, "tps": 14945, "wall": 33044.8} {"step": 7536, "train_loss": 3.5567474365234375, "lr": 0.0003581749131674595, "tps": 14945, "wall": 33049.6} {"step": 7537, "train_loss": 3.5429930686950684, "lr": 0.0003581626343446794, "tps": 14945, "wall": 33054.5} {"step": 7538, "train_loss": 3.597611427307129, "lr": 0.00035815035395678544, "tps": 14945, "wall": 33059.3} {"step": 7539, "train_loss": 3.639035224914551, "lr": 0.00035813807200391686, "tps": 14944, "wall": 33064.2} {"step": 7540, "train_loss": 3.697777509689331, "lr": 0.0003581257884862127, "tps": 14944, "wall": 33069.0} {"step": 7541, "train_loss": 3.6522607803344727, "lr": 0.00035811350340381214, "tps": 14944, "wall": 33073.9} {"step": 7542, "train_loss": 3.6385931968688965, "lr": 0.0003581012167568544, "tps": 14944, "wall": 33078.7} {"step": 7543, "train_loss": 3.712036371231079, "lr": 0.00035808892854547847, "tps": 14944, "wall": 33083.5} {"step": 7544, "train_loss": 3.702112913131714, "lr": 0.0003580766387698238, "tps": 14943, "wall": 33088.3} {"step": 7545, "train_loss": 3.5711517333984375, "lr": 0.0003580643474300294, "tps": 14943, "wall": 33093.2} {"step": 7546, "train_loss": 3.6310739517211914, "lr": 0.0003580520545262347, "tps": 14943, "wall": 33098.0} {"step": 7547, "train_loss": 3.5956902503967285, "lr": 0.0003580397600585788, "tps": 14943, "wall": 33102.8} {"step": 7548, "train_loss": 3.6360490322113037, "lr": 0.00035802746402720107, "tps": 14943, "wall": 33107.7} {"step": 7549, "train_loss": 3.556870698928833, "lr": 0.00035801516643224076, "tps": 14942, "wall": 33112.5} {"step": 7550, "train_loss": 3.6723971366882324, "lr": 0.00035800286727383717, "tps": 14942, "wall": 33117.4} {"step": 7551, "train_loss": 3.5923614501953125, "lr": 0.0003579905665521296, "tps": 14942, "wall": 33122.2} {"step": 7552, "train_loss": 3.6323561668395996, "lr": 0.00035797826426725744, "tps": 14942, "wall": 33127.1} {"step": 7553, "train_loss": 3.6446499824523926, "lr": 0.00035796596041936005, "tps": 14942, "wall": 33131.9} {"step": 7554, "train_loss": 3.556312084197998, "lr": 0.00035795365500857683, "tps": 14941, "wall": 33136.7} {"step": 7555, "train_loss": 3.5935914516448975, "lr": 0.00035794134803504715, "tps": 14941, "wall": 33141.6} {"step": 7556, "train_loss": 3.6183390617370605, "lr": 0.0003579290394989103, "tps": 14941, "wall": 33146.4} {"step": 7557, "train_loss": 3.6602001190185547, "lr": 0.00035791672940030595, "tps": 14941, "wall": 33151.2} {"step": 7558, "train_loss": 3.5368833541870117, "lr": 0.00035790441773937335, "tps": 14941, "wall": 33156.1} {"step": 7559, "train_loss": 3.5474071502685547, "lr": 0.0003578921045162521, "tps": 14940, "wall": 33160.9} {"step": 7560, "train_loss": 3.528545379638672, "lr": 0.0003578797897310816, "tps": 14940, "wall": 33165.8} {"step": 7561, "train_loss": 3.62807035446167, "lr": 0.0003578674733840014, "tps": 14940, "wall": 33170.6} {"step": 7562, "train_loss": 3.564981460571289, "lr": 0.000357855155475151, "tps": 14940, "wall": 33175.5} {"step": 7563, "train_loss": 3.684086799621582, "lr": 0.00035784283600466993, "tps": 14939, "wall": 33180.3} {"step": 7564, "train_loss": 3.5533039569854736, "lr": 0.0003578305149726978, "tps": 14939, "wall": 33185.2} {"step": 7565, "train_loss": 3.5813779830932617, "lr": 0.0003578181923793741, "tps": 14939, "wall": 33190.0} {"step": 7566, "train_loss": 3.5927371978759766, "lr": 0.0003578058682248384, "tps": 14939, "wall": 33194.8} {"step": 7567, "train_loss": 3.60237193107605, "lr": 0.00035779354250923043, "tps": 14939, "wall": 33199.7} {"step": 7568, "train_loss": 3.638439893722534, "lr": 0.0003577812152326898, "tps": 14938, "wall": 33204.5} {"step": 7569, "train_loss": 3.632692813873291, "lr": 0.00035776888639535605, "tps": 14938, "wall": 33209.3} {"step": 7570, "train_loss": 3.4776501655578613, "lr": 0.00035775655599736895, "tps": 14938, "wall": 33214.2} {"step": 7571, "train_loss": 3.589522361755371, "lr": 0.0003577442240388681, "tps": 14938, "wall": 33219.0} {"step": 7572, "train_loss": 3.585184097290039, "lr": 0.0003577318905199932, "tps": 14938, "wall": 33223.8} {"step": 7573, "train_loss": 3.584317684173584, "lr": 0.000357719555440884, "tps": 14938, "wall": 33228.6} {"step": 7574, "train_loss": 3.7276511192321777, "lr": 0.0003577072188016803, "tps": 14937, "wall": 33233.5} {"step": 7575, "train_loss": 3.6205644607543945, "lr": 0.0003576948806025217, "tps": 14937, "wall": 33238.4} {"step": 7576, "train_loss": 3.646303415298462, "lr": 0.000357682540843548, "tps": 14937, "wall": 33243.2} {"step": 7577, "train_loss": 3.6178927421569824, "lr": 0.0003576701995248992, "tps": 14937, "wall": 33248.1} {"step": 7578, "train_loss": 3.487717628479004, "lr": 0.00035765785664671477, "tps": 14936, "wall": 33252.9} {"step": 7579, "train_loss": 3.6050429344177246, "lr": 0.00035764551220913483, "tps": 14936, "wall": 33257.7} {"step": 7580, "train_loss": 3.654609441757202, "lr": 0.00035763316621229897, "tps": 14936, "wall": 33262.6} {"step": 7581, "train_loss": 3.6427431106567383, "lr": 0.00035762081865634715, "tps": 14936, "wall": 33267.4} {"step": 7582, "train_loss": 3.599674701690674, "lr": 0.0003576084695414193, "tps": 14936, "wall": 33272.2} {"step": 7583, "train_loss": 3.587655782699585, "lr": 0.0003575961188676552, "tps": 14935, "wall": 33277.1} {"step": 7584, "train_loss": 3.6988253593444824, "lr": 0.0003575837666351949, "tps": 14935, "wall": 33281.9} {"step": 7585, "train_loss": 3.526531219482422, "lr": 0.00035757141284417827, "tps": 14935, "wall": 33286.8} {"step": 7586, "train_loss": 3.638523578643799, "lr": 0.00035755905749474515, "tps": 14935, "wall": 33291.6} {"step": 7587, "train_loss": 3.5687646865844727, "lr": 0.00035754670058703563, "tps": 14935, "wall": 33296.5} {"step": 7588, "train_loss": 3.5231094360351562, "lr": 0.0003575343421211896, "tps": 14934, "wall": 33301.3} {"step": 7589, "train_loss": 3.5803327560424805, "lr": 0.00035752198209734715, "tps": 14934, "wall": 33306.2} {"step": 7590, "train_loss": 3.614427089691162, "lr": 0.00035750962051564825, "tps": 14934, "wall": 33311.0} {"step": 7591, "train_loss": 3.6997461318969727, "lr": 0.0003574972573762329, "tps": 14934, "wall": 33315.8} {"step": 7592, "train_loss": 3.6747732162475586, "lr": 0.0003574848926792412, "tps": 14934, "wall": 33320.6} {"step": 7593, "train_loss": 3.609982490539551, "lr": 0.0003574725264248132, "tps": 14933, "wall": 33325.5} {"step": 7594, "train_loss": 3.5361413955688477, "lr": 0.00035746015861308895, "tps": 14933, "wall": 33330.3} {"step": 7595, "train_loss": 3.611440896987915, "lr": 0.00035744778924420867, "tps": 14933, "wall": 33335.1} {"step": 7596, "train_loss": 3.618712902069092, "lr": 0.0003574354183183123, "tps": 14933, "wall": 33340.0} {"step": 7597, "train_loss": 3.5721986293792725, "lr": 0.0003574230458355401, "tps": 14933, "wall": 33344.8} {"step": 7598, "train_loss": 3.578023672103882, "lr": 0.0003574106717960322, "tps": 14932, "wall": 33349.6} {"step": 7599, "train_loss": 3.5138044357299805, "lr": 0.00035739829619992877, "tps": 14932, "wall": 33354.5} {"step": 7600, "train_loss": 3.740558624267578, "lr": 0.0003573859190473701, "tps": 14932, "wall": 33359.3} {"step": 7601, "train_loss": 3.4184231758117676, "lr": 0.00035737354033849625, "tps": 14932, "wall": 33364.2} {"step": 7602, "train_loss": 3.6391000747680664, "lr": 0.00035736116007344755, "tps": 14932, "wall": 33369.0} {"step": 7603, "train_loss": 3.5524344444274902, "lr": 0.00035734877825236404, "tps": 14931, "wall": 33373.8} {"step": 7604, "train_loss": 3.60201358795166, "lr": 0.0003573363948753863, "tps": 14931, "wall": 33378.7} {"step": 7605, "train_loss": 3.661724805831909, "lr": 0.00035732400994265435, "tps": 14931, "wall": 33383.5} {"step": 7606, "train_loss": 3.647045612335205, "lr": 0.0003573116234543086, "tps": 14931, "wall": 33388.3} {"step": 7607, "train_loss": 3.538816213607788, "lr": 0.0003572992354104894, "tps": 14931, "wall": 33393.2} {"step": 7608, "train_loss": 3.6493351459503174, "lr": 0.00035728684581133705, "tps": 14930, "wall": 33398.0} {"step": 7609, "train_loss": 3.612431049346924, "lr": 0.00035727445465699183, "tps": 14930, "wall": 33402.8} {"step": 7610, "train_loss": 3.6011791229248047, "lr": 0.00035726206194759414, "tps": 14930, "wall": 33407.7} {"step": 7611, "train_loss": 3.505748748779297, "lr": 0.00035724966768328444, "tps": 14930, "wall": 33412.5} {"step": 7612, "train_loss": 3.6086478233337402, "lr": 0.000357237271864203, "tps": 14930, "wall": 33417.4} {"step": 7613, "train_loss": 3.5364389419555664, "lr": 0.00035722487449049045, "tps": 14929, "wall": 33422.2} {"step": 7614, "train_loss": 3.674708366394043, "lr": 0.000357212475562287, "tps": 14929, "wall": 33427.1} {"step": 7615, "train_loss": 3.4965624809265137, "lr": 0.0003572000750797332, "tps": 14929, "wall": 33431.9} {"step": 7616, "train_loss": 3.6372416019439697, "lr": 0.00035718767304296963, "tps": 14929, "wall": 33436.7} {"step": 7617, "train_loss": 3.6630256175994873, "lr": 0.00035717526945213654, "tps": 14929, "wall": 33441.6} {"step": 7618, "train_loss": 3.549795150756836, "lr": 0.00035716286430737465, "tps": 14928, "wall": 33446.4} {"step": 7619, "train_loss": 3.5963315963745117, "lr": 0.00035715045760882446, "tps": 14928, "wall": 33451.2} {"step": 7620, "train_loss": 3.5011887550354004, "lr": 0.0003571380493566264, "tps": 14928, "wall": 33456.1} {"step": 7621, "train_loss": 3.5976381301879883, "lr": 0.0003571256395509211, "tps": 14928, "wall": 33460.9} {"step": 7622, "train_loss": 3.485797643661499, "lr": 0.00035711322819184915, "tps": 14928, "wall": 33465.7} {"step": 7623, "train_loss": 3.7101757526397705, "lr": 0.0003571008152795511, "tps": 14927, "wall": 33470.6} {"step": 7624, "train_loss": 3.6000208854675293, "lr": 0.00035708840081416764, "tps": 14927, "wall": 33475.4} {"step": 7625, "train_loss": 3.6609296798706055, "lr": 0.0003570759847958393, "tps": 14927, "wall": 33480.3} {"step": 7626, "train_loss": 3.617492437362671, "lr": 0.0003570635672247069, "tps": 14927, "wall": 33485.1} {"step": 7627, "train_loss": 3.5044751167297363, "lr": 0.0003570511481009109, "tps": 14927, "wall": 33490.0} {"step": 7628, "train_loss": 3.5728633403778076, "lr": 0.0003570387274245921, "tps": 14926, "wall": 33494.8} {"step": 7629, "train_loss": 3.5326642990112305, "lr": 0.0003570263051958912, "tps": 14926, "wall": 33499.7} {"step": 7630, "train_loss": 3.53347110748291, "lr": 0.0003570138814149489, "tps": 14926, "wall": 33504.5} {"step": 7631, "train_loss": 3.636049747467041, "lr": 0.00035700145608190593, "tps": 14926, "wall": 33509.3} {"step": 7632, "train_loss": 3.6673436164855957, "lr": 0.0003569890291969031, "tps": 14926, "wall": 33514.2} {"step": 7633, "train_loss": 3.6026158332824707, "lr": 0.000356976600760081, "tps": 14925, "wall": 33519.0} {"step": 7634, "train_loss": 3.5993528366088867, "lr": 0.0003569641707715807, "tps": 14925, "wall": 33523.8} {"step": 7635, "train_loss": 3.603865146636963, "lr": 0.00035695173923154283, "tps": 14925, "wall": 33528.7} {"step": 7636, "train_loss": 3.583156108856201, "lr": 0.00035693930614010824, "tps": 14925, "wall": 33533.5} {"step": 7637, "train_loss": 3.634296417236328, "lr": 0.0003569268714974178, "tps": 14925, "wall": 33538.4} {"step": 7638, "train_loss": 3.6103639602661133, "lr": 0.0003569144353036123, "tps": 14924, "wall": 33543.2} {"step": 7639, "train_loss": 3.461894989013672, "lr": 0.0003569019975588327, "tps": 14924, "wall": 33548.0} {"step": 7640, "train_loss": 3.6001229286193848, "lr": 0.0003568895582632199, "tps": 14924, "wall": 33552.9} {"step": 7641, "train_loss": 3.5031495094299316, "lr": 0.0003568771174169147, "tps": 14924, "wall": 33557.7} {"step": 7642, "train_loss": 3.5956687927246094, "lr": 0.00035686467502005816, "tps": 14924, "wall": 33562.5} {"step": 7643, "train_loss": 3.5808565616607666, "lr": 0.0003568522310727911, "tps": 14923, "wall": 33567.4} {"step": 7644, "train_loss": 3.622653007507324, "lr": 0.00035683978557525466, "tps": 14923, "wall": 33572.2} {"step": 7645, "train_loss": 3.5276718139648438, "lr": 0.00035682733852758974, "tps": 14923, "wall": 33577.0} {"step": 7646, "train_loss": 3.4900858402252197, "lr": 0.00035681488992993725, "tps": 14923, "wall": 33581.8} {"step": 7647, "train_loss": 3.639626979827881, "lr": 0.0003568024397824383, "tps": 14923, "wall": 33586.7} {"step": 7648, "train_loss": 3.5682287216186523, "lr": 0.00035678998808523396, "tps": 14922, "wall": 33591.5} {"step": 7649, "train_loss": 3.5968868732452393, "lr": 0.00035677753483846514, "tps": 14922, "wall": 33596.4} {"step": 7650, "train_loss": 3.548214912414551, "lr": 0.00035676508004227315, "tps": 14922, "wall": 33601.2} {"step": 7651, "train_loss": 3.5433413982391357, "lr": 0.00035675262369679885, "tps": 14922, "wall": 33606.1} {"step": 7652, "train_loss": 3.5878963470458984, "lr": 0.0003567401658021834, "tps": 14922, "wall": 33610.9} {"step": 7653, "train_loss": 3.602313280105591, "lr": 0.00035672770635856803, "tps": 14921, "wall": 33615.7} {"step": 7654, "train_loss": 3.5038294792175293, "lr": 0.0003567152453660938, "tps": 14921, "wall": 33620.5} {"step": 7655, "train_loss": 3.553006649017334, "lr": 0.00035670278282490177, "tps": 14921, "wall": 33625.4} {"step": 7656, "train_loss": 3.526472568511963, "lr": 0.00035669031873513334, "tps": 14921, "wall": 33630.2} {"step": 7657, "train_loss": 3.6641721725463867, "lr": 0.0003566778530969295, "tps": 14921, "wall": 33635.0} {"step": 7658, "train_loss": 3.6020307540893555, "lr": 0.0003566653859104316, "tps": 14921, "wall": 33639.8} {"step": 7659, "train_loss": 3.5994880199432373, "lr": 0.00035665291717578074, "tps": 14920, "wall": 33644.7} {"step": 7660, "train_loss": 3.524810314178467, "lr": 0.00035664044689311835, "tps": 14920, "wall": 33649.5} {"step": 7661, "train_loss": 3.6354928016662598, "lr": 0.0003566279750625855, "tps": 14920, "wall": 33654.4} {"step": 7662, "train_loss": 3.567962646484375, "lr": 0.00035661550168432355, "tps": 14920, "wall": 33659.3} {"step": 7663, "train_loss": 3.6002578735351562, "lr": 0.0003566030267584739, "tps": 14919, "wall": 33664.1} {"step": 7664, "train_loss": 3.6495962142944336, "lr": 0.0003565905502851777, "tps": 14919, "wall": 33668.9} {"step": 7665, "train_loss": 3.5856409072875977, "lr": 0.00035657807226457635, "tps": 14919, "wall": 33673.7} {"step": 7666, "train_loss": 3.567471504211426, "lr": 0.00035656559269681127, "tps": 14919, "wall": 33678.6} {"step": 7667, "train_loss": 3.588792562484741, "lr": 0.00035655311158202374, "tps": 14919, "wall": 33683.4} {"step": 7668, "train_loss": 3.5451250076293945, "lr": 0.0003565406289203551, "tps": 14918, "wall": 33688.3} {"step": 7669, "train_loss": 3.621274471282959, "lr": 0.0003565281447119469, "tps": 14918, "wall": 33693.1} {"step": 7670, "train_loss": 3.556790351867676, "lr": 0.0003565156589569405, "tps": 14918, "wall": 33698.0} {"step": 7671, "train_loss": 3.4954471588134766, "lr": 0.0003565031716554773, "tps": 14918, "wall": 33702.8} {"step": 7672, "train_loss": 3.7108612060546875, "lr": 0.00035649068280769883, "tps": 14918, "wall": 33707.6} {"step": 7673, "train_loss": 3.6574785709381104, "lr": 0.0003564781924137465, "tps": 14918, "wall": 33712.5} {"step": 7674, "train_loss": 3.4932708740234375, "lr": 0.0003564657004737618, "tps": 14917, "wall": 33717.4} {"step": 7675, "train_loss": 3.4902257919311523, "lr": 0.0003564532069878863, "tps": 14917, "wall": 33722.2} {"step": 7676, "train_loss": 3.5145740509033203, "lr": 0.00035644071195626144, "tps": 14917, "wall": 33727.0} {"step": 7677, "train_loss": 3.5270605087280273, "lr": 0.00035642821537902884, "tps": 14917, "wall": 33731.9} {"step": 7678, "train_loss": 3.505784273147583, "lr": 0.00035641571725633, "tps": 14917, "wall": 33736.7} {"step": 7679, "train_loss": 3.40533185005188, "lr": 0.0003564032175883066, "tps": 14916, "wall": 33741.5} {"step": 7680, "train_loss": 3.5276975631713867, "lr": 0.0003563907163751002, "tps": 14916, "wall": 33746.3} {"step": 7681, "train_loss": 3.571441888809204, "lr": 0.0003563782136168523, "tps": 14916, "wall": 33751.1} {"step": 7682, "train_loss": 3.556565284729004, "lr": 0.0003563657093137047, "tps": 14916, "wall": 33756.0} {"step": 7683, "train_loss": 3.6743228435516357, "lr": 0.00035635320346579885, "tps": 14916, "wall": 33760.8} {"step": 7684, "train_loss": 3.5803940296173096, "lr": 0.0003563406960732766, "tps": 14915, "wall": 33765.6} {"step": 7685, "train_loss": 3.5067665576934814, "lr": 0.00035632818713627956, "tps": 14915, "wall": 33770.4} {"step": 7686, "train_loss": 3.555396318435669, "lr": 0.00035631567665494947, "tps": 14915, "wall": 33775.3} {"step": 7687, "train_loss": 3.5086452960968018, "lr": 0.000356303164629428, "tps": 14915, "wall": 33780.1} {"step": 7688, "train_loss": 3.64683198928833, "lr": 0.0003562906510598569, "tps": 14915, "wall": 33785.0} {"step": 7689, "train_loss": 3.683335781097412, "lr": 0.000356278135946378, "tps": 14914, "wall": 33789.8} {"step": 7690, "train_loss": 3.5617241859436035, "lr": 0.0003562656192891329, "tps": 14914, "wall": 33794.6} {"step": 7691, "train_loss": 3.741952896118164, "lr": 0.0003562531010882635, "tps": 14914, "wall": 33799.5} {"step": 7692, "train_loss": 3.6681900024414062, "lr": 0.00035624058134391167, "tps": 14914, "wall": 33804.3} {"step": 7693, "train_loss": 3.5313172340393066, "lr": 0.0003562280600562191, "tps": 14914, "wall": 33809.1} {"step": 7694, "train_loss": 3.657571315765381, "lr": 0.00035621553722532776, "tps": 14913, "wall": 33814.0} {"step": 7695, "train_loss": 3.550947666168213, "lr": 0.0003562030128513794, "tps": 14913, "wall": 33818.8} {"step": 7696, "train_loss": 3.620171308517456, "lr": 0.000356190486934516, "tps": 14913, "wall": 33823.6} {"step": 7697, "train_loss": 3.650441884994507, "lr": 0.0003561779594748793, "tps": 14913, "wall": 33828.4} {"step": 7698, "train_loss": 3.558565139770508, "lr": 0.00035616543047261136, "tps": 14913, "wall": 33833.3} {"step": 7699, "train_loss": 3.5189099311828613, "lr": 0.00035615289992785407, "tps": 14912, "wall": 33838.1} {"step": 7700, "train_loss": 3.594137191772461, "lr": 0.00035614036784074936, "tps": 14912, "wall": 33843.0} {"step": 7701, "train_loss": 3.5926294326782227, "lr": 0.00035612783421143916, "tps": 14912, "wall": 33847.8} {"step": 7702, "train_loss": 3.6124448776245117, "lr": 0.00035611529904006555, "tps": 14912, "wall": 33852.6} {"step": 7703, "train_loss": 3.6142654418945312, "lr": 0.0003561027623267704, "tps": 14912, "wall": 33857.4} {"step": 7704, "train_loss": 3.6456961631774902, "lr": 0.00035609022407169586, "tps": 14912, "wall": 33862.3} {"step": 7705, "train_loss": 3.5409133434295654, "lr": 0.00035607768427498384, "tps": 14911, "wall": 33867.1} {"step": 7706, "train_loss": 3.656393051147461, "lr": 0.0003560651429367765, "tps": 14911, "wall": 33871.9} {"step": 7707, "train_loss": 3.6200594902038574, "lr": 0.0003560526000572158, "tps": 14911, "wall": 33876.7} {"step": 7708, "train_loss": 3.549800395965576, "lr": 0.000356040055636444, "tps": 14911, "wall": 33881.6} {"step": 7709, "train_loss": 3.4881577491760254, "lr": 0.00035602750967460295, "tps": 14911, "wall": 33886.4} {"step": 7710, "train_loss": 3.560225009918213, "lr": 0.000356014962171835, "tps": 14910, "wall": 33891.2} {"step": 7711, "train_loss": 3.4475409984588623, "lr": 0.00035600241312828214, "tps": 14910, "wall": 33896.1} {"step": 7712, "train_loss": 3.530383825302124, "lr": 0.00035598986254408663, "tps": 14910, "wall": 33900.9} {"step": 7713, "train_loss": 3.642298698425293, "lr": 0.0003559773104193906, "tps": 14910, "wall": 33905.7} {"step": 7714, "train_loss": 3.639490842819214, "lr": 0.0003559647567543363, "tps": 14910, "wall": 33910.5} {"step": 7715, "train_loss": 3.576359510421753, "lr": 0.0003559522015490658, "tps": 14909, "wall": 33915.4} {"step": 7716, "train_loss": 3.5604946613311768, "lr": 0.00035593964480372137, "tps": 14909, "wall": 33920.2} {"step": 7717, "train_loss": 3.6047067642211914, "lr": 0.0003559270865184453, "tps": 14909, "wall": 33925.0} {"step": 7718, "train_loss": 3.453577995300293, "lr": 0.00035591452669337997, "tps": 14909, "wall": 33929.8} {"step": 7719, "train_loss": 3.581822156906128, "lr": 0.0003559019653286674, "tps": 14909, "wall": 33934.7} {"step": 7720, "train_loss": 3.509478807449341, "lr": 0.00035588940242445, "tps": 14908, "wall": 33939.5} {"step": 7721, "train_loss": 3.509945869445801, "lr": 0.0003558768379808702, "tps": 14908, "wall": 33944.3} {"step": 7722, "train_loss": 3.537073850631714, "lr": 0.0003558642719980702, "tps": 14908, "wall": 33949.1} {"step": 7723, "train_loss": 3.636565685272217, "lr": 0.00035585170447619235, "tps": 14908, "wall": 33954.0} {"step": 7724, "train_loss": 3.627711057662964, "lr": 0.0003558391354153791, "tps": 14908, "wall": 33958.8} {"step": 7725, "train_loss": 3.567656993865967, "lr": 0.00035582656481577266, "tps": 14908, "wall": 33963.6} {"step": 7726, "train_loss": 3.4727444648742676, "lr": 0.0003558139926775156, "tps": 14907, "wall": 33968.5} {"step": 7727, "train_loss": 3.584872007369995, "lr": 0.0003558014190007503, "tps": 14907, "wall": 33973.3} {"step": 7728, "train_loss": 3.5016565322875977, "lr": 0.00035578884378561923, "tps": 14907, "wall": 33978.1} {"step": 7729, "train_loss": 3.6824021339416504, "lr": 0.00035577626703226466, "tps": 14907, "wall": 33982.9} {"step": 7730, "train_loss": 3.5808815956115723, "lr": 0.00035576368874082933, "tps": 14907, "wall": 33987.7} {"step": 7731, "train_loss": 3.711656093597412, "lr": 0.00035575110891145555, "tps": 14906, "wall": 33992.6} {"step": 7732, "train_loss": 3.6585769653320312, "lr": 0.0003557385275442858, "tps": 14906, "wall": 33997.4} {"step": 7733, "train_loss": 3.616392135620117, "lr": 0.00035572594463946267, "tps": 14906, "wall": 34002.2} {"step": 7734, "train_loss": 3.4910483360290527, "lr": 0.00035571336019712876, "tps": 14906, "wall": 34007.1} {"step": 7735, "train_loss": 3.5594325065612793, "lr": 0.0003557007742174265, "tps": 14906, "wall": 34011.9} {"step": 7736, "train_loss": 3.529942274093628, "lr": 0.00035568818670049865, "tps": 14905, "wall": 34016.8} {"step": 7737, "train_loss": 3.5551600456237793, "lr": 0.00035567559764648754, "tps": 14905, "wall": 34021.6} {"step": 7738, "train_loss": 3.560796022415161, "lr": 0.000355663007055536, "tps": 14905, "wall": 34026.4} {"step": 7739, "train_loss": 3.5626540184020996, "lr": 0.00035565041492778657, "tps": 14905, "wall": 34031.2} {"step": 7740, "train_loss": 3.6022441387176514, "lr": 0.00035563782126338186, "tps": 14905, "wall": 34036.1} {"step": 7741, "train_loss": 3.5809764862060547, "lr": 0.0003556252260624646, "tps": 14905, "wall": 34040.9} {"step": 7742, "train_loss": 3.5382280349731445, "lr": 0.00035561262932517747, "tps": 14904, "wall": 34045.7} {"step": 7743, "train_loss": 3.5157365798950195, "lr": 0.0003556000310516631, "tps": 14904, "wall": 34050.5} {"step": 7744, "train_loss": 3.5850613117218018, "lr": 0.00035558743124206423, "tps": 14904, "wall": 34055.3} {"step": 7745, "train_loss": 3.594116449356079, "lr": 0.0003555748298965236, "tps": 14904, "wall": 34060.2} {"step": 7746, "train_loss": 3.5084972381591797, "lr": 0.00035556222701518396, "tps": 14904, "wall": 34065.0} {"step": 7747, "train_loss": 3.499354839324951, "lr": 0.00035554962259818815, "tps": 14903, "wall": 34069.8} {"step": 7748, "train_loss": 3.7637906074523926, "lr": 0.0003555370166456788, "tps": 14903, "wall": 34074.7} {"step": 7749, "train_loss": 3.5557379722595215, "lr": 0.00035552440915779886, "tps": 14903, "wall": 34079.5} {"step": 7750, "train_loss": 3.656635284423828, "lr": 0.00035551180013469107, "tps": 14903, "wall": 34084.4} {"step": 7751, "train_loss": 3.571127414703369, "lr": 0.0003554991895764982, "tps": 14903, "wall": 34089.3} {"step": 7752, "train_loss": 3.514625072479248, "lr": 0.0003554865774833633, "tps": 14902, "wall": 34094.1} {"step": 7753, "train_loss": 3.5220842361450195, "lr": 0.00035547396385542904, "tps": 14902, "wall": 34098.9} {"step": 7754, "train_loss": 3.542454481124878, "lr": 0.0003554613486928384, "tps": 14902, "wall": 34103.8} {"step": 7755, "train_loss": 3.5923635959625244, "lr": 0.0003554487319957342, "tps": 14902, "wall": 34108.6} {"step": 7756, "train_loss": 3.5373964309692383, "lr": 0.0003554361137642596, "tps": 14902, "wall": 34113.4} {"step": 7757, "train_loss": 3.703627109527588, "lr": 0.00035542349399855723, "tps": 14901, "wall": 34118.2} {"step": 7758, "train_loss": 3.5321829319000244, "lr": 0.0003554108726987703, "tps": 14901, "wall": 34123.1} {"step": 7759, "train_loss": 3.5714621543884277, "lr": 0.0003553982498650416, "tps": 14901, "wall": 34127.9} {"step": 7760, "train_loss": 3.567990303039551, "lr": 0.00035538562549751424, "tps": 14901, "wall": 34132.7} {"step": 7761, "train_loss": 3.5392889976501465, "lr": 0.00035537299959633123, "tps": 14901, "wall": 34137.6} {"step": 7762, "train_loss": 3.618072271347046, "lr": 0.0003553603721616355, "tps": 14900, "wall": 34142.4} {"step": 7763, "train_loss": 3.605151653289795, "lr": 0.00035534774319357016, "tps": 14900, "wall": 34147.2} {"step": 7764, "train_loss": 3.593613624572754, "lr": 0.0003553351126922783, "tps": 14900, "wall": 34152.1} {"step": 7765, "train_loss": 3.5840182304382324, "lr": 0.0003553224806579029, "tps": 14900, "wall": 34156.9} {"step": 7766, "train_loss": 3.5100812911987305, "lr": 0.0003553098470905872, "tps": 14900, "wall": 34161.7} {"step": 7767, "train_loss": 3.5601820945739746, "lr": 0.0003552972119904741, "tps": 14900, "wall": 34166.5} {"step": 7768, "train_loss": 3.6127519607543945, "lr": 0.00035528457535770693, "tps": 14899, "wall": 34171.3} {"step": 7769, "train_loss": 3.6352450847625732, "lr": 0.0003552719371924288, "tps": 14899, "wall": 34176.2} {"step": 7770, "train_loss": 3.639317035675049, "lr": 0.00035525929749478284, "tps": 14899, "wall": 34181.0} {"step": 7771, "train_loss": 3.5677809715270996, "lr": 0.0003552466562649123, "tps": 14899, "wall": 34185.8} {"step": 7772, "train_loss": 3.5860702991485596, "lr": 0.00035523401350296026, "tps": 14899, "wall": 34190.6} {"step": 7773, "train_loss": 3.4754366874694824, "lr": 0.0003552213692090699, "tps": 14898, "wall": 34195.5} {"step": 7774, "train_loss": 3.5421085357666016, "lr": 0.0003552087233833847, "tps": 14898, "wall": 34200.3} {"step": 7775, "train_loss": 3.499692440032959, "lr": 0.0003551960760260477, "tps": 14898, "wall": 34205.1} {"step": 7776, "train_loss": 3.665775775909424, "lr": 0.00035518342713720225, "tps": 14898, "wall": 34210.0} {"step": 7777, "train_loss": 3.6218857765197754, "lr": 0.0003551707767169916, "tps": 14898, "wall": 34214.8} {"step": 7778, "train_loss": 3.5425243377685547, "lr": 0.0003551581247655591, "tps": 14898, "wall": 34219.6} {"step": 7779, "train_loss": 3.675377368927002, "lr": 0.00035514547128304814, "tps": 14897, "wall": 34224.4} {"step": 7780, "train_loss": 3.5704169273376465, "lr": 0.00035513281626960185, "tps": 14897, "wall": 34229.2} {"step": 7781, "train_loss": 3.5360984802246094, "lr": 0.00035512015972536374, "tps": 14897, "wall": 34234.1} {"step": 7782, "train_loss": 3.5490996837615967, "lr": 0.0003551075016504771, "tps": 14897, "wall": 34238.9} {"step": 7783, "train_loss": 3.695439577102661, "lr": 0.00035509484204508543, "tps": 14897, "wall": 34243.7} {"step": 7784, "train_loss": 3.580763339996338, "lr": 0.00035508218090933206, "tps": 14896, "wall": 34248.5} {"step": 7785, "train_loss": 3.598320484161377, "lr": 0.00035506951824336046, "tps": 14896, "wall": 34253.3} {"step": 7786, "train_loss": 3.5848846435546875, "lr": 0.000355056854047314, "tps": 14896, "wall": 34258.2} {"step": 7787, "train_loss": 3.5914065837860107, "lr": 0.0003550441883213363, "tps": 14896, "wall": 34263.0} {"step": 7788, "train_loss": 3.4624180793762207, "lr": 0.0003550315210655707, "tps": 14896, "wall": 34267.9} {"step": 7789, "train_loss": 3.642714262008667, "lr": 0.00035501885228016064, "tps": 14895, "wall": 34272.7} {"step": 7790, "train_loss": 3.6481335163116455, "lr": 0.0003550061819652498, "tps": 14895, "wall": 34277.5} {"step": 7791, "train_loss": 3.533621072769165, "lr": 0.00035499351012098154, "tps": 14895, "wall": 34282.3} {"step": 7792, "train_loss": 3.640519380569458, "lr": 0.00035498083674749954, "tps": 14895, "wall": 34287.2} {"step": 7793, "train_loss": 3.625199556350708, "lr": 0.0003549681618449473, "tps": 14895, "wall": 34292.0} {"step": 7794, "train_loss": 3.621809959411621, "lr": 0.0003549554854134685, "tps": 14895, "wall": 34296.8} {"step": 7795, "train_loss": 3.72519588470459, "lr": 0.0003549428074532066, "tps": 14894, "wall": 34301.6} {"step": 7796, "train_loss": 3.6082236766815186, "lr": 0.00035493012796430527, "tps": 14894, "wall": 34306.4} {"step": 7797, "train_loss": 3.5694074630737305, "lr": 0.00035491744694690814, "tps": 14894, "wall": 34311.2} {"step": 7798, "train_loss": 3.640160083770752, "lr": 0.0003549047644011589, "tps": 14894, "wall": 34316.1} {"step": 7799, "train_loss": 3.5918936729431152, "lr": 0.0003548920803272012, "tps": 14894, "wall": 34320.9} {"step": 7800, "train_loss": 3.746218681335449, "lr": 0.0003548793947251787, "tps": 14893, "wall": 34325.8} {"step": 7801, "train_loss": 3.4967238903045654, "lr": 0.00035486670759523513, "tps": 14893, "wall": 34330.6} {"step": 7802, "train_loss": 3.65859317779541, "lr": 0.00035485401893751414, "tps": 14893, "wall": 34335.4} {"step": 7803, "train_loss": 3.533949851989746, "lr": 0.0003548413287521596, "tps": 14893, "wall": 34340.2} {"step": 7804, "train_loss": 3.5854299068450928, "lr": 0.0003548286370393152, "tps": 14893, "wall": 34345.0} {"step": 7805, "train_loss": 3.610269546508789, "lr": 0.00035481594379912465, "tps": 14893, "wall": 34349.9} {"step": 7806, "train_loss": 3.5375266075134277, "lr": 0.00035480324903173187, "tps": 14892, "wall": 34354.7} {"step": 7807, "train_loss": 3.632659912109375, "lr": 0.00035479055273728054, "tps": 14892, "wall": 34359.9} {"step": 7808, "train_loss": 3.5626306533813477, "lr": 0.00035477785491591456, "tps": 14892, "wall": 34365.1} {"step": 7809, "train_loss": 3.6254332065582275, "lr": 0.0003547651555677777, "tps": 14891, "wall": 34370.2} {"step": 7810, "train_loss": 3.6642637252807617, "lr": 0.0003547524546930139, "tps": 14891, "wall": 34375.3} {"step": 7811, "train_loss": 3.4333906173706055, "lr": 0.000354739752291767, "tps": 14891, "wall": 34380.4} {"step": 7812, "train_loss": 3.5297722816467285, "lr": 0.00035472704836418087, "tps": 14890, "wall": 34385.8} {"step": 7813, "train_loss": 3.5733509063720703, "lr": 0.00035471434291039946, "tps": 14890, "wall": 34391.0} {"step": 7814, "train_loss": 3.672049045562744, "lr": 0.00035470163593056674, "tps": 14890, "wall": 34396.2} {"step": 7815, "train_loss": 3.4812324047088623, "lr": 0.00035468892742482653, "tps": 14889, "wall": 34401.5} {"step": 7816, "train_loss": 3.597053289413452, "lr": 0.0003546762173933229, "tps": 14889, "wall": 34406.7} {"step": 7817, "train_loss": 3.682821273803711, "lr": 0.00035466350583619977, "tps": 14889, "wall": 34411.7} {"step": 7818, "train_loss": 3.61427903175354, "lr": 0.00035465079275360124, "tps": 14888, "wall": 34416.6} {"step": 7819, "train_loss": 3.6034722328186035, "lr": 0.00035463807814567114, "tps": 14888, "wall": 34421.5} {"step": 7820, "train_loss": 3.52897310256958, "lr": 0.00035462536201255363, "tps": 14888, "wall": 34426.4} {"step": 7821, "train_loss": 3.696988105773926, "lr": 0.0003546126443543928, "tps": 14888, "wall": 34431.4} {"step": 7822, "train_loss": 3.5955023765563965, "lr": 0.0003545999251713326, "tps": 14887, "wall": 34436.5} {"step": 7823, "train_loss": 3.6449801921844482, "lr": 0.0003545872044635172, "tps": 14887, "wall": 34441.5} {"step": 7824, "train_loss": 3.527146816253662, "lr": 0.00035457448223109064, "tps": 14887, "wall": 34446.5} {"step": 7825, "train_loss": 3.541712760925293, "lr": 0.000354561758474197, "tps": 14887, "wall": 34451.5} {"step": 7826, "train_loss": 3.6561226844787598, "lr": 0.00035454903319298055, "tps": 14886, "wall": 34456.5} {"step": 7827, "train_loss": 3.6645965576171875, "lr": 0.0003545363063875854, "tps": 14886, "wall": 34461.5} {"step": 7828, "train_loss": 3.7063791751861572, "lr": 0.0003545235780581557, "tps": 14886, "wall": 34466.6} {"step": 7829, "train_loss": 3.564945697784424, "lr": 0.00035451084820483557, "tps": 14886, "wall": 34471.6} {"step": 7830, "train_loss": 3.5973246097564697, "lr": 0.0003544981168277693, "tps": 14885, "wall": 34476.6} {"step": 7831, "train_loss": 3.5638017654418945, "lr": 0.0003544853839271011, "tps": 14885, "wall": 34481.5} {"step": 7832, "train_loss": 3.5463171005249023, "lr": 0.00035447264950297516, "tps": 14885, "wall": 34486.4} {"step": 7833, "train_loss": 3.662339687347412, "lr": 0.00035445991355553575, "tps": 14885, "wall": 34491.3} {"step": 7834, "train_loss": 3.57096004486084, "lr": 0.0003544471760849272, "tps": 14884, "wall": 34496.2} {"step": 7835, "train_loss": 3.595770835876465, "lr": 0.0003544344370912938, "tps": 14884, "wall": 34501.1} {"step": 7836, "train_loss": 3.6778204441070557, "lr": 0.0003544216965747798, "tps": 14884, "wall": 34506.0} {"step": 7837, "train_loss": 3.513869524002075, "lr": 0.0003544089545355295, "tps": 14884, "wall": 34510.8} {"step": 7838, "train_loss": 3.592395782470703, "lr": 0.00035439621097368735, "tps": 14884, "wall": 34515.6} {"step": 7839, "train_loss": 3.568881034851074, "lr": 0.0003543834658893977, "tps": 14883, "wall": 34520.4} {"step": 7840, "train_loss": 3.645068883895874, "lr": 0.00035437071928280477, "tps": 14883, "wall": 34525.3} {"step": 7841, "train_loss": 3.5623013973236084, "lr": 0.00035435797115405314, "tps": 14883, "wall": 34530.1} {"step": 7842, "train_loss": 3.53824782371521, "lr": 0.0003543452215032871, "tps": 14883, "wall": 34534.9} {"step": 7843, "train_loss": 3.5857441425323486, "lr": 0.0003543324703306511, "tps": 14883, "wall": 34539.8} {"step": 7844, "train_loss": 3.5956437587738037, "lr": 0.00035431971763628966, "tps": 14882, "wall": 34544.9} {"step": 7845, "train_loss": 3.6817731857299805, "lr": 0.0003543069634203472, "tps": 14882, "wall": 34549.8} {"step": 7846, "train_loss": 3.5546340942382812, "lr": 0.00035429420768296816, "tps": 14882, "wall": 34554.8} {"step": 7847, "train_loss": 3.6032378673553467, "lr": 0.0003542814504242971, "tps": 14882, "wall": 34559.8} {"step": 7848, "train_loss": 3.563009023666382, "lr": 0.00035426869164447843, "tps": 14882, "wall": 34564.7} {"step": 7849, "train_loss": 3.5259976387023926, "lr": 0.00035425593134365686, "tps": 14881, "wall": 34569.7} {"step": 7850, "train_loss": 3.454711437225342, "lr": 0.00035424316952197677, "tps": 14881, "wall": 34574.9} {"step": 7851, "train_loss": 3.5327646732330322, "lr": 0.00035423040617958284, "tps": 14881, "wall": 34579.9} {"step": 7852, "train_loss": 3.5708439350128174, "lr": 0.0003542176413166196, "tps": 14880, "wall": 34585.3} {"step": 7853, "train_loss": 3.520237922668457, "lr": 0.0003542048749332316, "tps": 14880, "wall": 34590.7} {"step": 7854, "train_loss": 3.598262071609497, "lr": 0.0003541921070295635, "tps": 14879, "wall": 34596.0} {"step": 7855, "train_loss": 3.63210129737854, "lr": 0.00035417933760576006, "tps": 14879, "wall": 34600.9} {"step": 7856, "train_loss": 3.6037683486938477, "lr": 0.0003541665666619658, "tps": 14879, "wall": 34605.8} {"step": 7857, "train_loss": 3.6190032958984375, "lr": 0.0003541537941983254, "tps": 14879, "wall": 34610.8} {"step": 7858, "train_loss": 3.661322832107544, "lr": 0.00035414102021498353, "tps": 14878, "wall": 34615.8} {"step": 7859, "train_loss": 3.710348129272461, "lr": 0.0003541282447120849, "tps": 14878, "wall": 34620.8} {"step": 7860, "train_loss": 3.636280059814453, "lr": 0.0003541154676897743, "tps": 14878, "wall": 34625.7} {"step": 7861, "train_loss": 3.575737953186035, "lr": 0.00035410268914819643, "tps": 14878, "wall": 34630.6} {"step": 7862, "train_loss": 3.667660713195801, "lr": 0.00035408990908749607, "tps": 14878, "wall": 34635.5} {"step": 7863, "train_loss": 3.5951731204986572, "lr": 0.0003540771275078179, "tps": 14877, "wall": 34640.5} {"step": 7864, "train_loss": 3.6252198219299316, "lr": 0.0003540643444093068, "tps": 14877, "wall": 34645.3} {"step": 7865, "train_loss": 3.60756254196167, "lr": 0.0003540515597921076, "tps": 14877, "wall": 34650.3} {"step": 7866, "train_loss": 3.6567955017089844, "lr": 0.00035403877365636503, "tps": 14877, "wall": 34655.2} {"step": 7867, "train_loss": 3.664680242538452, "lr": 0.000354025986002224, "tps": 14876, "wall": 34660.1} {"step": 7868, "train_loss": 3.633150100708008, "lr": 0.0003540131968298293, "tps": 14876, "wall": 34665.1} {"step": 7869, "train_loss": 3.6570324897766113, "lr": 0.000354000406139326, "tps": 14876, "wall": 34670.0} {"step": 7870, "train_loss": 3.4486401081085205, "lr": 0.0003539876139308587, "tps": 14876, "wall": 34675.1} {"step": 7871, "train_loss": 3.621384859085083, "lr": 0.0003539748202045725, "tps": 14876, "wall": 34680.0} {"step": 7872, "train_loss": 3.640124797821045, "lr": 0.00035396202496061234, "tps": 14875, "wall": 34684.9} {"step": 7873, "train_loss": 3.534719228744507, "lr": 0.00035394922819912306, "tps": 14875, "wall": 34689.8} {"step": 7874, "train_loss": 3.5877444744110107, "lr": 0.00035393642992024964, "tps": 14875, "wall": 34694.7} {"step": 7875, "train_loss": 3.679318904876709, "lr": 0.0003539236301241372, "tps": 14875, "wall": 34699.6} {"step": 7876, "train_loss": 3.471762180328369, "lr": 0.0003539108288109305, "tps": 14874, "wall": 34704.5} {"step": 7877, "train_loss": 3.629364490509033, "lr": 0.0003538980259807748, "tps": 14874, "wall": 34709.5} {"step": 7878, "train_loss": 3.6349940299987793, "lr": 0.00035388522163381494, "tps": 14874, "wall": 34714.5} {"step": 7879, "train_loss": 3.578421115875244, "lr": 0.00035387241577019613, "tps": 14874, "wall": 34719.5} {"step": 7880, "train_loss": 3.6244895458221436, "lr": 0.00035385960839006336, "tps": 14873, "wall": 34724.5} {"step": 7881, "train_loss": 3.6183061599731445, "lr": 0.00035384679949356163, "tps": 14873, "wall": 34729.5} {"step": 7882, "train_loss": 3.632303237915039, "lr": 0.0003538339890808361, "tps": 14873, "wall": 34734.7} {"step": 7883, "train_loss": 3.543023109436035, "lr": 0.00035382117715203196, "tps": 14873, "wall": 34739.6} {"step": 7884, "train_loss": 3.54443097114563, "lr": 0.00035380836370729426, "tps": 14872, "wall": 34744.6} {"step": 7885, "train_loss": 3.539386749267578, "lr": 0.00035379554874676814, "tps": 14872, "wall": 34749.6} {"step": 7886, "train_loss": 3.604649543762207, "lr": 0.00035378273227059894, "tps": 14872, "wall": 34754.5} {"step": 7887, "train_loss": 3.6124227046966553, "lr": 0.0003537699142789316, "tps": 14872, "wall": 34759.5} {"step": 7888, "train_loss": 3.531467914581299, "lr": 0.00035375709477191146, "tps": 14871, "wall": 34764.5} {"step": 7889, "train_loss": 3.583303689956665, "lr": 0.00035374427374968364, "tps": 14871, "wall": 34769.5} {"step": 7890, "train_loss": 3.5861449241638184, "lr": 0.00035373145121239354, "tps": 14871, "wall": 34774.5} {"step": 7891, "train_loss": 3.583739757537842, "lr": 0.00035371862716018635, "tps": 14871, "wall": 34779.7} {"step": 7892, "train_loss": 3.59220814704895, "lr": 0.0003537058015932073, "tps": 14870, "wall": 34784.9} {"step": 7893, "train_loss": 3.5065975189208984, "lr": 0.00035369297451160164, "tps": 14870, "wall": 34790.1} {"step": 7894, "train_loss": 3.616872787475586, "lr": 0.00035368014591551474, "tps": 14869, "wall": 34795.4} {"step": 7895, "train_loss": 3.538957118988037, "lr": 0.000353667315805092, "tps": 14869, "wall": 34800.5} {"step": 7896, "train_loss": 3.668330192565918, "lr": 0.00035365448418047855, "tps": 14869, "wall": 34805.7} {"step": 7897, "train_loss": 3.721489906311035, "lr": 0.0003536416510418199, "tps": 14868, "wall": 34810.9} {"step": 7898, "train_loss": 3.5452327728271484, "lr": 0.0003536288163892615, "tps": 14868, "wall": 34816.1} {"step": 7899, "train_loss": 3.5457706451416016, "lr": 0.00035361598022294854, "tps": 14868, "wall": 34821.3} {"step": 7900, "train_loss": 3.5473952293395996, "lr": 0.00035360314254302656, "tps": 14867, "wall": 34826.5} {"step": 7901, "train_loss": 3.6321234703063965, "lr": 0.00035359030334964096, "tps": 14867, "wall": 34831.4} {"step": 7902, "train_loss": 3.566312313079834, "lr": 0.0003535774626429372, "tps": 14867, "wall": 34836.4} {"step": 7903, "train_loss": 3.63708233833313, "lr": 0.00035356462042306064, "tps": 14867, "wall": 34841.4} {"step": 7904, "train_loss": 3.627349376678467, "lr": 0.0003535517766901569, "tps": 14867, "wall": 34846.4} {"step": 7905, "train_loss": 3.560807704925537, "lr": 0.0003535389314443714, "tps": 14866, "wall": 34851.4} {"step": 7906, "train_loss": 3.615772008895874, "lr": 0.00035352608468584964, "tps": 14866, "wall": 34856.3} {"step": 7907, "train_loss": 3.5713841915130615, "lr": 0.0003535132364147372, "tps": 14866, "wall": 34861.1} {"step": 7908, "train_loss": 3.550352096557617, "lr": 0.0003535003866311796, "tps": 14866, "wall": 34866.0} {"step": 7909, "train_loss": 3.5815138816833496, "lr": 0.00035348753533532233, "tps": 14865, "wall": 34870.9} {"step": 7910, "train_loss": 3.514340877532959, "lr": 0.0003534746825273111, "tps": 14865, "wall": 34876.0} {"step": 7911, "train_loss": 3.547628879547119, "lr": 0.0003534618282072914, "tps": 14865, "wall": 34881.0} {"step": 7912, "train_loss": 3.6437458992004395, "lr": 0.0003534489723754089, "tps": 14865, "wall": 34886.0} {"step": 7913, "train_loss": 3.6083171367645264, "lr": 0.00035343611503180927, "tps": 14864, "wall": 34891.0} {"step": 7914, "train_loss": 3.5722575187683105, "lr": 0.00035342325617663807, "tps": 14864, "wall": 34896.0} {"step": 7915, "train_loss": 3.5534887313842773, "lr": 0.000353410395810041, "tps": 14864, "wall": 34901.0} {"step": 7916, "train_loss": 3.5610532760620117, "lr": 0.00035339753393216376, "tps": 14864, "wall": 34906.0} {"step": 7917, "train_loss": 3.5728635787963867, "lr": 0.000353384670543152, "tps": 14863, "wall": 34910.8} {"step": 7918, "train_loss": 3.478360176086426, "lr": 0.00035337180564315153, "tps": 14863, "wall": 34915.7} {"step": 7919, "train_loss": 3.5531482696533203, "lr": 0.00035335893923230804, "tps": 14863, "wall": 34920.5} {"step": 7920, "train_loss": 3.7008886337280273, "lr": 0.00035334607131076723, "tps": 14863, "wall": 34925.4} {"step": 7921, "train_loss": 3.6164445877075195, "lr": 0.0003533332018786749, "tps": 14863, "wall": 34930.2} {"step": 7922, "train_loss": 3.643214464187622, "lr": 0.0003533203309361769, "tps": 14863, "wall": 34935.1} {"step": 7923, "train_loss": 3.6113100051879883, "lr": 0.00035330745848341895, "tps": 14862, "wall": 34940.1} {"step": 7924, "train_loss": 3.5991740226745605, "lr": 0.00035329458452054696, "tps": 14862, "wall": 34945.2} {"step": 7925, "train_loss": 3.546510696411133, "lr": 0.0003532817090477066, "tps": 14862, "wall": 34950.2} {"step": 7926, "train_loss": 3.5488638877868652, "lr": 0.0003532688320650439, "tps": 14861, "wall": 34955.2} {"step": 7927, "train_loss": 3.7105624675750732, "lr": 0.00035325595357270465, "tps": 14861, "wall": 34960.2} {"step": 7928, "train_loss": 3.55755615234375, "lr": 0.0003532430735708347, "tps": 14861, "wall": 34965.2} {"step": 7929, "train_loss": 3.5575461387634277, "lr": 0.00035323019205958005, "tps": 14861, "wall": 34970.3} {"step": 7930, "train_loss": 3.7032129764556885, "lr": 0.0003532173090390866, "tps": 14860, "wall": 34975.5} {"step": 7931, "train_loss": 3.5802197456359863, "lr": 0.00035320442450950017, "tps": 14860, "wall": 34980.5} {"step": 7932, "train_loss": 3.647369623184204, "lr": 0.0003531915384709669, "tps": 14860, "wall": 34985.6} {"step": 7933, "train_loss": 3.592127799987793, "lr": 0.00035317865092363265, "tps": 14860, "wall": 34990.5} {"step": 7934, "train_loss": 3.644988536834717, "lr": 0.0003531657618676434, "tps": 14859, "wall": 34995.5} {"step": 7935, "train_loss": 3.547391653060913, "lr": 0.00035315287130314527, "tps": 14859, "wall": 35000.5} {"step": 7936, "train_loss": 3.6074178218841553, "lr": 0.0003531399792302842, "tps": 14859, "wall": 35005.5} {"step": 7937, "train_loss": 3.5308938026428223, "lr": 0.00035312708564920627, "tps": 14859, "wall": 35010.5} {"step": 7938, "train_loss": 3.610502243041992, "lr": 0.0003531141905600574, "tps": 14858, "wall": 35015.6} {"step": 7939, "train_loss": 3.5889430046081543, "lr": 0.00035310129396298387, "tps": 14858, "wall": 35020.9} {"step": 7940, "train_loss": 3.6792526245117188, "lr": 0.00035308839585813164, "tps": 14858, "wall": 35026.1} {"step": 7941, "train_loss": 3.513400077819824, "lr": 0.00035307549624564685, "tps": 14857, "wall": 35031.4} {"step": 7942, "train_loss": 3.590392827987671, "lr": 0.00035306259512567564, "tps": 14857, "wall": 35036.7} {"step": 7943, "train_loss": 3.5647974014282227, "lr": 0.00035304969249836424, "tps": 14857, "wall": 35041.9} {"step": 7944, "train_loss": 3.5861141681671143, "lr": 0.0003530367883638586, "tps": 14856, "wall": 35047.0} {"step": 7945, "train_loss": 3.50836181640625, "lr": 0.0003530238827223051, "tps": 14856, "wall": 35052.1} {"step": 7946, "train_loss": 3.4903292655944824, "lr": 0.00035301097557384985, "tps": 14856, "wall": 35057.1} {"step": 7947, "train_loss": 3.624526023864746, "lr": 0.00035299806691863907, "tps": 14855, "wall": 35062.4} {"step": 7948, "train_loss": 3.545714855194092, "lr": 0.000352985156756819, "tps": 14855, "wall": 35067.5} {"step": 7949, "train_loss": 3.5968215465545654, "lr": 0.00035297224508853585, "tps": 14855, "wall": 35072.5} {"step": 7950, "train_loss": 3.4728283882141113, "lr": 0.0003529593319139359, "tps": 14855, "wall": 35077.4} {"step": 7951, "train_loss": 3.620948553085327, "lr": 0.00035294641723316553, "tps": 14854, "wall": 35082.3} {"step": 7952, "train_loss": 3.5221152305603027, "lr": 0.0003529335010463709, "tps": 14854, "wall": 35087.1} {"step": 7953, "train_loss": 3.536004066467285, "lr": 0.00035292058335369836, "tps": 14854, "wall": 35092.0} {"step": 7954, "train_loss": 3.5568199157714844, "lr": 0.0003529076641552943, "tps": 14854, "wall": 35097.0} {"step": 7955, "train_loss": 3.6327965259552, "lr": 0.00035289474345130505, "tps": 14853, "wall": 35102.0} {"step": 7956, "train_loss": 3.612771987915039, "lr": 0.0003528818212418769, "tps": 14853, "wall": 35106.8} {"step": 7957, "train_loss": 3.5067553520202637, "lr": 0.0003528688975271563, "tps": 14853, "wall": 35111.7} {"step": 7958, "train_loss": 3.648301601409912, "lr": 0.0003528559723072897, "tps": 14853, "wall": 35116.6} {"step": 7959, "train_loss": 3.545640468597412, "lr": 0.0003528430455824234, "tps": 14853, "wall": 35121.4} {"step": 7960, "train_loss": 3.643122434616089, "lr": 0.0003528301173527039, "tps": 14853, "wall": 35126.3} {"step": 7961, "train_loss": 3.6791436672210693, "lr": 0.00035281718761827764, "tps": 14852, "wall": 35131.3} {"step": 7962, "train_loss": 3.563861608505249, "lr": 0.000352804256379291, "tps": 14852, "wall": 35136.3} {"step": 7963, "train_loss": 3.5097670555114746, "lr": 0.00035279132363589074, "tps": 14852, "wall": 35141.4} {"step": 7964, "train_loss": 3.61019229888916, "lr": 0.0003527783893882231, "tps": 14852, "wall": 35146.3} {"step": 7965, "train_loss": 3.586395740509033, "lr": 0.0003527654536364346, "tps": 14851, "wall": 35151.3} {"step": 7966, "train_loss": 3.686469554901123, "lr": 0.000352752516380672, "tps": 14851, "wall": 35156.4} {"step": 7967, "train_loss": 3.499451160430908, "lr": 0.0003527395776210817, "tps": 14851, "wall": 35161.5} {"step": 7968, "train_loss": 3.590489387512207, "lr": 0.0003527266373578102, "tps": 14850, "wall": 35166.4} {"step": 7969, "train_loss": 3.655648946762085, "lr": 0.0003527136955910042, "tps": 14850, "wall": 35171.5} {"step": 7970, "train_loss": 3.6415812969207764, "lr": 0.00035270075232081026, "tps": 14850, "wall": 35176.5} {"step": 7971, "train_loss": 3.55902099609375, "lr": 0.0003526878075473751, "tps": 14850, "wall": 35181.5} {"step": 7972, "train_loss": 3.549344778060913, "lr": 0.00035267486127084515, "tps": 14849, "wall": 35186.5} {"step": 7973, "train_loss": 3.561138153076172, "lr": 0.0003526619134913673, "tps": 14849, "wall": 35191.5} {"step": 7974, "train_loss": 3.6530115604400635, "lr": 0.00035264896420908806, "tps": 14849, "wall": 35196.5} {"step": 7975, "train_loss": 3.5366127490997314, "lr": 0.00035263601342415423, "tps": 14849, "wall": 35201.5} {"step": 7976, "train_loss": 3.64058780670166, "lr": 0.0003526230611367125, "tps": 14848, "wall": 35206.5} {"step": 7977, "train_loss": 3.5276317596435547, "lr": 0.0003526101073469094, "tps": 14848, "wall": 35211.4} {"step": 7978, "train_loss": 3.6119394302368164, "lr": 0.00035259715205489196, "tps": 14848, "wall": 35216.5} {"step": 7979, "train_loss": 3.5765488147735596, "lr": 0.0003525841952608068, "tps": 14848, "wall": 35221.5} {"step": 7980, "train_loss": 3.7542381286621094, "lr": 0.00035257123696480063, "tps": 14847, "wall": 35226.5} {"step": 7981, "train_loss": 3.6119446754455566, "lr": 0.0003525582771670204, "tps": 14847, "wall": 35231.5} {"step": 7982, "train_loss": 3.627509117126465, "lr": 0.0003525453158676128, "tps": 14847, "wall": 35236.6} {"step": 7983, "train_loss": 3.600576400756836, "lr": 0.00035253235306672464, "tps": 14847, "wall": 35241.6} {"step": 7984, "train_loss": 3.6048476696014404, "lr": 0.0003525193887645029, "tps": 14846, "wall": 35246.6} {"step": 7985, "train_loss": 3.5859057903289795, "lr": 0.0003525064229610943, "tps": 14846, "wall": 35251.6} {"step": 7986, "train_loss": 3.4614439010620117, "lr": 0.0003524934556566458, "tps": 14846, "wall": 35256.6} {"step": 7987, "train_loss": 3.57529878616333, "lr": 0.00035248048685130424, "tps": 14846, "wall": 35261.6} {"step": 7988, "train_loss": 3.6699490547180176, "lr": 0.00035246751654521656, "tps": 14845, "wall": 35266.6} {"step": 7989, "train_loss": 3.605451822280884, "lr": 0.00035245454473852966, "tps": 14845, "wall": 35271.6} {"step": 7990, "train_loss": 3.5500454902648926, "lr": 0.00035244157143139065, "tps": 14845, "wall": 35276.6} {"step": 7991, "train_loss": 3.573322296142578, "lr": 0.00035242859662394616, "tps": 14845, "wall": 35281.6} {"step": 7992, "train_loss": 3.574498176574707, "lr": 0.0003524156203163435, "tps": 14845, "wall": 35286.6} {"step": 7993, "train_loss": 3.654060125350952, "lr": 0.0003524026425087295, "tps": 14844, "wall": 35291.5} {"step": 7994, "train_loss": 3.6472764015197754, "lr": 0.0003523896632012512, "tps": 14844, "wall": 35296.5} {"step": 7995, "train_loss": 3.6493494510650635, "lr": 0.0003523766823940556, "tps": 14844, "wall": 35301.5} {"step": 7996, "train_loss": 3.634290933609009, "lr": 0.0003523637000872898, "tps": 14844, "wall": 35306.5} {"step": 7997, "train_loss": 3.5752248764038086, "lr": 0.00035235071628110086, "tps": 14843, "wall": 35311.4} {"step": 7998, "train_loss": 3.6909608840942383, "lr": 0.00035233773097563585, "tps": 14843, "wall": 35316.4} {"step": 7999, "train_loss": 3.5687503814697266, "lr": 0.00035232474417104184, "tps": 14843, "wall": 35321.4} {"step": 8000, "train_loss": 3.6296088695526123, "lr": 0.00035231175586746596, "tps": 14843, "wall": 35326.3, "val_loss_monitor": 3.604597478708445} {"step": 8001, "train_loss": 3.593122959136963, "lr": 0.0003522987660650554, "tps": 14822, "wall": 35379.2} {"step": 8002, "train_loss": 3.6386003494262695, "lr": 0.0003522857747639572, "tps": 14822, "wall": 35384.2} {"step": 8003, "train_loss": 3.537245035171509, "lr": 0.0003522727819643186, "tps": 14822, "wall": 35389.3} {"step": 8004, "train_loss": 3.6100547313690186, "lr": 0.0003522597876662868, "tps": 14821, "wall": 35394.4} {"step": 8005, "train_loss": 3.611814498901367, "lr": 0.000352246791870009, "tps": 14821, "wall": 35399.4} {"step": 8006, "train_loss": 3.5304088592529297, "lr": 0.0003522337945756323, "tps": 14821, "wall": 35404.5} {"step": 8007, "train_loss": 3.5566742420196533, "lr": 0.0003522207957833041, "tps": 14821, "wall": 35409.6} {"step": 8008, "train_loss": 3.626307487487793, "lr": 0.0003522077954931715, "tps": 14820, "wall": 35414.7} {"step": 8009, "train_loss": 3.605459690093994, "lr": 0.0003521947937053819, "tps": 14820, "wall": 35419.7} {"step": 8010, "train_loss": 3.6636345386505127, "lr": 0.0003521817904200825, "tps": 14820, "wall": 35424.8} {"step": 8011, "train_loss": 3.5855579376220703, "lr": 0.00035216878563742066, "tps": 14820, "wall": 35429.9} {"step": 8012, "train_loss": 3.5217995643615723, "lr": 0.0003521557793575436, "tps": 14819, "wall": 35435.0} {"step": 8013, "train_loss": 3.559777021408081, "lr": 0.0003521427715805988, "tps": 14819, "wall": 35440.1} {"step": 8014, "train_loss": 3.6078877449035645, "lr": 0.0003521297623067335, "tps": 14819, "wall": 35445.1} {"step": 8015, "train_loss": 3.5675206184387207, "lr": 0.00035211675153609505, "tps": 14819, "wall": 35450.2} {"step": 8016, "train_loss": 3.5212814807891846, "lr": 0.0003521037392688309, "tps": 14818, "wall": 35455.3} {"step": 8017, "train_loss": 3.549067497253418, "lr": 0.0003520907255050885, "tps": 14818, "wall": 35460.3} {"step": 8018, "train_loss": 3.581188440322876, "lr": 0.0003520777102450152, "tps": 14818, "wall": 35465.4} {"step": 8019, "train_loss": 3.525632619857788, "lr": 0.00035206469348875847, "tps": 14817, "wall": 35470.5} {"step": 8020, "train_loss": 3.540052890777588, "lr": 0.00035205167523646573, "tps": 14817, "wall": 35475.6} {"step": 8021, "train_loss": 3.6446876525878906, "lr": 0.0003520386554882845, "tps": 14817, "wall": 35480.6} {"step": 8022, "train_loss": 3.6180622577667236, "lr": 0.00035202563424436217, "tps": 14817, "wall": 35485.6} {"step": 8023, "train_loss": 3.610116958618164, "lr": 0.00035201261150484634, "tps": 14816, "wall": 35490.6} {"step": 8024, "train_loss": 3.5519540309906006, "lr": 0.0003519995872698846, "tps": 14816, "wall": 35495.7} {"step": 8025, "train_loss": 3.699282646179199, "lr": 0.00035198656153962425, "tps": 14816, "wall": 35500.7} {"step": 8026, "train_loss": 3.5454249382019043, "lr": 0.00035197353431421305, "tps": 14816, "wall": 35505.7} {"step": 8027, "train_loss": 3.5818819999694824, "lr": 0.0003519605055937985, "tps": 14815, "wall": 35510.8} {"step": 8028, "train_loss": 3.583580255508423, "lr": 0.00035194747537852823, "tps": 14815, "wall": 35515.8} {"step": 8029, "train_loss": 3.567873001098633, "lr": 0.0003519344436685498, "tps": 14815, "wall": 35520.9} {"step": 8030, "train_loss": 3.670227289199829, "lr": 0.0003519214104640109, "tps": 14815, "wall": 35525.9} {"step": 8031, "train_loss": 3.5019290447235107, "lr": 0.00035190837576505905, "tps": 14814, "wall": 35530.9} {"step": 8032, "train_loss": 3.672123908996582, "lr": 0.00035189533957184207, "tps": 14814, "wall": 35536.0} {"step": 8033, "train_loss": 3.4690895080566406, "lr": 0.0003518823018845075, "tps": 14814, "wall": 35541.0} {"step": 8034, "train_loss": 3.679675579071045, "lr": 0.00035186926270320304, "tps": 14814, "wall": 35546.0} {"step": 8035, "train_loss": 3.5879876613616943, "lr": 0.0003518562220280765, "tps": 14813, "wall": 35551.0} {"step": 8036, "train_loss": 3.5766406059265137, "lr": 0.00035184317985927554, "tps": 14813, "wall": 35556.0} {"step": 8037, "train_loss": 3.5808181762695312, "lr": 0.00035183013619694784, "tps": 14813, "wall": 35561.0} {"step": 8038, "train_loss": 3.572880744934082, "lr": 0.00035181709104124126, "tps": 14813, "wall": 35566.0} {"step": 8039, "train_loss": 3.5787668228149414, "lr": 0.00035180404439230363, "tps": 14812, "wall": 35571.2} {"step": 8040, "train_loss": 3.4662909507751465, "lr": 0.0003517909962502825, "tps": 14812, "wall": 35576.2} {"step": 8041, "train_loss": 3.5633087158203125, "lr": 0.00035177794661532595, "tps": 14812, "wall": 35581.6} {"step": 8042, "train_loss": 3.5320029258728027, "lr": 0.0003517648954875816, "tps": 14811, "wall": 35586.9} {"step": 8043, "train_loss": 3.4945051670074463, "lr": 0.0003517518428671975, "tps": 14811, "wall": 35592.2} {"step": 8044, "train_loss": 3.510395050048828, "lr": 0.0003517387887543213, "tps": 14811, "wall": 35597.4} {"step": 8045, "train_loss": 3.676112174987793, "lr": 0.000351725733149101, "tps": 14810, "wall": 35602.7} {"step": 8046, "train_loss": 3.680732011795044, "lr": 0.00035171267605168453, "tps": 14810, "wall": 35608.1} {"step": 8047, "train_loss": 3.5612123012542725, "lr": 0.00035169961746221967, "tps": 14810, "wall": 35613.3} {"step": 8048, "train_loss": 3.593893051147461, "lr": 0.00035168655738085445, "tps": 14809, "wall": 35618.6} {"step": 8049, "train_loss": 3.5100696086883545, "lr": 0.00035167349580773676, "tps": 14809, "wall": 35623.8} {"step": 8050, "train_loss": 3.5608434677124023, "lr": 0.0003516604327430146, "tps": 14808, "wall": 35629.1} {"step": 8051, "train_loss": 3.5829200744628906, "lr": 0.0003516473681868359, "tps": 14808, "wall": 35634.2} {"step": 8052, "train_loss": 3.6041455268859863, "lr": 0.0003516343021393488, "tps": 14808, "wall": 35639.3} {"step": 8053, "train_loss": 3.4793922901153564, "lr": 0.00035162123460070105, "tps": 14808, "wall": 35644.4} {"step": 8054, "train_loss": 3.679189920425415, "lr": 0.0003516081655710409, "tps": 14807, "wall": 35649.7} {"step": 8055, "train_loss": 3.5729923248291016, "lr": 0.00035159509505051635, "tps": 14807, "wall": 35655.0} {"step": 8056, "train_loss": 3.5319647789001465, "lr": 0.0003515820230392755, "tps": 14807, "wall": 35660.2} {"step": 8057, "train_loss": 3.600985527038574, "lr": 0.00035156894953746625, "tps": 14806, "wall": 35665.4} {"step": 8058, "train_loss": 3.474374771118164, "lr": 0.00035155587454523693, "tps": 14806, "wall": 35670.4} {"step": 8059, "train_loss": 3.4180335998535156, "lr": 0.0003515427980627355, "tps": 14806, "wall": 35675.4} {"step": 8060, "train_loss": 3.5825071334838867, "lr": 0.0003515297200901101, "tps": 14806, "wall": 35680.4} {"step": 8061, "train_loss": 3.535402774810791, "lr": 0.00035151664062750895, "tps": 14805, "wall": 35685.4} {"step": 8062, "train_loss": 3.5881540775299072, "lr": 0.0003515035596750802, "tps": 14805, "wall": 35690.4} {"step": 8063, "train_loss": 3.5665910243988037, "lr": 0.000351490477232972, "tps": 14805, "wall": 35695.5} {"step": 8064, "train_loss": 3.5957956314086914, "lr": 0.0003514773933013326, "tps": 14805, "wall": 35700.5} {"step": 8065, "train_loss": 3.4870309829711914, "lr": 0.00035146430788031007, "tps": 14804, "wall": 35705.5} {"step": 8066, "train_loss": 3.6082448959350586, "lr": 0.0003514512209700529, "tps": 14804, "wall": 35710.5} {"step": 8067, "train_loss": 3.5108723640441895, "lr": 0.000351438132570709, "tps": 14804, "wall": 35715.5} {"step": 8068, "train_loss": 3.61618709564209, "lr": 0.0003514250426824269, "tps": 14804, "wall": 35720.5} {"step": 8069, "train_loss": 3.5511412620544434, "lr": 0.00035141195130535484, "tps": 14803, "wall": 35725.5} {"step": 8070, "train_loss": 3.50071382522583, "lr": 0.0003513988584396411, "tps": 14803, "wall": 35730.5} {"step": 8071, "train_loss": 3.4680545330047607, "lr": 0.000351385764085434, "tps": 14803, "wall": 35735.5} {"step": 8072, "train_loss": 3.716442108154297, "lr": 0.00035137266824288173, "tps": 14803, "wall": 35740.5} {"step": 8073, "train_loss": 3.5858571529388428, "lr": 0.00035135957091213287, "tps": 14802, "wall": 35745.4} {"step": 8074, "train_loss": 3.670501232147217, "lr": 0.00035134647209333566, "tps": 14802, "wall": 35750.4} {"step": 8075, "train_loss": 3.5848875045776367, "lr": 0.00035133337178663854, "tps": 14802, "wall": 35755.6} {"step": 8076, "train_loss": 3.5855298042297363, "lr": 0.0003513202699921898, "tps": 14802, "wall": 35760.5} {"step": 8077, "train_loss": 3.560492753982544, "lr": 0.000351307166710138, "tps": 14802, "wall": 35765.4} {"step": 8078, "train_loss": 3.553854465484619, "lr": 0.0003512940619406315, "tps": 14801, "wall": 35770.3} {"step": 8079, "train_loss": 3.519502639770508, "lr": 0.0003512809556838188, "tps": 14801, "wall": 35775.3} {"step": 8080, "train_loss": 3.6767971515655518, "lr": 0.00035126784793984827, "tps": 14801, "wall": 35780.1} {"step": 8081, "train_loss": 3.750561475753784, "lr": 0.0003512547387088685, "tps": 14801, "wall": 35785.0} {"step": 8082, "train_loss": 3.5639357566833496, "lr": 0.0003512416279910279, "tps": 14801, "wall": 35789.8} {"step": 8083, "train_loss": 3.6556925773620605, "lr": 0.0003512285157864751, "tps": 14800, "wall": 35794.7} {"step": 8084, "train_loss": 3.521949052810669, "lr": 0.0003512154020953586, "tps": 14800, "wall": 35799.5} {"step": 8085, "train_loss": 3.591461658477783, "lr": 0.0003512022869178268, "tps": 14800, "wall": 35804.4} {"step": 8086, "train_loss": 3.6455039978027344, "lr": 0.00035118917025402845, "tps": 14800, "wall": 35809.2} {"step": 8087, "train_loss": 3.615884780883789, "lr": 0.0003511760521041121, "tps": 14800, "wall": 35814.1} {"step": 8088, "train_loss": 3.679652690887451, "lr": 0.0003511629324682263, "tps": 14800, "wall": 35818.9} {"step": 8089, "train_loss": 3.5220947265625, "lr": 0.0003511498113465198, "tps": 14799, "wall": 35823.8} {"step": 8090, "train_loss": 3.5555005073547363, "lr": 0.00035113668873914107, "tps": 14799, "wall": 35828.7} {"step": 8091, "train_loss": 3.5665154457092285, "lr": 0.00035112356464623884, "tps": 14799, "wall": 35833.5} {"step": 8092, "train_loss": 3.644116163253784, "lr": 0.00035111043906796175, "tps": 14799, "wall": 35838.4} {"step": 8093, "train_loss": 3.5244150161743164, "lr": 0.00035109731200445854, "tps": 14799, "wall": 35843.2} {"step": 8094, "train_loss": 3.591315746307373, "lr": 0.0003510841834558779, "tps": 14798, "wall": 35848.0} {"step": 8095, "train_loss": 3.5622212886810303, "lr": 0.0003510710534223685, "tps": 14798, "wall": 35852.9} {"step": 8096, "train_loss": 3.613647937774658, "lr": 0.00035105792190407917, "tps": 14798, "wall": 35857.8} {"step": 8097, "train_loss": 3.442241668701172, "lr": 0.00035104478890115866, "tps": 14798, "wall": 35862.6} {"step": 8098, "train_loss": 3.6119909286499023, "lr": 0.0003510316544137556, "tps": 14798, "wall": 35867.4} {"step": 8099, "train_loss": 3.4820244312286377, "lr": 0.00035101851844201884, "tps": 14798, "wall": 35872.3} {"step": 8100, "train_loss": 3.5544586181640625, "lr": 0.00035100538098609726, "tps": 14797, "wall": 35877.1} {"step": 8101, "train_loss": 3.581000328063965, "lr": 0.00035099224204613964, "tps": 14797, "wall": 35882.0} {"step": 8102, "train_loss": 3.5612099170684814, "lr": 0.00035097910162229485, "tps": 14797, "wall": 35886.8} {"step": 8103, "train_loss": 3.5407052040100098, "lr": 0.00035096595971471163, "tps": 14797, "wall": 35891.7} {"step": 8104, "train_loss": 3.5921525955200195, "lr": 0.000350952816323539, "tps": 14797, "wall": 35896.5} {"step": 8105, "train_loss": 3.7229807376861572, "lr": 0.0003509396714489258, "tps": 14797, "wall": 35901.4} {"step": 8106, "train_loss": 3.614352226257324, "lr": 0.00035092652509102084, "tps": 14796, "wall": 35906.2} {"step": 8107, "train_loss": 3.572585105895996, "lr": 0.00035091337724997324, "tps": 14796, "wall": 35911.1} {"step": 8108, "train_loss": 3.6232123374938965, "lr": 0.0003509002279259317, "tps": 14796, "wall": 35916.0} {"step": 8109, "train_loss": 3.5819106101989746, "lr": 0.00035088707711904534, "tps": 14796, "wall": 35920.8} {"step": 8110, "train_loss": 3.5475192070007324, "lr": 0.0003508739248294631, "tps": 14796, "wall": 35925.7} {"step": 8111, "train_loss": 3.621445894241333, "lr": 0.00035086077105733396, "tps": 14795, "wall": 35930.6} {"step": 8112, "train_loss": 3.5595016479492188, "lr": 0.0003508476158028069, "tps": 14795, "wall": 35935.5} {"step": 8113, "train_loss": 3.582969903945923, "lr": 0.00035083445906603097, "tps": 14795, "wall": 35940.4} {"step": 8114, "train_loss": 3.6154983043670654, "lr": 0.0003508213008471552, "tps": 14795, "wall": 35945.3} {"step": 8115, "train_loss": 3.6831297874450684, "lr": 0.0003508081411463287, "tps": 14795, "wall": 35950.2} {"step": 8116, "train_loss": 3.5644989013671875, "lr": 0.0003507949799637005, "tps": 14795, "wall": 35955.0} {"step": 8117, "train_loss": 3.5845742225646973, "lr": 0.00035078181729941964, "tps": 14794, "wall": 35959.9} {"step": 8118, "train_loss": 3.5752975940704346, "lr": 0.0003507686531536353, "tps": 14794, "wall": 35964.8} {"step": 8119, "train_loss": 3.550506591796875, "lr": 0.0003507554875264966, "tps": 14794, "wall": 35969.6} {"step": 8120, "train_loss": 3.6128897666931152, "lr": 0.00035074232041815265, "tps": 14794, "wall": 35974.5} {"step": 8121, "train_loss": 3.678041458129883, "lr": 0.0003507291518287526, "tps": 14794, "wall": 35979.3} {"step": 8122, "train_loss": 3.596785068511963, "lr": 0.0003507159817584457, "tps": 14793, "wall": 35984.1} {"step": 8123, "train_loss": 3.6033153533935547, "lr": 0.00035070281020738105, "tps": 14793, "wall": 35989.0} {"step": 8124, "train_loss": 3.522508144378662, "lr": 0.00035068963717570787, "tps": 14793, "wall": 35993.8} {"step": 8125, "train_loss": 3.620882034301758, "lr": 0.0003506764626635755, "tps": 14793, "wall": 35998.9} {"step": 8126, "train_loss": 3.4420337677001953, "lr": 0.00035066328667113304, "tps": 14793, "wall": 36003.9} {"step": 8127, "train_loss": 3.5688650608062744, "lr": 0.00035065010919852976, "tps": 14792, "wall": 36008.8} {"step": 8128, "train_loss": 3.548945426940918, "lr": 0.00035063693024591506, "tps": 14792, "wall": 36013.8} {"step": 8129, "train_loss": 3.5891640186309814, "lr": 0.00035062374981343806, "tps": 14792, "wall": 36018.8} {"step": 8130, "train_loss": 3.6356072425842285, "lr": 0.0003506105679012482, "tps": 14792, "wall": 36023.8} {"step": 8131, "train_loss": 3.6154439449310303, "lr": 0.00035059738450949474, "tps": 14792, "wall": 36028.7} {"step": 8132, "train_loss": 3.599564552307129, "lr": 0.0003505841996383271, "tps": 14791, "wall": 36033.7} {"step": 8133, "train_loss": 3.560121536254883, "lr": 0.0003505710132878945, "tps": 14791, "wall": 36038.7} {"step": 8134, "train_loss": 3.584146022796631, "lr": 0.00035055782545834646, "tps": 14791, "wall": 36043.7} {"step": 8135, "train_loss": 3.6214120388031006, "lr": 0.00035054463614983224, "tps": 14791, "wall": 36048.7} {"step": 8136, "train_loss": 3.6074459552764893, "lr": 0.00035053144536250144, "tps": 14790, "wall": 36053.6} {"step": 8137, "train_loss": 3.544952869415283, "lr": 0.00035051825309650325, "tps": 14790, "wall": 36058.7} {"step": 8138, "train_loss": 3.6629810333251953, "lr": 0.0003505050593519873, "tps": 14790, "wall": 36063.7} {"step": 8139, "train_loss": 3.510468006134033, "lr": 0.0003504918641291029, "tps": 14790, "wall": 36068.7} {"step": 8140, "train_loss": 3.5644845962524414, "lr": 0.0003504786674279997, "tps": 14789, "wall": 36073.7} {"step": 8141, "train_loss": 3.6162643432617188, "lr": 0.000350465469248827, "tps": 14789, "wall": 36078.7} {"step": 8142, "train_loss": 3.640066623687744, "lr": 0.0003504522695917345, "tps": 14789, "wall": 36083.7} {"step": 8143, "train_loss": 3.645524024963379, "lr": 0.00035043906845687154, "tps": 14789, "wall": 36088.6} {"step": 8144, "train_loss": 3.646958112716675, "lr": 0.0003504258658443878, "tps": 14789, "wall": 36093.6} {"step": 8145, "train_loss": 3.471257209777832, "lr": 0.00035041266175443275, "tps": 14788, "wall": 36098.6} {"step": 8146, "train_loss": 3.53433895111084, "lr": 0.00035039945618715613, "tps": 14788, "wall": 36103.6} {"step": 8147, "train_loss": 3.5804502964019775, "lr": 0.0003503862491427074, "tps": 14788, "wall": 36108.5} {"step": 8148, "train_loss": 3.638047218322754, "lr": 0.00035037304062123604, "tps": 14788, "wall": 36113.5} {"step": 8149, "train_loss": 3.633998155593872, "lr": 0.000350359830622892, "tps": 14787, "wall": 36118.6} {"step": 8150, "train_loss": 3.5596137046813965, "lr": 0.0003503466191478246, "tps": 14787, "wall": 36123.6} {"step": 8151, "train_loss": 3.6013965606689453, "lr": 0.0003503334061961837, "tps": 14787, "wall": 36128.6} {"step": 8152, "train_loss": 3.572408437728882, "lr": 0.00035032019176811896, "tps": 14787, "wall": 36133.6} {"step": 8153, "train_loss": 3.6086177825927734, "lr": 0.00035030697586377996, "tps": 14786, "wall": 36138.6} {"step": 8154, "train_loss": 3.5876030921936035, "lr": 0.0003502937584833166, "tps": 14786, "wall": 36143.6} {"step": 8155, "train_loss": 3.591353178024292, "lr": 0.0003502805396268784, "tps": 14786, "wall": 36148.6} {"step": 8156, "train_loss": 3.50850772857666, "lr": 0.0003502673192946153, "tps": 14786, "wall": 36153.6} {"step": 8157, "train_loss": 3.4479358196258545, "lr": 0.0003502540974866768, "tps": 14786, "wall": 36158.7} {"step": 8158, "train_loss": 3.6343204975128174, "lr": 0.00035024087420321295, "tps": 14785, "wall": 36163.7} {"step": 8159, "train_loss": 3.5175788402557373, "lr": 0.0003502276494443734, "tps": 14785, "wall": 36168.8} {"step": 8160, "train_loss": 3.5889461040496826, "lr": 0.00035021442321030806, "tps": 14785, "wall": 36174.0} {"step": 8161, "train_loss": 3.566161632537842, "lr": 0.0003502011955011666, "tps": 14784, "wall": 36179.1} {"step": 8162, "train_loss": 3.56256103515625, "lr": 0.00035018796631709894, "tps": 14784, "wall": 36184.0} {"step": 8163, "train_loss": 3.620744228363037, "lr": 0.00035017473565825504, "tps": 14784, "wall": 36188.8} {"step": 8164, "train_loss": 3.6029536724090576, "lr": 0.0003501615035247846, "tps": 14784, "wall": 36193.6} {"step": 8165, "train_loss": 3.547907829284668, "lr": 0.00035014826991683774, "tps": 14784, "wall": 36198.4} {"step": 8166, "train_loss": 3.5258538722991943, "lr": 0.0003501350348345641, "tps": 14784, "wall": 36203.4} {"step": 8167, "train_loss": 3.4987380504608154, "lr": 0.0003501217982781138, "tps": 14783, "wall": 36208.2} {"step": 8168, "train_loss": 3.4844303131103516, "lr": 0.00035010856024763676, "tps": 14783, "wall": 36213.0} {"step": 8169, "train_loss": 3.5557355880737305, "lr": 0.0003500953207432829, "tps": 14783, "wall": 36217.8} {"step": 8170, "train_loss": 3.449471950531006, "lr": 0.00035008207976520213, "tps": 14783, "wall": 36222.6} {"step": 8171, "train_loss": 3.583150625228882, "lr": 0.0003500688373135446, "tps": 14783, "wall": 36227.5} {"step": 8172, "train_loss": 3.4977145195007324, "lr": 0.00035005559338846027, "tps": 14783, "wall": 36232.3} {"step": 8173, "train_loss": 3.552295207977295, "lr": 0.00035004234799009904, "tps": 14782, "wall": 36237.2} {"step": 8174, "train_loss": 3.5895485877990723, "lr": 0.00035002910111861117, "tps": 14782, "wall": 36242.1} {"step": 8175, "train_loss": 3.6157968044281006, "lr": 0.00035001585277414656, "tps": 14782, "wall": 36246.9} {"step": 8176, "train_loss": 3.5603322982788086, "lr": 0.00035000260295685526, "tps": 14782, "wall": 36251.8} {"step": 8177, "train_loss": 3.5065150260925293, "lr": 0.00034998935166688754, "tps": 14782, "wall": 36256.7} {"step": 8178, "train_loss": 3.5445985794067383, "lr": 0.00034997609890439335, "tps": 14782, "wall": 36261.6} {"step": 8179, "train_loss": 3.5459916591644287, "lr": 0.00034996284466952296, "tps": 14781, "wall": 36266.4} {"step": 8180, "train_loss": 3.595451593399048, "lr": 0.00034994958896242636, "tps": 14781, "wall": 36271.3} {"step": 8181, "train_loss": 3.4734103679656982, "lr": 0.00034993633178325383, "tps": 14781, "wall": 36276.1} {"step": 8182, "train_loss": 3.519932508468628, "lr": 0.0003499230731321554, "tps": 14781, "wall": 36281.0} {"step": 8183, "train_loss": 3.586013078689575, "lr": 0.00034990981300928156, "tps": 14781, "wall": 36285.8} {"step": 8184, "train_loss": 3.640058755874634, "lr": 0.00034989655141478226, "tps": 14781, "wall": 36290.6} {"step": 8185, "train_loss": 3.59694242477417, "lr": 0.00034988328834880766, "tps": 14780, "wall": 36295.6} {"step": 8186, "train_loss": 3.5362112522125244, "lr": 0.0003498700238115083, "tps": 14780, "wall": 36300.4} {"step": 8187, "train_loss": 3.6009788513183594, "lr": 0.0003498567578030342, "tps": 14780, "wall": 36305.2} {"step": 8188, "train_loss": 3.624134063720703, "lr": 0.0003498434903235358, "tps": 14780, "wall": 36310.1} {"step": 8189, "train_loss": 3.464168071746826, "lr": 0.0003498302213731632, "tps": 14780, "wall": 36314.9} {"step": 8190, "train_loss": 3.599500894546509, "lr": 0.00034981695095206696, "tps": 14779, "wall": 36319.8} {"step": 8191, "train_loss": 3.660562753677368, "lr": 0.0003498036790603972, "tps": 14779, "wall": 36324.6} {"step": 8192, "train_loss": 3.61822509765625, "lr": 0.0003497904056983043, "tps": 14779, "wall": 36329.4} {"step": 8193, "train_loss": 3.579592227935791, "lr": 0.0003497771308659388, "tps": 14779, "wall": 36334.3} {"step": 8194, "train_loss": 3.613184690475464, "lr": 0.0003497638545634509, "tps": 14779, "wall": 36339.1} {"step": 8195, "train_loss": 3.5844156742095947, "lr": 0.00034975057679099096, "tps": 14779, "wall": 36344.0} {"step": 8196, "train_loss": 3.5366597175598145, "lr": 0.0003497372975487095, "tps": 14778, "wall": 36348.8} {"step": 8197, "train_loss": 3.5505282878875732, "lr": 0.00034972401683675697, "tps": 14778, "wall": 36353.6} {"step": 8198, "train_loss": 3.628157138824463, "lr": 0.00034971073465528364, "tps": 14778, "wall": 36358.5} {"step": 8199, "train_loss": 3.6115341186523438, "lr": 0.00034969745100444017, "tps": 14778, "wall": 36363.4} {"step": 8200, "train_loss": 3.6140942573547363, "lr": 0.00034968416588437694, "tps": 14778, "wall": 36368.2} {"step": 8201, "train_loss": 3.6044485569000244, "lr": 0.0003496708792952445, "tps": 14778, "wall": 36373.0} {"step": 8202, "train_loss": 3.5704736709594727, "lr": 0.0003496575912371933, "tps": 14777, "wall": 36377.9} {"step": 8203, "train_loss": 3.621772289276123, "lr": 0.0003496443017103739, "tps": 14777, "wall": 36382.7} {"step": 8204, "train_loss": 3.5947046279907227, "lr": 0.0003496310107149368, "tps": 14777, "wall": 36387.5} {"step": 8205, "train_loss": 3.638101100921631, "lr": 0.0003496177182510326, "tps": 14777, "wall": 36392.4} {"step": 8206, "train_loss": 3.5451669692993164, "lr": 0.0003496044243188119, "tps": 14777, "wall": 36397.2} {"step": 8207, "train_loss": 3.617448329925537, "lr": 0.0003495911289184252, "tps": 14777, "wall": 36402.1} {"step": 8208, "train_loss": 3.522352457046509, "lr": 0.0003495778320500233, "tps": 14777, "wall": 36406.9} {"step": 8209, "train_loss": 3.644787311553955, "lr": 0.00034956453371375664, "tps": 14776, "wall": 36411.8} {"step": 8210, "train_loss": 3.6527838706970215, "lr": 0.000349551233909776, "tps": 14776, "wall": 36416.7} {"step": 8211, "train_loss": 3.536860942840576, "lr": 0.0003495379326382319, "tps": 14776, "wall": 36421.5} {"step": 8212, "train_loss": 3.548666000366211, "lr": 0.0003495246298992751, "tps": 14776, "wall": 36426.4} {"step": 8213, "train_loss": 3.6956114768981934, "lr": 0.0003495113256930563, "tps": 14776, "wall": 36431.3} {"step": 8214, "train_loss": 3.585153579711914, "lr": 0.0003494980200197262, "tps": 14775, "wall": 36436.1} {"step": 8215, "train_loss": 3.5556914806365967, "lr": 0.0003494847128794355, "tps": 14775, "wall": 36441.0} {"step": 8216, "train_loss": 3.5871505737304688, "lr": 0.000349471404272335, "tps": 14775, "wall": 36445.9} {"step": 8217, "train_loss": 3.5729918479919434, "lr": 0.0003494580941985754, "tps": 14775, "wall": 36450.9} {"step": 8218, "train_loss": 3.5907700061798096, "lr": 0.0003494447826583075, "tps": 14775, "wall": 36455.8} {"step": 8219, "train_loss": 3.5498733520507812, "lr": 0.00034943146965168216, "tps": 14774, "wall": 36460.8} {"step": 8220, "train_loss": 3.6197681427001953, "lr": 0.00034941815517885007, "tps": 14774, "wall": 36465.8} {"step": 8221, "train_loss": 3.572484016418457, "lr": 0.00034940483923996213, "tps": 14774, "wall": 36470.7} {"step": 8222, "train_loss": 3.6298837661743164, "lr": 0.0003493915218351692, "tps": 14774, "wall": 36475.8} {"step": 8223, "train_loss": 3.5832901000976562, "lr": 0.00034937820296462207, "tps": 14774, "wall": 36480.7} {"step": 8224, "train_loss": 3.536499500274658, "lr": 0.00034936488262847173, "tps": 14773, "wall": 36485.7} {"step": 8225, "train_loss": 3.5178189277648926, "lr": 0.0003493515608268689, "tps": 14773, "wall": 36490.6} {"step": 8226, "train_loss": 3.5736021995544434, "lr": 0.0003493382375599646, "tps": 14773, "wall": 36495.6} {"step": 8227, "train_loss": 3.619851589202881, "lr": 0.0003493249128279098, "tps": 14773, "wall": 36500.6} {"step": 8228, "train_loss": 3.5295987129211426, "lr": 0.0003493115866308554, "tps": 14772, "wall": 36505.5} {"step": 8229, "train_loss": 3.64877986907959, "lr": 0.0003492982589689523, "tps": 14772, "wall": 36510.5} {"step": 8230, "train_loss": 3.6362051963806152, "lr": 0.0003492849298423516, "tps": 14772, "wall": 36515.4} {"step": 8231, "train_loss": 3.606172561645508, "lr": 0.0003492715992512041, "tps": 14772, "wall": 36520.4} {"step": 8232, "train_loss": 3.6044206619262695, "lr": 0.0003492582671956611, "tps": 14772, "wall": 36525.4} {"step": 8233, "train_loss": 3.6407816410064697, "lr": 0.0003492449336758733, "tps": 14771, "wall": 36530.4} {"step": 8234, "train_loss": 3.555924415588379, "lr": 0.00034923159869199196, "tps": 14771, "wall": 36535.4} {"step": 8235, "train_loss": 3.5082249641418457, "lr": 0.00034921826224416805, "tps": 14771, "wall": 36540.4} {"step": 8236, "train_loss": 3.490586757659912, "lr": 0.00034920492433255276, "tps": 14771, "wall": 36545.4} {"step": 8237, "train_loss": 3.5341198444366455, "lr": 0.000349191584957297, "tps": 14771, "wall": 36550.4} {"step": 8238, "train_loss": 3.693019390106201, "lr": 0.000349178244118552, "tps": 14770, "wall": 36555.4} {"step": 8239, "train_loss": 3.480769395828247, "lr": 0.0003491649018164689, "tps": 14770, "wall": 36560.3} {"step": 8240, "train_loss": 3.522540330886841, "lr": 0.0003491515580511988, "tps": 14770, "wall": 36565.3} {"step": 8241, "train_loss": 3.5287551879882812, "lr": 0.0003491382128228928, "tps": 14770, "wall": 36570.3} {"step": 8242, "train_loss": 3.5349063873291016, "lr": 0.00034912486613170225, "tps": 14769, "wall": 36575.3} {"step": 8243, "train_loss": 3.490907907485962, "lr": 0.00034911151797777817, "tps": 14769, "wall": 36580.3} {"step": 8244, "train_loss": 3.6507153511047363, "lr": 0.0003490981683612718, "tps": 14769, "wall": 36585.3} {"step": 8245, "train_loss": 3.659397602081299, "lr": 0.0003490848172823344, "tps": 14769, "wall": 36590.3} {"step": 8246, "train_loss": 3.5898938179016113, "lr": 0.0003490714647411172, "tps": 14768, "wall": 36595.3} {"step": 8247, "train_loss": 3.5927910804748535, "lr": 0.00034905811073777156, "tps": 14768, "wall": 36600.3} {"step": 8248, "train_loss": 3.533482313156128, "lr": 0.0003490447552724486, "tps": 14768, "wall": 36605.3} {"step": 8249, "train_loss": 3.517289400100708, "lr": 0.0003490313983452996, "tps": 14768, "wall": 36610.3} {"step": 8250, "train_loss": 3.5741281509399414, "lr": 0.00034901803995647605, "tps": 14768, "wall": 36615.3} {"step": 8251, "train_loss": 3.593386650085449, "lr": 0.00034900468010612906, "tps": 14767, "wall": 36620.3} {"step": 8252, "train_loss": 3.568706512451172, "lr": 0.0003489913187944102, "tps": 14767, "wall": 36625.3} {"step": 8253, "train_loss": 3.5983786582946777, "lr": 0.0003489779560214706, "tps": 14767, "wall": 36630.2} {"step": 8254, "train_loss": 3.576277017593384, "lr": 0.00034896459178746176, "tps": 14767, "wall": 36635.2} {"step": 8255, "train_loss": 3.5655441284179688, "lr": 0.000348951226092535, "tps": 14766, "wall": 36640.3} {"step": 8256, "train_loss": 3.6283817291259766, "lr": 0.00034893785893684186, "tps": 14766, "wall": 36645.4} {"step": 8257, "train_loss": 3.6238694190979004, "lr": 0.0003489244903205337, "tps": 14766, "wall": 36650.4} {"step": 8258, "train_loss": 3.5647854804992676, "lr": 0.0003489111202437618, "tps": 14766, "wall": 36655.4} {"step": 8259, "train_loss": 3.5837771892547607, "lr": 0.0003488977487066779, "tps": 14766, "wall": 36660.2} {"step": 8260, "train_loss": 3.5030016899108887, "lr": 0.0003488843757094333, "tps": 14765, "wall": 36665.1} {"step": 8261, "train_loss": 3.554332971572876, "lr": 0.00034887100125217946, "tps": 14765, "wall": 36670.0} {"step": 8262, "train_loss": 3.487513542175293, "lr": 0.000348857625335068, "tps": 14765, "wall": 36674.8} {"step": 8263, "train_loss": 3.605640411376953, "lr": 0.00034884424795825035, "tps": 14765, "wall": 36679.6} {"step": 8264, "train_loss": 3.4341254234313965, "lr": 0.0003488308691218781, "tps": 14765, "wall": 36684.4} {"step": 8265, "train_loss": 3.567121744155884, "lr": 0.0003488174888261028, "tps": 14765, "wall": 36689.3} {"step": 8266, "train_loss": 3.602250099182129, "lr": 0.00034880410707107605, "tps": 14764, "wall": 36694.3} {"step": 8267, "train_loss": 3.5112252235412598, "lr": 0.00034879072385694934, "tps": 14764, "wall": 36699.2} {"step": 8268, "train_loss": 3.5742998123168945, "lr": 0.0003487773391838744, "tps": 14764, "wall": 36704.2} {"step": 8269, "train_loss": 3.575239658355713, "lr": 0.0003487639530520028, "tps": 14764, "wall": 36709.2} {"step": 8270, "train_loss": 3.5540361404418945, "lr": 0.0003487505654614861, "tps": 14764, "wall": 36714.1} {"step": 8271, "train_loss": 3.6258645057678223, "lr": 0.0003487371764124761, "tps": 14763, "wall": 36719.1} {"step": 8272, "train_loss": 3.5661449432373047, "lr": 0.0003487237859051244, "tps": 14763, "wall": 36724.1} {"step": 8273, "train_loss": 3.5194907188415527, "lr": 0.00034871039393958263, "tps": 14763, "wall": 36729.0} {"step": 8274, "train_loss": 3.5800423622131348, "lr": 0.0003486970005160027, "tps": 14763, "wall": 36734.0} {"step": 8275, "train_loss": 3.545680284500122, "lr": 0.000348683605634536, "tps": 14762, "wall": 36739.0} {"step": 8276, "train_loss": 3.566155433654785, "lr": 0.0003486702092953345, "tps": 14762, "wall": 36743.9} {"step": 8277, "train_loss": 3.5174026489257812, "lr": 0.00034865681149855, "tps": 14762, "wall": 36748.9} {"step": 8278, "train_loss": 3.4810643196105957, "lr": 0.0003486434122443341, "tps": 14762, "wall": 36753.8} {"step": 8279, "train_loss": 3.5896339416503906, "lr": 0.0003486300115328387, "tps": 14762, "wall": 36758.8} {"step": 8280, "train_loss": 3.5916407108306885, "lr": 0.00034861660936421555, "tps": 14761, "wall": 36763.7} {"step": 8281, "train_loss": 3.567003011703491, "lr": 0.0003486032057386165, "tps": 14761, "wall": 36768.7} {"step": 8282, "train_loss": 3.6576039791107178, "lr": 0.0003485898006561933, "tps": 14761, "wall": 36773.7} {"step": 8283, "train_loss": 3.442640781402588, "lr": 0.00034857639411709797, "tps": 14761, "wall": 36778.7} {"step": 8284, "train_loss": 3.574626922607422, "lr": 0.0003485629861214823, "tps": 14761, "wall": 36783.7} {"step": 8285, "train_loss": 3.530149221420288, "lr": 0.0003485495766694982, "tps": 14760, "wall": 36788.7} {"step": 8286, "train_loss": 3.577815294265747, "lr": 0.00034853616576129747, "tps": 14760, "wall": 36793.6} {"step": 8287, "train_loss": 3.605736494064331, "lr": 0.00034852275339703213, "tps": 14760, "wall": 36798.6} {"step": 8288, "train_loss": 3.539764165878296, "lr": 0.00034850933957685404, "tps": 14760, "wall": 36803.6} {"step": 8289, "train_loss": 3.448493003845215, "lr": 0.00034849592430091526, "tps": 14759, "wall": 36808.6} {"step": 8290, "train_loss": 3.4847850799560547, "lr": 0.00034848250756936767, "tps": 14759, "wall": 36813.6} {"step": 8291, "train_loss": 3.4740984439849854, "lr": 0.0003484690893823633, "tps": 14759, "wall": 36818.5} {"step": 8292, "train_loss": 3.5717835426330566, "lr": 0.00034845566974005406, "tps": 14759, "wall": 36823.5} {"step": 8293, "train_loss": 3.6012954711914062, "lr": 0.00034844224864259216, "tps": 14759, "wall": 36828.5} {"step": 8294, "train_loss": 3.5183186531066895, "lr": 0.0003484288260901294, "tps": 14758, "wall": 36833.4} {"step": 8295, "train_loss": 3.561089277267456, "lr": 0.000348415402082818, "tps": 14758, "wall": 36838.4} {"step": 8296, "train_loss": 3.5157384872436523, "lr": 0.0003484019766208101, "tps": 14758, "wall": 36843.4} {"step": 8297, "train_loss": 3.5534205436706543, "lr": 0.0003483885497042575, "tps": 14758, "wall": 36848.4} {"step": 8298, "train_loss": 3.61307692527771, "lr": 0.00034837512133331254, "tps": 14758, "wall": 36853.3} {"step": 8299, "train_loss": 3.6086225509643555, "lr": 0.0003483616915081272, "tps": 14757, "wall": 36858.3} {"step": 8300, "train_loss": 3.537777900695801, "lr": 0.0003483482602288537, "tps": 14757, "wall": 36863.3} {"step": 8301, "train_loss": 3.6023337841033936, "lr": 0.0003483348274956443, "tps": 14757, "wall": 36868.3} {"step": 8302, "train_loss": 3.4733691215515137, "lr": 0.0003483213933086508, "tps": 14757, "wall": 36873.2} {"step": 8303, "train_loss": 3.506263256072998, "lr": 0.00034830795766802573, "tps": 14756, "wall": 36878.2} {"step": 8304, "train_loss": 3.5324110984802246, "lr": 0.0003482945205739212, "tps": 14756, "wall": 36883.2} {"step": 8305, "train_loss": 3.5600345134735107, "lr": 0.0003482810820264893, "tps": 14756, "wall": 36888.1} {"step": 8306, "train_loss": 3.455990791320801, "lr": 0.00034826764202588247, "tps": 14756, "wall": 36893.1} {"step": 8307, "train_loss": 3.5003275871276855, "lr": 0.0003482542005722528, "tps": 14756, "wall": 36898.1} {"step": 8308, "train_loss": 3.625906229019165, "lr": 0.0003482407576657526, "tps": 14755, "wall": 36903.1} {"step": 8309, "train_loss": 3.5910277366638184, "lr": 0.0003482273133065342, "tps": 14755, "wall": 36908.1} {"step": 8310, "train_loss": 3.5472207069396973, "lr": 0.00034821386749474986, "tps": 14755, "wall": 36913.0} {"step": 8311, "train_loss": 3.4360833168029785, "lr": 0.0003482004202305518, "tps": 14755, "wall": 36918.0} {"step": 8312, "train_loss": 3.609678268432617, "lr": 0.00034818697151409254, "tps": 14755, "wall": 36922.9} {"step": 8313, "train_loss": 3.4352152347564697, "lr": 0.00034817352134552433, "tps": 14754, "wall": 36927.9} {"step": 8314, "train_loss": 3.466141939163208, "lr": 0.0003481600697249995, "tps": 14754, "wall": 36932.9} {"step": 8315, "train_loss": 3.494246006011963, "lr": 0.00034814661665267047, "tps": 14754, "wall": 36937.8} {"step": 8316, "train_loss": 3.667904853820801, "lr": 0.0003481331621286897, "tps": 14754, "wall": 36942.8} {"step": 8317, "train_loss": 3.5108284950256348, "lr": 0.00034811970615320945, "tps": 14754, "wall": 36947.7} {"step": 8318, "train_loss": 3.590334892272949, "lr": 0.00034810624872638225, "tps": 14753, "wall": 36952.7} {"step": 8319, "train_loss": 3.4975662231445312, "lr": 0.0003480927898483606, "tps": 14753, "wall": 36957.8} {"step": 8320, "train_loss": 3.5547170639038086, "lr": 0.00034807932951929683, "tps": 14753, "wall": 36962.8} {"step": 8321, "train_loss": 3.577014923095703, "lr": 0.0003480658677393435, "tps": 14753, "wall": 36967.7} {"step": 8322, "train_loss": 3.5751123428344727, "lr": 0.0003480524045086531, "tps": 14752, "wall": 36972.9} {"step": 8323, "train_loss": 3.636655330657959, "lr": 0.00034803893982737814, "tps": 14752, "wall": 36977.9} {"step": 8324, "train_loss": 3.5772767066955566, "lr": 0.00034802547369567114, "tps": 14752, "wall": 36983.0} {"step": 8325, "train_loss": 3.5811407566070557, "lr": 0.0003480120061136846, "tps": 14752, "wall": 36987.9} {"step": 8326, "train_loss": 3.6311535835266113, "lr": 0.0003479985370815712, "tps": 14751, "wall": 36992.9} {"step": 8327, "train_loss": 3.544605255126953, "lr": 0.0003479850665994834, "tps": 14751, "wall": 36997.8} {"step": 8328, "train_loss": 3.606006383895874, "lr": 0.00034797159466757384, "tps": 14751, "wall": 37002.8} {"step": 8329, "train_loss": 3.5025248527526855, "lr": 0.0003479581212859952, "tps": 14751, "wall": 37007.8} {"step": 8330, "train_loss": 3.500532388687134, "lr": 0.0003479446464549, "tps": 14751, "wall": 37012.8} {"step": 8331, "train_loss": 3.5898241996765137, "lr": 0.0003479311701744409, "tps": 14750, "wall": 37017.9} {"step": 8332, "train_loss": 3.499692916870117, "lr": 0.00034791769244477057, "tps": 14750, "wall": 37022.8} {"step": 8333, "train_loss": 3.602090358734131, "lr": 0.00034790421326604177, "tps": 14750, "wall": 37027.7} {"step": 8334, "train_loss": 3.7031383514404297, "lr": 0.00034789073263840703, "tps": 14750, "wall": 37032.8} {"step": 8335, "train_loss": 3.6104607582092285, "lr": 0.0003478772505620192, "tps": 14750, "wall": 37037.8} {"step": 8336, "train_loss": 3.621671199798584, "lr": 0.00034786376703703096, "tps": 14749, "wall": 37042.8} {"step": 8337, "train_loss": 3.5556204319000244, "lr": 0.00034785028206359505, "tps": 14749, "wall": 37047.9} {"step": 8338, "train_loss": 3.6312038898468018, "lr": 0.0003478367956418642, "tps": 14749, "wall": 37053.0} {"step": 8339, "train_loss": 3.546438694000244, "lr": 0.0003478233077719913, "tps": 14748, "wall": 37058.2} {"step": 8340, "train_loss": 3.6567487716674805, "lr": 0.000347809818454129, "tps": 14748, "wall": 37063.4} {"step": 8341, "train_loss": 3.589301347732544, "lr": 0.00034779632768843014, "tps": 14748, "wall": 37068.5} {"step": 8342, "train_loss": 3.593742847442627, "lr": 0.0003477828354750476, "tps": 14748, "wall": 37073.4} {"step": 8343, "train_loss": 3.632861852645874, "lr": 0.0003477693418141342, "tps": 14747, "wall": 37078.4} {"step": 8344, "train_loss": 3.47640323638916, "lr": 0.0003477558467058427, "tps": 14747, "wall": 37083.3} {"step": 8345, "train_loss": 3.540431499481201, "lr": 0.0003477423501503261, "tps": 14747, "wall": 37088.3} {"step": 8346, "train_loss": 3.5886409282684326, "lr": 0.00034772885214773725, "tps": 14747, "wall": 37093.2} {"step": 8347, "train_loss": 3.701862335205078, "lr": 0.00034771535269822914, "tps": 14747, "wall": 37098.2} {"step": 8348, "train_loss": 3.667175769805908, "lr": 0.0003477018518019545, "tps": 14746, "wall": 37103.2} {"step": 8349, "train_loss": 3.5788493156433105, "lr": 0.0003476883494590664, "tps": 14746, "wall": 37108.2} {"step": 8350, "train_loss": 3.5492300987243652, "lr": 0.00034767484566971776, "tps": 14746, "wall": 37113.0} {"step": 8351, "train_loss": 3.4838218688964844, "lr": 0.00034766134043406156, "tps": 14746, "wall": 37117.8} {"step": 8352, "train_loss": 3.6214141845703125, "lr": 0.0003476478337522508, "tps": 14746, "wall": 37122.6} {"step": 8353, "train_loss": 3.6032934188842773, "lr": 0.0003476343256244385, "tps": 14746, "wall": 37127.4} {"step": 8354, "train_loss": 3.48886775970459, "lr": 0.0003476208160507776, "tps": 14746, "wall": 37132.2} {"step": 8355, "train_loss": 3.563317060470581, "lr": 0.00034760730503142123, "tps": 14745, "wall": 37137.0} {"step": 8356, "train_loss": 3.627920150756836, "lr": 0.00034759379256652244, "tps": 14745, "wall": 37141.8} {"step": 8357, "train_loss": 3.6096537113189697, "lr": 0.0003475802786562342, "tps": 14745, "wall": 37146.6} {"step": 8358, "train_loss": 3.603700876235962, "lr": 0.0003475667633007097, "tps": 14745, "wall": 37151.4} {"step": 8359, "train_loss": 3.5207695960998535, "lr": 0.00034755324650010197, "tps": 14745, "wall": 37156.3} {"step": 8360, "train_loss": 3.548832893371582, "lr": 0.00034753972825456414, "tps": 14745, "wall": 37161.1} {"step": 8361, "train_loss": 3.436110258102417, "lr": 0.00034752620856424944, "tps": 14745, "wall": 37165.9} {"step": 8362, "train_loss": 3.6214070320129395, "lr": 0.0003475126874293109, "tps": 14744, "wall": 37170.8} {"step": 8363, "train_loss": 3.6496033668518066, "lr": 0.00034749916484990177, "tps": 14744, "wall": 37175.6} {"step": 8364, "train_loss": 3.520709991455078, "lr": 0.0003474856408261752, "tps": 14744, "wall": 37180.4} {"step": 8365, "train_loss": 3.555239200592041, "lr": 0.0003474721153582844, "tps": 14744, "wall": 37185.2} {"step": 8366, "train_loss": 3.5393590927124023, "lr": 0.00034745858844638253, "tps": 14744, "wall": 37190.0} {"step": 8367, "train_loss": 3.7542989253997803, "lr": 0.0003474450600906229, "tps": 14744, "wall": 37194.9} {"step": 8368, "train_loss": 3.6887366771698, "lr": 0.0003474315302911588, "tps": 14743, "wall": 37199.7} {"step": 8369, "train_loss": 3.5962090492248535, "lr": 0.0003474179990481433, "tps": 14743, "wall": 37204.5} {"step": 8370, "train_loss": 3.5406763553619385, "lr": 0.00034740446636172994, "tps": 14743, "wall": 37209.4} {"step": 8371, "train_loss": 3.592014789581299, "lr": 0.0003473909322320718, "tps": 14743, "wall": 37214.3} {"step": 8372, "train_loss": 3.580127716064453, "lr": 0.00034737739665932236, "tps": 14743, "wall": 37219.1} {"step": 8373, "train_loss": 3.5305495262145996, "lr": 0.00034736385964363487, "tps": 14743, "wall": 37223.9} {"step": 8374, "train_loss": 3.5131173133850098, "lr": 0.0003473503211851627, "tps": 14743, "wall": 37228.7} {"step": 8375, "train_loss": 3.5228500366210938, "lr": 0.00034733678128405916, "tps": 14742, "wall": 37233.5} {"step": 8376, "train_loss": 3.593804359436035, "lr": 0.00034732323994047766, "tps": 14742, "wall": 37238.3} {"step": 8377, "train_loss": 3.5926456451416016, "lr": 0.0003473096971545716, "tps": 14742, "wall": 37243.1} {"step": 8378, "train_loss": 3.5695993900299072, "lr": 0.00034729615292649447, "tps": 14742, "wall": 37248.1} {"step": 8379, "train_loss": 3.565056800842285, "lr": 0.0003472826072563996, "tps": 14742, "wall": 37253.0} {"step": 8380, "train_loss": 3.583256244659424, "lr": 0.0003472690601444404, "tps": 14741, "wall": 37258.0} {"step": 8381, "train_loss": 3.570486307144165, "lr": 0.00034725551159077054, "tps": 14741, "wall": 37263.0} {"step": 8382, "train_loss": 3.537405490875244, "lr": 0.0003472419615955433, "tps": 14741, "wall": 37268.0} {"step": 8383, "train_loss": 3.5252695083618164, "lr": 0.00034722841015891225, "tps": 14741, "wall": 37272.9} {"step": 8384, "train_loss": 3.5924782752990723, "lr": 0.0003472148572810308, "tps": 14741, "wall": 37278.0} {"step": 8385, "train_loss": 3.5530710220336914, "lr": 0.0003472013029620527, "tps": 14740, "wall": 37283.0} {"step": 8386, "train_loss": 3.50486421585083, "lr": 0.0003471877472021312, "tps": 14740, "wall": 37287.9} {"step": 8387, "train_loss": 3.5374338626861572, "lr": 0.0003471741900014201, "tps": 14740, "wall": 37292.9} {"step": 8388, "train_loss": 3.519002914428711, "lr": 0.0003471606313600729, "tps": 14740, "wall": 37297.9} {"step": 8389, "train_loss": 3.6291420459747314, "lr": 0.0003471470712782432, "tps": 14740, "wall": 37302.9} {"step": 8390, "train_loss": 3.520419120788574, "lr": 0.0003471335097560846, "tps": 14739, "wall": 37307.8} {"step": 8391, "train_loss": 3.547130823135376, "lr": 0.0003471199467937507, "tps": 14739, "wall": 37312.8} {"step": 8392, "train_loss": 3.557060718536377, "lr": 0.00034710638239139515, "tps": 14739, "wall": 37317.8} {"step": 8393, "train_loss": 3.5961897373199463, "lr": 0.0003470928165491716, "tps": 14739, "wall": 37322.8} {"step": 8394, "train_loss": 3.598822593688965, "lr": 0.0003470792492672339, "tps": 14739, "wall": 37327.7} {"step": 8395, "train_loss": 3.592970371246338, "lr": 0.0003470656805457354, "tps": 14738, "wall": 37332.7} {"step": 8396, "train_loss": 3.5739588737487793, "lr": 0.00034705211038483017, "tps": 14738, "wall": 37337.6} {"step": 8397, "train_loss": 3.504058361053467, "lr": 0.00034703853878467164, "tps": 14738, "wall": 37342.6} {"step": 8398, "train_loss": 3.533720016479492, "lr": 0.0003470249657454137, "tps": 14738, "wall": 37347.5} {"step": 8399, "train_loss": 3.6369097232818604, "lr": 0.00034701139126721013, "tps": 14738, "wall": 37352.5} {"step": 8400, "train_loss": 3.5637316703796387, "lr": 0.0003469978153502146, "tps": 14737, "wall": 37357.5} {"step": 8401, "train_loss": 3.549351215362549, "lr": 0.0003469842379945809, "tps": 14737, "wall": 37362.4} {"step": 8402, "train_loss": 3.5319855213165283, "lr": 0.0003469706592004629, "tps": 14737, "wall": 37367.4} {"step": 8403, "train_loss": 3.548948287963867, "lr": 0.0003469570789680145, "tps": 14737, "wall": 37372.3} {"step": 8404, "train_loss": 3.49566388130188, "lr": 0.0003469434972973893, "tps": 14737, "wall": 37377.3} {"step": 8405, "train_loss": 3.5725998878479004, "lr": 0.0003469299141887414, "tps": 14736, "wall": 37382.4} {"step": 8406, "train_loss": 3.6187727451324463, "lr": 0.0003469163296422245, "tps": 14736, "wall": 37387.7} {"step": 8407, "train_loss": 3.5842533111572266, "lr": 0.0003469027436579926, "tps": 14736, "wall": 37392.7} {"step": 8408, "train_loss": 3.6063106060028076, "lr": 0.00034688915623619956, "tps": 14736, "wall": 37397.7} {"step": 8409, "train_loss": 3.5132665634155273, "lr": 0.00034687556737699924, "tps": 14735, "wall": 37402.6} {"step": 8410, "train_loss": 3.5797476768493652, "lr": 0.00034686197708054566, "tps": 14735, "wall": 37407.6} {"step": 8411, "train_loss": 3.5485963821411133, "lr": 0.0003468483853469928, "tps": 14735, "wall": 37412.4} {"step": 8412, "train_loss": 3.534376621246338, "lr": 0.00034683479217649445, "tps": 14735, "wall": 37417.3} {"step": 8413, "train_loss": 3.5812389850616455, "lr": 0.00034682119756920484, "tps": 14735, "wall": 37422.2} {"step": 8414, "train_loss": 3.6025547981262207, "lr": 0.00034680760152527775, "tps": 14734, "wall": 37427.1} {"step": 8415, "train_loss": 3.5386009216308594, "lr": 0.0003467940040448673, "tps": 14734, "wall": 37431.9} {"step": 8416, "train_loss": 3.4797730445861816, "lr": 0.0003467804051281275, "tps": 14734, "wall": 37436.8} {"step": 8417, "train_loss": 3.5254268646240234, "lr": 0.0003467668047752125, "tps": 14734, "wall": 37441.7} {"step": 8418, "train_loss": 3.54537296295166, "lr": 0.0003467532029862762, "tps": 14734, "wall": 37446.5} {"step": 8419, "train_loss": 3.5353283882141113, "lr": 0.0003467395997614728, "tps": 14734, "wall": 37451.4} {"step": 8420, "train_loss": 3.561079978942871, "lr": 0.00034672599510095626, "tps": 14733, "wall": 37456.5} {"step": 8421, "train_loss": 3.645188808441162, "lr": 0.0003467123890048809, "tps": 14733, "wall": 37461.8} {"step": 8422, "train_loss": 3.4287545680999756, "lr": 0.0003466987814734007, "tps": 14733, "wall": 37466.7} {"step": 8423, "train_loss": 3.422400951385498, "lr": 0.0003466851725066699, "tps": 14733, "wall": 37471.6} {"step": 8424, "train_loss": 3.5574498176574707, "lr": 0.00034667156210484255, "tps": 14732, "wall": 37476.5} {"step": 8425, "train_loss": 3.6223721504211426, "lr": 0.0003466579502680729, "tps": 14732, "wall": 37481.6} {"step": 8426, "train_loss": 3.6632137298583984, "lr": 0.0003466443369965152, "tps": 14732, "wall": 37486.7} {"step": 8427, "train_loss": 3.659346103668213, "lr": 0.0003466307222903235, "tps": 14732, "wall": 37491.8} {"step": 8428, "train_loss": 3.6034998893737793, "lr": 0.0003466171061496522, "tps": 14731, "wall": 37497.3} {"step": 8429, "train_loss": 3.6416826248168945, "lr": 0.00034660348857465547, "tps": 14731, "wall": 37502.5} {"step": 8430, "train_loss": 3.590268135070801, "lr": 0.00034658986956548755, "tps": 14731, "wall": 37507.5} {"step": 8431, "train_loss": 3.538116455078125, "lr": 0.0003465762491223027, "tps": 14731, "wall": 37512.4} {"step": 8432, "train_loss": 3.6138062477111816, "lr": 0.0003465626272452553, "tps": 14730, "wall": 37517.4} {"step": 8433, "train_loss": 3.590120792388916, "lr": 0.00034654900393449957, "tps": 14730, "wall": 37522.3} {"step": 8434, "train_loss": 3.6563942432403564, "lr": 0.0003465353791901899, "tps": 14730, "wall": 37527.2} {"step": 8435, "train_loss": 3.513826370239258, "lr": 0.00034652175301248063, "tps": 14730, "wall": 37532.1} {"step": 8436, "train_loss": 3.623818874359131, "lr": 0.00034650812540152617, "tps": 14730, "wall": 37537.0} {"step": 8437, "train_loss": 3.723086357116699, "lr": 0.0003464944963574807, "tps": 14729, "wall": 37542.1} {"step": 8438, "train_loss": 3.5176525115966797, "lr": 0.00034648086588049873, "tps": 14729, "wall": 37547.0} {"step": 8439, "train_loss": 3.668012857437134, "lr": 0.00034646723397073476, "tps": 14729, "wall": 37552.0} {"step": 8440, "train_loss": 3.659386157989502, "lr": 0.000346453600628343, "tps": 14729, "wall": 37556.9} {"step": 8441, "train_loss": 3.4730443954467773, "lr": 0.0003464399658534781, "tps": 14729, "wall": 37561.8} {"step": 8442, "train_loss": 3.580142021179199, "lr": 0.0003464263296462944, "tps": 14728, "wall": 37566.9} {"step": 8443, "train_loss": 3.581859588623047, "lr": 0.0003464126920069464, "tps": 14728, "wall": 37571.7} {"step": 8444, "train_loss": 3.5827596187591553, "lr": 0.0003463990529355887, "tps": 14728, "wall": 37576.6} {"step": 8445, "train_loss": 3.6152167320251465, "lr": 0.0003463854124323755, "tps": 14728, "wall": 37581.7} {"step": 8446, "train_loss": 3.6956660747528076, "lr": 0.0003463717704974616, "tps": 14728, "wall": 37586.6} {"step": 8447, "train_loss": 3.646181106567383, "lr": 0.0003463581271310014, "tps": 14727, "wall": 37591.5} {"step": 8448, "train_loss": 3.5793297290802, "lr": 0.00034634448233314955, "tps": 14727, "wall": 37596.5} {"step": 8449, "train_loss": 3.581627607345581, "lr": 0.0003463308361040606, "tps": 14727, "wall": 37601.5} {"step": 8450, "train_loss": 3.599041700363159, "lr": 0.0003463171884438891, "tps": 14727, "wall": 37606.4} {"step": 8451, "train_loss": 3.5933609008789062, "lr": 0.0003463035393527896, "tps": 14727, "wall": 37611.4} {"step": 8452, "train_loss": 3.5520029067993164, "lr": 0.00034628988883091675, "tps": 14726, "wall": 37616.4} {"step": 8453, "train_loss": 3.453665256500244, "lr": 0.00034627623687842526, "tps": 14726, "wall": 37621.3} {"step": 8454, "train_loss": 3.4535861015319824, "lr": 0.00034626258349546973, "tps": 14726, "wall": 37626.3} {"step": 8455, "train_loss": 3.473849296569824, "lr": 0.0003462489286822048, "tps": 14726, "wall": 37631.2} {"step": 8456, "train_loss": 3.542210102081299, "lr": 0.0003462352724387852, "tps": 14726, "wall": 37636.2} {"step": 8457, "train_loss": 3.42852783203125, "lr": 0.0003462216147653656, "tps": 14726, "wall": 37641.1} {"step": 8458, "train_loss": 3.4509732723236084, "lr": 0.0003462079556621007, "tps": 14725, "wall": 37646.1} {"step": 8459, "train_loss": 3.498749256134033, "lr": 0.00034619429512914527, "tps": 14725, "wall": 37651.0} {"step": 8460, "train_loss": 3.5232303142547607, "lr": 0.00034618063316665406, "tps": 14725, "wall": 37656.0} {"step": 8461, "train_loss": 3.6634020805358887, "lr": 0.0003461669697747817, "tps": 14725, "wall": 37660.9} {"step": 8462, "train_loss": 3.618152141571045, "lr": 0.0003461533049536832, "tps": 14725, "wall": 37665.9} {"step": 8463, "train_loss": 3.6325037479400635, "lr": 0.0003461396387035132, "tps": 14724, "wall": 37670.8} {"step": 8464, "train_loss": 3.5974843502044678, "lr": 0.0003461259710244266, "tps": 14724, "wall": 37675.9} {"step": 8465, "train_loss": 3.5979249477386475, "lr": 0.00034611230191657815, "tps": 14724, "wall": 37680.9} {"step": 8466, "train_loss": 3.487480401992798, "lr": 0.00034609863138012264, "tps": 14724, "wall": 37685.9} {"step": 8467, "train_loss": 3.584313154220581, "lr": 0.0003460849594152151, "tps": 14723, "wall": 37690.9} {"step": 8468, "train_loss": 3.5342397689819336, "lr": 0.00034607128602201026, "tps": 14723, "wall": 37695.9} {"step": 8469, "train_loss": 3.523242473602295, "lr": 0.00034605761120066304, "tps": 14723, "wall": 37701.9} {"step": 8470, "train_loss": 3.65114426612854, "lr": 0.00034604393495132847, "tps": 14722, "wall": 37707.1} {"step": 8471, "train_loss": 3.5503597259521484, "lr": 0.00034603025727416133, "tps": 14722, "wall": 37712.2} {"step": 8472, "train_loss": 3.660064935684204, "lr": 0.00034601657816931666, "tps": 14722, "wall": 37717.4} {"step": 8473, "train_loss": 3.503448486328125, "lr": 0.00034600289763694935, "tps": 14722, "wall": 37722.6} {"step": 8474, "train_loss": 3.523367404937744, "lr": 0.0003459892156772144, "tps": 14721, "wall": 37727.8} {"step": 8475, "train_loss": 3.5305819511413574, "lr": 0.0003459755322902668, "tps": 14721, "wall": 37732.9} {"step": 8476, "train_loss": 3.664705753326416, "lr": 0.0003459618474762616, "tps": 14721, "wall": 37738.1} {"step": 8477, "train_loss": 3.665165424346924, "lr": 0.00034594816123535374, "tps": 14720, "wall": 37743.3} {"step": 8478, "train_loss": 3.533048391342163, "lr": 0.0003459344735676983, "tps": 14720, "wall": 37748.5} {"step": 8479, "train_loss": 3.466732978820801, "lr": 0.0003459207844734503, "tps": 14720, "wall": 37753.7} {"step": 8480, "train_loss": 3.5676989555358887, "lr": 0.00034590709395276485, "tps": 14720, "wall": 37758.8} {"step": 8481, "train_loss": 3.573132038116455, "lr": 0.00034589340200579704, "tps": 14719, "wall": 37764.0} {"step": 8482, "train_loss": 3.5703067779541016, "lr": 0.000345879708632702, "tps": 14719, "wall": 37769.2} {"step": 8483, "train_loss": 3.456389904022217, "lr": 0.00034586601383363477, "tps": 14719, "wall": 37774.4} {"step": 8484, "train_loss": 3.493730068206787, "lr": 0.0003458523176087505, "tps": 14718, "wall": 37779.6} {"step": 8485, "train_loss": 3.4923856258392334, "lr": 0.0003458386199582044, "tps": 14718, "wall": 37784.7} {"step": 8486, "train_loss": 3.467804193496704, "lr": 0.0003458249208821516, "tps": 14718, "wall": 37789.9} {"step": 8487, "train_loss": 3.6005358695983887, "lr": 0.00034581122038074736, "tps": 14718, "wall": 37795.1} {"step": 8488, "train_loss": 3.5693156719207764, "lr": 0.0003457975184541467, "tps": 14717, "wall": 37800.1} {"step": 8489, "train_loss": 3.477133274078369, "lr": 0.00034578381510250503, "tps": 14717, "wall": 37805.1} {"step": 8490, "train_loss": 3.608840227127075, "lr": 0.0003457701103259774, "tps": 14717, "wall": 37810.0} {"step": 8491, "train_loss": 3.6021082401275635, "lr": 0.0003457564041247192, "tps": 14717, "wall": 37815.0} {"step": 8492, "train_loss": 3.5920424461364746, "lr": 0.0003457426964988857, "tps": 14715, "wall": 37822.7} {"step": 8493, "train_loss": 3.6032090187072754, "lr": 0.0003457289874486321, "tps": 14715, "wall": 37829.2} {"step": 8494, "train_loss": 3.5848727226257324, "lr": 0.0003457152769741137, "tps": 14714, "wall": 37834.7} {"step": 8495, "train_loss": 3.5272104740142822, "lr": 0.0003457015650754858, "tps": 14714, "wall": 37840.1} {"step": 8496, "train_loss": 3.5757203102111816, "lr": 0.0003456878517529039, "tps": 14714, "wall": 37845.3} {"step": 8497, "train_loss": 3.5055601596832275, "lr": 0.0003456741370065232, "tps": 14713, "wall": 37850.5} {"step": 8498, "train_loss": 3.541203022003174, "lr": 0.00034566042083649897, "tps": 14713, "wall": 37855.7} {"step": 8499, "train_loss": 3.4944965839385986, "lr": 0.00034564670324298676, "tps": 14713, "wall": 37860.9} {"step": 8500, "train_loss": 3.5689902305603027, "lr": 0.0003456329842261419, "tps": 14712, "wall": 37866.1} {"step": 8501, "train_loss": 3.6089179515838623, "lr": 0.0003456192637861198, "tps": 14712, "wall": 37871.4} {"step": 8502, "train_loss": 3.508803129196167, "lr": 0.0003456055419230759, "tps": 14712, "wall": 37876.6} {"step": 8503, "train_loss": 3.6132922172546387, "lr": 0.0003455918186371655, "tps": 14712, "wall": 37881.8} {"step": 8504, "train_loss": 3.559792995452881, "lr": 0.00034557809392854434, "tps": 14711, "wall": 37887.0} {"step": 8505, "train_loss": 3.588618040084839, "lr": 0.0003455643677973677, "tps": 14711, "wall": 37892.2} {"step": 8506, "train_loss": 3.436896800994873, "lr": 0.00034555064024379106, "tps": 14711, "wall": 37897.4} {"step": 8507, "train_loss": 3.5143308639526367, "lr": 0.00034553691126797, "tps": 14710, "wall": 37902.6} {"step": 8508, "train_loss": 3.557990789413452, "lr": 0.00034552318087006, "tps": 14710, "wall": 37907.8} {"step": 8509, "train_loss": 3.5850002765655518, "lr": 0.00034550944905021664, "tps": 14710, "wall": 37912.9} {"step": 8510, "train_loss": 3.553328514099121, "lr": 0.0003454957158085955, "tps": 14710, "wall": 37918.1} {"step": 8511, "train_loss": 3.5168824195861816, "lr": 0.000345481981145352, "tps": 14709, "wall": 37923.4} {"step": 8512, "train_loss": 3.497727394104004, "lr": 0.0003454682450606419, "tps": 14709, "wall": 37928.6} {"step": 8513, "train_loss": 3.5354866981506348, "lr": 0.0003454545075546207, "tps": 14709, "wall": 37933.9} {"step": 8514, "train_loss": 3.500481605529785, "lr": 0.00034544076862744405, "tps": 14708, "wall": 37939.1} {"step": 8515, "train_loss": 3.6312103271484375, "lr": 0.00034542702827926764, "tps": 14708, "wall": 37944.3} {"step": 8516, "train_loss": 3.6533150672912598, "lr": 0.00034541328651024704, "tps": 14708, "wall": 37949.6} {"step": 8517, "train_loss": 3.530514717102051, "lr": 0.0003453995433205379, "tps": 14707, "wall": 37954.6} {"step": 8518, "train_loss": 3.582439661026001, "lr": 0.000345385798710296, "tps": 14707, "wall": 37959.5} {"step": 8519, "train_loss": 3.6063647270202637, "lr": 0.00034537205267967696, "tps": 14707, "wall": 37964.5} {"step": 8520, "train_loss": 3.384835720062256, "lr": 0.00034535830522883655, "tps": 14707, "wall": 37969.4} {"step": 8521, "train_loss": 3.5383620262145996, "lr": 0.0003453445563579304, "tps": 14707, "wall": 37974.4} {"step": 8522, "train_loss": 3.5985422134399414, "lr": 0.00034533080606711445, "tps": 14706, "wall": 37979.4} {"step": 8523, "train_loss": 3.482450485229492, "lr": 0.00034531705435654426, "tps": 14706, "wall": 37984.4} {"step": 8524, "train_loss": 3.4487671852111816, "lr": 0.0003453033012263758, "tps": 14706, "wall": 37989.4} {"step": 8525, "train_loss": 3.5870070457458496, "lr": 0.00034528954667676465, "tps": 14706, "wall": 37994.4} {"step": 8526, "train_loss": 3.6014270782470703, "lr": 0.0003452757907078668, "tps": 14706, "wall": 37999.4} {"step": 8527, "train_loss": 3.5813794136047363, "lr": 0.00034526203331983803, "tps": 14705, "wall": 38004.3} {"step": 8528, "train_loss": 3.531865119934082, "lr": 0.0003452482745128341, "tps": 14705, "wall": 38009.3} {"step": 8529, "train_loss": 3.593773126602173, "lr": 0.000345234514287011, "tps": 14705, "wall": 38014.3} {"step": 8530, "train_loss": 3.5468578338623047, "lr": 0.00034522075264252456, "tps": 14705, "wall": 38019.3} {"step": 8531, "train_loss": 3.5826056003570557, "lr": 0.0003452069895795306, "tps": 14705, "wall": 38024.5} {"step": 8532, "train_loss": 3.6025562286376953, "lr": 0.00034519322509818514, "tps": 14704, "wall": 38029.7} {"step": 8533, "train_loss": 3.532224178314209, "lr": 0.000345179459198644, "tps": 14704, "wall": 38034.9} {"step": 8534, "train_loss": 3.618452548980713, "lr": 0.00034516569188106327, "tps": 14704, "wall": 38040.1} {"step": 8535, "train_loss": 3.4447925090789795, "lr": 0.00034515192314559873, "tps": 14703, "wall": 38045.4} {"step": 8536, "train_loss": 3.5023651123046875, "lr": 0.00034513815299240644, "tps": 14703, "wall": 38050.6} {"step": 8537, "train_loss": 3.5762648582458496, "lr": 0.0003451243814216424, "tps": 14703, "wall": 38055.8} {"step": 8538, "train_loss": 3.5075488090515137, "lr": 0.0003451106084334626, "tps": 14702, "wall": 38061.1} {"step": 8539, "train_loss": 3.49471378326416, "lr": 0.00034509683402802305, "tps": 14702, "wall": 38066.3} {"step": 8540, "train_loss": 3.499175548553467, "lr": 0.00034508305820547976, "tps": 14702, "wall": 38071.5} {"step": 8541, "train_loss": 3.491672992706299, "lr": 0.0003450692809659889, "tps": 14702, "wall": 38076.7} {"step": 8542, "train_loss": 3.523449182510376, "lr": 0.0003450555023097064, "tps": 14701, "wall": 38081.8} {"step": 8543, "train_loss": 3.605790138244629, "lr": 0.0003450417222367885, "tps": 14701, "wall": 38086.8} {"step": 8544, "train_loss": 3.4987316131591797, "lr": 0.0003450279407473911, "tps": 14701, "wall": 38091.8} {"step": 8545, "train_loss": 3.491950750350952, "lr": 0.00034501415784167044, "tps": 14701, "wall": 38096.9} {"step": 8546, "train_loss": 3.6212830543518066, "lr": 0.00034500037351978263, "tps": 14701, "wall": 38101.6} {"step": 8547, "train_loss": 3.5713114738464355, "lr": 0.00034498658778188385, "tps": 14700, "wall": 38106.4} {"step": 8548, "train_loss": 3.4929072856903076, "lr": 0.00034497280062813023, "tps": 14700, "wall": 38111.2} {"step": 8549, "train_loss": 3.5406675338745117, "lr": 0.000344959012058678, "tps": 14700, "wall": 38116.0} {"step": 8550, "train_loss": 3.476574420928955, "lr": 0.0003449452220736833, "tps": 14700, "wall": 38120.9} {"step": 8551, "train_loss": 3.6422696113586426, "lr": 0.00034493143067330234, "tps": 14700, "wall": 38125.7} {"step": 8552, "train_loss": 3.531306266784668, "lr": 0.00034491763785769134, "tps": 14700, "wall": 38130.5} {"step": 8553, "train_loss": 3.600497245788574, "lr": 0.00034490384362700666, "tps": 14700, "wall": 38135.4} {"step": 8554, "train_loss": 3.5547308921813965, "lr": 0.0003448900479814045, "tps": 14699, "wall": 38140.3} {"step": 8555, "train_loss": 3.454242467880249, "lr": 0.00034487625092104103, "tps": 14699, "wall": 38145.2} {"step": 8556, "train_loss": 3.4819822311401367, "lr": 0.0003448624524460727, "tps": 14699, "wall": 38150.2} {"step": 8557, "train_loss": 3.4777822494506836, "lr": 0.0003448486525566557, "tps": 14699, "wall": 38155.2} {"step": 8558, "train_loss": 3.51275372505188, "lr": 0.00034483485125294647, "tps": 14699, "wall": 38160.2} {"step": 8559, "train_loss": 3.502002716064453, "lr": 0.00034482104853510127, "tps": 14698, "wall": 38165.1} {"step": 8560, "train_loss": 3.550907611846924, "lr": 0.00034480724440327646, "tps": 14698, "wall": 38170.1} {"step": 8561, "train_loss": 3.454542636871338, "lr": 0.0003447934388576285, "tps": 14698, "wall": 38175.0} {"step": 8562, "train_loss": 3.5509817600250244, "lr": 0.00034477963189831365, "tps": 14698, "wall": 38180.0} {"step": 8563, "train_loss": 3.515157699584961, "lr": 0.0003447658235254883, "tps": 14698, "wall": 38185.0} {"step": 8564, "train_loss": 3.506199836730957, "lr": 0.0003447520137393091, "tps": 14698, "wall": 38189.9} {"step": 8565, "train_loss": 3.564748764038086, "lr": 0.0003447382025399323, "tps": 14697, "wall": 38194.9} {"step": 8566, "train_loss": 3.533895492553711, "lr": 0.00034472438992751435, "tps": 14697, "wall": 38199.8} {"step": 8567, "train_loss": 3.366428852081299, "lr": 0.00034471057590221174, "tps": 14697, "wall": 38204.8} {"step": 8568, "train_loss": 3.561487913131714, "lr": 0.00034469676046418107, "tps": 14697, "wall": 38209.8} {"step": 8569, "train_loss": 3.5798892974853516, "lr": 0.0003446829436135787, "tps": 14696, "wall": 38214.9} {"step": 8570, "train_loss": 3.5563502311706543, "lr": 0.0003446691253505612, "tps": 14696, "wall": 38219.9} {"step": 8571, "train_loss": 3.5892162322998047, "lr": 0.00034465530567528513, "tps": 14696, "wall": 38224.8} {"step": 8572, "train_loss": 3.4550631046295166, "lr": 0.000344641484587907, "tps": 14696, "wall": 38229.8} {"step": 8573, "train_loss": 3.4509284496307373, "lr": 0.0003446276620885833, "tps": 14696, "wall": 38234.8} {"step": 8574, "train_loss": 3.5206685066223145, "lr": 0.00034461383817747086, "tps": 14696, "wall": 38239.7} {"step": 8575, "train_loss": 3.466099739074707, "lr": 0.000344600012854726, "tps": 14695, "wall": 38244.5} {"step": 8576, "train_loss": 3.5513081550598145, "lr": 0.00034458618612050553, "tps": 14695, "wall": 38249.4} {"step": 8577, "train_loss": 3.5721569061279297, "lr": 0.000344572357974966, "tps": 14695, "wall": 38254.4} {"step": 8578, "train_loss": 3.5794384479522705, "lr": 0.00034455852841826397, "tps": 14695, "wall": 38259.3} {"step": 8579, "train_loss": 3.5170929431915283, "lr": 0.0003445446974505563, "tps": 14695, "wall": 38264.3} {"step": 8580, "train_loss": 3.5814011096954346, "lr": 0.00034453086507199945, "tps": 14694, "wall": 38269.2} {"step": 8581, "train_loss": 3.592935562133789, "lr": 0.00034451703128275034, "tps": 14694, "wall": 38274.2} {"step": 8582, "train_loss": 3.597748279571533, "lr": 0.0003445031960829655, "tps": 14694, "wall": 38279.3} {"step": 8583, "train_loss": 3.5423264503479004, "lr": 0.00034448935947280175, "tps": 14694, "wall": 38284.3} {"step": 8584, "train_loss": 3.50080943107605, "lr": 0.0003444755214524158, "tps": 14694, "wall": 38289.3} {"step": 8585, "train_loss": 3.441629648208618, "lr": 0.00034446168202196436, "tps": 14693, "wall": 38294.4} {"step": 8586, "train_loss": 3.5474250316619873, "lr": 0.00034444784118160425, "tps": 14693, "wall": 38299.6} {"step": 8587, "train_loss": 3.439267635345459, "lr": 0.0003444339989314923, "tps": 14693, "wall": 38304.8} {"step": 8588, "train_loss": 3.58937668800354, "lr": 0.00034442015527178524, "tps": 14692, "wall": 38310.0} {"step": 8589, "train_loss": 3.471853494644165, "lr": 0.00034440631020264, "tps": 14692, "wall": 38315.2} {"step": 8590, "train_loss": 3.532698392868042, "lr": 0.00034439246372421333, "tps": 14692, "wall": 38320.4} {"step": 8591, "train_loss": 3.620521068572998, "lr": 0.000344378615836662, "tps": 14692, "wall": 38325.6} {"step": 8592, "train_loss": 3.493964672088623, "lr": 0.00034436476654014315, "tps": 14691, "wall": 38330.7} {"step": 8593, "train_loss": 3.5087203979492188, "lr": 0.00034435091583481336, "tps": 14691, "wall": 38336.0} {"step": 8594, "train_loss": 3.6936349868774414, "lr": 0.0003443370637208298, "tps": 14691, "wall": 38341.1} {"step": 8595, "train_loss": 3.4804506301879883, "lr": 0.0003443232101983491, "tps": 14691, "wall": 38346.3} {"step": 8596, "train_loss": 3.5398154258728027, "lr": 0.00034430935526752845, "tps": 14690, "wall": 38351.5} {"step": 8597, "train_loss": 3.5326666831970215, "lr": 0.0003442954989285247, "tps": 14690, "wall": 38356.7} {"step": 8598, "train_loss": 3.595848560333252, "lr": 0.00034428164118149477, "tps": 14690, "wall": 38361.9} {"step": 8599, "train_loss": 3.5049219131469727, "lr": 0.0003442677820265957, "tps": 14689, "wall": 38367.0} {"step": 8600, "train_loss": 3.608738899230957, "lr": 0.0003442539214639844, "tps": 14689, "wall": 38372.0} {"step": 8601, "train_loss": 3.5896077156066895, "lr": 0.00034424005949381807, "tps": 14689, "wall": 38377.3} {"step": 8602, "train_loss": 3.494065761566162, "lr": 0.00034422619611625355, "tps": 14689, "wall": 38382.5} {"step": 8603, "train_loss": 3.4439620971679688, "lr": 0.00034421233133144805, "tps": 14688, "wall": 38387.7} {"step": 8604, "train_loss": 3.609113931655884, "lr": 0.0003441984651395584, "tps": 14688, "wall": 38392.9} {"step": 8605, "train_loss": 3.5007195472717285, "lr": 0.00034418459754074197, "tps": 14688, "wall": 38398.1} {"step": 8606, "train_loss": 3.4679574966430664, "lr": 0.0003441707285351556, "tps": 14688, "wall": 38403.3} {"step": 8607, "train_loss": 3.5499427318573, "lr": 0.00034415685812295657, "tps": 14687, "wall": 38408.4} {"step": 8608, "train_loss": 3.5648155212402344, "lr": 0.0003441429863043018, "tps": 14687, "wall": 38413.5} {"step": 8609, "train_loss": 3.6434648036956787, "lr": 0.00034412911307934877, "tps": 14687, "wall": 38418.7} {"step": 8610, "train_loss": 3.510237693786621, "lr": 0.0003441152384482543, "tps": 14686, "wall": 38423.9} {"step": 8611, "train_loss": 3.646512508392334, "lr": 0.0003441013624111757, "tps": 14686, "wall": 38428.9} {"step": 8612, "train_loss": 3.626312494277954, "lr": 0.00034408748496827016, "tps": 14686, "wall": 38433.9} {"step": 8613, "train_loss": 3.544252872467041, "lr": 0.0003440736061196949, "tps": 14686, "wall": 38438.8} {"step": 8614, "train_loss": 3.5546345710754395, "lr": 0.00034405972586560706, "tps": 14686, "wall": 38443.8} {"step": 8615, "train_loss": 3.632615566253662, "lr": 0.00034404584420616403, "tps": 14685, "wall": 38448.8} {"step": 8616, "train_loss": 3.52803111076355, "lr": 0.00034403196114152294, "tps": 14685, "wall": 38453.6} {"step": 8617, "train_loss": 3.492219924926758, "lr": 0.00034401807667184105, "tps": 14685, "wall": 38458.5} {"step": 8618, "train_loss": 3.5453743934631348, "lr": 0.0003440041907972757, "tps": 14685, "wall": 38463.2} {"step": 8619, "train_loss": 3.571258544921875, "lr": 0.0003439903035179841, "tps": 14685, "wall": 38468.0} {"step": 8620, "train_loss": 3.52799129486084, "lr": 0.00034397641483412377, "tps": 14685, "wall": 38472.8} {"step": 8621, "train_loss": 3.531290054321289, "lr": 0.00034396252474585176, "tps": 14685, "wall": 38477.6} {"step": 8622, "train_loss": 3.5417137145996094, "lr": 0.00034394863325332565, "tps": 14685, "wall": 38482.4} {"step": 8623, "train_loss": 3.45065975189209, "lr": 0.00034393474035670265, "tps": 14684, "wall": 38487.2} {"step": 8624, "train_loss": 3.5882420539855957, "lr": 0.0003439208460561403, "tps": 14684, "wall": 38492.0} {"step": 8625, "train_loss": 3.493960380554199, "lr": 0.00034390695035179584, "tps": 14684, "wall": 38496.9} {"step": 8626, "train_loss": 3.6113462448120117, "lr": 0.0003438930532438268, "tps": 14684, "wall": 38501.8} {"step": 8627, "train_loss": 3.488023281097412, "lr": 0.0003438791547323905, "tps": 14684, "wall": 38506.6} {"step": 8628, "train_loss": 3.6354660987854004, "lr": 0.00034386525481764436, "tps": 14684, "wall": 38511.3} {"step": 8629, "train_loss": 3.601383924484253, "lr": 0.000343851353499746, "tps": 14684, "wall": 38516.2} {"step": 8630, "train_loss": 3.538447856903076, "lr": 0.0003438374507788528, "tps": 14683, "wall": 38521.1} {"step": 8631, "train_loss": 3.5811591148376465, "lr": 0.0003438235466551223, "tps": 14683, "wall": 38525.9} {"step": 8632, "train_loss": 3.5102572441101074, "lr": 0.0003438096411287119, "tps": 14683, "wall": 38530.7} {"step": 8633, "train_loss": 3.4275736808776855, "lr": 0.0003437957341997793, "tps": 14683, "wall": 38535.5} {"step": 8634, "train_loss": 3.5790834426879883, "lr": 0.0003437818258684818, "tps": 14683, "wall": 38540.3} {"step": 8635, "train_loss": 3.517052173614502, "lr": 0.0003437679161349771, "tps": 14683, "wall": 38545.1} {"step": 8636, "train_loss": 3.603311777114868, "lr": 0.00034375400499942274, "tps": 14683, "wall": 38549.9} {"step": 8637, "train_loss": 3.5595455169677734, "lr": 0.0003437400924619764, "tps": 14683, "wall": 38554.7} {"step": 8638, "train_loss": 3.470057487487793, "lr": 0.00034372617852279554, "tps": 14682, "wall": 38559.5} {"step": 8639, "train_loss": 3.504429340362549, "lr": 0.00034371226318203783, "tps": 14682, "wall": 38564.3} {"step": 8640, "train_loss": 3.513563632965088, "lr": 0.00034369834643986093, "tps": 14682, "wall": 38569.3} {"step": 8641, "train_loss": 3.5682806968688965, "lr": 0.0003436844282964225, "tps": 14682, "wall": 38574.4} {"step": 8642, "train_loss": 3.5323805809020996, "lr": 0.00034367050875188006, "tps": 14682, "wall": 38579.4} {"step": 8643, "train_loss": 3.527726888656616, "lr": 0.00034365658780639147, "tps": 14681, "wall": 38584.4} {"step": 8644, "train_loss": 3.4916019439697266, "lr": 0.00034364266546011444, "tps": 14681, "wall": 38589.3} {"step": 8645, "train_loss": 3.5851385593414307, "lr": 0.0003436287417132065, "tps": 14681, "wall": 38594.3} {"step": 8646, "train_loss": 3.5534045696258545, "lr": 0.0003436148165658255, "tps": 14681, "wall": 38599.1} {"step": 8647, "train_loss": 3.6370973587036133, "lr": 0.0003436008900181292, "tps": 14681, "wall": 38603.9} {"step": 8648, "train_loss": 3.502943992614746, "lr": 0.0003435869620702754, "tps": 14681, "wall": 38608.8} {"step": 8649, "train_loss": 3.5790019035339355, "lr": 0.00034357303272242174, "tps": 14680, "wall": 38613.7} {"step": 8650, "train_loss": 3.5085301399230957, "lr": 0.000343559101974726, "tps": 14680, "wall": 38618.6} {"step": 8651, "train_loss": 3.6018805503845215, "lr": 0.00034354516982734615, "tps": 14680, "wall": 38623.5} {"step": 8652, "train_loss": 3.5492215156555176, "lr": 0.00034353123628044, "tps": 14680, "wall": 38628.4} {"step": 8653, "train_loss": 3.4804177284240723, "lr": 0.0003435173013341652, "tps": 14680, "wall": 38633.3} {"step": 8654, "train_loss": 3.6044461727142334, "lr": 0.0003435033649886798, "tps": 14680, "wall": 38638.4} {"step": 8655, "train_loss": 3.5501370429992676, "lr": 0.00034348942724414153, "tps": 14679, "wall": 38643.3} {"step": 8656, "train_loss": 3.5687997341156006, "lr": 0.0003434754881007084, "tps": 14679, "wall": 38648.3} {"step": 8657, "train_loss": 3.569244861602783, "lr": 0.0003434615475585382, "tps": 14679, "wall": 38653.3} {"step": 8658, "train_loss": 3.4199957847595215, "lr": 0.00034344760561778897, "tps": 14679, "wall": 38658.2} {"step": 8659, "train_loss": 3.472693920135498, "lr": 0.0003434336622786186, "tps": 14679, "wall": 38663.0} {"step": 8660, "train_loss": 3.5470709800720215, "lr": 0.000343419717541185, "tps": 14679, "wall": 38667.9} {"step": 8661, "train_loss": 3.4755618572235107, "lr": 0.0003434057714056462, "tps": 14678, "wall": 38672.7} {"step": 8662, "train_loss": 3.4962806701660156, "lr": 0.00034339182387216013, "tps": 14678, "wall": 38677.5} {"step": 8663, "train_loss": 3.510659694671631, "lr": 0.00034337787494088473, "tps": 14678, "wall": 38682.4} {"step": 8664, "train_loss": 3.4992117881774902, "lr": 0.00034336392461197825, "tps": 14678, "wall": 38687.3} {"step": 8665, "train_loss": 3.672419548034668, "lr": 0.0003433499728855984, "tps": 14678, "wall": 38692.2} {"step": 8666, "train_loss": 3.6234030723571777, "lr": 0.0003433360197619034, "tps": 14678, "wall": 38697.2} {"step": 8667, "train_loss": 3.554953098297119, "lr": 0.00034332206524105135, "tps": 14677, "wall": 38702.2} {"step": 8668, "train_loss": 3.551457405090332, "lr": 0.00034330810932320025, "tps": 14677, "wall": 38707.2} {"step": 8669, "train_loss": 3.4993152618408203, "lr": 0.0003432941520085082, "tps": 14677, "wall": 38712.1} {"step": 8670, "train_loss": 3.509697198867798, "lr": 0.0003432801932971334, "tps": 14677, "wall": 38717.1} {"step": 8671, "train_loss": 3.521516799926758, "lr": 0.0003432662331892338, "tps": 14677, "wall": 38722.1} {"step": 8672, "train_loss": 3.6195685863494873, "lr": 0.00034325227168496776, "tps": 14676, "wall": 38727.1} {"step": 8673, "train_loss": 3.582961082458496, "lr": 0.0003432383087844932, "tps": 14676, "wall": 38732.0} {"step": 8674, "train_loss": 3.581794261932373, "lr": 0.00034322434448796847, "tps": 14676, "wall": 38737.0} {"step": 8675, "train_loss": 3.448812246322632, "lr": 0.0003432103787955517, "tps": 14676, "wall": 38741.9} {"step": 8676, "train_loss": 3.5012643337249756, "lr": 0.0003431964117074011, "tps": 14676, "wall": 38746.9} {"step": 8677, "train_loss": 3.6115660667419434, "lr": 0.00034318244322367487, "tps": 14675, "wall": 38751.8} {"step": 8678, "train_loss": 3.4908676147460938, "lr": 0.00034316847334453125, "tps": 14675, "wall": 38756.9} {"step": 8679, "train_loss": 3.6553592681884766, "lr": 0.00034315450207012856, "tps": 14675, "wall": 38761.9} {"step": 8680, "train_loss": 3.5555076599121094, "lr": 0.0003431405294006249, "tps": 14675, "wall": 38766.9} {"step": 8681, "train_loss": 3.6497867107391357, "lr": 0.00034312655533617876, "tps": 14675, "wall": 38771.9} {"step": 8682, "train_loss": 3.5457496643066406, "lr": 0.00034311257987694823, "tps": 14674, "wall": 38776.8} {"step": 8683, "train_loss": 3.50095796585083, "lr": 0.0003430986030230918, "tps": 14674, "wall": 38781.9} {"step": 8684, "train_loss": 3.5659003257751465, "lr": 0.0003430846247747678, "tps": 14674, "wall": 38787.2} {"step": 8685, "train_loss": 3.5491042137145996, "lr": 0.0003430706451321344, "tps": 14674, "wall": 38792.4} {"step": 8686, "train_loss": 3.5792903900146484, "lr": 0.00034305666409535017, "tps": 14673, "wall": 38797.6} {"step": 8687, "train_loss": 3.4980978965759277, "lr": 0.0003430426816645733, "tps": 14673, "wall": 38802.8} {"step": 8688, "train_loss": 3.545151710510254, "lr": 0.0003430286978399624, "tps": 14673, "wall": 38808.3} {"step": 8689, "train_loss": 3.4782521724700928, "lr": 0.00034301471262167564, "tps": 14672, "wall": 38813.4} {"step": 8690, "train_loss": 3.650679588317871, "lr": 0.00034300072600987157, "tps": 14672, "wall": 38818.7} {"step": 8691, "train_loss": 3.5868513584136963, "lr": 0.00034298673800470865, "tps": 14672, "wall": 38823.9} {"step": 8692, "train_loss": 3.4064676761627197, "lr": 0.0003429727486063453, "tps": 14672, "wall": 38829.1} {"step": 8693, "train_loss": 3.5701518058776855, "lr": 0.00034295875781494, "tps": 14671, "wall": 38834.3} {"step": 8694, "train_loss": 3.475271463394165, "lr": 0.0003429447656306513, "tps": 14671, "wall": 38839.3} {"step": 8695, "train_loss": 3.624021291732788, "lr": 0.00034293077205363757, "tps": 14671, "wall": 38844.3} {"step": 8696, "train_loss": 3.4086875915527344, "lr": 0.00034291677708405744, "tps": 14671, "wall": 38849.3} {"step": 8697, "train_loss": 3.443779945373535, "lr": 0.00034290278072206937, "tps": 14671, "wall": 38854.2} {"step": 8698, "train_loss": 3.5071287155151367, "lr": 0.00034288878296783197, "tps": 14670, "wall": 38859.3} {"step": 8699, "train_loss": 3.641078472137451, "lr": 0.0003428747838215038, "tps": 14670, "wall": 38864.3} {"step": 8700, "train_loss": 3.515216827392578, "lr": 0.00034286078328324345, "tps": 14670, "wall": 38869.2} {"step": 8701, "train_loss": 3.5273687839508057, "lr": 0.00034284678135320946, "tps": 14670, "wall": 38874.2} {"step": 8702, "train_loss": 3.5047922134399414, "lr": 0.0003428327780315605, "tps": 14670, "wall": 38879.2} {"step": 8703, "train_loss": 3.531435489654541, "lr": 0.00034281877331845517, "tps": 14669, "wall": 38884.2} {"step": 8704, "train_loss": 3.4483118057250977, "lr": 0.00034280476721405216, "tps": 14669, "wall": 38889.2} {"step": 8705, "train_loss": 3.6100025177001953, "lr": 0.00034279075971851004, "tps": 14669, "wall": 38894.0} {"step": 8706, "train_loss": 3.6167399883270264, "lr": 0.00034277675083198766, "tps": 14669, "wall": 38898.8} {"step": 8707, "train_loss": 3.6560726165771484, "lr": 0.0003427627405546435, "tps": 14669, "wall": 38903.7} {"step": 8708, "train_loss": 3.510462999343872, "lr": 0.00034274872888663646, "tps": 14669, "wall": 38908.5} {"step": 8709, "train_loss": 3.5878007411956787, "lr": 0.0003427347158281251, "tps": 14668, "wall": 38913.6} {"step": 8710, "train_loss": 3.581900119781494, "lr": 0.00034272070137926833, "tps": 14668, "wall": 38918.4} {"step": 8711, "train_loss": 3.5799400806427, "lr": 0.00034270668554022476, "tps": 14668, "wall": 38923.2} {"step": 8712, "train_loss": 3.537473678588867, "lr": 0.0003426926683111532, "tps": 14668, "wall": 38928.0} {"step": 8713, "train_loss": 3.6073834896087646, "lr": 0.0003426786496922124, "tps": 14668, "wall": 38932.9} {"step": 8714, "train_loss": 3.5612239837646484, "lr": 0.0003426646296835614, "tps": 14668, "wall": 38937.7} {"step": 8715, "train_loss": 3.6377878189086914, "lr": 0.0003426506082853587, "tps": 14668, "wall": 38942.6} {"step": 8716, "train_loss": 3.5379514694213867, "lr": 0.0003426365854977633, "tps": 14667, "wall": 38947.5} {"step": 8717, "train_loss": 3.4924778938293457, "lr": 0.00034262256132093407, "tps": 14667, "wall": 38952.4} {"step": 8718, "train_loss": 3.5911178588867188, "lr": 0.0003426085357550298, "tps": 14667, "wall": 38957.4} {"step": 8719, "train_loss": 3.535161018371582, "lr": 0.00034259450880020937, "tps": 14667, "wall": 38962.4} {"step": 8720, "train_loss": 3.6316728591918945, "lr": 0.0003425804804566318, "tps": 14667, "wall": 38967.3} {"step": 8721, "train_loss": 3.6078357696533203, "lr": 0.00034256645072445585, "tps": 14666, "wall": 38972.3} {"step": 8722, "train_loss": 3.5660805702209473, "lr": 0.0003425524196038405, "tps": 14666, "wall": 38977.2} {"step": 8723, "train_loss": 3.5127081871032715, "lr": 0.00034253838709494473, "tps": 14666, "wall": 38982.2} {"step": 8724, "train_loss": 3.582383871078491, "lr": 0.00034252435319792753, "tps": 14666, "wall": 38987.1} {"step": 8725, "train_loss": 3.6032016277313232, "lr": 0.0003425103179129478, "tps": 14666, "wall": 38992.1} {"step": 8726, "train_loss": 3.6669833660125732, "lr": 0.0003424962812401645, "tps": 14666, "wall": 38997.1} {"step": 8727, "train_loss": 3.609066963195801, "lr": 0.0003424822431797368, "tps": 14665, "wall": 39002.0} {"step": 8728, "train_loss": 3.6328651905059814, "lr": 0.00034246820373182353, "tps": 14665, "wall": 39007.0} {"step": 8729, "train_loss": 3.4050986766815186, "lr": 0.0003424541628965838, "tps": 14665, "wall": 39012.0} {"step": 8730, "train_loss": 3.48466420173645, "lr": 0.00034244012067417677, "tps": 14665, "wall": 39016.9} {"step": 8731, "train_loss": 3.616766929626465, "lr": 0.0003424260770647614, "tps": 14665, "wall": 39021.8} {"step": 8732, "train_loss": 3.5992941856384277, "lr": 0.0003424120320684969, "tps": 14664, "wall": 39026.8} {"step": 8733, "train_loss": 3.526616096496582, "lr": 0.0003423979856855421, "tps": 14664, "wall": 39031.8} {"step": 8734, "train_loss": 3.511303424835205, "lr": 0.00034238393791605643, "tps": 14664, "wall": 39036.7} {"step": 8735, "train_loss": 3.597250461578369, "lr": 0.0003423698887601988, "tps": 14664, "wall": 39041.7} {"step": 8736, "train_loss": 3.5630440711975098, "lr": 0.00034235583821812856, "tps": 14664, "wall": 39046.7} {"step": 8737, "train_loss": 3.556224822998047, "lr": 0.0003423417862900047, "tps": 14664, "wall": 39051.7} {"step": 8738, "train_loss": 3.5441133975982666, "lr": 0.0003423277329759864, "tps": 14663, "wall": 39056.6} {"step": 8739, "train_loss": 3.562053680419922, "lr": 0.00034231367827623304, "tps": 14663, "wall": 39061.6} {"step": 8740, "train_loss": 3.6159749031066895, "lr": 0.0003422996221909037, "tps": 14663, "wall": 39066.7} {"step": 8741, "train_loss": 3.4870493412017822, "lr": 0.0003422855647201576, "tps": 14663, "wall": 39071.7} {"step": 8742, "train_loss": 3.449370861053467, "lr": 0.00034227150586415395, "tps": 14662, "wall": 39076.7} {"step": 8743, "train_loss": 3.540970802307129, "lr": 0.00034225744562305213, "tps": 14662, "wall": 39081.9} {"step": 8744, "train_loss": 3.4713451862335205, "lr": 0.0003422433839970113, "tps": 14662, "wall": 39087.1} {"step": 8745, "train_loss": 3.434896230697632, "lr": 0.00034222932098619085, "tps": 14662, "wall": 39092.4} {"step": 8746, "train_loss": 3.578979015350342, "lr": 0.00034221525659075005, "tps": 14661, "wall": 39097.6} {"step": 8747, "train_loss": 3.549935817718506, "lr": 0.00034220119081084817, "tps": 14661, "wall": 39102.8} {"step": 8748, "train_loss": 3.585400342941284, "lr": 0.00034218712364664466, "tps": 14661, "wall": 39108.1} {"step": 8749, "train_loss": 3.5834951400756836, "lr": 0.00034217305509829873, "tps": 14660, "wall": 39113.3} {"step": 8750, "train_loss": 3.5726022720336914, "lr": 0.00034215898516596987, "tps": 14660, "wall": 39118.6} {"step": 8751, "train_loss": 3.6526219844818115, "lr": 0.0003421449138498174, "tps": 14660, "wall": 39123.9} {"step": 8752, "train_loss": 3.513869047164917, "lr": 0.00034213084115000073, "tps": 14660, "wall": 39129.1} {"step": 8753, "train_loss": 3.5355629920959473, "lr": 0.0003421167670666793, "tps": 14659, "wall": 39134.3} {"step": 8754, "train_loss": 3.5112271308898926, "lr": 0.00034210269160001245, "tps": 14659, "wall": 39139.5} {"step": 8755, "train_loss": 3.5688462257385254, "lr": 0.0003420886147501598, "tps": 14659, "wall": 39144.8} {"step": 8756, "train_loss": 3.5551815032958984, "lr": 0.0003420745365172806, "tps": 14658, "wall": 39150.0} {"step": 8757, "train_loss": 3.5580978393554688, "lr": 0.00034206045690153455, "tps": 14658, "wall": 39155.2} {"step": 8758, "train_loss": 3.6223011016845703, "lr": 0.0003420463759030811, "tps": 14658, "wall": 39160.3} {"step": 8759, "train_loss": 3.514198064804077, "lr": 0.0003420322935220796, "tps": 14658, "wall": 39165.3} {"step": 8760, "train_loss": 3.5424671173095703, "lr": 0.0003420182097586897, "tps": 14658, "wall": 39170.3} {"step": 8761, "train_loss": 3.5107407569885254, "lr": 0.0003420041246130709, "tps": 14657, "wall": 39175.4} {"step": 8762, "train_loss": 3.460615634918213, "lr": 0.0003419900380853828, "tps": 14657, "wall": 39180.7} {"step": 8763, "train_loss": 3.583839178085327, "lr": 0.000341975950175785, "tps": 14657, "wall": 39185.9} {"step": 8764, "train_loss": 3.6463849544525146, "lr": 0.000341961860884437, "tps": 14656, "wall": 39191.1} {"step": 8765, "train_loss": 3.523547649383545, "lr": 0.00034194777021149836, "tps": 14656, "wall": 39196.4} {"step": 8766, "train_loss": 3.529071569442749, "lr": 0.00034193367815712886, "tps": 14656, "wall": 39201.6} {"step": 8767, "train_loss": 3.55350399017334, "lr": 0.000341919584721488, "tps": 14656, "wall": 39206.8} {"step": 8768, "train_loss": 3.541368007659912, "lr": 0.0003419054899047356, "tps": 14655, "wall": 39212.0} {"step": 8769, "train_loss": 3.5784261226654053, "lr": 0.0003418913937070311, "tps": 14655, "wall": 39217.2} {"step": 8770, "train_loss": 3.5067572593688965, "lr": 0.0003418772961285344, "tps": 14655, "wall": 39222.3} {"step": 8771, "train_loss": 3.488727331161499, "lr": 0.000341863197169405, "tps": 14655, "wall": 39227.5} {"step": 8772, "train_loss": 3.521451950073242, "lr": 0.0003418490968298028, "tps": 14654, "wall": 39232.5} {"step": 8773, "train_loss": 3.4957351684570312, "lr": 0.00034183499510988735, "tps": 14654, "wall": 39237.5} {"step": 8774, "train_loss": 3.4607725143432617, "lr": 0.0003418208920098185, "tps": 14654, "wall": 39242.4} {"step": 8775, "train_loss": 3.5204784870147705, "lr": 0.00034180678752975603, "tps": 14654, "wall": 39247.2} {"step": 8776, "train_loss": 3.482233762741089, "lr": 0.00034179268166985966, "tps": 14654, "wall": 39252.0} {"step": 8777, "train_loss": 3.5420210361480713, "lr": 0.00034177857443028924, "tps": 14654, "wall": 39256.8} {"step": 8778, "train_loss": 3.4536144733428955, "lr": 0.00034176446581120454, "tps": 14654, "wall": 39261.6} {"step": 8779, "train_loss": 3.5873818397521973, "lr": 0.0003417503558127653, "tps": 14653, "wall": 39266.3} {"step": 8780, "train_loss": 3.5988454818725586, "lr": 0.0003417362444351315, "tps": 14653, "wall": 39271.1} {"step": 8781, "train_loss": 3.5770020484924316, "lr": 0.0003417221316784629, "tps": 14653, "wall": 39276.0} {"step": 8782, "train_loss": 3.575394868850708, "lr": 0.0003417080175429195, "tps": 14653, "wall": 39280.9} {"step": 8783, "train_loss": 3.605386972427368, "lr": 0.00034169390202866103, "tps": 14653, "wall": 39285.8} {"step": 8784, "train_loss": 3.535409927368164, "lr": 0.00034167978513584746, "tps": 14653, "wall": 39290.7} {"step": 8785, "train_loss": 3.618971586227417, "lr": 0.0003416656668646387, "tps": 14652, "wall": 39295.7} {"step": 8786, "train_loss": 3.5543317794799805, "lr": 0.0003416515472151947, "tps": 14652, "wall": 39300.8} {"step": 8787, "train_loss": 3.554551839828491, "lr": 0.0003416374261876754, "tps": 14652, "wall": 39305.7} {"step": 8788, "train_loss": 3.553729295730591, "lr": 0.00034162330378224073, "tps": 14652, "wall": 39310.7} {"step": 8789, "train_loss": 3.5965495109558105, "lr": 0.00034160917999905065, "tps": 14652, "wall": 39315.6} {"step": 8790, "train_loss": 3.596282482147217, "lr": 0.00034159505483826526, "tps": 14652, "wall": 39320.5} {"step": 8791, "train_loss": 3.504148006439209, "lr": 0.00034158092830004455, "tps": 14651, "wall": 39325.5} {"step": 8792, "train_loss": 3.4444189071655273, "lr": 0.0003415668003845484, "tps": 14651, "wall": 39330.4} {"step": 8793, "train_loss": 3.680626630783081, "lr": 0.000341552671091937, "tps": 14651, "wall": 39335.4} {"step": 8794, "train_loss": 3.5960612297058105, "lr": 0.00034153854042237044, "tps": 14651, "wall": 39340.3} {"step": 8795, "train_loss": 3.5639243125915527, "lr": 0.00034152440837600863, "tps": 14651, "wall": 39345.3} {"step": 8796, "train_loss": 3.531841278076172, "lr": 0.0003415102749530118, "tps": 14651, "wall": 39350.2} {"step": 8797, "train_loss": 3.546724796295166, "lr": 0.00034149614015354, "tps": 14650, "wall": 39355.2} {"step": 8798, "train_loss": 3.5409584045410156, "lr": 0.00034148200397775334, "tps": 14650, "wall": 39360.2} {"step": 8799, "train_loss": 3.4415886402130127, "lr": 0.00034146786642581193, "tps": 14650, "wall": 39365.2} {"step": 8800, "train_loss": 3.5685787200927734, "lr": 0.000341453727497876, "tps": 14650, "wall": 39370.1} {"step": 8801, "train_loss": 3.495879888534546, "lr": 0.00034143958719410564, "tps": 14650, "wall": 39375.1} {"step": 8802, "train_loss": 3.45974063873291, "lr": 0.00034142544551466115, "tps": 14649, "wall": 39380.0} {"step": 8803, "train_loss": 3.5774431228637695, "lr": 0.00034141130245970253, "tps": 14649, "wall": 39385.0} {"step": 8804, "train_loss": 3.48455548286438, "lr": 0.00034139715802939015, "tps": 14649, "wall": 39390.0} {"step": 8805, "train_loss": 3.4924285411834717, "lr": 0.00034138301222388424, "tps": 14649, "wall": 39394.9} {"step": 8806, "train_loss": 3.5871965885162354, "lr": 0.00034136886504334494, "tps": 14649, "wall": 39399.9} {"step": 8807, "train_loss": 3.602661609649658, "lr": 0.0003413547164879326, "tps": 14648, "wall": 39404.9} {"step": 8808, "train_loss": 3.5130057334899902, "lr": 0.0003413405665578075, "tps": 14648, "wall": 39409.8} {"step": 8809, "train_loss": 3.5010905265808105, "lr": 0.0003413264152531298, "tps": 14648, "wall": 39414.9} {"step": 8810, "train_loss": 3.4005961418151855, "lr": 0.00034131226257405996, "tps": 14648, "wall": 39419.9} {"step": 8811, "train_loss": 3.460700511932373, "lr": 0.00034129810852075827, "tps": 14648, "wall": 39424.8} {"step": 8812, "train_loss": 3.5382955074310303, "lr": 0.00034128395309338504, "tps": 14648, "wall": 39429.8} {"step": 8813, "train_loss": 3.5885910987854004, "lr": 0.00034126979629210056, "tps": 14647, "wall": 39434.8} {"step": 8814, "train_loss": 3.632424831390381, "lr": 0.00034125563811706537, "tps": 14647, "wall": 39439.7} {"step": 8815, "train_loss": 3.5525007247924805, "lr": 0.00034124147856843975, "tps": 14647, "wall": 39444.7} {"step": 8816, "train_loss": 3.4369752407073975, "lr": 0.00034122731764638407, "tps": 14647, "wall": 39449.7} {"step": 8817, "train_loss": 3.5825443267822266, "lr": 0.0003412131553510587, "tps": 14647, "wall": 39454.7} {"step": 8818, "train_loss": 3.432788372039795, "lr": 0.00034119899168262417, "tps": 14646, "wall": 39459.7} {"step": 8819, "train_loss": 3.5343446731567383, "lr": 0.00034118482664124094, "tps": 14646, "wall": 39464.6} {"step": 8820, "train_loss": 3.474602222442627, "lr": 0.0003411706602270695, "tps": 14646, "wall": 39469.6} {"step": 8821, "train_loss": 3.6486997604370117, "lr": 0.0003411564924402702, "tps": 14646, "wall": 39474.6} {"step": 8822, "train_loss": 3.532134532928467, "lr": 0.0003411423232810036, "tps": 14646, "wall": 39479.6} {"step": 8823, "train_loss": 3.624141216278076, "lr": 0.00034112815274943024, "tps": 14645, "wall": 39484.5} {"step": 8824, "train_loss": 3.484485626220703, "lr": 0.00034111398084571057, "tps": 14645, "wall": 39489.5} {"step": 8825, "train_loss": 3.640348434448242, "lr": 0.0003410998075700052, "tps": 14645, "wall": 39494.5} {"step": 8826, "train_loss": 3.594454288482666, "lr": 0.00034108563292247466, "tps": 14645, "wall": 39499.4} {"step": 8827, "train_loss": 3.4562528133392334, "lr": 0.0003410714569032795, "tps": 14645, "wall": 39504.4} {"step": 8828, "train_loss": 3.562762498855591, "lr": 0.0003410572795125803, "tps": 14645, "wall": 39509.5} {"step": 8829, "train_loss": 3.5983164310455322, "lr": 0.00034104310075053776, "tps": 14644, "wall": 39514.5} {"step": 8830, "train_loss": 3.5818252563476562, "lr": 0.00034102892061731237, "tps": 14644, "wall": 39519.5} {"step": 8831, "train_loss": 3.4810476303100586, "lr": 0.00034101473911306486, "tps": 14644, "wall": 39524.5} {"step": 8832, "train_loss": 3.516575813293457, "lr": 0.00034100055623795586, "tps": 14644, "wall": 39529.5} {"step": 8833, "train_loss": 3.538587808609009, "lr": 0.00034098637199214595, "tps": 14644, "wall": 39534.5} {"step": 8834, "train_loss": 3.510894298553467, "lr": 0.0003409721863757959, "tps": 14643, "wall": 39539.6} {"step": 8835, "train_loss": 3.666050434112549, "lr": 0.00034095799938906637, "tps": 14643, "wall": 39544.7} {"step": 8836, "train_loss": 3.465386152267456, "lr": 0.00034094381103211806, "tps": 14643, "wall": 39549.7} {"step": 8837, "train_loss": 3.6107888221740723, "lr": 0.00034092962130511176, "tps": 14643, "wall": 39554.7} {"step": 8838, "train_loss": 3.6345937252044678, "lr": 0.00034091543020820815, "tps": 14642, "wall": 39559.7} {"step": 8839, "train_loss": 3.6026270389556885, "lr": 0.000340901237741568, "tps": 14642, "wall": 39564.7} {"step": 8840, "train_loss": 3.5252554416656494, "lr": 0.00034088704390535207, "tps": 14642, "wall": 39569.7} {"step": 8841, "train_loss": 3.587528705596924, "lr": 0.0003408728486997212, "tps": 14642, "wall": 39574.7} {"step": 8842, "train_loss": 3.545802593231201, "lr": 0.00034085865212483615, "tps": 14642, "wall": 39579.7} {"step": 8843, "train_loss": 3.5986382961273193, "lr": 0.0003408444541808577, "tps": 14642, "wall": 39584.6} {"step": 8844, "train_loss": 3.5562143325805664, "lr": 0.0003408302548679468, "tps": 14641, "wall": 39589.6} {"step": 8845, "train_loss": 3.5904436111450195, "lr": 0.0003408160541862643, "tps": 14641, "wall": 39594.7} {"step": 8846, "train_loss": 3.5291428565979004, "lr": 0.00034080185213597084, "tps": 14641, "wall": 39599.7} {"step": 8847, "train_loss": 3.482171058654785, "lr": 0.00034078764871722756, "tps": 14641, "wall": 39604.7} {"step": 8848, "train_loss": 3.519885778427124, "lr": 0.0003407734439301953, "tps": 14641, "wall": 39609.7} {"step": 8849, "train_loss": 3.5178699493408203, "lr": 0.00034075923777503484, "tps": 14640, "wall": 39614.7} {"step": 8850, "train_loss": 3.5298404693603516, "lr": 0.00034074503025190725, "tps": 14640, "wall": 39619.7} {"step": 8851, "train_loss": 3.5436739921569824, "lr": 0.00034073082136097346, "tps": 14640, "wall": 39624.8} {"step": 8852, "train_loss": 3.520024061203003, "lr": 0.0003407166111023943, "tps": 14640, "wall": 39629.8} {"step": 8853, "train_loss": 3.502058982849121, "lr": 0.0003407023994763309, "tps": 14640, "wall": 39634.8} {"step": 8854, "train_loss": 3.4641032218933105, "lr": 0.0003406881864829442, "tps": 14639, "wall": 39639.8} {"step": 8855, "train_loss": 3.5638132095336914, "lr": 0.0003406739721223951, "tps": 14639, "wall": 39644.8} {"step": 8856, "train_loss": 3.5174224376678467, "lr": 0.0003406597563948448, "tps": 14639, "wall": 39649.7} {"step": 8857, "train_loss": 3.563457727432251, "lr": 0.00034064553930045427, "tps": 14639, "wall": 39654.7} {"step": 8858, "train_loss": 3.460888385772705, "lr": 0.00034063132083938456, "tps": 14638, "wall": 39660.0} {"step": 8859, "train_loss": 3.444772720336914, "lr": 0.0003406171010117966, "tps": 14638, "wall": 39665.3} {"step": 8860, "train_loss": 3.5863256454467773, "lr": 0.00034060287981785173, "tps": 14638, "wall": 39670.3} {"step": 8861, "train_loss": 3.5709285736083984, "lr": 0.00034058865725771083, "tps": 14638, "wall": 39675.1} {"step": 8862, "train_loss": 3.6730124950408936, "lr": 0.00034057443333153516, "tps": 14638, "wall": 39679.9} {"step": 8863, "train_loss": 3.579866886138916, "lr": 0.0003405602080394857, "tps": 14638, "wall": 39684.8} {"step": 8864, "train_loss": 3.6000616550445557, "lr": 0.00034054598138172376, "tps": 14638, "wall": 39689.6} {"step": 8865, "train_loss": 3.5437750816345215, "lr": 0.00034053175335841036, "tps": 14637, "wall": 39694.4} {"step": 8866, "train_loss": 3.5112669467926025, "lr": 0.00034051752396970674, "tps": 14637, "wall": 39699.2} {"step": 8867, "train_loss": 3.5002400875091553, "lr": 0.0003405032932157742, "tps": 14637, "wall": 39703.9} {"step": 8868, "train_loss": 3.5846099853515625, "lr": 0.0003404890610967737, "tps": 14637, "wall": 39708.7} {"step": 8869, "train_loss": 3.6467862129211426, "lr": 0.0003404748276128666, "tps": 14637, "wall": 39713.5} {"step": 8870, "train_loss": 3.5573713779449463, "lr": 0.00034046059276421424, "tps": 14637, "wall": 39718.4} {"step": 8871, "train_loss": 3.499380350112915, "lr": 0.00034044635655097765, "tps": 14637, "wall": 39723.2} {"step": 8872, "train_loss": 3.4935638904571533, "lr": 0.00034043211897331833, "tps": 14637, "wall": 39728.1} {"step": 8873, "train_loss": 3.65630841255188, "lr": 0.0003404178800313974, "tps": 14636, "wall": 39732.9} {"step": 8874, "train_loss": 3.38869571685791, "lr": 0.00034040363972537616, "tps": 14636, "wall": 39737.7} {"step": 8875, "train_loss": 3.5059070587158203, "lr": 0.000340389398055416, "tps": 14636, "wall": 39742.6} {"step": 8876, "train_loss": 3.5857338905334473, "lr": 0.00034037515502167835, "tps": 14636, "wall": 39747.4} {"step": 8877, "train_loss": 3.6045939922332764, "lr": 0.0003403609106243243, "tps": 14636, "wall": 39752.3} {"step": 8878, "train_loss": 3.564363479614258, "lr": 0.00034034666486351537, "tps": 14636, "wall": 39757.2} {"step": 8879, "train_loss": 3.476780414581299, "lr": 0.0003403324177394129, "tps": 14635, "wall": 39762.2} {"step": 8880, "train_loss": 3.540099620819092, "lr": 0.00034031816925217834, "tps": 14635, "wall": 39767.2} {"step": 8881, "train_loss": 3.620342969894409, "lr": 0.000340303919401973, "tps": 14635, "wall": 39772.2} {"step": 8882, "train_loss": 3.5432028770446777, "lr": 0.0003402896681889584, "tps": 14635, "wall": 39777.4} {"step": 8883, "train_loss": 3.553952217102051, "lr": 0.0003402754156132959, "tps": 14635, "wall": 39782.6} {"step": 8884, "train_loss": 3.6291239261627197, "lr": 0.00034026116167514697, "tps": 14634, "wall": 39787.6} {"step": 8885, "train_loss": 3.5476179122924805, "lr": 0.0003402469063746731, "tps": 14634, "wall": 39792.6} {"step": 8886, "train_loss": 3.5596041679382324, "lr": 0.0003402326497120358, "tps": 14634, "wall": 39797.6} {"step": 8887, "train_loss": 3.511385440826416, "lr": 0.00034021839168739653, "tps": 14634, "wall": 39802.6} {"step": 8888, "train_loss": 3.5627551078796387, "lr": 0.0003402041323009168, "tps": 14634, "wall": 39807.6} {"step": 8889, "train_loss": 3.608152151107788, "lr": 0.00034018987155275815, "tps": 14633, "wall": 39812.5} {"step": 8890, "train_loss": 3.676340341567993, "lr": 0.00034017560944308217, "tps": 14633, "wall": 39817.6} {"step": 8891, "train_loss": 3.5517663955688477, "lr": 0.0003401613459720504, "tps": 14633, "wall": 39822.5} {"step": 8892, "train_loss": 3.5310463905334473, "lr": 0.00034014708113982425, "tps": 14633, "wall": 39827.5} {"step": 8893, "train_loss": 3.570984363555908, "lr": 0.0003401328149465656, "tps": 14633, "wall": 39832.5} {"step": 8894, "train_loss": 3.607297658920288, "lr": 0.00034011854739243594, "tps": 14632, "wall": 39837.6} {"step": 8895, "train_loss": 3.5408003330230713, "lr": 0.00034010427847759687, "tps": 14632, "wall": 39842.6} {"step": 8896, "train_loss": 3.529613494873047, "lr": 0.00034009000820220994, "tps": 14632, "wall": 39847.6} {"step": 8897, "train_loss": 3.460993766784668, "lr": 0.00034007573656643703, "tps": 14632, "wall": 39852.6} {"step": 8898, "train_loss": 3.5098443031311035, "lr": 0.00034006146357043953, "tps": 14632, "wall": 39857.6} {"step": 8899, "train_loss": 3.584421157836914, "lr": 0.0003400471892143794, "tps": 14632, "wall": 39862.6} {"step": 8900, "train_loss": 3.5553715229034424, "lr": 0.00034003291349841817, "tps": 14631, "wall": 39867.6} {"step": 8901, "train_loss": 3.549315929412842, "lr": 0.00034001863642271757, "tps": 14631, "wall": 39872.6} {"step": 8902, "train_loss": 3.4500060081481934, "lr": 0.0003400043579874395, "tps": 14631, "wall": 39877.5} {"step": 8903, "train_loss": 3.612365245819092, "lr": 0.00033999007819274544, "tps": 14631, "wall": 39882.4} {"step": 8904, "train_loss": 3.6182608604431152, "lr": 0.0003399757970387973, "tps": 14631, "wall": 39887.4} {"step": 8905, "train_loss": 3.5201330184936523, "lr": 0.00033996151452575686, "tps": 14630, "wall": 39892.4} {"step": 8906, "train_loss": 3.512643337249756, "lr": 0.00033994723065378584, "tps": 14630, "wall": 39897.4} {"step": 8907, "train_loss": 3.5843424797058105, "lr": 0.0003399329454230462, "tps": 14630, "wall": 39902.5} {"step": 8908, "train_loss": 3.504591941833496, "lr": 0.0003399186588336996, "tps": 14630, "wall": 39907.5} {"step": 8909, "train_loss": 3.580034017562866, "lr": 0.000339904370885908, "tps": 14630, "wall": 39912.5} {"step": 8910, "train_loss": 3.538651704788208, "lr": 0.0003398900815798331, "tps": 14629, "wall": 39917.5} {"step": 8911, "train_loss": 3.5938150882720947, "lr": 0.000339875790915637, "tps": 14629, "wall": 39922.5} {"step": 8912, "train_loss": 3.549301862716675, "lr": 0.0003398614988934813, "tps": 14629, "wall": 39927.5} {"step": 8913, "train_loss": 3.5584511756896973, "lr": 0.0003398472055135282, "tps": 14629, "wall": 39932.5} {"step": 8914, "train_loss": 3.477673053741455, "lr": 0.0003398329107759394, "tps": 14629, "wall": 39937.5} {"step": 8915, "train_loss": 3.607309103012085, "lr": 0.0003398186146808769, "tps": 14629, "wall": 39942.5} {"step": 8916, "train_loss": 3.5380547046661377, "lr": 0.00033980431722850266, "tps": 14628, "wall": 39947.5} {"step": 8917, "train_loss": 3.590060234069824, "lr": 0.0003397900184189786, "tps": 14628, "wall": 39952.5} {"step": 8918, "train_loss": 3.598799705505371, "lr": 0.00033977571825246684, "tps": 14628, "wall": 39957.5} {"step": 8919, "train_loss": 3.5589699745178223, "lr": 0.00033976141672912923, "tps": 14628, "wall": 39962.5} {"step": 8920, "train_loss": 3.5258703231811523, "lr": 0.0003397471138491277, "tps": 14628, "wall": 39967.5} {"step": 8921, "train_loss": 3.513857364654541, "lr": 0.00033973280961262453, "tps": 14627, "wall": 39972.5} {"step": 8922, "train_loss": 3.6122658252716064, "lr": 0.00033971850401978156, "tps": 14627, "wall": 39977.5} {"step": 8923, "train_loss": 3.6184329986572266, "lr": 0.0003397041970707609, "tps": 14627, "wall": 39982.4} {"step": 8924, "train_loss": 3.5285403728485107, "lr": 0.0003396898887657246, "tps": 14627, "wall": 39987.4} {"step": 8925, "train_loss": 3.482748031616211, "lr": 0.0003396755791048348, "tps": 14627, "wall": 39992.4} {"step": 8926, "train_loss": 3.5233473777770996, "lr": 0.0003396612680882535, "tps": 14626, "wall": 39997.4} {"step": 8927, "train_loss": 3.624911308288574, "lr": 0.0003396469557161429, "tps": 14626, "wall": 40002.4} {"step": 8928, "train_loss": 3.5940637588500977, "lr": 0.00033963264198866517, "tps": 14626, "wall": 40007.4} {"step": 8929, "train_loss": 3.5416972637176514, "lr": 0.00033961832690598235, "tps": 14626, "wall": 40012.4} {"step": 8930, "train_loss": 3.572779655456543, "lr": 0.00033960401046825666, "tps": 14626, "wall": 40017.4} {"step": 8931, "train_loss": 3.5721702575683594, "lr": 0.0003395896926756503, "tps": 14625, "wall": 40022.4} {"step": 8932, "train_loss": 3.4309000968933105, "lr": 0.0003395753735283254, "tps": 14625, "wall": 40027.4} {"step": 8933, "train_loss": 3.530107021331787, "lr": 0.0003395610530264442, "tps": 14625, "wall": 40032.4} {"step": 8934, "train_loss": 3.546812057495117, "lr": 0.00033954673117016893, "tps": 14625, "wall": 40037.4} {"step": 8935, "train_loss": 3.428621768951416, "lr": 0.0003395324079596618, "tps": 14625, "wall": 40042.4} {"step": 8936, "train_loss": 3.4662466049194336, "lr": 0.00033951808339508513, "tps": 14625, "wall": 40047.3} {"step": 8937, "train_loss": 3.440096378326416, "lr": 0.00033950375747660114, "tps": 14624, "wall": 40052.3} {"step": 8938, "train_loss": 3.5795798301696777, "lr": 0.0003394894302043721, "tps": 14624, "wall": 40057.3} {"step": 8939, "train_loss": 3.5708510875701904, "lr": 0.0003394751015785603, "tps": 14624, "wall": 40062.3} {"step": 8940, "train_loss": 3.6424756050109863, "lr": 0.00033946077159932814, "tps": 14624, "wall": 40067.3} {"step": 8941, "train_loss": 3.533076763153076, "lr": 0.0003394464402668379, "tps": 14624, "wall": 40072.3} {"step": 8942, "train_loss": 3.5137314796447754, "lr": 0.0003394321075812518, "tps": 14623, "wall": 40077.3} {"step": 8943, "train_loss": 3.475067615509033, "lr": 0.0003394177735427325, "tps": 14623, "wall": 40082.3} {"step": 8944, "train_loss": 3.5555050373077393, "lr": 0.00033940343815144205, "tps": 14623, "wall": 40087.3} {"step": 8945, "train_loss": 3.5209555625915527, "lr": 0.00033938910140754317, "tps": 14623, "wall": 40092.3} {"step": 8946, "train_loss": 3.4233524799346924, "lr": 0.000339374763311198, "tps": 14623, "wall": 40097.3} {"step": 8947, "train_loss": 3.51983904838562, "lr": 0.000339360423862569, "tps": 14623, "wall": 40102.2} {"step": 8948, "train_loss": 3.643350839614868, "lr": 0.00033934608306181873, "tps": 14622, "wall": 40107.2} {"step": 8949, "train_loss": 3.660719394683838, "lr": 0.0003393317409091095, "tps": 14622, "wall": 40112.2} {"step": 8950, "train_loss": 3.5088865756988525, "lr": 0.00033931739740460397, "tps": 14622, "wall": 40117.2} {"step": 8951, "train_loss": 3.580362319946289, "lr": 0.00033930305254846433, "tps": 14622, "wall": 40122.2} {"step": 8952, "train_loss": 3.5449538230895996, "lr": 0.0003392887063408534, "tps": 14622, "wall": 40127.1} {"step": 8953, "train_loss": 3.571936845779419, "lr": 0.00033927435878193356, "tps": 14621, "wall": 40132.2} {"step": 8954, "train_loss": 3.5964040756225586, "lr": 0.0003392600098718673, "tps": 14621, "wall": 40137.2} {"step": 8955, "train_loss": 3.5783262252807617, "lr": 0.00033924565961081715, "tps": 14621, "wall": 40142.2} {"step": 8956, "train_loss": 3.565960168838501, "lr": 0.0003392313079989457, "tps": 14621, "wall": 40147.2} {"step": 8957, "train_loss": 3.538397789001465, "lr": 0.0003392169550364156, "tps": 14621, "wall": 40152.1} {"step": 8958, "train_loss": 3.6171140670776367, "lr": 0.0003392026007233894, "tps": 14620, "wall": 40157.1} {"step": 8959, "train_loss": 3.5312905311584473, "lr": 0.00033918824506002965, "tps": 14620, "wall": 40162.1} {"step": 8960, "train_loss": 3.531538963317871, "lr": 0.00033917388804649903, "tps": 14620, "wall": 40167.1} {"step": 8961, "train_loss": 3.564075469970703, "lr": 0.0003391595296829602, "tps": 14620, "wall": 40172.1} {"step": 8962, "train_loss": 3.591083288192749, "lr": 0.00033914516996957564, "tps": 14620, "wall": 40177.5} {"step": 8963, "train_loss": 3.527041435241699, "lr": 0.0003391308089065083, "tps": 14619, "wall": 40182.5} {"step": 8964, "train_loss": 3.5793983936309814, "lr": 0.00033911644649392065, "tps": 14619, "wall": 40187.5} {"step": 8965, "train_loss": 3.4573936462402344, "lr": 0.00033910208273197544, "tps": 14619, "wall": 40192.5} {"step": 8966, "train_loss": 3.6250782012939453, "lr": 0.0003390877176208354, "tps": 14619, "wall": 40197.5} {"step": 8967, "train_loss": 3.542614459991455, "lr": 0.0003390733511606633, "tps": 14619, "wall": 40202.5} {"step": 8968, "train_loss": 3.674595594406128, "lr": 0.0003390589833516218, "tps": 14618, "wall": 40207.5} {"step": 8969, "train_loss": 3.565566062927246, "lr": 0.00033904461419387365, "tps": 14618, "wall": 40212.4} {"step": 8970, "train_loss": 3.4458165168762207, "lr": 0.00033903024368758176, "tps": 14618, "wall": 40217.4} {"step": 8971, "train_loss": 3.5190632343292236, "lr": 0.00033901587183290873, "tps": 14618, "wall": 40222.4} {"step": 8972, "train_loss": 3.4961905479431152, "lr": 0.00033900149863001755, "tps": 14618, "wall": 40227.4} {"step": 8973, "train_loss": 3.522876024246216, "lr": 0.0003389871240790709, "tps": 14618, "wall": 40232.4} {"step": 8974, "train_loss": 3.506350517272949, "lr": 0.0003389727481802317, "tps": 14617, "wall": 40237.4} {"step": 8975, "train_loss": 3.574326992034912, "lr": 0.00033895837093366274, "tps": 14617, "wall": 40242.3} {"step": 8976, "train_loss": 3.5252068042755127, "lr": 0.000338943992339527, "tps": 14617, "wall": 40247.4} {"step": 8977, "train_loss": 3.4355177879333496, "lr": 0.00033892961239798716, "tps": 14617, "wall": 40252.3} {"step": 8978, "train_loss": 3.6013755798339844, "lr": 0.00033891523110920633, "tps": 14617, "wall": 40257.4} {"step": 8979, "train_loss": 3.5872294902801514, "lr": 0.00033890084847334724, "tps": 14616, "wall": 40262.4} {"step": 8980, "train_loss": 3.5563275814056396, "lr": 0.000338886464490573, "tps": 14616, "wall": 40267.3} {"step": 8981, "train_loss": 3.6134705543518066, "lr": 0.00033887207916104636, "tps": 14616, "wall": 40272.3} {"step": 8982, "train_loss": 3.5357742309570312, "lr": 0.0003388576924849305, "tps": 14616, "wall": 40277.2} {"step": 8983, "train_loss": 3.583702564239502, "lr": 0.00033884330446238816, "tps": 14616, "wall": 40282.2} {"step": 8984, "train_loss": 3.560265302658081, "lr": 0.0003388289150935825, "tps": 14616, "wall": 40287.2} {"step": 8985, "train_loss": 3.4967641830444336, "lr": 0.00033881452437867644, "tps": 14615, "wall": 40292.2} {"step": 8986, "train_loss": 3.4743752479553223, "lr": 0.00033880013231783306, "tps": 14615, "wall": 40297.1} {"step": 8987, "train_loss": 3.6397314071655273, "lr": 0.00033878573891121534, "tps": 14615, "wall": 40302.1} {"step": 8988, "train_loss": 3.5203397274017334, "lr": 0.0003387713441589863, "tps": 14615, "wall": 40307.1} {"step": 8989, "train_loss": 3.563783884048462, "lr": 0.00033875694806130904, "tps": 14615, "wall": 40312.1} {"step": 8990, "train_loss": 3.550394058227539, "lr": 0.00033874255061834666, "tps": 14615, "wall": 40317.1} {"step": 8991, "train_loss": 3.476496696472168, "lr": 0.00033872815183026234, "tps": 14614, "wall": 40322.1} {"step": 8992, "train_loss": 3.512540578842163, "lr": 0.000338713751697219, "tps": 14614, "wall": 40327.0} {"step": 8993, "train_loss": 3.625431776046753, "lr": 0.00033869935021937984, "tps": 14614, "wall": 40332.0} {"step": 8994, "train_loss": 3.6320743560791016, "lr": 0.00033868494739690806, "tps": 14614, "wall": 40337.0} {"step": 8995, "train_loss": 3.5727388858795166, "lr": 0.0003386705432299667, "tps": 14614, "wall": 40341.9} {"step": 8996, "train_loss": 3.4988701343536377, "lr": 0.00033865613771871914, "tps": 14613, "wall": 40346.9} {"step": 8997, "train_loss": 3.537385940551758, "lr": 0.0003386417308633284, "tps": 14613, "wall": 40351.8} {"step": 8998, "train_loss": 3.648744583129883, "lr": 0.00033862732266395765, "tps": 14613, "wall": 40356.9} {"step": 8999, "train_loss": 3.4685909748077393, "lr": 0.0003386129131207702, "tps": 14613, "wall": 40361.8} {"step": 9000, "train_loss": 3.5856552124023438, "lr": 0.00033859850223392926, "tps": 14613, "wall": 40366.8, "val_loss_monitor": 3.569185431684418} {"step": 9001, "train_loss": 3.528911590576172, "lr": 0.0003385840900035981, "tps": 14595, "wall": 40419.4} {"step": 9002, "train_loss": 3.4942619800567627, "lr": 0.0003385696764299399, "tps": 14595, "wall": 40424.4} {"step": 9003, "train_loss": 3.496640205383301, "lr": 0.000338555261513118, "tps": 14595, "wall": 40429.4} {"step": 9004, "train_loss": 3.564969062805176, "lr": 0.0003385408452532957, "tps": 14595, "wall": 40434.5} {"step": 9005, "train_loss": 3.550222158432007, "lr": 0.0003385264276506363, "tps": 14595, "wall": 40439.5} {"step": 9006, "train_loss": 3.520620822906494, "lr": 0.00033851200870530315, "tps": 14594, "wall": 40444.5} {"step": 9007, "train_loss": 3.5540993213653564, "lr": 0.00033849758841745945, "tps": 14594, "wall": 40449.5} {"step": 9008, "train_loss": 3.636338710784912, "lr": 0.00033848316678726867, "tps": 14594, "wall": 40454.4} {"step": 9009, "train_loss": 3.349604845046997, "lr": 0.00033846874381489425, "tps": 14594, "wall": 40459.4} {"step": 9010, "train_loss": 3.575888156890869, "lr": 0.00033845431950049943, "tps": 14594, "wall": 40464.4} {"step": 9011, "train_loss": 3.5624728202819824, "lr": 0.0003384398938442477, "tps": 14593, "wall": 40469.4} {"step": 9012, "train_loss": 3.625882387161255, "lr": 0.00033842546684630245, "tps": 14593, "wall": 40474.4} {"step": 9013, "train_loss": 3.5729174613952637, "lr": 0.00033841103850682706, "tps": 14593, "wall": 40479.4} {"step": 9014, "train_loss": 3.5359408855438232, "lr": 0.0003383966088259851, "tps": 14593, "wall": 40484.4} {"step": 9015, "train_loss": 3.5797119140625, "lr": 0.00033838217780393984, "tps": 14593, "wall": 40489.4} {"step": 9016, "train_loss": 3.5740818977355957, "lr": 0.000338367745440855, "tps": 14593, "wall": 40494.4} {"step": 9017, "train_loss": 3.661572217941284, "lr": 0.00033835331173689384, "tps": 14592, "wall": 40499.4} {"step": 9018, "train_loss": 3.5596580505371094, "lr": 0.00033833887669222, "tps": 14592, "wall": 40504.3} {"step": 9019, "train_loss": 3.5807290077209473, "lr": 0.0003383244403069969, "tps": 14592, "wall": 40509.3} {"step": 9020, "train_loss": 3.508484363555908, "lr": 0.00033831000258138815, "tps": 14592, "wall": 40514.3} {"step": 9021, "train_loss": 3.5472586154937744, "lr": 0.0003382955635155574, "tps": 14592, "wall": 40519.3} {"step": 9022, "train_loss": 3.4397058486938477, "lr": 0.000338281123109668, "tps": 14592, "wall": 40524.3} {"step": 9023, "train_loss": 3.5775485038757324, "lr": 0.0003382666813638837, "tps": 14591, "wall": 40529.3} {"step": 9024, "train_loss": 3.517763614654541, "lr": 0.000338252238278368, "tps": 14591, "wall": 40534.2} {"step": 9025, "train_loss": 3.5326974391937256, "lr": 0.0003382377938532845, "tps": 14591, "wall": 40539.2} {"step": 9026, "train_loss": 3.438631057739258, "lr": 0.000338223348088797, "tps": 14591, "wall": 40544.2} {"step": 9027, "train_loss": 3.56320858001709, "lr": 0.0003382089009850689, "tps": 14591, "wall": 40549.1} {"step": 9028, "train_loss": 3.5523531436920166, "lr": 0.0003381944525422641, "tps": 14590, "wall": 40554.1} {"step": 9029, "train_loss": 3.5696394443511963, "lr": 0.000338180002760546, "tps": 14590, "wall": 40559.1} {"step": 9030, "train_loss": 3.5151872634887695, "lr": 0.00033816555164007853, "tps": 14590, "wall": 40564.0} {"step": 9031, "train_loss": 3.5909276008605957, "lr": 0.0003381510991810253, "tps": 14590, "wall": 40569.0} {"step": 9032, "train_loss": 3.5002963542938232, "lr": 0.00033813664538355, "tps": 14590, "wall": 40574.0} {"step": 9033, "train_loss": 3.570901393890381, "lr": 0.00033812219024781636, "tps": 14590, "wall": 40578.9} {"step": 9034, "train_loss": 3.567009210586548, "lr": 0.00033810773377398817, "tps": 14589, "wall": 40583.9} {"step": 9035, "train_loss": 3.603844165802002, "lr": 0.0003380932759622292, "tps": 14589, "wall": 40588.8} {"step": 9036, "train_loss": 3.4620778560638428, "lr": 0.00033807881681270326, "tps": 14589, "wall": 40593.8} {"step": 9037, "train_loss": 3.585174322128296, "lr": 0.000338064356325574, "tps": 14589, "wall": 40598.8} {"step": 9038, "train_loss": 3.4711461067199707, "lr": 0.0003380498945010053, "tps": 14589, "wall": 40603.7} {"step": 9039, "train_loss": 3.563751220703125, "lr": 0.0003380354313391611, "tps": 14589, "wall": 40608.7} {"step": 9040, "train_loss": 3.504081964492798, "lr": 0.0003380209668402052, "tps": 14588, "wall": 40613.6} {"step": 9041, "train_loss": 3.501171827316284, "lr": 0.0003380065010043013, "tps": 14588, "wall": 40618.6} {"step": 9042, "train_loss": 3.539940595626831, "lr": 0.0003379920338316134, "tps": 14588, "wall": 40623.6} {"step": 9043, "train_loss": 3.482074737548828, "lr": 0.00033797756532230535, "tps": 14588, "wall": 40628.5} {"step": 9044, "train_loss": 3.5994069576263428, "lr": 0.00033796309547654105, "tps": 14588, "wall": 40633.5} {"step": 9045, "train_loss": 3.550391435623169, "lr": 0.00033794862429448446, "tps": 14588, "wall": 40638.5} {"step": 9046, "train_loss": 3.530508279800415, "lr": 0.00033793415177629945, "tps": 14587, "wall": 40643.4} {"step": 9047, "train_loss": 3.5597751140594482, "lr": 0.00033791967792215, "tps": 14587, "wall": 40648.4} {"step": 9048, "train_loss": 3.643155336380005, "lr": 0.0003379052027322001, "tps": 14587, "wall": 40653.3} {"step": 9049, "train_loss": 3.5619566440582275, "lr": 0.0003378907262066136, "tps": 14587, "wall": 40658.3} {"step": 9050, "train_loss": 3.5205886363983154, "lr": 0.0003378762483455546, "tps": 14587, "wall": 40663.2} {"step": 9051, "train_loss": 3.5853307247161865, "lr": 0.0003378617691491871, "tps": 14587, "wall": 40668.1} {"step": 9052, "train_loss": 3.4973011016845703, "lr": 0.00033784728861767507, "tps": 14586, "wall": 40673.1} {"step": 9053, "train_loss": 3.473803997039795, "lr": 0.0003378328067511826, "tps": 14586, "wall": 40678.1} {"step": 9054, "train_loss": 3.533369779586792, "lr": 0.0003378183235498738, "tps": 14586, "wall": 40683.1} {"step": 9055, "train_loss": 3.6138601303100586, "lr": 0.00033780383901391256, "tps": 14586, "wall": 40688.0} {"step": 9056, "train_loss": 3.6733779907226562, "lr": 0.0003377893531434631, "tps": 14586, "wall": 40693.0} {"step": 9057, "train_loss": 3.5958709716796875, "lr": 0.0003377748659386894, "tps": 14586, "wall": 40697.9} {"step": 9058, "train_loss": 3.5630040168762207, "lr": 0.00033776037739975575, "tps": 14585, "wall": 40702.9} {"step": 9059, "train_loss": 3.554478168487549, "lr": 0.0003377458875268261, "tps": 14585, "wall": 40707.8} {"step": 9060, "train_loss": 3.5207715034484863, "lr": 0.0003377313963200647, "tps": 14585, "wall": 40712.8} {"step": 9061, "train_loss": 3.494629144668579, "lr": 0.00033771690377963566, "tps": 14585, "wall": 40717.8} {"step": 9062, "train_loss": 3.583034038543701, "lr": 0.0003377024099057032, "tps": 14585, "wall": 40722.7} {"step": 9063, "train_loss": 3.439840078353882, "lr": 0.00033768791469843145, "tps": 14585, "wall": 40727.7} {"step": 9064, "train_loss": 3.5538783073425293, "lr": 0.0003376734181579846, "tps": 14584, "wall": 40732.6} {"step": 9065, "train_loss": 3.555349826812744, "lr": 0.000337658920284527, "tps": 14584, "wall": 40737.6} {"step": 9066, "train_loss": 3.5261404514312744, "lr": 0.00033764442107822265, "tps": 14584, "wall": 40742.6} {"step": 9067, "train_loss": 3.646503210067749, "lr": 0.0003376299205392361, "tps": 14584, "wall": 40747.5} {"step": 9068, "train_loss": 3.6499691009521484, "lr": 0.0003376154186677313, "tps": 14584, "wall": 40752.5} {"step": 9069, "train_loss": 3.5120749473571777, "lr": 0.0003376009154638727, "tps": 14584, "wall": 40757.4} {"step": 9070, "train_loss": 3.4718236923217773, "lr": 0.0003375864109278246, "tps": 14583, "wall": 40762.4} {"step": 9071, "train_loss": 3.607391357421875, "lr": 0.00033757190505975126, "tps": 14583, "wall": 40767.4} {"step": 9072, "train_loss": 3.4775874614715576, "lr": 0.0003375573978598171, "tps": 14583, "wall": 40772.3} {"step": 9073, "train_loss": 3.5299832820892334, "lr": 0.0003375428893281862, "tps": 14583, "wall": 40777.3} {"step": 9074, "train_loss": 3.5751686096191406, "lr": 0.00033752837946502323, "tps": 14583, "wall": 40782.2} {"step": 9075, "train_loss": 3.52346134185791, "lr": 0.0003375138682704924, "tps": 14583, "wall": 40787.2} {"step": 9076, "train_loss": 3.4975194931030273, "lr": 0.0003374993557447581, "tps": 14582, "wall": 40792.1} {"step": 9077, "train_loss": 3.5604066848754883, "lr": 0.00033748484188798476, "tps": 14582, "wall": 40797.2} {"step": 9078, "train_loss": 3.686473846435547, "lr": 0.00033747032670033674, "tps": 14582, "wall": 40802.1} {"step": 9079, "train_loss": 3.549931526184082, "lr": 0.00033745581018197854, "tps": 14582, "wall": 40807.1} {"step": 9080, "train_loss": 3.5159339904785156, "lr": 0.00033744129233307453, "tps": 14582, "wall": 40812.0} {"step": 9081, "train_loss": 3.5549895763397217, "lr": 0.00033742677315378925, "tps": 14582, "wall": 40817.0} {"step": 9082, "train_loss": 3.593123435974121, "lr": 0.00033741225264428704, "tps": 14581, "wall": 40822.0} {"step": 9083, "train_loss": 3.5509982109069824, "lr": 0.00033739773080473256, "tps": 14581, "wall": 40826.9} {"step": 9084, "train_loss": 3.575277328491211, "lr": 0.0003373832076352902, "tps": 14581, "wall": 40831.9} {"step": 9085, "train_loss": 3.5011913776397705, "lr": 0.00033736868313612455, "tps": 14581, "wall": 40836.9} {"step": 9086, "train_loss": 3.5084683895111084, "lr": 0.0003373541573074001, "tps": 14581, "wall": 40841.8} {"step": 9087, "train_loss": 3.539719581604004, "lr": 0.00033733963014928136, "tps": 14581, "wall": 40846.8} {"step": 9088, "train_loss": 3.6183600425720215, "lr": 0.00033732510166193297, "tps": 14580, "wall": 40851.7} {"step": 9089, "train_loss": 3.598822832107544, "lr": 0.0003373105718455195, "tps": 14580, "wall": 40856.8} {"step": 9090, "train_loss": 3.672987937927246, "lr": 0.0003372960407002055, "tps": 14580, "wall": 40861.7} {"step": 9091, "train_loss": 3.4812488555908203, "lr": 0.0003372815082261557, "tps": 14580, "wall": 40866.6} {"step": 9092, "train_loss": 3.6186437606811523, "lr": 0.0003372669744235345, "tps": 14580, "wall": 40871.6} {"step": 9093, "train_loss": 3.537238597869873, "lr": 0.00033725243929250674, "tps": 14580, "wall": 40876.6} {"step": 9094, "train_loss": 3.533031702041626, "lr": 0.000337237902833237, "tps": 14579, "wall": 40881.5} {"step": 9095, "train_loss": 3.498868465423584, "lr": 0.00033722336504588994, "tps": 14579, "wall": 40886.5} {"step": 9096, "train_loss": 3.523132801055908, "lr": 0.0003372088259306303, "tps": 14579, "wall": 40891.4} {"step": 9097, "train_loss": 3.5455551147460938, "lr": 0.00033719428548762266, "tps": 14579, "wall": 40896.4} {"step": 9098, "train_loss": 3.5569796562194824, "lr": 0.00033717974371703187, "tps": 14579, "wall": 40901.4} {"step": 9099, "train_loss": 3.5293970108032227, "lr": 0.00033716520061902254, "tps": 14579, "wall": 40906.3} {"step": 9100, "train_loss": 3.51088809967041, "lr": 0.0003371506561937595, "tps": 14578, "wall": 40911.3} {"step": 9101, "train_loss": 3.547609329223633, "lr": 0.00033713611044140757, "tps": 14578, "wall": 40916.3} {"step": 9102, "train_loss": 3.5031347274780273, "lr": 0.00033712156336213137, "tps": 14578, "wall": 40921.3} {"step": 9103, "train_loss": 3.613952159881592, "lr": 0.0003371070149560958, "tps": 14578, "wall": 40926.2} {"step": 9104, "train_loss": 3.493231773376465, "lr": 0.0003370924652234656, "tps": 14578, "wall": 40931.2} {"step": 9105, "train_loss": 3.5700082778930664, "lr": 0.00033707791416440566, "tps": 14578, "wall": 40936.2} {"step": 9106, "train_loss": 3.5595033168792725, "lr": 0.0003370633617790807, "tps": 14577, "wall": 40941.1} {"step": 9107, "train_loss": 3.495922088623047, "lr": 0.0003370488080676557, "tps": 14577, "wall": 40946.1} {"step": 9108, "train_loss": 3.523254632949829, "lr": 0.0003370342530302955, "tps": 14577, "wall": 40951.0} {"step": 9109, "train_loss": 3.6149394512176514, "lr": 0.00033701969666716485, "tps": 14577, "wall": 40956.0} {"step": 9110, "train_loss": 3.5999808311462402, "lr": 0.00033700513897842884, "tps": 14577, "wall": 40960.9} {"step": 9111, "train_loss": 3.482285261154175, "lr": 0.00033699057996425225, "tps": 14577, "wall": 40965.8} {"step": 9112, "train_loss": 3.541181802749634, "lr": 0.0003369760196248, "tps": 14576, "wall": 40970.8} {"step": 9113, "train_loss": 3.4817495346069336, "lr": 0.00033696145796023716, "tps": 14576, "wall": 40975.8} {"step": 9114, "train_loss": 3.598158836364746, "lr": 0.0003369468949707285, "tps": 14576, "wall": 40980.7} {"step": 9115, "train_loss": 3.5619263648986816, "lr": 0.0003369323306564392, "tps": 14576, "wall": 40985.7} {"step": 9116, "train_loss": 3.5653762817382812, "lr": 0.000336917765017534, "tps": 14576, "wall": 40990.6} {"step": 9117, "train_loss": 3.5869483947753906, "lr": 0.00033690319805417814, "tps": 14576, "wall": 40995.6} {"step": 9118, "train_loss": 3.5368967056274414, "lr": 0.00033688862976653653, "tps": 14575, "wall": 41000.5} {"step": 9119, "train_loss": 3.559749126434326, "lr": 0.0003368740601547741, "tps": 14575, "wall": 41005.4} {"step": 9120, "train_loss": 3.5110039710998535, "lr": 0.0003368594892190561, "tps": 14575, "wall": 41010.4} {"step": 9121, "train_loss": 3.538270950317383, "lr": 0.00033684491695954745, "tps": 14575, "wall": 41015.4} {"step": 9122, "train_loss": 3.517178535461426, "lr": 0.0003368303433764132, "tps": 14575, "wall": 41020.3} {"step": 9123, "train_loss": 3.5219216346740723, "lr": 0.00033681576846981856, "tps": 14575, "wall": 41025.3} {"step": 9124, "train_loss": 3.516085147857666, "lr": 0.0003368011922399286, "tps": 14575, "wall": 41030.2} {"step": 9125, "train_loss": 3.537848949432373, "lr": 0.0003367866146869083, "tps": 14574, "wall": 41035.2} {"step": 9126, "train_loss": 3.614967107772827, "lr": 0.000336772035810923, "tps": 14574, "wall": 41040.2} {"step": 9127, "train_loss": 3.5649008750915527, "lr": 0.0003367574556121378, "tps": 14574, "wall": 41045.1} {"step": 9128, "train_loss": 3.5230705738067627, "lr": 0.00033674287409071773, "tps": 14574, "wall": 41050.1} {"step": 9129, "train_loss": 3.461639881134033, "lr": 0.00033672829124682815, "tps": 14574, "wall": 41055.1} {"step": 9130, "train_loss": 3.498236894607544, "lr": 0.0003367137070806341, "tps": 14574, "wall": 41060.0} {"step": 9131, "train_loss": 3.565103054046631, "lr": 0.0003366991215923009, "tps": 14573, "wall": 41065.0} {"step": 9132, "train_loss": 3.6256327629089355, "lr": 0.00033668453478199377, "tps": 14573, "wall": 41069.9} {"step": 9133, "train_loss": 3.533259391784668, "lr": 0.00033666994664987784, "tps": 14573, "wall": 41074.9} {"step": 9134, "train_loss": 3.4983315467834473, "lr": 0.0003366553571961185, "tps": 14573, "wall": 41079.9} {"step": 9135, "train_loss": 3.5114922523498535, "lr": 0.00033664076642088095, "tps": 14573, "wall": 41084.8} {"step": 9136, "train_loss": 3.5633082389831543, "lr": 0.00033662617432433044, "tps": 14573, "wall": 41089.8} {"step": 9137, "train_loss": 3.561047077178955, "lr": 0.00033661158090663243, "tps": 14572, "wall": 41094.8} {"step": 9138, "train_loss": 3.5578274726867676, "lr": 0.00033659698616795203, "tps": 14572, "wall": 41099.8} {"step": 9139, "train_loss": 3.56178879737854, "lr": 0.00033658239010845475, "tps": 14572, "wall": 41104.8} {"step": 9140, "train_loss": 3.4376015663146973, "lr": 0.00033656779272830576, "tps": 14572, "wall": 41109.8} {"step": 9141, "train_loss": 3.5876734256744385, "lr": 0.0003365531940276705, "tps": 14572, "wall": 41114.7} {"step": 9142, "train_loss": 3.504134178161621, "lr": 0.00033653859400671436, "tps": 14571, "wall": 41119.7} {"step": 9143, "train_loss": 3.6505544185638428, "lr": 0.0003365239926656028, "tps": 14571, "wall": 41124.6} {"step": 9144, "train_loss": 3.445556879043579, "lr": 0.00033650939000450105, "tps": 14571, "wall": 41129.6} {"step": 9145, "train_loss": 3.620204448699951, "lr": 0.0003364947860235747, "tps": 14571, "wall": 41134.6} {"step": 9146, "train_loss": 3.5976016521453857, "lr": 0.0003364801807229891, "tps": 14571, "wall": 41139.5} {"step": 9147, "train_loss": 3.5645570755004883, "lr": 0.0003364655741029097, "tps": 14571, "wall": 41144.5} {"step": 9148, "train_loss": 3.5960681438446045, "lr": 0.0003364509661635019, "tps": 14571, "wall": 41149.4} {"step": 9149, "train_loss": 3.583437204360962, "lr": 0.0003364363569049314, "tps": 14570, "wall": 41154.4} {"step": 9150, "train_loss": 3.5585427284240723, "lr": 0.00033642174632736346, "tps": 14570, "wall": 41159.4} {"step": 9151, "train_loss": 3.45694637298584, "lr": 0.00033640713443096364, "tps": 14570, "wall": 41164.3} {"step": 9152, "train_loss": 3.5349607467651367, "lr": 0.0003363925212158976, "tps": 14570, "wall": 41169.3} {"step": 9153, "train_loss": 3.5612375736236572, "lr": 0.00033637790668233073, "tps": 14570, "wall": 41174.3} {"step": 9154, "train_loss": 3.6130740642547607, "lr": 0.0003363632908304287, "tps": 14570, "wall": 41179.2} {"step": 9155, "train_loss": 3.5347914695739746, "lr": 0.0003363486736603569, "tps": 14569, "wall": 41184.2} {"step": 9156, "train_loss": 3.5236318111419678, "lr": 0.0003363340551722811, "tps": 14569, "wall": 41189.1} {"step": 9157, "train_loss": 3.5337464809417725, "lr": 0.00033631943536636684, "tps": 14569, "wall": 41194.1} {"step": 9158, "train_loss": 3.611176013946533, "lr": 0.00033630481424277975, "tps": 14569, "wall": 41199.0} {"step": 9159, "train_loss": 3.5134081840515137, "lr": 0.0003362901918016854, "tps": 14569, "wall": 41204.0} {"step": 9160, "train_loss": 3.5896687507629395, "lr": 0.00033627556804324946, "tps": 14569, "wall": 41209.0} {"step": 9161, "train_loss": 3.5104310512542725, "lr": 0.0003362609429676375, "tps": 14568, "wall": 41213.9} {"step": 9162, "train_loss": 3.547250509262085, "lr": 0.0003362463165750154, "tps": 14568, "wall": 41219.0} {"step": 9163, "train_loss": 3.5709571838378906, "lr": 0.00033623168886554874, "tps": 14568, "wall": 41223.9} {"step": 9164, "train_loss": 3.592294931411743, "lr": 0.0003362170598394032, "tps": 14568, "wall": 41228.9} {"step": 9165, "train_loss": 3.517759323120117, "lr": 0.0003362024294967445, "tps": 14568, "wall": 41233.8} {"step": 9166, "train_loss": 3.452960968017578, "lr": 0.0003361877978377385, "tps": 14568, "wall": 41238.8} {"step": 9167, "train_loss": 3.52284836769104, "lr": 0.00033617316486255064, "tps": 14567, "wall": 41243.8} {"step": 9168, "train_loss": 3.5178024768829346, "lr": 0.00033615853057134703, "tps": 14567, "wall": 41248.7} {"step": 9169, "train_loss": 3.5565390586853027, "lr": 0.00033614389496429333, "tps": 14567, "wall": 41253.7} {"step": 9170, "train_loss": 3.51046085357666, "lr": 0.00033612925804155514, "tps": 14567, "wall": 41258.7} {"step": 9171, "train_loss": 3.5240840911865234, "lr": 0.00033611461980329857, "tps": 14567, "wall": 41263.6} {"step": 9172, "train_loss": 3.535670280456543, "lr": 0.0003360999802496893, "tps": 14567, "wall": 41268.6} {"step": 9173, "train_loss": 3.4662632942199707, "lr": 0.0003360853393808931, "tps": 14566, "wall": 41273.6} {"step": 9174, "train_loss": 3.493967294692993, "lr": 0.00033607069719707595, "tps": 14566, "wall": 41278.6} {"step": 9175, "train_loss": 3.3848915100097656, "lr": 0.00033605605369840363, "tps": 14566, "wall": 41283.5} {"step": 9176, "train_loss": 3.4266114234924316, "lr": 0.0003360414088850421, "tps": 14566, "wall": 41288.5} {"step": 9177, "train_loss": 3.559115171432495, "lr": 0.00033602676275715714, "tps": 14566, "wall": 41293.5} {"step": 9178, "train_loss": 3.5154173374176025, "lr": 0.0003360121153149148, "tps": 14566, "wall": 41298.4} {"step": 9179, "train_loss": 3.5732128620147705, "lr": 0.00033599746655848097, "tps": 14565, "wall": 41303.4} {"step": 9180, "train_loss": 3.6647908687591553, "lr": 0.0003359828164880215, "tps": 14565, "wall": 41308.3} {"step": 9181, "train_loss": 3.5541272163391113, "lr": 0.00033596816510370243, "tps": 14565, "wall": 41313.3} {"step": 9182, "train_loss": 3.5982837677001953, "lr": 0.0003359535124056897, "tps": 14565, "wall": 41318.3} {"step": 9183, "train_loss": 3.477020740509033, "lr": 0.0003359388583941493, "tps": 14565, "wall": 41323.2} {"step": 9184, "train_loss": 3.500274181365967, "lr": 0.0003359242030692472, "tps": 14565, "wall": 41328.2} {"step": 9185, "train_loss": 3.702497720718384, "lr": 0.0003359095464311496, "tps": 14564, "wall": 41333.1} {"step": 9186, "train_loss": 3.525813579559326, "lr": 0.0003358948884800223, "tps": 14564, "wall": 41338.1} {"step": 9187, "train_loss": 3.7147345542907715, "lr": 0.0003358802292160314, "tps": 14564, "wall": 41343.0} {"step": 9188, "train_loss": 3.530292510986328, "lr": 0.00033586556863934305, "tps": 14564, "wall": 41348.0} {"step": 9189, "train_loss": 3.4603285789489746, "lr": 0.00033585090675012323, "tps": 14564, "wall": 41353.0} {"step": 9190, "train_loss": 3.5159621238708496, "lr": 0.0003358362435485381, "tps": 14564, "wall": 41357.9} {"step": 9191, "train_loss": 3.4239630699157715, "lr": 0.00033582157903475367, "tps": 14563, "wall": 41362.9} {"step": 9192, "train_loss": 3.691619634628296, "lr": 0.0003358069132089362, "tps": 14563, "wall": 41367.9} {"step": 9193, "train_loss": 3.5452399253845215, "lr": 0.00033579224607125177, "tps": 14563, "wall": 41372.8} {"step": 9194, "train_loss": 3.5442280769348145, "lr": 0.00033577757762186646, "tps": 14563, "wall": 41377.8} {"step": 9195, "train_loss": 3.5438807010650635, "lr": 0.0003357629078609465, "tps": 14563, "wall": 41382.7} {"step": 9196, "train_loss": 3.6094329357147217, "lr": 0.00033574823678865804, "tps": 14563, "wall": 41387.7} {"step": 9197, "train_loss": 3.5519025325775146, "lr": 0.00033573356440516736, "tps": 14562, "wall": 41392.7} {"step": 9198, "train_loss": 3.6719279289245605, "lr": 0.0003357188907106405, "tps": 14562, "wall": 41397.7} {"step": 9199, "train_loss": 3.5040364265441895, "lr": 0.0003357042157052439, "tps": 14562, "wall": 41402.7} {"step": 9200, "train_loss": 3.5675177574157715, "lr": 0.00033568953938914356, "tps": 14562, "wall": 41407.7} {"step": 9201, "train_loss": 3.5438551902770996, "lr": 0.00033567486176250597, "tps": 14562, "wall": 41412.6} {"step": 9202, "train_loss": 3.6041250228881836, "lr": 0.00033566018282549725, "tps": 14562, "wall": 41417.5} {"step": 9203, "train_loss": 3.612278461456299, "lr": 0.0003356455025782837, "tps": 14561, "wall": 41422.5} {"step": 9204, "train_loss": 3.5088272094726562, "lr": 0.00033563082102103166, "tps": 14561, "wall": 41427.5} {"step": 9205, "train_loss": 3.4631428718566895, "lr": 0.0003356161381539074, "tps": 14561, "wall": 41432.5} {"step": 9206, "train_loss": 3.5280988216400146, "lr": 0.0003356014539770773, "tps": 14561, "wall": 41437.4} {"step": 9207, "train_loss": 3.6509995460510254, "lr": 0.00033558676849070767, "tps": 14561, "wall": 41442.4} {"step": 9208, "train_loss": 3.6347718238830566, "lr": 0.0003355720816949649, "tps": 14561, "wall": 41447.4} {"step": 9209, "train_loss": 3.516422748565674, "lr": 0.0003355573935900153, "tps": 14560, "wall": 41452.3} {"step": 9210, "train_loss": 3.5880331993103027, "lr": 0.0003355427041760253, "tps": 14560, "wall": 41457.3} {"step": 9211, "train_loss": 3.5494182109832764, "lr": 0.00033552801345316125, "tps": 14560, "wall": 41462.3} {"step": 9212, "train_loss": 3.5063350200653076, "lr": 0.00033551332142158966, "tps": 14560, "wall": 41467.2} {"step": 9213, "train_loss": 3.556033134460449, "lr": 0.0003354986280814769, "tps": 14560, "wall": 41472.2} {"step": 9214, "train_loss": 3.54257869720459, "lr": 0.00033548393343298946, "tps": 14560, "wall": 41477.2} {"step": 9215, "train_loss": 3.4651551246643066, "lr": 0.00033546923747629375, "tps": 14560, "wall": 41482.1} {"step": 9216, "train_loss": 3.4748787879943848, "lr": 0.0003354545402115563, "tps": 14559, "wall": 41487.1} {"step": 9217, "train_loss": 3.6261250972747803, "lr": 0.0003354398416389436, "tps": 14559, "wall": 41492.0} {"step": 9218, "train_loss": 3.473304510116577, "lr": 0.0003354251417586221, "tps": 14559, "wall": 41497.0} {"step": 9219, "train_loss": 3.6214046478271484, "lr": 0.0003354104405707583, "tps": 14559, "wall": 41501.9} {"step": 9220, "train_loss": 3.452610492706299, "lr": 0.00033539573807551883, "tps": 14559, "wall": 41506.9} {"step": 9221, "train_loss": 3.5192034244537354, "lr": 0.00033538103427307016, "tps": 14559, "wall": 41511.8} {"step": 9222, "train_loss": 3.5312652587890625, "lr": 0.0003353663291635789, "tps": 14558, "wall": 41516.8} {"step": 9223, "train_loss": 3.638885974884033, "lr": 0.0003353516227472117, "tps": 14558, "wall": 41521.8} {"step": 9224, "train_loss": 3.479084014892578, "lr": 0.000335336915024135, "tps": 14558, "wall": 41526.8} {"step": 9225, "train_loss": 3.606069564819336, "lr": 0.0003353222059945155, "tps": 14558, "wall": 41531.7} {"step": 9226, "train_loss": 3.666882038116455, "lr": 0.0003353074956585199, "tps": 14558, "wall": 41536.7} {"step": 9227, "train_loss": 3.553248405456543, "lr": 0.0003352927840163146, "tps": 14558, "wall": 41541.7} {"step": 9228, "train_loss": 3.544088363647461, "lr": 0.00033527807106806647, "tps": 14557, "wall": 41546.6} {"step": 9229, "train_loss": 3.5874180793762207, "lr": 0.00033526335681394214, "tps": 14557, "wall": 41551.6} {"step": 9230, "train_loss": 3.5273914337158203, "lr": 0.0003352486412541082, "tps": 14557, "wall": 41556.6} {"step": 9231, "train_loss": 3.4962799549102783, "lr": 0.0003352339243887315, "tps": 14557, "wall": 41561.5} {"step": 9232, "train_loss": 3.6264991760253906, "lr": 0.0003352192062179786, "tps": 14557, "wall": 41566.5} {"step": 9233, "train_loss": 3.529679775238037, "lr": 0.00033520448674201635, "tps": 14557, "wall": 41571.4} {"step": 9234, "train_loss": 3.485429048538208, "lr": 0.0003351897659610114, "tps": 14556, "wall": 41576.4} {"step": 9235, "train_loss": 3.558143138885498, "lr": 0.00033517504387513064, "tps": 14556, "wall": 41581.4} {"step": 9236, "train_loss": 3.619070053100586, "lr": 0.00033516032048454064, "tps": 14556, "wall": 41586.3} {"step": 9237, "train_loss": 3.61529803276062, "lr": 0.00033514559578940833, "tps": 14556, "wall": 41591.3} {"step": 9238, "train_loss": 3.4886441230773926, "lr": 0.0003351308697899005, "tps": 14556, "wall": 41596.2} {"step": 9239, "train_loss": 3.503511428833008, "lr": 0.0003351161424861839, "tps": 14556, "wall": 41601.2} {"step": 9240, "train_loss": 3.4893758296966553, "lr": 0.0003351014138784255, "tps": 14555, "wall": 41606.2} {"step": 9241, "train_loss": 3.56371808052063, "lr": 0.000335086683966792, "tps": 14555, "wall": 41611.2} {"step": 9242, "train_loss": 3.5450353622436523, "lr": 0.0003350719527514503, "tps": 14555, "wall": 41616.1} {"step": 9243, "train_loss": 3.495074510574341, "lr": 0.00033505722023256736, "tps": 14555, "wall": 41621.1} {"step": 9244, "train_loss": 3.533724308013916, "lr": 0.00033504248641031, "tps": 14555, "wall": 41626.0} {"step": 9245, "train_loss": 3.561830759048462, "lr": 0.00033502775128484505, "tps": 14555, "wall": 41631.0} {"step": 9246, "train_loss": 3.4925503730773926, "lr": 0.00033501301485633963, "tps": 14554, "wall": 41636.0} {"step": 9247, "train_loss": 3.556262969970703, "lr": 0.00033499827712496044, "tps": 14554, "wall": 41640.9} {"step": 9248, "train_loss": 3.6850810050964355, "lr": 0.00033498353809087455, "tps": 14554, "wall": 41645.9} {"step": 9249, "train_loss": 3.4317469596862793, "lr": 0.000334968797754249, "tps": 14554, "wall": 41650.9} {"step": 9250, "train_loss": 3.529402256011963, "lr": 0.0003349540561152506, "tps": 14554, "wall": 41655.9} {"step": 9251, "train_loss": 3.631253719329834, "lr": 0.00033493931317404656, "tps": 14554, "wall": 41660.8} {"step": 9252, "train_loss": 3.4678540229797363, "lr": 0.0003349245689308036, "tps": 14554, "wall": 41665.8} {"step": 9253, "train_loss": 3.595170259475708, "lr": 0.00033490982338568905, "tps": 14553, "wall": 41670.7} {"step": 9254, "train_loss": 3.4950380325317383, "lr": 0.0003348950765388698, "tps": 14553, "wall": 41675.7} {"step": 9255, "train_loss": 3.5384459495544434, "lr": 0.0003348803283905128, "tps": 14553, "wall": 41680.7} {"step": 9256, "train_loss": 3.505164623260498, "lr": 0.00033486557894078523, "tps": 14553, "wall": 41685.6} {"step": 9257, "train_loss": 3.6006178855895996, "lr": 0.00033485082818985424, "tps": 14553, "wall": 41690.5} {"step": 9258, "train_loss": 3.5357353687286377, "lr": 0.0003348360761378869, "tps": 14553, "wall": 41695.6} {"step": 9259, "train_loss": 3.650632381439209, "lr": 0.00033482132278505017, "tps": 14552, "wall": 41700.6} {"step": 9260, "train_loss": 3.5042848587036133, "lr": 0.0003348065681315113, "tps": 14552, "wall": 41705.6} {"step": 9261, "train_loss": 3.4691262245178223, "lr": 0.0003347918121774375, "tps": 14552, "wall": 41710.5} {"step": 9262, "train_loss": 3.6035594940185547, "lr": 0.00033477705492299575, "tps": 14552, "wall": 41715.5} {"step": 9263, "train_loss": 3.551785707473755, "lr": 0.0003347622963683533, "tps": 14552, "wall": 41720.4} {"step": 9264, "train_loss": 3.597228527069092, "lr": 0.0003347475365136774, "tps": 14551, "wall": 41725.8} {"step": 9265, "train_loss": 3.513195037841797, "lr": 0.00033473277535913515, "tps": 14551, "wall": 41730.8} {"step": 9266, "train_loss": 3.5232324600219727, "lr": 0.00033471801290489386, "tps": 14551, "wall": 41735.8} {"step": 9267, "train_loss": 3.629995346069336, "lr": 0.0003347032491511207, "tps": 14551, "wall": 41740.8} {"step": 9268, "train_loss": 3.5910956859588623, "lr": 0.0003346884840979829, "tps": 14551, "wall": 41745.7} {"step": 9269, "train_loss": 3.469982862472534, "lr": 0.0003346737177456478, "tps": 14551, "wall": 41750.7} {"step": 9270, "train_loss": 3.5377306938171387, "lr": 0.00033465895009428265, "tps": 14550, "wall": 41755.7} {"step": 9271, "train_loss": 3.5513648986816406, "lr": 0.00033464418114405466, "tps": 14550, "wall": 41760.7} {"step": 9272, "train_loss": 3.4325852394104004, "lr": 0.00033462941089513115, "tps": 14550, "wall": 41765.7} {"step": 9273, "train_loss": 3.5194411277770996, "lr": 0.0003346146393476795, "tps": 14550, "wall": 41770.6} {"step": 9274, "train_loss": 3.5801379680633545, "lr": 0.0003345998665018671, "tps": 14550, "wall": 41775.6} {"step": 9275, "train_loss": 3.595918893814087, "lr": 0.0003345850923578611, "tps": 14550, "wall": 41780.5} {"step": 9276, "train_loss": 3.5498833656311035, "lr": 0.000334570316915829, "tps": 14549, "wall": 41785.5} {"step": 9277, "train_loss": 3.6464345455169678, "lr": 0.0003345555401759382, "tps": 14549, "wall": 41790.4} {"step": 9278, "train_loss": 3.5008862018585205, "lr": 0.000334540762138356, "tps": 14549, "wall": 41795.4} {"step": 9279, "train_loss": 3.5361990928649902, "lr": 0.0003345259828032498, "tps": 14549, "wall": 41800.3} {"step": 9280, "train_loss": 3.565364122390747, "lr": 0.0003345112021707872, "tps": 14549, "wall": 41805.3} {"step": 9281, "train_loss": 3.417448043823242, "lr": 0.0003344964202411354, "tps": 14549, "wall": 41810.2} {"step": 9282, "train_loss": 3.5053508281707764, "lr": 0.00033448163701446193, "tps": 14549, "wall": 41815.3} {"step": 9283, "train_loss": 3.5089035034179688, "lr": 0.00033446685249093435, "tps": 14548, "wall": 41820.2} {"step": 9284, "train_loss": 3.602118730545044, "lr": 0.0003344520666707201, "tps": 14548, "wall": 41825.2} {"step": 9285, "train_loss": 3.5493226051330566, "lr": 0.0003344372795539866, "tps": 14548, "wall": 41830.1} {"step": 9286, "train_loss": 3.5049121379852295, "lr": 0.0003344224911409014, "tps": 14548, "wall": 41835.1} {"step": 9287, "train_loss": 3.364675998687744, "lr": 0.0003344077014316321, "tps": 14548, "wall": 41840.0} {"step": 9288, "train_loss": 3.5683200359344482, "lr": 0.0003343929104263461, "tps": 14548, "wall": 41845.0} {"step": 9289, "train_loss": 3.582369327545166, "lr": 0.0003343781181252111, "tps": 14547, "wall": 41849.9} {"step": 9290, "train_loss": 3.551488161087036, "lr": 0.00033436332452839446, "tps": 14547, "wall": 41854.9} {"step": 9291, "train_loss": 3.5168728828430176, "lr": 0.00033434852963606395, "tps": 14547, "wall": 41859.9} {"step": 9292, "train_loss": 3.6242289543151855, "lr": 0.0003343337334483872, "tps": 14547, "wall": 41864.8} {"step": 9293, "train_loss": 3.5217080116271973, "lr": 0.0003343189359655316, "tps": 14547, "wall": 41869.8} {"step": 9294, "train_loss": 3.519585132598877, "lr": 0.000334304137187665, "tps": 14547, "wall": 41874.8} {"step": 9295, "train_loss": 3.500709056854248, "lr": 0.0003342893371149549, "tps": 14546, "wall": 41879.7} {"step": 9296, "train_loss": 3.4545724391937256, "lr": 0.000334274535747569, "tps": 14546, "wall": 41884.7} {"step": 9297, "train_loss": 3.577577829360962, "lr": 0.00033425973308567495, "tps": 14546, "wall": 41889.6} {"step": 9298, "train_loss": 3.5590593814849854, "lr": 0.0003342449291294406, "tps": 14546, "wall": 41894.6} {"step": 9299, "train_loss": 3.502467632293701, "lr": 0.00033423012387903336, "tps": 14546, "wall": 41899.6} {"step": 9300, "train_loss": 3.5792953968048096, "lr": 0.0003342153173346212, "tps": 14546, "wall": 41904.5} {"step": 9301, "train_loss": 3.6024346351623535, "lr": 0.0003342005094963717, "tps": 14546, "wall": 41909.5} {"step": 9302, "train_loss": 3.4241018295288086, "lr": 0.0003341857003644526, "tps": 14545, "wall": 41914.5} {"step": 9303, "train_loss": 3.573275089263916, "lr": 0.00033417088993903187, "tps": 14545, "wall": 41919.4} {"step": 9304, "train_loss": 3.496129274368286, "lr": 0.000334156078220277, "tps": 14545, "wall": 41924.9} {"step": 9305, "train_loss": 3.437389850616455, "lr": 0.0003341412652083559, "tps": 14545, "wall": 41929.8} {"step": 9306, "train_loss": 3.602051258087158, "lr": 0.0003341264509034364, "tps": 14545, "wall": 41934.8} {"step": 9307, "train_loss": 3.6013710498809814, "lr": 0.00033411163530568626, "tps": 14544, "wall": 41940.2} {"step": 9308, "train_loss": 3.542086601257324, "lr": 0.00033409681841527336, "tps": 14544, "wall": 41945.4} {"step": 9309, "train_loss": 3.484182357788086, "lr": 0.00033408200023236554, "tps": 14544, "wall": 41950.5} {"step": 9310, "train_loss": 3.5485572814941406, "lr": 0.00033406718075713063, "tps": 14544, "wall": 41955.7} {"step": 9311, "train_loss": 3.5902676582336426, "lr": 0.0003340523599897365, "tps": 14543, "wall": 41960.9} {"step": 9312, "train_loss": 3.4652724266052246, "lr": 0.00033403753793035117, "tps": 14543, "wall": 41966.2} {"step": 9313, "train_loss": 3.643228054046631, "lr": 0.00033402271457914234, "tps": 14543, "wall": 41971.2} {"step": 9314, "train_loss": 3.4995625019073486, "lr": 0.0003340078899362781, "tps": 14543, "wall": 41976.1} {"step": 9315, "train_loss": 3.488253116607666, "lr": 0.00033399306400192625, "tps": 14543, "wall": 41981.1} {"step": 9316, "train_loss": 3.5380640029907227, "lr": 0.0003339782367762548, "tps": 14542, "wall": 41986.0} {"step": 9317, "train_loss": 3.534456729888916, "lr": 0.0003339634082594318, "tps": 14542, "wall": 41990.9} {"step": 9318, "train_loss": 3.390895366668701, "lr": 0.00033394857845162507, "tps": 14542, "wall": 41995.9} {"step": 9319, "train_loss": 3.5296847820281982, "lr": 0.00033393374735300274, "tps": 14542, "wall": 42000.9} {"step": 9320, "train_loss": 3.541386127471924, "lr": 0.0003339189149637327, "tps": 14542, "wall": 42005.9} {"step": 9321, "train_loss": 3.4508044719696045, "lr": 0.00033390408128398306, "tps": 14542, "wall": 42010.8} {"step": 9322, "train_loss": 3.501655101776123, "lr": 0.00033388924631392176, "tps": 14541, "wall": 42015.9} {"step": 9323, "train_loss": 3.481719732284546, "lr": 0.000333874410053717, "tps": 14541, "wall": 42020.9} {"step": 9324, "train_loss": 3.5463316440582275, "lr": 0.0003338595725035367, "tps": 14541, "wall": 42026.1} {"step": 9325, "train_loss": 3.593140125274658, "lr": 0.00033384473366354905, "tps": 14541, "wall": 42031.1} {"step": 9326, "train_loss": 3.543076992034912, "lr": 0.00033382989353392215, "tps": 14541, "wall": 42036.0} {"step": 9327, "train_loss": 3.3846940994262695, "lr": 0.00033381505211482396, "tps": 14541, "wall": 42041.1} {"step": 9328, "train_loss": 3.492305278778076, "lr": 0.00033380020940642274, "tps": 14540, "wall": 42046.0} {"step": 9329, "train_loss": 3.580028533935547, "lr": 0.0003337853654088866, "tps": 14540, "wall": 42051.1} {"step": 9330, "train_loss": 3.376004695892334, "lr": 0.00033377052012238364, "tps": 14540, "wall": 42056.1} {"step": 9331, "train_loss": 3.4739508628845215, "lr": 0.00033375567354708213, "tps": 14540, "wall": 42061.2} {"step": 9332, "train_loss": 3.564406156539917, "lr": 0.0003337408256831502, "tps": 14540, "wall": 42066.2} {"step": 9333, "train_loss": 3.4604368209838867, "lr": 0.000333725976530756, "tps": 14539, "wall": 42071.1} {"step": 9334, "train_loss": 3.5721254348754883, "lr": 0.00033371112609006774, "tps": 14539, "wall": 42076.1} {"step": 9335, "train_loss": 3.53464674949646, "lr": 0.0003336962743612538, "tps": 14539, "wall": 42081.0} {"step": 9336, "train_loss": 3.531907796859741, "lr": 0.00033368142134448226, "tps": 14539, "wall": 42086.0} {"step": 9337, "train_loss": 3.425631523132324, "lr": 0.0003336665670399214, "tps": 14539, "wall": 42091.0} {"step": 9338, "train_loss": 3.5411627292633057, "lr": 0.00033365171144773956, "tps": 14539, "wall": 42095.9} {"step": 9339, "train_loss": 3.5666069984436035, "lr": 0.000333636854568105, "tps": 14539, "wall": 42100.9} {"step": 9340, "train_loss": 3.5029711723327637, "lr": 0.000333621996401186, "tps": 14538, "wall": 42105.8} {"step": 9341, "train_loss": 3.5947999954223633, "lr": 0.0003336071369471508, "tps": 14538, "wall": 42110.8} {"step": 9342, "train_loss": 3.502127170562744, "lr": 0.00033359227620616787, "tps": 14538, "wall": 42115.9} {"step": 9343, "train_loss": 3.491719961166382, "lr": 0.0003335774141784055, "tps": 14538, "wall": 42120.8} {"step": 9344, "train_loss": 3.482607841491699, "lr": 0.000333562550864032, "tps": 14538, "wall": 42125.8} {"step": 9345, "train_loss": 3.6602559089660645, "lr": 0.0003335476862632158, "tps": 14538, "wall": 42130.8} {"step": 9346, "train_loss": 3.548710346221924, "lr": 0.0003335328203761253, "tps": 14537, "wall": 42135.7} {"step": 9347, "train_loss": 3.446223258972168, "lr": 0.00033351795320292883, "tps": 14537, "wall": 42140.6} {"step": 9348, "train_loss": 3.5617501735687256, "lr": 0.00033350308474379485, "tps": 14537, "wall": 42145.6} {"step": 9349, "train_loss": 3.508361339569092, "lr": 0.0003334882149988918, "tps": 14537, "wall": 42150.5} {"step": 9350, "train_loss": 3.563385248184204, "lr": 0.0003334733439683881, "tps": 14537, "wall": 42155.4} {"step": 9351, "train_loss": 3.51100492477417, "lr": 0.0003334584716524522, "tps": 14537, "wall": 42160.3} {"step": 9352, "train_loss": 3.4248206615448, "lr": 0.00033344359805125267, "tps": 14537, "wall": 42165.3} {"step": 9353, "train_loss": 3.4128036499023438, "lr": 0.00033342872316495785, "tps": 14536, "wall": 42170.2} {"step": 9354, "train_loss": 3.547527551651001, "lr": 0.00033341384699373634, "tps": 14536, "wall": 42175.3} {"step": 9355, "train_loss": 3.4358344078063965, "lr": 0.0003333989695377566, "tps": 14536, "wall": 42180.2} {"step": 9356, "train_loss": 3.5448825359344482, "lr": 0.00033338409079718725, "tps": 14536, "wall": 42185.2} {"step": 9357, "train_loss": 3.4926795959472656, "lr": 0.00033336921077219676, "tps": 14536, "wall": 42190.1} {"step": 9358, "train_loss": 3.449002742767334, "lr": 0.0003333543294629537, "tps": 14536, "wall": 42195.0} {"step": 9359, "train_loss": 3.575650930404663, "lr": 0.0003333394468696267, "tps": 14535, "wall": 42200.0} {"step": 9360, "train_loss": 3.6189773082733154, "lr": 0.0003333245629923843, "tps": 14535, "wall": 42204.9} {"step": 9361, "train_loss": 3.5750832557678223, "lr": 0.00033330967783139513, "tps": 14535, "wall": 42209.9} {"step": 9362, "train_loss": 3.558124542236328, "lr": 0.00033329479138682774, "tps": 14535, "wall": 42214.8} {"step": 9363, "train_loss": 3.5285356044769287, "lr": 0.00033327990365885095, "tps": 14535, "wall": 42219.8} {"step": 9364, "train_loss": 3.6518194675445557, "lr": 0.00033326501464763317, "tps": 14535, "wall": 42224.8} {"step": 9365, "train_loss": 3.483150005340576, "lr": 0.00033325012435334327, "tps": 14535, "wall": 42229.7} {"step": 9366, "train_loss": 3.593207836151123, "lr": 0.00033323523277614973, "tps": 14534, "wall": 42234.7} {"step": 9367, "train_loss": 3.52577805519104, "lr": 0.00033322033991622143, "tps": 14534, "wall": 42239.6} {"step": 9368, "train_loss": 3.573291778564453, "lr": 0.000333205445773727, "tps": 14534, "wall": 42244.6} {"step": 9369, "train_loss": 3.5461020469665527, "lr": 0.00033319055034883505, "tps": 14534, "wall": 42249.5} {"step": 9370, "train_loss": 3.536210775375366, "lr": 0.00033317565364171444, "tps": 14534, "wall": 42254.5} {"step": 9371, "train_loss": 3.5062644481658936, "lr": 0.000333160755652534, "tps": 14534, "wall": 42259.4} {"step": 9372, "train_loss": 3.4716176986694336, "lr": 0.0003331458563814624, "tps": 14533, "wall": 42264.4} {"step": 9373, "train_loss": 3.525756597518921, "lr": 0.0003331309558286684, "tps": 14533, "wall": 42269.3} {"step": 9374, "train_loss": 3.536799192428589, "lr": 0.0003331160539943207, "tps": 14533, "wall": 42274.2} {"step": 9375, "train_loss": 3.50679087638855, "lr": 0.0003331011508785883, "tps": 14533, "wall": 42279.2} {"step": 9376, "train_loss": 3.484395980834961, "lr": 0.00033308624648163996, "tps": 14533, "wall": 42284.1} {"step": 9377, "train_loss": 3.4472713470458984, "lr": 0.0003330713408036445, "tps": 14533, "wall": 42289.1} {"step": 9378, "train_loss": 3.475109577178955, "lr": 0.00033305643384477074, "tps": 14533, "wall": 42294.0} {"step": 9379, "train_loss": 3.5613462924957275, "lr": 0.0003330415256051876, "tps": 14532, "wall": 42299.0} {"step": 9380, "train_loss": 3.539271831512451, "lr": 0.000333026616085064, "tps": 14532, "wall": 42304.0} {"step": 9381, "train_loss": 3.594578742980957, "lr": 0.0003330117052845687, "tps": 14532, "wall": 42308.9} {"step": 9382, "train_loss": 3.4892959594726562, "lr": 0.00033299679320387065, "tps": 14532, "wall": 42313.9} {"step": 9383, "train_loss": 3.5867819786071777, "lr": 0.0003329818798431389, "tps": 14532, "wall": 42318.8} {"step": 9384, "train_loss": 3.6737611293792725, "lr": 0.00033296696520254226, "tps": 14532, "wall": 42323.8} {"step": 9385, "train_loss": 3.440703868865967, "lr": 0.00033295204928224974, "tps": 14531, "wall": 42328.8} {"step": 9386, "train_loss": 3.514106512069702, "lr": 0.00033293713208243033, "tps": 14531, "wall": 42333.7} {"step": 9387, "train_loss": 3.5711700916290283, "lr": 0.000332922213603253, "tps": 14531, "wall": 42338.7} {"step": 9388, "train_loss": 3.5806119441986084, "lr": 0.00033290729384488664, "tps": 14531, "wall": 42343.6} {"step": 9389, "train_loss": 3.5936427116394043, "lr": 0.00033289237280750036, "tps": 14531, "wall": 42348.6} {"step": 9390, "train_loss": 3.5432448387145996, "lr": 0.0003328774504912632, "tps": 14531, "wall": 42353.5} {"step": 9391, "train_loss": 3.624319076538086, "lr": 0.00033286252689634417, "tps": 14531, "wall": 42358.5} {"step": 9392, "train_loss": 3.580331802368164, "lr": 0.00033284760202291236, "tps": 14530, "wall": 42363.5} {"step": 9393, "train_loss": 3.5777957439422607, "lr": 0.00033283267587113675, "tps": 14530, "wall": 42368.5} {"step": 9394, "train_loss": 3.5844473838806152, "lr": 0.0003328177484411866, "tps": 14530, "wall": 42373.4} {"step": 9395, "train_loss": 3.531722068786621, "lr": 0.0003328028197332307, "tps": 14530, "wall": 42378.4} {"step": 9396, "train_loss": 3.587022542953491, "lr": 0.0003327878897474385, "tps": 14530, "wall": 42383.3} {"step": 9397, "train_loss": 3.4517433643341064, "lr": 0.00033277295848397893, "tps": 14530, "wall": 42388.3} {"step": 9398, "train_loss": 3.5253829956054688, "lr": 0.00033275802594302117, "tps": 14529, "wall": 42393.2} {"step": 9399, "train_loss": 3.543964385986328, "lr": 0.00033274309212473447, "tps": 14529, "wall": 42398.2} {"step": 9400, "train_loss": 3.4938454627990723, "lr": 0.0003327281570292879, "tps": 14529, "wall": 42403.2} {"step": 9401, "train_loss": 3.5581161975860596, "lr": 0.00033271322065685064, "tps": 14529, "wall": 42408.1} {"step": 9402, "train_loss": 3.5640761852264404, "lr": 0.0003326982830075919, "tps": 14529, "wall": 42413.1} {"step": 9403, "train_loss": 3.613675594329834, "lr": 0.0003326833440816809, "tps": 14529, "wall": 42418.3} {"step": 9404, "train_loss": 3.5041325092315674, "lr": 0.00033266840387928694, "tps": 14528, "wall": 42423.2} {"step": 9405, "train_loss": 3.539475917816162, "lr": 0.00033265346240057917, "tps": 14528, "wall": 42428.2} {"step": 9406, "train_loss": 3.528313398361206, "lr": 0.0003326385196457269, "tps": 14528, "wall": 42433.1} {"step": 9407, "train_loss": 3.518996477127075, "lr": 0.0003326235756148994, "tps": 14528, "wall": 42438.1} {"step": 9408, "train_loss": 3.4865453243255615, "lr": 0.00033260863030826595, "tps": 14528, "wall": 42443.2} {"step": 9409, "train_loss": 3.587423324584961, "lr": 0.0003325936837259958, "tps": 14528, "wall": 42448.4} {"step": 9410, "train_loss": 3.532106876373291, "lr": 0.0003325787358682583, "tps": 14527, "wall": 42453.4} {"step": 9411, "train_loss": 3.4467036724090576, "lr": 0.00033256378673522283, "tps": 14527, "wall": 42458.3} {"step": 9412, "train_loss": 3.493272542953491, "lr": 0.00033254883632705866, "tps": 14527, "wall": 42463.3} {"step": 9413, "train_loss": 3.650986909866333, "lr": 0.0003325338846439352, "tps": 14527, "wall": 42468.2} {"step": 9414, "train_loss": 3.5659706592559814, "lr": 0.0003325189316860218, "tps": 14527, "wall": 42473.2} {"step": 9415, "train_loss": 3.532317638397217, "lr": 0.00033250397745348783, "tps": 14527, "wall": 42478.2} {"step": 9416, "train_loss": 3.545471429824829, "lr": 0.0003324890219465028, "tps": 14526, "wall": 42483.2} {"step": 9417, "train_loss": 3.370105266571045, "lr": 0.00033247406516523603, "tps": 14526, "wall": 42488.1} {"step": 9418, "train_loss": 3.52968430519104, "lr": 0.00033245910710985686, "tps": 14526, "wall": 42493.1} {"step": 9419, "train_loss": 3.4798078536987305, "lr": 0.000332444147780535, "tps": 14526, "wall": 42498.1} {"step": 9420, "train_loss": 3.5321011543273926, "lr": 0.0003324291871774396, "tps": 14526, "wall": 42503.1} {"step": 9421, "train_loss": 3.4702630043029785, "lr": 0.00033241422530074036, "tps": 14526, "wall": 42508.2} {"step": 9422, "train_loss": 3.469743251800537, "lr": 0.00033239926215060666, "tps": 14525, "wall": 42513.2} {"step": 9423, "train_loss": 3.5474724769592285, "lr": 0.0003323842977272081, "tps": 14525, "wall": 42518.4} {"step": 9424, "train_loss": 3.6160147190093994, "lr": 0.0003323693320307141, "tps": 14525, "wall": 42523.5} {"step": 9425, "train_loss": 3.533843994140625, "lr": 0.0003323543650612942, "tps": 14525, "wall": 42528.6} {"step": 9426, "train_loss": 3.556947708129883, "lr": 0.000332339396819118, "tps": 14525, "wall": 42533.5} {"step": 9427, "train_loss": 3.704106569290161, "lr": 0.00033232442730435504, "tps": 14524, "wall": 42538.8} {"step": 9428, "train_loss": 3.3720321655273438, "lr": 0.0003323094565171749, "tps": 14524, "wall": 42544.0} {"step": 9429, "train_loss": 3.590963363647461, "lr": 0.00033229448445774715, "tps": 14524, "wall": 42549.1} {"step": 9430, "train_loss": 3.5897321701049805, "lr": 0.00033227951112624137, "tps": 14524, "wall": 42554.3} {"step": 9431, "train_loss": 3.583310604095459, "lr": 0.0003322645365228273, "tps": 14524, "wall": 42559.5} {"step": 9432, "train_loss": 3.532085418701172, "lr": 0.00033224956064767435, "tps": 14523, "wall": 42564.7} {"step": 9433, "train_loss": 3.508833408355713, "lr": 0.0003322345835009524, "tps": 14523, "wall": 42569.9} {"step": 9434, "train_loss": 3.4710774421691895, "lr": 0.00033221960508283103, "tps": 14523, "wall": 42574.8} {"step": 9435, "train_loss": 3.4119434356689453, "lr": 0.0003322046253934799, "tps": 14523, "wall": 42579.8} {"step": 9436, "train_loss": 3.5127995014190674, "lr": 0.00033218964443306864, "tps": 14523, "wall": 42584.8} {"step": 9437, "train_loss": 3.506164073944092, "lr": 0.0003321746622017671, "tps": 14522, "wall": 42589.9} {"step": 9438, "train_loss": 3.537736415863037, "lr": 0.00033215967869974484, "tps": 14522, "wall": 42594.9} {"step": 9439, "train_loss": 3.5546810626983643, "lr": 0.0003321446939271717, "tps": 14522, "wall": 42599.8} {"step": 9440, "train_loss": 3.441854476928711, "lr": 0.00033212970788421735, "tps": 14522, "wall": 42604.8} {"step": 9441, "train_loss": 3.564385175704956, "lr": 0.00033211472057105166, "tps": 14522, "wall": 42609.7} {"step": 9442, "train_loss": 3.406341075897217, "lr": 0.00033209973198784434, "tps": 14522, "wall": 42614.6} {"step": 9443, "train_loss": 3.5584070682525635, "lr": 0.0003320847421347653, "tps": 14522, "wall": 42619.6} {"step": 9444, "train_loss": 3.492382287979126, "lr": 0.0003320697510119841, "tps": 14521, "wall": 42624.5} {"step": 9445, "train_loss": 3.5469870567321777, "lr": 0.00033205475861967075, "tps": 14521, "wall": 42629.5} {"step": 9446, "train_loss": 3.4604015350341797, "lr": 0.00033203976495799496, "tps": 14521, "wall": 42634.4} {"step": 9447, "train_loss": 3.453518867492676, "lr": 0.0003320247700271267, "tps": 14521, "wall": 42639.4} {"step": 9448, "train_loss": 3.6144371032714844, "lr": 0.0003320097738272359, "tps": 14521, "wall": 42644.3} {"step": 9449, "train_loss": 3.5393588542938232, "lr": 0.00033199477635849215, "tps": 14521, "wall": 42649.3} {"step": 9450, "train_loss": 3.5537009239196777, "lr": 0.00033197977762106556, "tps": 14520, "wall": 42654.2} {"step": 9451, "train_loss": 3.4901442527770996, "lr": 0.000331964777615126, "tps": 14520, "wall": 42659.2} {"step": 9452, "train_loss": 3.503188133239746, "lr": 0.00033194977634084345, "tps": 14520, "wall": 42664.1} {"step": 9453, "train_loss": 3.4734039306640625, "lr": 0.0003319347737983877, "tps": 14520, "wall": 42669.1} {"step": 9454, "train_loss": 3.4391632080078125, "lr": 0.0003319197699879288, "tps": 14520, "wall": 42674.0} {"step": 9455, "train_loss": 3.4939045906066895, "lr": 0.0003319047649096367, "tps": 14520, "wall": 42679.0} {"step": 9456, "train_loss": 3.4669029712677, "lr": 0.0003318897585636813, "tps": 14520, "wall": 42684.0} {"step": 9457, "train_loss": 3.474029779434204, "lr": 0.0003318747509502328, "tps": 14519, "wall": 42688.9} {"step": 9458, "train_loss": 3.4944348335266113, "lr": 0.00033185974206946094, "tps": 14519, "wall": 42693.8} {"step": 9459, "train_loss": 3.5457849502563477, "lr": 0.0003318447319215359, "tps": 14519, "wall": 42698.8} {"step": 9460, "train_loss": 3.5341382026672363, "lr": 0.00033182972050662773, "tps": 14519, "wall": 42703.7} {"step": 9461, "train_loss": 3.5639986991882324, "lr": 0.0003318147078249064, "tps": 14519, "wall": 42708.7} {"step": 9462, "train_loss": 3.5165247917175293, "lr": 0.0003317996938765421, "tps": 14519, "wall": 42713.6} {"step": 9463, "train_loss": 3.624535322189331, "lr": 0.0003317846786617047, "tps": 14519, "wall": 42718.6} {"step": 9464, "train_loss": 3.498253345489502, "lr": 0.00033176966218056444, "tps": 14518, "wall": 42723.5} {"step": 9465, "train_loss": 3.5134096145629883, "lr": 0.0003317546444332914, "tps": 14518, "wall": 42728.5} {"step": 9466, "train_loss": 3.3915152549743652, "lr": 0.0003317396254200557, "tps": 14518, "wall": 42733.4} {"step": 9467, "train_loss": 3.529928684234619, "lr": 0.0003317246051410275, "tps": 14518, "wall": 42738.4} {"step": 9468, "train_loss": 3.412010431289673, "lr": 0.0003317095835963769, "tps": 14518, "wall": 42743.4} {"step": 9469, "train_loss": 3.604764938354492, "lr": 0.0003316945607862742, "tps": 14518, "wall": 42748.3} {"step": 9470, "train_loss": 3.3243777751922607, "lr": 0.00033167953671088936, "tps": 14517, "wall": 42753.3} {"step": 9471, "train_loss": 3.519923210144043, "lr": 0.0003316645113703927, "tps": 14517, "wall": 42758.2} {"step": 9472, "train_loss": 3.4828851222991943, "lr": 0.00033164948476495446, "tps": 14517, "wall": 42763.1} {"step": 9473, "train_loss": 3.519832134246826, "lr": 0.0003316344568947448, "tps": 14517, "wall": 42768.1} {"step": 9474, "train_loss": 3.552659273147583, "lr": 0.00033161942775993393, "tps": 14517, "wall": 42773.0} {"step": 9475, "train_loss": 3.5251901149749756, "lr": 0.00033160439736069214, "tps": 14517, "wall": 42778.0} {"step": 9476, "train_loss": 3.597017765045166, "lr": 0.0003315893656971898, "tps": 14517, "wall": 42782.9} {"step": 9477, "train_loss": 3.583226203918457, "lr": 0.00033157433276959704, "tps": 14516, "wall": 42787.9} {"step": 9478, "train_loss": 3.57177472114563, "lr": 0.0003315592985780841, "tps": 14516, "wall": 42792.8} {"step": 9479, "train_loss": 3.424678325653076, "lr": 0.0003315442631228215, "tps": 14516, "wall": 42797.8} {"step": 9480, "train_loss": 3.5687713623046875, "lr": 0.00033152922640397944, "tps": 14516, "wall": 42802.7} {"step": 9481, "train_loss": 3.505690097808838, "lr": 0.00033151418842172824, "tps": 14516, "wall": 42807.6} {"step": 9482, "train_loss": 3.4874649047851562, "lr": 0.00033149914917623833, "tps": 14516, "wall": 42812.6} {"step": 9483, "train_loss": 3.6180343627929688, "lr": 0.00033148410866767994, "tps": 14516, "wall": 42817.6} {"step": 9484, "train_loss": 3.5390751361846924, "lr": 0.0003314690668962237, "tps": 14515, "wall": 42822.5} {"step": 9485, "train_loss": 3.496896982192993, "lr": 0.00033145402386203964, "tps": 14515, "wall": 42827.5} {"step": 9486, "train_loss": 3.5488767623901367, "lr": 0.0003314389795652985, "tps": 14515, "wall": 42832.4} {"step": 9487, "train_loss": 3.4702112674713135, "lr": 0.0003314239340061705, "tps": 14515, "wall": 42837.4} {"step": 9488, "train_loss": 3.4322595596313477, "lr": 0.00033140888718482614, "tps": 14515, "wall": 42842.3} {"step": 9489, "train_loss": 3.610419273376465, "lr": 0.00033139383910143593, "tps": 14515, "wall": 42847.3} {"step": 9490, "train_loss": 3.471620559692383, "lr": 0.00033137878975617036, "tps": 14515, "wall": 42852.2} {"step": 9491, "train_loss": 3.3790509700775146, "lr": 0.0003313637391491997, "tps": 14514, "wall": 42857.1} {"step": 9492, "train_loss": 3.5836994647979736, "lr": 0.00033134868728069457, "tps": 14514, "wall": 42862.1} {"step": 9493, "train_loss": 3.412863254547119, "lr": 0.00033133363415082555, "tps": 14514, "wall": 42867.0} {"step": 9494, "train_loss": 3.432305335998535, "lr": 0.0003313185797597631, "tps": 14514, "wall": 42872.0} {"step": 9495, "train_loss": 3.503173828125, "lr": 0.00033130352410767774, "tps": 14514, "wall": 42876.9} {"step": 9496, "train_loss": 3.5131454467773438, "lr": 0.0003312884671947401, "tps": 14514, "wall": 42881.9} {"step": 9497, "train_loss": 3.5048274993896484, "lr": 0.00033127340902112056, "tps": 14514, "wall": 42886.8} {"step": 9498, "train_loss": 3.460333824157715, "lr": 0.0003312583495869899, "tps": 14513, "wall": 42891.8} {"step": 9499, "train_loss": 3.4992775917053223, "lr": 0.00033124328889251863, "tps": 14513, "wall": 42896.8} {"step": 9500, "train_loss": 3.578408718109131, "lr": 0.0003312282269378774, "tps": 14513, "wall": 42901.7} {"step": 9501, "train_loss": 3.5033974647521973, "lr": 0.0003312131637232367, "tps": 14513, "wall": 42906.9} {"step": 9502, "train_loss": 3.534195899963379, "lr": 0.00033119809924876735, "tps": 14513, "wall": 42911.8} {"step": 9503, "train_loss": 3.4757750034332275, "lr": 0.0003311830335146399, "tps": 14513, "wall": 42916.8} {"step": 9504, "train_loss": 3.459191083908081, "lr": 0.00033116796652102494, "tps": 14512, "wall": 42921.7} {"step": 9505, "train_loss": 3.5286707878112793, "lr": 0.00033115289826809335, "tps": 14512, "wall": 42926.6} {"step": 9506, "train_loss": 3.5235681533813477, "lr": 0.0003311378287560157, "tps": 14512, "wall": 42931.6} {"step": 9507, "train_loss": 3.5371387004852295, "lr": 0.00033112275798496266, "tps": 14512, "wall": 42936.6} {"step": 9508, "train_loss": 3.501875638961792, "lr": 0.00033110768595510514, "tps": 14512, "wall": 42941.5} {"step": 9509, "train_loss": 3.5171918869018555, "lr": 0.0003310926126666136, "tps": 14512, "wall": 42946.5} {"step": 9510, "train_loss": 3.4510080814361572, "lr": 0.00033107753811965896, "tps": 14512, "wall": 42951.4} {"step": 9511, "train_loss": 3.5140857696533203, "lr": 0.000331062462314412, "tps": 14511, "wall": 42956.4} {"step": 9512, "train_loss": 3.6244664192199707, "lr": 0.0003310473852510434, "tps": 14511, "wall": 42961.4} {"step": 9513, "train_loss": 3.4507243633270264, "lr": 0.0003310323069297241, "tps": 14511, "wall": 42966.3} {"step": 9514, "train_loss": 3.5966906547546387, "lr": 0.0003310172273506248, "tps": 14511, "wall": 42971.3} {"step": 9515, "train_loss": 3.4656872749328613, "lr": 0.0003310021465139163, "tps": 14511, "wall": 42976.2} {"step": 9516, "train_loss": 3.3802385330200195, "lr": 0.00033098706441976947, "tps": 14511, "wall": 42981.1} {"step": 9517, "train_loss": 3.471957206726074, "lr": 0.0003309719810683552, "tps": 14511, "wall": 42986.1} {"step": 9518, "train_loss": 3.6345925331115723, "lr": 0.0003309568964598443, "tps": 14510, "wall": 42991.0} {"step": 9519, "train_loss": 3.4538493156433105, "lr": 0.00033094181059440775, "tps": 14510, "wall": 42996.0} {"step": 9520, "train_loss": 3.492060899734497, "lr": 0.00033092672347221627, "tps": 14510, "wall": 43001.0} {"step": 9521, "train_loss": 3.54628586769104, "lr": 0.00033091163509344087, "tps": 14510, "wall": 43005.9} {"step": 9522, "train_loss": 3.4159393310546875, "lr": 0.0003308965454582525, "tps": 14510, "wall": 43011.0} {"step": 9523, "train_loss": 3.461310386657715, "lr": 0.0003308814545668221, "tps": 14510, "wall": 43016.0} {"step": 9524, "train_loss": 3.4964427947998047, "lr": 0.00033086636241932055, "tps": 14509, "wall": 43021.1} {"step": 9525, "train_loss": 3.4622528553009033, "lr": 0.0003308512690159188, "tps": 14509, "wall": 43026.4} {"step": 9526, "train_loss": 3.5213747024536133, "lr": 0.00033083617435678795, "tps": 14509, "wall": 43031.3} {"step": 9527, "train_loss": 3.6013550758361816, "lr": 0.000330821078442099, "tps": 14509, "wall": 43036.4} {"step": 9528, "train_loss": 3.5244860649108887, "lr": 0.0003308059812720227, "tps": 14509, "wall": 43041.3} {"step": 9529, "train_loss": 3.4750757217407227, "lr": 0.0003307908828467303, "tps": 14508, "wall": 43046.3} {"step": 9530, "train_loss": 3.559176445007324, "lr": 0.00033077578316639285, "tps": 14508, "wall": 43051.3} {"step": 9531, "train_loss": 3.4751992225646973, "lr": 0.0003307606822311813, "tps": 14508, "wall": 43056.2} {"step": 9532, "train_loss": 3.4828577041625977, "lr": 0.0003307455800412667, "tps": 14508, "wall": 43061.2} {"step": 9533, "train_loss": 3.5927515029907227, "lr": 0.0003307304765968203, "tps": 14508, "wall": 43066.1} {"step": 9534, "train_loss": 3.4674594402313232, "lr": 0.00033071537189801296, "tps": 14508, "wall": 43071.1} {"step": 9535, "train_loss": 3.4903273582458496, "lr": 0.00033070026594501586, "tps": 14508, "wall": 43076.1} {"step": 9536, "train_loss": 3.5217323303222656, "lr": 0.0003306851587380003, "tps": 14507, "wall": 43081.0} {"step": 9537, "train_loss": 3.571882486343384, "lr": 0.0003306700502771372, "tps": 14507, "wall": 43086.0} {"step": 9538, "train_loss": 3.547868013381958, "lr": 0.0003306549405625978, "tps": 14507, "wall": 43090.9} {"step": 9539, "train_loss": 3.492978096008301, "lr": 0.0003306398295945532, "tps": 14507, "wall": 43095.9} {"step": 9540, "train_loss": 3.509594440460205, "lr": 0.00033062471737317466, "tps": 14507, "wall": 43100.8} {"step": 9541, "train_loss": 3.5993752479553223, "lr": 0.00033060960389863335, "tps": 14507, "wall": 43105.8} {"step": 9542, "train_loss": 3.5126218795776367, "lr": 0.00033059448917110046, "tps": 14507, "wall": 43110.7} {"step": 9543, "train_loss": 3.412944793701172, "lr": 0.0003305793731907472, "tps": 14506, "wall": 43115.7} {"step": 9544, "train_loss": 3.4939184188842773, "lr": 0.0003305642559577448, "tps": 14506, "wall": 43120.6} {"step": 9545, "train_loss": 3.4328036308288574, "lr": 0.00033054913747226455, "tps": 14506, "wall": 43125.6} {"step": 9546, "train_loss": 3.500277042388916, "lr": 0.0003305340177344777, "tps": 14506, "wall": 43130.5} {"step": 9547, "train_loss": 3.457615852355957, "lr": 0.00033051889674455553, "tps": 14506, "wall": 43135.6} {"step": 9548, "train_loss": 3.5585989952087402, "lr": 0.0003305037745026693, "tps": 14506, "wall": 43140.5} {"step": 9549, "train_loss": 3.5401694774627686, "lr": 0.0003304886510089903, "tps": 14506, "wall": 43145.5} {"step": 9550, "train_loss": 3.4575467109680176, "lr": 0.0003304735262636899, "tps": 14505, "wall": 43150.4} {"step": 9551, "train_loss": 3.6042184829711914, "lr": 0.00033045840026693944, "tps": 14505, "wall": 43155.4} {"step": 9552, "train_loss": 3.571545124053955, "lr": 0.00033044327301891025, "tps": 14505, "wall": 43160.3} {"step": 9553, "train_loss": 3.5437395572662354, "lr": 0.0003304281445197737, "tps": 14505, "wall": 43165.3} {"step": 9554, "train_loss": 3.540187358856201, "lr": 0.0003304130147697011, "tps": 14505, "wall": 43170.2} {"step": 9555, "train_loss": 3.6652393341064453, "lr": 0.00033039788376886393, "tps": 14505, "wall": 43175.2} {"step": 9556, "train_loss": 3.435032844543457, "lr": 0.00033038275151743357, "tps": 14504, "wall": 43180.1} {"step": 9557, "train_loss": 3.550966501235962, "lr": 0.0003303676180155814, "tps": 14504, "wall": 43185.5} {"step": 9558, "train_loss": 3.4663658142089844, "lr": 0.00033035248326347894, "tps": 14504, "wall": 43190.5} {"step": 9559, "train_loss": 3.524576425552368, "lr": 0.0003303373472612975, "tps": 14504, "wall": 43195.6} {"step": 9560, "train_loss": 3.581697702407837, "lr": 0.00033032221000920867, "tps": 14504, "wall": 43200.6} {"step": 9561, "train_loss": 3.5612988471984863, "lr": 0.0003303070715073839, "tps": 14504, "wall": 43205.6} {"step": 9562, "train_loss": 3.4538283348083496, "lr": 0.0003302919317559946, "tps": 14503, "wall": 43210.5} {"step": 9563, "train_loss": 3.5184898376464844, "lr": 0.00033027679075521235, "tps": 14503, "wall": 43215.4} {"step": 9564, "train_loss": 3.404928207397461, "lr": 0.00033026164850520867, "tps": 14503, "wall": 43220.4} {"step": 9565, "train_loss": 3.4629287719726562, "lr": 0.00033024650500615497, "tps": 14503, "wall": 43225.4} {"step": 9566, "train_loss": 3.600306987762451, "lr": 0.00033023136025822305, "tps": 14503, "wall": 43230.3} {"step": 9567, "train_loss": 3.4279770851135254, "lr": 0.00033021621426158426, "tps": 14503, "wall": 43235.0} {"step": 9568, "train_loss": 3.63430118560791, "lr": 0.0003302010670164102, "tps": 14503, "wall": 43239.8} {"step": 9569, "train_loss": 3.5711913108825684, "lr": 0.00033018591852287255, "tps": 14503, "wall": 43244.6} {"step": 9570, "train_loss": 3.5668814182281494, "lr": 0.00033017076878114277, "tps": 14502, "wall": 43249.3} {"step": 9571, "train_loss": 3.5292999744415283, "lr": 0.0003301556177913926, "tps": 14502, "wall": 43254.1} {"step": 9572, "train_loss": 3.4792470932006836, "lr": 0.0003301404655537937, "tps": 14502, "wall": 43259.0} {"step": 9573, "train_loss": 3.5387749671936035, "lr": 0.0003301253120685175, "tps": 14502, "wall": 43263.7} {"step": 9574, "train_loss": 3.5813279151916504, "lr": 0.0003301101573357359, "tps": 14502, "wall": 43268.5} {"step": 9575, "train_loss": 3.566556215286255, "lr": 0.0003300950013556205, "tps": 14502, "wall": 43273.3} {"step": 9576, "train_loss": 3.558940887451172, "lr": 0.00033007984412834296, "tps": 14502, "wall": 43278.1} {"step": 9577, "train_loss": 3.4970946311950684, "lr": 0.0003300646856540749, "tps": 14502, "wall": 43282.9} {"step": 9578, "train_loss": 3.536447048187256, "lr": 0.00033004952593298825, "tps": 14502, "wall": 43287.7} {"step": 9579, "train_loss": 3.491659164428711, "lr": 0.00033003436496525457, "tps": 14502, "wall": 43292.5} {"step": 9580, "train_loss": 3.3987739086151123, "lr": 0.00033001920275104563, "tps": 14502, "wall": 43297.2} {"step": 9581, "train_loss": 3.5753984451293945, "lr": 0.00033000403929053324, "tps": 14501, "wall": 43302.0} {"step": 9582, "train_loss": 3.508068799972534, "lr": 0.0003299888745838891, "tps": 14501, "wall": 43306.8} {"step": 9583, "train_loss": 3.4763076305389404, "lr": 0.0003299737086312851, "tps": 14501, "wall": 43311.6} {"step": 9584, "train_loss": 3.3941307067871094, "lr": 0.0003299585414328929, "tps": 14501, "wall": 43316.5} {"step": 9585, "train_loss": 3.5755324363708496, "lr": 0.0003299433729888845, "tps": 14501, "wall": 43321.2} {"step": 9586, "train_loss": 3.5230953693389893, "lr": 0.00032992820329943155, "tps": 14501, "wall": 43326.1} {"step": 9587, "train_loss": 3.4709043502807617, "lr": 0.000329913032364706, "tps": 14501, "wall": 43330.8} {"step": 9588, "train_loss": 3.451380491256714, "lr": 0.0003298978601848796, "tps": 14501, "wall": 43335.6} {"step": 9589, "train_loss": 3.6320581436157227, "lr": 0.00032988268676012434, "tps": 14501, "wall": 43340.4} {"step": 9590, "train_loss": 3.3944294452667236, "lr": 0.00032986751209061207, "tps": 14501, "wall": 43345.2} {"step": 9591, "train_loss": 3.4498510360717773, "lr": 0.0003298523361765147, "tps": 14501, "wall": 43350.0} {"step": 9592, "train_loss": 3.4969935417175293, "lr": 0.0003298371590180041, "tps": 14500, "wall": 43354.8} {"step": 9593, "train_loss": 3.512308120727539, "lr": 0.0003298219806152522, "tps": 14500, "wall": 43359.6} {"step": 9594, "train_loss": 3.4709835052490234, "lr": 0.000329806800968431, "tps": 14500, "wall": 43364.4} {"step": 9595, "train_loss": 3.3650426864624023, "lr": 0.0003297916200777124, "tps": 14500, "wall": 43369.2} {"step": 9596, "train_loss": 3.516796588897705, "lr": 0.00032977643794326834, "tps": 14500, "wall": 43374.0} {"step": 9597, "train_loss": 3.484924077987671, "lr": 0.00032976125456527097, "tps": 14500, "wall": 43378.8} {"step": 9598, "train_loss": 3.5082592964172363, "lr": 0.00032974606994389205, "tps": 14500, "wall": 43383.6} {"step": 9599, "train_loss": 3.533418655395508, "lr": 0.0003297308840793037, "tps": 14500, "wall": 43388.4} {"step": 9600, "train_loss": 3.520418643951416, "lr": 0.0003297156969716781, "tps": 14500, "wall": 43393.2} {"step": 9601, "train_loss": 3.4737114906311035, "lr": 0.00032970050862118704, "tps": 14500, "wall": 43398.0} {"step": 9602, "train_loss": 3.5426993370056152, "lr": 0.0003296853190280027, "tps": 14500, "wall": 43402.8} {"step": 9603, "train_loss": 3.4628095626831055, "lr": 0.00032967012819229717, "tps": 14499, "wall": 43407.6} {"step": 9604, "train_loss": 3.490962028503418, "lr": 0.0003296549361142424, "tps": 14499, "wall": 43412.4} {"step": 9605, "train_loss": 3.5224905014038086, "lr": 0.0003296397427940107, "tps": 14499, "wall": 43417.2} {"step": 9606, "train_loss": 3.457601547241211, "lr": 0.000329624548231774, "tps": 14499, "wall": 43422.0} {"step": 9607, "train_loss": 3.4997029304504395, "lr": 0.0003296093524277045, "tps": 14499, "wall": 43426.8} {"step": 9608, "train_loss": 3.525200843811035, "lr": 0.0003295941553819743, "tps": 14499, "wall": 43431.6} {"step": 9609, "train_loss": 3.563873291015625, "lr": 0.0003295789570947557, "tps": 14499, "wall": 43436.5} {"step": 9610, "train_loss": 3.612125873565674, "lr": 0.0003295637575662206, "tps": 14499, "wall": 43441.3} {"step": 9611, "train_loss": 3.529423236846924, "lr": 0.00032954855679654136, "tps": 14499, "wall": 43446.1} {"step": 9612, "train_loss": 3.4844298362731934, "lr": 0.0003295333547858902, "tps": 14499, "wall": 43450.9} {"step": 9613, "train_loss": 3.579453945159912, "lr": 0.00032951815153443924, "tps": 14498, "wall": 43455.7} {"step": 9614, "train_loss": 3.3915584087371826, "lr": 0.0003295029470423607, "tps": 14498, "wall": 43460.5} {"step": 9615, "train_loss": 3.5401411056518555, "lr": 0.0003294877413098269, "tps": 14498, "wall": 43465.3} {"step": 9616, "train_loss": 3.5595459938049316, "lr": 0.00032947253433701, "tps": 14498, "wall": 43470.1} {"step": 9617, "train_loss": 3.445237159729004, "lr": 0.00032945732612408234, "tps": 14498, "wall": 43474.9} {"step": 9618, "train_loss": 3.5622007846832275, "lr": 0.0003294421166712162, "tps": 14498, "wall": 43479.7} {"step": 9619, "train_loss": 3.4595561027526855, "lr": 0.0003294269059785838, "tps": 14498, "wall": 43484.5} {"step": 9620, "train_loss": 3.5001816749572754, "lr": 0.00032941169404635743, "tps": 14498, "wall": 43489.3} {"step": 9621, "train_loss": 3.6044647693634033, "lr": 0.00032939648087470955, "tps": 14498, "wall": 43494.1} {"step": 9622, "train_loss": 3.3750340938568115, "lr": 0.0003293812664638124, "tps": 14498, "wall": 43498.9} {"step": 9623, "train_loss": 3.400421142578125, "lr": 0.00032936605081383837, "tps": 14498, "wall": 43503.7} {"step": 9624, "train_loss": 3.444521427154541, "lr": 0.0003293508339249597, "tps": 14497, "wall": 43508.5} {"step": 9625, "train_loss": 3.478177070617676, "lr": 0.000329335615797349, "tps": 14497, "wall": 43513.3} {"step": 9626, "train_loss": 3.6134839057922363, "lr": 0.0003293203964311784, "tps": 14497, "wall": 43518.1} {"step": 9627, "train_loss": 3.4948372840881348, "lr": 0.0003293051758266206, "tps": 14497, "wall": 43522.9} {"step": 9628, "train_loss": 3.537773609161377, "lr": 0.00032928995398384767, "tps": 14497, "wall": 43527.6} {"step": 9629, "train_loss": 3.534252166748047, "lr": 0.00032927473090303233, "tps": 14497, "wall": 43532.4} {"step": 9630, "train_loss": 3.561307191848755, "lr": 0.0003292595065843469, "tps": 14497, "wall": 43537.2} {"step": 9631, "train_loss": 3.4593582153320312, "lr": 0.0003292442810279639, "tps": 14497, "wall": 43542.0} {"step": 9632, "train_loss": 3.4967353343963623, "lr": 0.0003292290542340558, "tps": 14497, "wall": 43546.8} {"step": 9633, "train_loss": 3.6597020626068115, "lr": 0.00032921382620279495, "tps": 14497, "wall": 43551.6} {"step": 9634, "train_loss": 3.4894371032714844, "lr": 0.00032919859693435405, "tps": 14497, "wall": 43556.4} {"step": 9635, "train_loss": 3.528369426727295, "lr": 0.00032918336642890554, "tps": 14496, "wall": 43561.2} {"step": 9636, "train_loss": 3.5483367443084717, "lr": 0.00032916813468662195, "tps": 14496, "wall": 43566.0} {"step": 9637, "train_loss": 3.570202589035034, "lr": 0.0003291529017076758, "tps": 14496, "wall": 43570.8} {"step": 9638, "train_loss": 3.6118998527526855, "lr": 0.00032913766749223967, "tps": 14496, "wall": 43575.6} {"step": 9639, "train_loss": 3.511411666870117, "lr": 0.00032912243204048623, "tps": 14496, "wall": 43580.4} {"step": 9640, "train_loss": 3.4758224487304688, "lr": 0.00032910719535258787, "tps": 14496, "wall": 43585.2} {"step": 9641, "train_loss": 3.5317327976226807, "lr": 0.0003290919574287173, "tps": 14496, "wall": 43590.0} {"step": 9642, "train_loss": 3.3964908123016357, "lr": 0.00032907671826904714, "tps": 14496, "wall": 43594.8} {"step": 9643, "train_loss": 3.580458879470825, "lr": 0.0003290614778737501, "tps": 14496, "wall": 43599.6} {"step": 9644, "train_loss": 3.601998805999756, "lr": 0.0003290462362429986, "tps": 14496, "wall": 43604.3} {"step": 9645, "train_loss": 3.5358047485351562, "lr": 0.00032903099337696555, "tps": 14496, "wall": 43609.2} {"step": 9646, "train_loss": 3.632862091064453, "lr": 0.0003290157492758235, "tps": 14495, "wall": 43614.0} {"step": 9647, "train_loss": 3.509493589401245, "lr": 0.00032900050393974505, "tps": 14495, "wall": 43618.8} {"step": 9648, "train_loss": 3.6096267700195312, "lr": 0.0003289852573689031, "tps": 14495, "wall": 43623.6} {"step": 9649, "train_loss": 3.5165977478027344, "lr": 0.00032897000956347023, "tps": 14495, "wall": 43628.4} {"step": 9650, "train_loss": 3.536210775375366, "lr": 0.0003289547605236192, "tps": 14495, "wall": 43633.2} {"step": 9651, "train_loss": 3.642568588256836, "lr": 0.00032893951024952274, "tps": 14495, "wall": 43638.0} {"step": 9652, "train_loss": 3.598632574081421, "lr": 0.0003289242587413536, "tps": 14495, "wall": 43642.8} {"step": 9653, "train_loss": 3.4827375411987305, "lr": 0.00032890900599928457, "tps": 14495, "wall": 43647.5} {"step": 9654, "train_loss": 3.543389320373535, "lr": 0.0003288937520234884, "tps": 14495, "wall": 43652.3} {"step": 9655, "train_loss": 3.563466787338257, "lr": 0.00032887849681413796, "tps": 14495, "wall": 43657.1} {"step": 9656, "train_loss": 3.3988120555877686, "lr": 0.00032886324037140603, "tps": 14495, "wall": 43661.9} {"step": 9657, "train_loss": 3.567354202270508, "lr": 0.00032884798269546537, "tps": 14494, "wall": 43666.7} {"step": 9658, "train_loss": 3.493246078491211, "lr": 0.0003288327237864889, "tps": 14494, "wall": 43671.5} {"step": 9659, "train_loss": 3.4635322093963623, "lr": 0.0003288174636446494, "tps": 14494, "wall": 43676.4} {"step": 9660, "train_loss": 3.5650603771209717, "lr": 0.00032880220227011987, "tps": 14494, "wall": 43681.2} {"step": 9661, "train_loss": 3.5346169471740723, "lr": 0.00032878693966307307, "tps": 14494, "wall": 43686.0} {"step": 9662, "train_loss": 3.4253365993499756, "lr": 0.00032877167582368196, "tps": 14494, "wall": 43690.7} {"step": 9663, "train_loss": 3.5949454307556152, "lr": 0.0003287564107521194, "tps": 14494, "wall": 43695.6} {"step": 9664, "train_loss": 3.4739813804626465, "lr": 0.00032874114444855833, "tps": 14494, "wall": 43700.3} {"step": 9665, "train_loss": 3.5801243782043457, "lr": 0.00032872587691317167, "tps": 14494, "wall": 43705.1} {"step": 9666, "train_loss": 3.377633571624756, "lr": 0.0003287106081461324, "tps": 14494, "wall": 43709.9} {"step": 9667, "train_loss": 3.508136510848999, "lr": 0.00032869533814761353, "tps": 14494, "wall": 43714.7} {"step": 9668, "train_loss": 3.5213708877563477, "lr": 0.00032868006691778797, "tps": 14493, "wall": 43719.5} {"step": 9669, "train_loss": 3.485945224761963, "lr": 0.00032866479445682866, "tps": 14493, "wall": 43724.3} {"step": 9670, "train_loss": 3.41188907623291, "lr": 0.00032864952076490877, "tps": 14493, "wall": 43729.1} {"step": 9671, "train_loss": 3.510641098022461, "lr": 0.0003286342458422012, "tps": 14493, "wall": 43733.9} {"step": 9672, "train_loss": 3.4511020183563232, "lr": 0.000328618969688879, "tps": 14493, "wall": 43738.7} {"step": 9673, "train_loss": 3.553839921951294, "lr": 0.00032860369230511526, "tps": 14493, "wall": 43743.5} {"step": 9674, "train_loss": 3.4740676879882812, "lr": 0.00032858841369108296, "tps": 14493, "wall": 43748.4} {"step": 9675, "train_loss": 3.4125823974609375, "lr": 0.0003285731338469553, "tps": 14493, "wall": 43753.2} {"step": 9676, "train_loss": 3.5128250122070312, "lr": 0.0003285578527729053, "tps": 14493, "wall": 43758.0} {"step": 9677, "train_loss": 3.5600593090057373, "lr": 0.00032854257046910606, "tps": 14493, "wall": 43762.8} {"step": 9678, "train_loss": 3.4398608207702637, "lr": 0.00032852728693573077, "tps": 14492, "wall": 43767.6} {"step": 9679, "train_loss": 3.6356348991394043, "lr": 0.0003285120021729524, "tps": 14492, "wall": 43772.4} {"step": 9680, "train_loss": 3.418130874633789, "lr": 0.00032849671618094425, "tps": 14492, "wall": 43777.2} {"step": 9681, "train_loss": 3.630197763442993, "lr": 0.0003284814289598793, "tps": 14492, "wall": 43782.0} {"step": 9682, "train_loss": 3.4928600788116455, "lr": 0.0003284661405099311, "tps": 14492, "wall": 43786.8} {"step": 9683, "train_loss": 3.5021872520446777, "lr": 0.00032845085083127245, "tps": 14492, "wall": 43791.6} {"step": 9684, "train_loss": 3.5228612422943115, "lr": 0.0003284355599240767, "tps": 14492, "wall": 43796.4} {"step": 9685, "train_loss": 3.486720085144043, "lr": 0.00032842026778851706, "tps": 14492, "wall": 43801.2} {"step": 9686, "train_loss": 3.482861280441284, "lr": 0.00032840497442476675, "tps": 14492, "wall": 43806.0} {"step": 9687, "train_loss": 3.521868944168091, "lr": 0.0003283896798329991, "tps": 14492, "wall": 43810.8} {"step": 9688, "train_loss": 3.55911922454834, "lr": 0.00032837438401338726, "tps": 14492, "wall": 43815.6} {"step": 9689, "train_loss": 3.411893844604492, "lr": 0.0003283590869661044, "tps": 14491, "wall": 43820.4} {"step": 9690, "train_loss": 3.5163800716400146, "lr": 0.00032834378869132415, "tps": 14491, "wall": 43825.2} {"step": 9691, "train_loss": 3.5117039680480957, "lr": 0.0003283284891892195, "tps": 14491, "wall": 43830.0} {"step": 9692, "train_loss": 3.456040859222412, "lr": 0.00032831318845996383, "tps": 14491, "wall": 43834.8} {"step": 9693, "train_loss": 3.420375347137451, "lr": 0.0003282978865037305, "tps": 14491, "wall": 43839.6} {"step": 9694, "train_loss": 3.479844093322754, "lr": 0.00032828258332069296, "tps": 14491, "wall": 43844.4} {"step": 9695, "train_loss": 3.4920573234558105, "lr": 0.0003282672789110244, "tps": 14491, "wall": 43849.2} {"step": 9696, "train_loss": 3.6330604553222656, "lr": 0.00032825197327489823, "tps": 14491, "wall": 43854.0} {"step": 9697, "train_loss": 3.521623134613037, "lr": 0.0003282366664124879, "tps": 14491, "wall": 43858.8} {"step": 9698, "train_loss": 3.4698431491851807, "lr": 0.0003282213583239667, "tps": 14491, "wall": 43863.6} {"step": 9699, "train_loss": 3.497159242630005, "lr": 0.0003282060490095081, "tps": 14491, "wall": 43868.4} {"step": 9700, "train_loss": 3.57834529876709, "lr": 0.0003281907384692855, "tps": 14490, "wall": 43873.2} {"step": 9701, "train_loss": 3.487144708633423, "lr": 0.00032817542670347246, "tps": 14490, "wall": 43878.0} {"step": 9702, "train_loss": 3.4440338611602783, "lr": 0.0003281601137122423, "tps": 14490, "wall": 43882.8} {"step": 9703, "train_loss": 3.450648307800293, "lr": 0.00032814479949576847, "tps": 14490, "wall": 43887.6} {"step": 9704, "train_loss": 3.489311456680298, "lr": 0.0003281294840542245, "tps": 14490, "wall": 43892.5} {"step": 9705, "train_loss": 3.412600517272949, "lr": 0.00032811416738778393, "tps": 14490, "wall": 43897.4} {"step": 9706, "train_loss": 3.534083843231201, "lr": 0.0003280988494966202, "tps": 14490, "wall": 43902.3} {"step": 9707, "train_loss": 3.4971649646759033, "lr": 0.0003280835303809069, "tps": 14490, "wall": 43907.3} {"step": 9708, "train_loss": 3.5961358547210693, "lr": 0.00032806821004081747, "tps": 14490, "wall": 43912.2} {"step": 9709, "train_loss": 3.4935669898986816, "lr": 0.00032805288847652554, "tps": 14489, "wall": 43917.3} {"step": 9710, "train_loss": 3.606269359588623, "lr": 0.0003280375656882046, "tps": 14489, "wall": 43922.3} {"step": 9711, "train_loss": 3.5567359924316406, "lr": 0.0003280222416760283, "tps": 14489, "wall": 43927.4} {"step": 9712, "train_loss": 3.512317657470703, "lr": 0.00032800691644017016, "tps": 14489, "wall": 43932.5} {"step": 9713, "train_loss": 3.5716333389282227, "lr": 0.0003279915899808039, "tps": 14489, "wall": 43937.5} {"step": 9714, "train_loss": 3.5707712173461914, "lr": 0.00032797626229810306, "tps": 14488, "wall": 43942.6} {"step": 9715, "train_loss": 3.569247007369995, "lr": 0.0003279609333922412, "tps": 14488, "wall": 43947.7} {"step": 9716, "train_loss": 3.5363917350769043, "lr": 0.0003279456032633921, "tps": 14488, "wall": 43952.7} {"step": 9717, "train_loss": 3.387482166290283, "lr": 0.00032793027191172934, "tps": 14488, "wall": 43957.8} {"step": 9718, "train_loss": 3.5894436836242676, "lr": 0.00032791493933742664, "tps": 14488, "wall": 43962.9} {"step": 9719, "train_loss": 3.4460768699645996, "lr": 0.0003278996055406577, "tps": 14488, "wall": 43967.9} {"step": 9720, "train_loss": 3.474806308746338, "lr": 0.00032788427052159614, "tps": 14487, "wall": 43973.0} {"step": 9721, "train_loss": 3.538274049758911, "lr": 0.0003278689342804158, "tps": 14487, "wall": 43978.2} {"step": 9722, "train_loss": 3.5169806480407715, "lr": 0.00032785359681729027, "tps": 14487, "wall": 43983.2} {"step": 9723, "train_loss": 3.509459972381592, "lr": 0.0003278382581323934, "tps": 14487, "wall": 43988.4} {"step": 9724, "train_loss": 3.5458414554595947, "lr": 0.0003278229182258989, "tps": 14487, "wall": 43993.4} {"step": 9725, "train_loss": 3.477102279663086, "lr": 0.0003278075770979805, "tps": 14486, "wall": 43998.5} {"step": 9726, "train_loss": 3.430232286453247, "lr": 0.0003277922347488121, "tps": 14486, "wall": 44003.6} {"step": 9727, "train_loss": 3.45271635055542, "lr": 0.00032777689117856736, "tps": 14486, "wall": 44008.7} {"step": 9728, "train_loss": 3.538968086242676, "lr": 0.00032776154638742026, "tps": 14486, "wall": 44013.8} {"step": 9729, "train_loss": 3.541656970977783, "lr": 0.00032774620037554446, "tps": 14486, "wall": 44018.9} {"step": 9730, "train_loss": 3.526322841644287, "lr": 0.0003277308531431139, "tps": 14485, "wall": 44024.0} {"step": 9731, "train_loss": 3.4859678745269775, "lr": 0.0003277155046903024, "tps": 14485, "wall": 44029.1} {"step": 9732, "train_loss": 3.5393106937408447, "lr": 0.0003277001550172839, "tps": 14485, "wall": 44034.2} {"step": 9733, "train_loss": 3.4994819164276123, "lr": 0.0003276848041242321, "tps": 14485, "wall": 44039.4} {"step": 9734, "train_loss": 3.4776864051818848, "lr": 0.0003276694520113211, "tps": 14485, "wall": 44044.4} {"step": 9735, "train_loss": 3.515068531036377, "lr": 0.0003276540986787247, "tps": 14485, "wall": 44049.5} {"step": 9736, "train_loss": 3.6191132068634033, "lr": 0.0003276387441266168, "tps": 14484, "wall": 44054.6} {"step": 9737, "train_loss": 3.527240753173828, "lr": 0.0003276233883551714, "tps": 14484, "wall": 44059.7} {"step": 9738, "train_loss": 3.4930226802825928, "lr": 0.0003276080313645625, "tps": 14484, "wall": 44064.8} {"step": 9739, "train_loss": 3.565793752670288, "lr": 0.00032759267315496393, "tps": 14484, "wall": 44069.9} {"step": 9740, "train_loss": 3.473454475402832, "lr": 0.00032757731372654974, "tps": 14484, "wall": 44075.0} {"step": 9741, "train_loss": 3.5592010021209717, "lr": 0.000327561953079494, "tps": 14483, "wall": 44080.1} {"step": 9742, "train_loss": 3.491034984588623, "lr": 0.00032754659121397053, "tps": 14483, "wall": 44085.2} {"step": 9743, "train_loss": 3.455065965652466, "lr": 0.00032753122813015354, "tps": 14483, "wall": 44090.3} {"step": 9744, "train_loss": 3.524641513824463, "lr": 0.0003275158638282169, "tps": 14483, "wall": 44095.5} {"step": 9745, "train_loss": 3.4957523345947266, "lr": 0.0003275004983083348, "tps": 14483, "wall": 44100.5} {"step": 9746, "train_loss": 3.539824962615967, "lr": 0.00032748513157068124, "tps": 14482, "wall": 44105.6} {"step": 9747, "train_loss": 3.319424629211426, "lr": 0.0003274697636154303, "tps": 14482, "wall": 44110.7} {"step": 9748, "train_loss": 3.5510315895080566, "lr": 0.00032745439444275604, "tps": 14482, "wall": 44115.8} {"step": 9749, "train_loss": 3.642298460006714, "lr": 0.0003274390240528326, "tps": 14482, "wall": 44120.9} {"step": 9750, "train_loss": 3.4489054679870605, "lr": 0.0003274236524458341, "tps": 14482, "wall": 44126.0} {"step": 9751, "train_loss": 3.5319392681121826, "lr": 0.0003274082796219346, "tps": 14482, "wall": 44131.1} {"step": 9752, "train_loss": 3.4630751609802246, "lr": 0.0003273929055813083, "tps": 14481, "wall": 44136.2} {"step": 9753, "train_loss": 3.4537150859832764, "lr": 0.0003273775303241294, "tps": 14481, "wall": 44141.3} {"step": 9754, "train_loss": 3.5410451889038086, "lr": 0.00032736215385057197, "tps": 14481, "wall": 44146.4} {"step": 9755, "train_loss": 3.4677677154541016, "lr": 0.0003273467761608103, "tps": 14481, "wall": 44151.5} {"step": 9756, "train_loss": 3.471445083618164, "lr": 0.0003273313972550185, "tps": 14481, "wall": 44156.6} {"step": 9757, "train_loss": 3.5479817390441895, "lr": 0.0003273160171333709, "tps": 14480, "wall": 44161.7} {"step": 9758, "train_loss": 3.5738577842712402, "lr": 0.00032730063579604167, "tps": 14480, "wall": 44166.9} {"step": 9759, "train_loss": 3.4758005142211914, "lr": 0.00032728525324320497, "tps": 14480, "wall": 44172.0} {"step": 9760, "train_loss": 3.574484348297119, "lr": 0.0003272698694750351, "tps": 14480, "wall": 44177.1} {"step": 9761, "train_loss": 3.587430477142334, "lr": 0.0003272544844917063, "tps": 14480, "wall": 44182.2} {"step": 9762, "train_loss": 3.5092852115631104, "lr": 0.000327239098293393, "tps": 14479, "wall": 44187.2} {"step": 9763, "train_loss": 3.502376079559326, "lr": 0.00032722371088026933, "tps": 14479, "wall": 44192.3} {"step": 9764, "train_loss": 3.6382155418395996, "lr": 0.0003272083222525097, "tps": 14479, "wall": 44197.4} {"step": 9765, "train_loss": 3.58848237991333, "lr": 0.00032719293241028843, "tps": 14479, "wall": 44202.5} {"step": 9766, "train_loss": 3.548959255218506, "lr": 0.00032717754135377973, "tps": 14479, "wall": 44207.6} {"step": 9767, "train_loss": 3.5008630752563477, "lr": 0.0003271621490831581, "tps": 14479, "wall": 44212.6} {"step": 9768, "train_loss": 3.631748676300049, "lr": 0.00032714675559859785, "tps": 14478, "wall": 44217.8} {"step": 9769, "train_loss": 3.4890122413635254, "lr": 0.00032713136090027335, "tps": 14478, "wall": 44222.9} {"step": 9770, "train_loss": 3.5301148891448975, "lr": 0.00032711596498835897, "tps": 14478, "wall": 44227.9} {"step": 9771, "train_loss": 3.5625171661376953, "lr": 0.0003271005678630292, "tps": 14478, "wall": 44233.0} {"step": 9772, "train_loss": 3.4920260906219482, "lr": 0.00032708516952445834, "tps": 14478, "wall": 44238.1} {"step": 9773, "train_loss": 3.643773078918457, "lr": 0.00032706976997282094, "tps": 14477, "wall": 44243.2} {"step": 9774, "train_loss": 3.5355918407440186, "lr": 0.0003270543692082914, "tps": 14477, "wall": 44248.3} {"step": 9775, "train_loss": 3.566993236541748, "lr": 0.0003270389672310441, "tps": 14477, "wall": 44253.4} {"step": 9776, "train_loss": 3.445950508117676, "lr": 0.00032702356404125366, "tps": 14477, "wall": 44258.4} {"step": 9777, "train_loss": 3.601221799850464, "lr": 0.0003270081596390944, "tps": 14477, "wall": 44263.5} {"step": 9778, "train_loss": 3.585038423538208, "lr": 0.000326992754024741, "tps": 14476, "wall": 44268.6} {"step": 9779, "train_loss": 3.3989124298095703, "lr": 0.00032697734719836787, "tps": 14476, "wall": 44273.7} {"step": 9780, "train_loss": 3.5311269760131836, "lr": 0.00032696193916014957, "tps": 14476, "wall": 44278.8} {"step": 9781, "train_loss": 3.5871002674102783, "lr": 0.0003269465299102607, "tps": 14476, "wall": 44284.0} {"step": 9782, "train_loss": 3.460456132888794, "lr": 0.0003269311194488756, "tps": 14476, "wall": 44289.1} {"step": 9783, "train_loss": 3.504380226135254, "lr": 0.00032691570777616916, "tps": 14476, "wall": 44294.2} {"step": 9784, "train_loss": 3.557823419570923, "lr": 0.00032690029489231573, "tps": 14475, "wall": 44299.3} {"step": 9785, "train_loss": 3.545731782913208, "lr": 0.00032688488079748995, "tps": 14475, "wall": 44304.4} {"step": 9786, "train_loss": 3.5583865642547607, "lr": 0.00032686946549186655, "tps": 14475, "wall": 44309.5} {"step": 9787, "train_loss": 3.463080406188965, "lr": 0.00032685404897561996, "tps": 14475, "wall": 44314.5} {"step": 9788, "train_loss": 3.4764294624328613, "lr": 0.0003268386312489249, "tps": 14475, "wall": 44319.6} {"step": 9789, "train_loss": 3.5093178749084473, "lr": 0.00032682321231195617, "tps": 14474, "wall": 44324.7} {"step": 9790, "train_loss": 3.5274577140808105, "lr": 0.00032680779216488824, "tps": 14474, "wall": 44329.8} {"step": 9791, "train_loss": 3.4649126529693604, "lr": 0.00032679237080789585, "tps": 14474, "wall": 44334.9} {"step": 9792, "train_loss": 3.4204137325286865, "lr": 0.0003267769482411537, "tps": 14474, "wall": 44340.0} {"step": 9793, "train_loss": 3.454836368560791, "lr": 0.00032676152446483653, "tps": 14474, "wall": 44345.1} {"step": 9794, "train_loss": 3.5834388732910156, "lr": 0.00032674609947911905, "tps": 14474, "wall": 44350.2} {"step": 9795, "train_loss": 3.513906478881836, "lr": 0.0003267306732841759, "tps": 14473, "wall": 44355.2} {"step": 9796, "train_loss": 3.5257863998413086, "lr": 0.000326715245880182, "tps": 14473, "wall": 44360.3} {"step": 9797, "train_loss": 3.547093629837036, "lr": 0.00032669981726731205, "tps": 14473, "wall": 44365.4} {"step": 9798, "train_loss": 3.5161898136138916, "lr": 0.00032668438744574074, "tps": 14473, "wall": 44370.4} {"step": 9799, "train_loss": 3.5829877853393555, "lr": 0.0003266689564156429, "tps": 14473, "wall": 44375.5} {"step": 9800, "train_loss": 3.527416467666626, "lr": 0.00032665352417719334, "tps": 14472, "wall": 44380.6} {"step": 9801, "train_loss": 3.556462287902832, "lr": 0.00032663809073056697, "tps": 14472, "wall": 44385.7} {"step": 9802, "train_loss": 3.4765355587005615, "lr": 0.00032662265607593847, "tps": 14472, "wall": 44390.7} {"step": 9803, "train_loss": 3.471951961517334, "lr": 0.0003266072202134828, "tps": 14472, "wall": 44395.9} {"step": 9804, "train_loss": 3.51680064201355, "lr": 0.0003265917831433747, "tps": 14472, "wall": 44401.0} {"step": 9805, "train_loss": 3.429063081741333, "lr": 0.00032657634486578916, "tps": 14472, "wall": 44406.0} {"step": 9806, "train_loss": 3.452672004699707, "lr": 0.000326560905380901, "tps": 14471, "wall": 44411.1} {"step": 9807, "train_loss": 3.431838035583496, "lr": 0.00032654546468888516, "tps": 14471, "wall": 44416.2} {"step": 9808, "train_loss": 3.436072826385498, "lr": 0.0003265300227899165, "tps": 14471, "wall": 44421.3} {"step": 9809, "train_loss": 3.5499207973480225, "lr": 0.00032651457968417005, "tps": 14471, "wall": 44426.4} {"step": 9810, "train_loss": 3.4199438095092773, "lr": 0.0003264991353718206, "tps": 14471, "wall": 44431.4} {"step": 9811, "train_loss": 3.5613865852355957, "lr": 0.00032648368985304326, "tps": 14470, "wall": 44436.5} {"step": 9812, "train_loss": 3.567521572113037, "lr": 0.00032646824312801285, "tps": 14470, "wall": 44441.6} {"step": 9813, "train_loss": 3.481773853302002, "lr": 0.00032645279519690444, "tps": 14470, "wall": 44446.6} {"step": 9814, "train_loss": 3.4602370262145996, "lr": 0.00032643734605989304, "tps": 14470, "wall": 44451.7} {"step": 9815, "train_loss": 3.484050989151001, "lr": 0.0003264218957171536, "tps": 14470, "wall": 44456.8} {"step": 9816, "train_loss": 3.59920072555542, "lr": 0.0003264064441688612, "tps": 14470, "wall": 44461.9} {"step": 9817, "train_loss": 3.592177629470825, "lr": 0.00032639099141519074, "tps": 14469, "wall": 44467.0} {"step": 9818, "train_loss": 3.4721922874450684, "lr": 0.0003263755374563175, "tps": 14469, "wall": 44472.1} {"step": 9819, "train_loss": 3.508829116821289, "lr": 0.00032636008229241636, "tps": 14469, "wall": 44477.2} {"step": 9820, "train_loss": 3.567370653152466, "lr": 0.00032634462592366246, "tps": 14469, "wall": 44482.2} {"step": 9821, "train_loss": 3.480077028274536, "lr": 0.00032632916835023093, "tps": 14469, "wall": 44487.3} {"step": 9822, "train_loss": 3.4397919178009033, "lr": 0.00032631370957229676, "tps": 14468, "wall": 44492.4} {"step": 9823, "train_loss": 3.4340145587921143, "lr": 0.00032629824959003515, "tps": 14468, "wall": 44497.5} {"step": 9824, "train_loss": 3.570028066635132, "lr": 0.00032628278840362126, "tps": 14468, "wall": 44502.6} {"step": 9825, "train_loss": 3.4553353786468506, "lr": 0.0003262673260132301, "tps": 14468, "wall": 44507.7} {"step": 9826, "train_loss": 3.3963255882263184, "lr": 0.00032625186241903696, "tps": 14468, "wall": 44512.7} {"step": 9827, "train_loss": 3.4805707931518555, "lr": 0.000326236397621217, "tps": 14468, "wall": 44517.9} {"step": 9828, "train_loss": 3.575383186340332, "lr": 0.00032622093161994536, "tps": 14467, "wall": 44522.9} {"step": 9829, "train_loss": 3.433928966522217, "lr": 0.0003262054644153973, "tps": 14467, "wall": 44528.0} {"step": 9830, "train_loss": 3.380549430847168, "lr": 0.000326189996007748, "tps": 14467, "wall": 44533.1} {"step": 9831, "train_loss": 3.504695415496826, "lr": 0.00032617452639717263, "tps": 14467, "wall": 44538.2} {"step": 9832, "train_loss": 3.5744285583496094, "lr": 0.0003261590555838465, "tps": 14467, "wall": 44543.2} {"step": 9833, "train_loss": 3.609628438949585, "lr": 0.0003261435835679449, "tps": 14467, "wall": 44548.3} {"step": 9834, "train_loss": 3.540691614151001, "lr": 0.0003261281103496429, "tps": 14466, "wall": 44553.4} {"step": 9835, "train_loss": 3.532169818878174, "lr": 0.00032611263592911605, "tps": 14466, "wall": 44558.5} {"step": 9836, "train_loss": 3.4691686630249023, "lr": 0.0003260971603065395, "tps": 14466, "wall": 44563.5} {"step": 9837, "train_loss": 3.4929494857788086, "lr": 0.0003260816834820885, "tps": 14466, "wall": 44568.6} {"step": 9838, "train_loss": 3.4888854026794434, "lr": 0.0003260662054559386, "tps": 14466, "wall": 44573.7} {"step": 9839, "train_loss": 3.5356974601745605, "lr": 0.00032605072622826485, "tps": 14465, "wall": 44578.8} {"step": 9840, "train_loss": 3.4873571395874023, "lr": 0.00032603524579924285, "tps": 14465, "wall": 44583.9} {"step": 9841, "train_loss": 3.4673402309417725, "lr": 0.00032601976416904774, "tps": 14465, "wall": 44589.0} {"step": 9842, "train_loss": 3.475512981414795, "lr": 0.0003260042813378551, "tps": 14465, "wall": 44594.1} {"step": 9843, "train_loss": 3.5149898529052734, "lr": 0.0003259887973058401, "tps": 14465, "wall": 44599.1} {"step": 9844, "train_loss": 3.542191743850708, "lr": 0.00032597331207317835, "tps": 14465, "wall": 44604.2} {"step": 9845, "train_loss": 3.586313247680664, "lr": 0.0003259578256400452, "tps": 14464, "wall": 44609.3} {"step": 9846, "train_loss": 3.4807863235473633, "lr": 0.00032594233800661604, "tps": 14464, "wall": 44614.3} {"step": 9847, "train_loss": 3.5589194297790527, "lr": 0.0003259268491730664, "tps": 14464, "wall": 44619.4} {"step": 9848, "train_loss": 3.505296230316162, "lr": 0.0003259113591395716, "tps": 14464, "wall": 44624.5} {"step": 9849, "train_loss": 3.5084643363952637, "lr": 0.00032589586790630724, "tps": 14464, "wall": 44629.6} {"step": 9850, "train_loss": 3.5751752853393555, "lr": 0.0003258803754734488, "tps": 14463, "wall": 44634.7} {"step": 9851, "train_loss": 3.563455820083618, "lr": 0.00032586488184117163, "tps": 14463, "wall": 44639.8} {"step": 9852, "train_loss": 3.4441754817962646, "lr": 0.00032584938700965145, "tps": 14463, "wall": 44644.9} {"step": 9853, "train_loss": 3.467489004135132, "lr": 0.0003258338909790637, "tps": 14463, "wall": 44650.0} {"step": 9854, "train_loss": 3.409332752227783, "lr": 0.0003258183937495838, "tps": 14463, "wall": 44655.1} {"step": 9855, "train_loss": 3.567884922027588, "lr": 0.00032580289532138743, "tps": 14463, "wall": 44660.1} {"step": 9856, "train_loss": 3.5541462898254395, "lr": 0.00032578739569465024, "tps": 14462, "wall": 44665.2} {"step": 9857, "train_loss": 3.576490879058838, "lr": 0.00032577189486954764, "tps": 14462, "wall": 44670.3} {"step": 9858, "train_loss": 3.4411869049072266, "lr": 0.00032575639284625527, "tps": 14462, "wall": 44675.3} {"step": 9859, "train_loss": 3.619919538497925, "lr": 0.0003257408896249488, "tps": 14462, "wall": 44680.4} {"step": 9860, "train_loss": 3.5533008575439453, "lr": 0.0003257253852058038, "tps": 14462, "wall": 44685.5} {"step": 9861, "train_loss": 3.455554485321045, "lr": 0.00032570987958899597, "tps": 14462, "wall": 44690.5} {"step": 9862, "train_loss": 3.405087947845459, "lr": 0.0003256943727747008, "tps": 14461, "wall": 44695.7} {"step": 9863, "train_loss": 3.5601806640625, "lr": 0.00032567886476309407, "tps": 14461, "wall": 44700.7} {"step": 9864, "train_loss": 3.555513858795166, "lr": 0.00032566335555435155, "tps": 14461, "wall": 44705.8} {"step": 9865, "train_loss": 3.5069663524627686, "lr": 0.0003256478451486487, "tps": 14461, "wall": 44710.9} {"step": 9866, "train_loss": 3.5809314250946045, "lr": 0.0003256323335461614, "tps": 14461, "wall": 44716.0} {"step": 9867, "train_loss": 3.497081756591797, "lr": 0.00032561682074706534, "tps": 14460, "wall": 44721.0} {"step": 9868, "train_loss": 3.409553050994873, "lr": 0.0003256013067515362, "tps": 14460, "wall": 44726.1} {"step": 9869, "train_loss": 3.4826197624206543, "lr": 0.0003255857915597497, "tps": 14460, "wall": 44731.1} {"step": 9870, "train_loss": 3.529294013977051, "lr": 0.0003255702751718817, "tps": 14460, "wall": 44736.2} {"step": 9871, "train_loss": 3.463557243347168, "lr": 0.00032555475758810784, "tps": 14460, "wall": 44741.3} {"step": 9872, "train_loss": 3.5122241973876953, "lr": 0.0003255392388086041, "tps": 14460, "wall": 44746.3} {"step": 9873, "train_loss": 3.571463108062744, "lr": 0.000325523718833546, "tps": 14459, "wall": 44751.4} {"step": 9874, "train_loss": 3.473306894302368, "lr": 0.00032550819766310964, "tps": 14459, "wall": 44756.5} {"step": 9875, "train_loss": 3.496689796447754, "lr": 0.00032549267529747065, "tps": 14459, "wall": 44761.6} {"step": 9876, "train_loss": 3.5677990913391113, "lr": 0.0003254771517368049, "tps": 14459, "wall": 44766.7} {"step": 9877, "train_loss": 3.4725918769836426, "lr": 0.00032546162698128826, "tps": 14459, "wall": 44771.8} {"step": 9878, "train_loss": 3.5618906021118164, "lr": 0.0003254461010310967, "tps": 14459, "wall": 44776.9} {"step": 9879, "train_loss": 3.408583641052246, "lr": 0.0003254305738864059, "tps": 14458, "wall": 44781.9} {"step": 9880, "train_loss": 3.5385420322418213, "lr": 0.0003254150455473919, "tps": 14458, "wall": 44787.0} {"step": 9881, "train_loss": 3.4133198261260986, "lr": 0.00032539951601423056, "tps": 14458, "wall": 44792.0} {"step": 9882, "train_loss": 3.438995361328125, "lr": 0.00032538398528709784, "tps": 14458, "wall": 44797.1} {"step": 9883, "train_loss": 3.448310375213623, "lr": 0.0003253684533661695, "tps": 14458, "wall": 44802.2} {"step": 9884, "train_loss": 3.4626858234405518, "lr": 0.00032535292025162176, "tps": 14457, "wall": 44807.3} {"step": 9885, "train_loss": 3.5071144104003906, "lr": 0.00032533738594363044, "tps": 14457, "wall": 44812.4} {"step": 9886, "train_loss": 3.4382622241973877, "lr": 0.00032532185044237147, "tps": 14457, "wall": 44817.5} {"step": 9887, "train_loss": 3.5447587966918945, "lr": 0.0003253063137480208, "tps": 14457, "wall": 44822.6} {"step": 9888, "train_loss": 3.5108909606933594, "lr": 0.0003252907758607546, "tps": 14457, "wall": 44827.7} {"step": 9889, "train_loss": 3.4528005123138428, "lr": 0.00032527523678074885, "tps": 14457, "wall": 44832.8} {"step": 9890, "train_loss": 3.6343064308166504, "lr": 0.0003252596965081794, "tps": 14456, "wall": 44837.9} {"step": 9891, "train_loss": 3.4434986114501953, "lr": 0.0003252441550432225, "tps": 14456, "wall": 44842.9} {"step": 9892, "train_loss": 3.53771710395813, "lr": 0.0003252286123860541, "tps": 14456, "wall": 44848.0} {"step": 9893, "train_loss": 3.5792341232299805, "lr": 0.00032521306853685027, "tps": 14456, "wall": 44853.1} {"step": 9894, "train_loss": 3.560328245162964, "lr": 0.0003251975234957871, "tps": 14456, "wall": 44858.1} {"step": 9895, "train_loss": 3.5703964233398438, "lr": 0.0003251819772630407, "tps": 14456, "wall": 44863.2} {"step": 9896, "train_loss": 3.6521918773651123, "lr": 0.0003251664298387872, "tps": 14455, "wall": 44868.2} {"step": 9897, "train_loss": 3.5200295448303223, "lr": 0.00032515088122320266, "tps": 14455, "wall": 44873.3} {"step": 9898, "train_loss": 3.5523457527160645, "lr": 0.0003251353314164633, "tps": 14455, "wall": 44878.4} {"step": 9899, "train_loss": 3.4898080825805664, "lr": 0.00032511978041874516, "tps": 14455, "wall": 44883.5} {"step": 9900, "train_loss": 3.3937582969665527, "lr": 0.0003251042282302245, "tps": 14455, "wall": 44888.6} {"step": 9901, "train_loss": 3.4522101879119873, "lr": 0.0003250886748510774, "tps": 14454, "wall": 44893.7} {"step": 9902, "train_loss": 3.545334815979004, "lr": 0.00032507312028148014, "tps": 14454, "wall": 44898.8} {"step": 9903, "train_loss": 3.548036813735962, "lr": 0.0003250575645216089, "tps": 14454, "wall": 44903.8} {"step": 9904, "train_loss": 3.6307544708251953, "lr": 0.0003250420075716398, "tps": 14454, "wall": 44908.9} {"step": 9905, "train_loss": 3.6423721313476562, "lr": 0.00032502644943174926, "tps": 14454, "wall": 44914.0} {"step": 9906, "train_loss": 3.5173394680023193, "lr": 0.00032501089010211336, "tps": 14454, "wall": 44919.1} {"step": 9907, "train_loss": 3.5319879055023193, "lr": 0.0003249953295829085, "tps": 14453, "wall": 44924.2} {"step": 9908, "train_loss": 3.561997890472412, "lr": 0.00032497976787431083, "tps": 14453, "wall": 44929.2} {"step": 9909, "train_loss": 3.4827425479888916, "lr": 0.0003249642049764966, "tps": 14453, "wall": 44934.3} {"step": 9910, "train_loss": 3.5229909420013428, "lr": 0.0003249486408896423, "tps": 14453, "wall": 44939.4} {"step": 9911, "train_loss": 3.5383691787719727, "lr": 0.000324933075613924, "tps": 14453, "wall": 44944.5} {"step": 9912, "train_loss": 3.360569477081299, "lr": 0.0003249175091495182, "tps": 14453, "wall": 44949.6} {"step": 9913, "train_loss": 3.516439437866211, "lr": 0.00032490194149660117, "tps": 14452, "wall": 44954.7} {"step": 9914, "train_loss": 3.5954208374023438, "lr": 0.0003248863726553492, "tps": 14452, "wall": 44959.7} {"step": 9915, "train_loss": 3.5280251502990723, "lr": 0.00032487080262593885, "tps": 14452, "wall": 44964.8} {"step": 9916, "train_loss": 3.535935401916504, "lr": 0.0003248552314085463, "tps": 14452, "wall": 44969.9} {"step": 9917, "train_loss": 3.4435977935791016, "lr": 0.0003248396590033481, "tps": 14452, "wall": 44975.0} {"step": 9918, "train_loss": 3.570119857788086, "lr": 0.00032482408541052043, "tps": 14451, "wall": 44980.1} {"step": 9919, "train_loss": 3.4722399711608887, "lr": 0.00032480851063023997, "tps": 14451, "wall": 44985.1} {"step": 9920, "train_loss": 3.5704710483551025, "lr": 0.000324792934662683, "tps": 14451, "wall": 44990.2} {"step": 9921, "train_loss": 3.5448966026306152, "lr": 0.00032477735750802595, "tps": 14451, "wall": 44995.4} {"step": 9922, "train_loss": 3.537924289703369, "lr": 0.00032476177916644536, "tps": 14451, "wall": 45000.4} {"step": 9923, "train_loss": 3.527474880218506, "lr": 0.00032474619963811767, "tps": 14451, "wall": 45005.5} {"step": 9924, "train_loss": 3.5196380615234375, "lr": 0.0003247306189232194, "tps": 14450, "wall": 45010.6} {"step": 9925, "train_loss": 3.5225231647491455, "lr": 0.00032471503702192697, "tps": 14450, "wall": 45015.7} {"step": 9926, "train_loss": 3.4545702934265137, "lr": 0.0003246994539344169, "tps": 14450, "wall": 45020.7} {"step": 9927, "train_loss": 3.45967435836792, "lr": 0.0003246838696608658, "tps": 14450, "wall": 45025.8} {"step": 9928, "train_loss": 3.523667335510254, "lr": 0.0003246682842014502, "tps": 14450, "wall": 45030.9} {"step": 9929, "train_loss": 3.5022921562194824, "lr": 0.0003246526975563465, "tps": 14450, "wall": 45036.0} {"step": 9930, "train_loss": 3.4301695823669434, "lr": 0.0003246371097257315, "tps": 14449, "wall": 45041.0} {"step": 9931, "train_loss": 3.381530523300171, "lr": 0.00032462152070978164, "tps": 14449, "wall": 45046.1} {"step": 9932, "train_loss": 3.3862414360046387, "lr": 0.0003246059305086735, "tps": 14449, "wall": 45051.1} {"step": 9933, "train_loss": 3.4856886863708496, "lr": 0.0003245903391225837, "tps": 14449, "wall": 45056.3} {"step": 9934, "train_loss": 3.4677371978759766, "lr": 0.00032457474655168896, "tps": 14449, "wall": 45061.4} {"step": 9935, "train_loss": 3.4899520874023438, "lr": 0.00032455915279616573, "tps": 14449, "wall": 45066.5} {"step": 9936, "train_loss": 3.4974093437194824, "lr": 0.0003245435578561908, "tps": 14448, "wall": 45071.5} {"step": 9937, "train_loss": 3.368987560272217, "lr": 0.0003245279617319408, "tps": 14448, "wall": 45076.6} {"step": 9938, "train_loss": 3.4973554611206055, "lr": 0.0003245123644235924, "tps": 14448, "wall": 45081.7} {"step": 9939, "train_loss": 3.3868560791015625, "lr": 0.0003244967659313223, "tps": 14448, "wall": 45086.7} {"step": 9940, "train_loss": 3.5407397747039795, "lr": 0.0003244811662553071, "tps": 14448, "wall": 45091.8} {"step": 9941, "train_loss": 3.404909372329712, "lr": 0.00032446556539572364, "tps": 14447, "wall": 45096.9} {"step": 9942, "train_loss": 3.5426506996154785, "lr": 0.00032444996335274863, "tps": 14447, "wall": 45101.9} {"step": 9943, "train_loss": 3.5527143478393555, "lr": 0.00032443436012655885, "tps": 14447, "wall": 45107.0} {"step": 9944, "train_loss": 3.446317672729492, "lr": 0.0003244187557173309, "tps": 14447, "wall": 45112.1} {"step": 9945, "train_loss": 3.4580554962158203, "lr": 0.00032440315012524163, "tps": 14447, "wall": 45117.2} {"step": 9946, "train_loss": 3.5163822174072266, "lr": 0.00032438754335046785, "tps": 14447, "wall": 45122.3} {"step": 9947, "train_loss": 3.5208864212036133, "lr": 0.0003243719353931863, "tps": 14446, "wall": 45127.4} {"step": 9948, "train_loss": 3.5079121589660645, "lr": 0.00032435632625357384, "tps": 14446, "wall": 45132.5} {"step": 9949, "train_loss": 3.573735237121582, "lr": 0.00032434071593180733, "tps": 14446, "wall": 45137.6} {"step": 9950, "train_loss": 3.5020389556884766, "lr": 0.00032432510442806346, "tps": 14446, "wall": 45142.7} {"step": 9951, "train_loss": 3.350834846496582, "lr": 0.00032430949174251916, "tps": 14446, "wall": 45147.8} {"step": 9952, "train_loss": 3.4735918045043945, "lr": 0.00032429387787535137, "tps": 14446, "wall": 45152.8} {"step": 9953, "train_loss": 3.542428493499756, "lr": 0.00032427826282673683, "tps": 14445, "wall": 45157.9} {"step": 9954, "train_loss": 3.4238977432250977, "lr": 0.0003242626465968525, "tps": 14445, "wall": 45163.0} {"step": 9955, "train_loss": 3.478165626525879, "lr": 0.0003242470291858753, "tps": 14445, "wall": 45168.0} {"step": 9956, "train_loss": 3.4680004119873047, "lr": 0.00032423141059398207, "tps": 14445, "wall": 45173.1} {"step": 9957, "train_loss": 3.6253209114074707, "lr": 0.0003242157908213498, "tps": 14445, "wall": 45178.2} {"step": 9958, "train_loss": 3.4396016597747803, "lr": 0.0003242001698681554, "tps": 14445, "wall": 45183.3} {"step": 9959, "train_loss": 3.558929920196533, "lr": 0.00032418454773457594, "tps": 14444, "wall": 45188.4} {"step": 9960, "train_loss": 3.531376361846924, "lr": 0.00032416892442078813, "tps": 14444, "wall": 45193.5} {"step": 9961, "train_loss": 3.466202735900879, "lr": 0.0003241532999269692, "tps": 14444, "wall": 45198.5} {"step": 9962, "train_loss": 3.5697097778320312, "lr": 0.000324137674253296, "tps": 14444, "wall": 45203.7} {"step": 9963, "train_loss": 3.5494303703308105, "lr": 0.0003241220473999456, "tps": 14444, "wall": 45208.7} {"step": 9964, "train_loss": 3.4769721031188965, "lr": 0.0003241064193670951, "tps": 14443, "wall": 45213.8} {"step": 9965, "train_loss": 3.437157154083252, "lr": 0.0003240907901549214, "tps": 14443, "wall": 45218.9} {"step": 9966, "train_loss": 3.498772621154785, "lr": 0.00032407515976360155, "tps": 14443, "wall": 45224.0} {"step": 9967, "train_loss": 3.4625139236450195, "lr": 0.00032405952819331273, "tps": 14443, "wall": 45229.0} {"step": 9968, "train_loss": 3.439148187637329, "lr": 0.0003240438954442319, "tps": 14443, "wall": 45234.1} {"step": 9969, "train_loss": 3.4507570266723633, "lr": 0.00032402826151653615, "tps": 14443, "wall": 45239.2} {"step": 9970, "train_loss": 3.4589600563049316, "lr": 0.00032401262641040276, "tps": 14442, "wall": 45244.3} {"step": 9971, "train_loss": 3.4835901260375977, "lr": 0.00032399699012600864, "tps": 14442, "wall": 45249.4} {"step": 9972, "train_loss": 3.5721435546875, "lr": 0.00032398135266353096, "tps": 14442, "wall": 45254.5} {"step": 9973, "train_loss": 3.4863474369049072, "lr": 0.00032396571402314693, "tps": 14442, "wall": 45259.6} {"step": 9974, "train_loss": 3.4328036308288574, "lr": 0.0003239500742050336, "tps": 14442, "wall": 45264.6} {"step": 9975, "train_loss": 3.5633246898651123, "lr": 0.00032393443320936823, "tps": 14442, "wall": 45269.7} {"step": 9976, "train_loss": 3.485522508621216, "lr": 0.00032391879103632805, "tps": 14441, "wall": 45274.8} {"step": 9977, "train_loss": 3.5318374633789062, "lr": 0.00032390314768609014, "tps": 14441, "wall": 45279.8} {"step": 9978, "train_loss": 3.459437370300293, "lr": 0.00032388750315883174, "tps": 14441, "wall": 45284.9} {"step": 9979, "train_loss": 3.4870545864105225, "lr": 0.0003238718574547301, "tps": 14441, "wall": 45290.0} {"step": 9980, "train_loss": 3.465094804763794, "lr": 0.0003238562105739624, "tps": 14441, "wall": 45295.1} {"step": 9981, "train_loss": 3.538266658782959, "lr": 0.000323840562516706, "tps": 14441, "wall": 45300.2} {"step": 9982, "train_loss": 3.4887242317199707, "lr": 0.00032382491328313803, "tps": 14440, "wall": 45305.3} {"step": 9983, "train_loss": 3.5235230922698975, "lr": 0.0003238092628734359, "tps": 14440, "wall": 45310.4} {"step": 9984, "train_loss": 3.524125814437866, "lr": 0.0003237936112877767, "tps": 14440, "wall": 45315.4} {"step": 9985, "train_loss": 3.5114240646362305, "lr": 0.0003237779585263379, "tps": 14440, "wall": 45320.5} {"step": 9986, "train_loss": 3.598311424255371, "lr": 0.0003237623045892969, "tps": 14440, "wall": 45325.5} {"step": 9987, "train_loss": 3.4113221168518066, "lr": 0.0003237466494768308, "tps": 14439, "wall": 45330.6} {"step": 9988, "train_loss": 3.4893457889556885, "lr": 0.000323730993189117, "tps": 14439, "wall": 45335.7} {"step": 9989, "train_loss": 3.4522042274475098, "lr": 0.0003237153357263329, "tps": 14439, "wall": 45340.7} {"step": 9990, "train_loss": 3.5444343090057373, "lr": 0.0003236996770886559, "tps": 14439, "wall": 45345.8} {"step": 9991, "train_loss": 3.4618735313415527, "lr": 0.0003236840172762634, "tps": 14439, "wall": 45350.9} {"step": 9992, "train_loss": 3.5053606033325195, "lr": 0.0003236683562893327, "tps": 14439, "wall": 45356.1} {"step": 9993, "train_loss": 3.522653818130493, "lr": 0.00032365269412804124, "tps": 14438, "wall": 45361.1} {"step": 9994, "train_loss": 3.4471793174743652, "lr": 0.00032363703079256646, "tps": 14438, "wall": 45366.2} {"step": 9995, "train_loss": 3.497371196746826, "lr": 0.0003236213662830858, "tps": 14438, "wall": 45371.2} {"step": 9996, "train_loss": 3.626009464263916, "lr": 0.0003236057005997767, "tps": 14438, "wall": 45376.3} {"step": 9997, "train_loss": 3.385033130645752, "lr": 0.00032359003374281655, "tps": 14438, "wall": 45381.4} {"step": 9998, "train_loss": 3.5067408084869385, "lr": 0.000323574365712383, "tps": 14438, "wall": 45386.5} {"step": 9999, "train_loss": 3.3855366706848145, "lr": 0.0003235586965086534, "tps": 14437, "wall": 45391.5} {"step": 10000, "train_loss": 3.5094106197357178, "lr": 0.00032354302613180525, "tps": 14437, "wall": 45396.6, "val_loss_monitor": 3.537727957250152, "val_loss_full": 3.553138615312463} {"step": 10001, "train_loss": 3.6016042232513428, "lr": 0.0003235273545820161, "tps": 14382, "wall": 45575.2} {"step": 10002, "train_loss": 3.4496099948883057, "lr": 0.0003235116818594635, "tps": 14382, "wall": 45580.3} {"step": 10003, "train_loss": 3.4186248779296875, "lr": 0.0003234960079643249, "tps": 14382, "wall": 45585.5} {"step": 10004, "train_loss": 3.4786903858184814, "lr": 0.000323480332896778, "tps": 14382, "wall": 45590.6} {"step": 10005, "train_loss": 3.4948010444641113, "lr": 0.0003234646566570003, "tps": 14381, "wall": 45595.7} {"step": 10006, "train_loss": 3.463167428970337, "lr": 0.00032344897924516927, "tps": 14381, "wall": 45600.8} {"step": 10007, "train_loss": 3.44720458984375, "lr": 0.0003234333006614627, "tps": 14381, "wall": 45605.9} {"step": 10008, "train_loss": 3.399437189102173, "lr": 0.0003234176209060581, "tps": 14381, "wall": 45611.0} {"step": 10009, "train_loss": 3.5110201835632324, "lr": 0.00032340193997913307, "tps": 14381, "wall": 45616.1} {"step": 10010, "train_loss": 3.4105935096740723, "lr": 0.0003233862578808653, "tps": 14381, "wall": 45621.2} {"step": 10011, "train_loss": 3.4707589149475098, "lr": 0.00032337057461143234, "tps": 14380, "wall": 45626.3} {"step": 10012, "train_loss": 3.535511016845703, "lr": 0.00032335489017101197, "tps": 14380, "wall": 45631.4} {"step": 10013, "train_loss": 3.5691118240356445, "lr": 0.0003233392045597819, "tps": 14380, "wall": 45636.4} {"step": 10014, "train_loss": 3.534139633178711, "lr": 0.0003233235177779196, "tps": 14380, "wall": 45641.5} {"step": 10015, "train_loss": 3.5962228775024414, "lr": 0.0003233078298256029, "tps": 14380, "wall": 45646.6} {"step": 10016, "train_loss": 3.622276544570923, "lr": 0.00032329214070300955, "tps": 14380, "wall": 45651.7} {"step": 10017, "train_loss": 3.472806215286255, "lr": 0.0003232764504103173, "tps": 14379, "wall": 45656.8} {"step": 10018, "train_loss": 3.464841365814209, "lr": 0.00032326075894770375, "tps": 14379, "wall": 45661.8} {"step": 10019, "train_loss": 3.5164031982421875, "lr": 0.00032324506631534677, "tps": 14379, "wall": 45666.9} {"step": 10020, "train_loss": 3.4787044525146484, "lr": 0.00032322937251342404, "tps": 14379, "wall": 45672.0} {"step": 10021, "train_loss": 3.530331611633301, "lr": 0.0003232136775421135, "tps": 14379, "wall": 45677.1} {"step": 10022, "train_loss": 3.459419012069702, "lr": 0.00032319798140159275, "tps": 14379, "wall": 45682.1} {"step": 10023, "train_loss": 3.499852418899536, "lr": 0.0003231822840920397, "tps": 14378, "wall": 45687.2} {"step": 10024, "train_loss": 3.6146903038024902, "lr": 0.00032316658561363213, "tps": 14378, "wall": 45692.3} {"step": 10025, "train_loss": 3.5156443119049072, "lr": 0.000323150885966548, "tps": 14378, "wall": 45697.3} {"step": 10026, "train_loss": 3.4956841468811035, "lr": 0.00032313518515096493, "tps": 14378, "wall": 45702.4} {"step": 10027, "train_loss": 3.4473187923431396, "lr": 0.00032311948316706096, "tps": 14378, "wall": 45707.5} {"step": 10028, "train_loss": 3.4621682167053223, "lr": 0.00032310378001501394, "tps": 14378, "wall": 45712.6} {"step": 10029, "train_loss": 3.538628578186035, "lr": 0.0003230880756950017, "tps": 14377, "wall": 45717.7} {"step": 10030, "train_loss": 3.536057949066162, "lr": 0.0003230723702072021, "tps": 14377, "wall": 45722.8} {"step": 10031, "train_loss": 3.5258736610412598, "lr": 0.0003230566635517932, "tps": 14377, "wall": 45727.8} {"step": 10032, "train_loss": 3.501695156097412, "lr": 0.00032304095572895276, "tps": 14377, "wall": 45732.9} {"step": 10033, "train_loss": 3.4632301330566406, "lr": 0.00032302524673885884, "tps": 14377, "wall": 45738.0} {"step": 10034, "train_loss": 3.4519453048706055, "lr": 0.00032300953658168937, "tps": 14377, "wall": 45743.0} {"step": 10035, "train_loss": 3.4838027954101562, "lr": 0.0003229938252576223, "tps": 14376, "wall": 45748.1} {"step": 10036, "train_loss": 3.534233808517456, "lr": 0.00032297811276683555, "tps": 14376, "wall": 45753.2} {"step": 10037, "train_loss": 3.524613380432129, "lr": 0.00032296239910950726, "tps": 14376, "wall": 45758.2} {"step": 10038, "train_loss": 3.518061399459839, "lr": 0.00032294668428581525, "tps": 14376, "wall": 45763.3} {"step": 10039, "train_loss": 3.5438232421875, "lr": 0.00032293096829593765, "tps": 14376, "wall": 45768.3} {"step": 10040, "train_loss": 3.349931001663208, "lr": 0.0003229152511400525, "tps": 14376, "wall": 45773.4} {"step": 10041, "train_loss": 3.450833320617676, "lr": 0.0003228995328183378, "tps": 14376, "wall": 45778.5} {"step": 10042, "train_loss": 3.5671606063842773, "lr": 0.0003228838133309717, "tps": 14375, "wall": 45783.6} {"step": 10043, "train_loss": 3.534135341644287, "lr": 0.00032286809267813207, "tps": 14375, "wall": 45788.7} {"step": 10044, "train_loss": 3.3649582862854004, "lr": 0.0003228523708599972, "tps": 14375, "wall": 45793.8} {"step": 10045, "train_loss": 3.543881416320801, "lr": 0.0003228366478767451, "tps": 14375, "wall": 45798.8} {"step": 10046, "train_loss": 3.4727914333343506, "lr": 0.00032282092372855386, "tps": 14375, "wall": 45803.9} {"step": 10047, "train_loss": 3.617255210876465, "lr": 0.00032280519841560167, "tps": 14375, "wall": 45809.0} {"step": 10048, "train_loss": 3.446932792663574, "lr": 0.00032278947193806656, "tps": 14374, "wall": 45814.1} {"step": 10049, "train_loss": 3.567416191101074, "lr": 0.00032277374429612684, "tps": 14374, "wall": 45819.1} {"step": 10050, "train_loss": 3.561079740524292, "lr": 0.0003227580154899606, "tps": 14374, "wall": 45824.2} {"step": 10051, "train_loss": 3.371342658996582, "lr": 0.0003227422855197459, "tps": 14374, "wall": 45829.3} {"step": 10052, "train_loss": 3.5852160453796387, "lr": 0.00032272655438566103, "tps": 14374, "wall": 45834.4} {"step": 10053, "train_loss": 3.43485164642334, "lr": 0.00032271082208788434, "tps": 14374, "wall": 45839.5} {"step": 10054, "train_loss": 3.4915804862976074, "lr": 0.0003226950886265938, "tps": 14373, "wall": 45844.6} {"step": 10055, "train_loss": 3.4805731773376465, "lr": 0.0003226793540019677, "tps": 14373, "wall": 45849.7} {"step": 10056, "train_loss": 3.5916004180908203, "lr": 0.0003226636182141844, "tps": 14373, "wall": 45854.8} {"step": 10057, "train_loss": 3.5387346744537354, "lr": 0.00032264788126342206, "tps": 14373, "wall": 45859.9} {"step": 10058, "train_loss": 3.4841744899749756, "lr": 0.0003226321431498589, "tps": 14373, "wall": 45864.9} {"step": 10059, "train_loss": 3.5571022033691406, "lr": 0.00032261640387367334, "tps": 14373, "wall": 45870.0} {"step": 10060, "train_loss": 3.3931150436401367, "lr": 0.00032260066343504364, "tps": 14372, "wall": 45875.1} {"step": 10061, "train_loss": 3.5660274028778076, "lr": 0.000322584921834148, "tps": 14372, "wall": 45880.1} {"step": 10062, "train_loss": 3.481654167175293, "lr": 0.00032256917907116483, "tps": 14372, "wall": 45885.2} {"step": 10063, "train_loss": 3.3768792152404785, "lr": 0.0003225534351462725, "tps": 14372, "wall": 45890.2} {"step": 10064, "train_loss": 3.54490327835083, "lr": 0.00032253769005964925, "tps": 14372, "wall": 45895.4} {"step": 10065, "train_loss": 3.4769463539123535, "lr": 0.0003225219438114735, "tps": 14372, "wall": 45900.4} {"step": 10066, "train_loss": 3.4676496982574463, "lr": 0.00032250619640192366, "tps": 14371, "wall": 45905.5} {"step": 10067, "train_loss": 3.5573570728302, "lr": 0.0003224904478311781, "tps": 14371, "wall": 45910.6} {"step": 10068, "train_loss": 3.652531147003174, "lr": 0.0003224746980994152, "tps": 14371, "wall": 45915.7} {"step": 10069, "train_loss": 3.526022434234619, "lr": 0.00032245894720681333, "tps": 14371, "wall": 45920.8} {"step": 10070, "train_loss": 3.484226942062378, "lr": 0.000322443195153551, "tps": 14371, "wall": 45925.8} {"step": 10071, "train_loss": 3.5156829357147217, "lr": 0.00032242744193980655, "tps": 14371, "wall": 45930.9} {"step": 10072, "train_loss": 3.5571465492248535, "lr": 0.00032241168756575855, "tps": 14370, "wall": 45936.0} {"step": 10073, "train_loss": 3.5523972511291504, "lr": 0.0003223959320315854, "tps": 14370, "wall": 45941.1} {"step": 10074, "train_loss": 3.53018856048584, "lr": 0.00032238017533746556, "tps": 14370, "wall": 45946.2} {"step": 10075, "train_loss": 3.5303783416748047, "lr": 0.0003223644174835776, "tps": 14370, "wall": 45951.2} {"step": 10076, "train_loss": 3.4861764907836914, "lr": 0.0003223486584701, "tps": 14370, "wall": 45956.4} {"step": 10077, "train_loss": 3.4427785873413086, "lr": 0.0003223328982972112, "tps": 14370, "wall": 45961.5} {"step": 10078, "train_loss": 3.507302761077881, "lr": 0.00032231713696508985, "tps": 14369, "wall": 45966.5} {"step": 10079, "train_loss": 3.4876201152801514, "lr": 0.0003223013744739144, "tps": 14369, "wall": 45971.7} {"step": 10080, "train_loss": 3.5245437622070312, "lr": 0.00032228561082386345, "tps": 14369, "wall": 45976.7} {"step": 10081, "train_loss": 3.34220552444458, "lr": 0.0003222698460151155, "tps": 14369, "wall": 45981.8} {"step": 10082, "train_loss": 3.495073080062866, "lr": 0.0003222540800478493, "tps": 14369, "wall": 45986.8} {"step": 10083, "train_loss": 3.5003280639648438, "lr": 0.0003222383129222434, "tps": 14369, "wall": 45991.9} {"step": 10084, "train_loss": 3.538555860519409, "lr": 0.0003222225446384762, "tps": 14369, "wall": 45997.0} {"step": 10085, "train_loss": 3.40651798248291, "lr": 0.0003222067751967266, "tps": 14368, "wall": 46002.0} {"step": 10086, "train_loss": 3.389850616455078, "lr": 0.0003221910045971731, "tps": 14368, "wall": 46007.1} {"step": 10087, "train_loss": 3.512739658355713, "lr": 0.00032217523283999437, "tps": 14368, "wall": 46012.1} {"step": 10088, "train_loss": 3.513942241668701, "lr": 0.00032215945992536903, "tps": 14368, "wall": 46017.3} {"step": 10089, "train_loss": 3.3656234741210938, "lr": 0.00032214368585347584, "tps": 14368, "wall": 46022.3} {"step": 10090, "train_loss": 3.5601320266723633, "lr": 0.0003221279106244934, "tps": 14368, "wall": 46027.4} {"step": 10091, "train_loss": 3.4958558082580566, "lr": 0.00032211213423860054, "tps": 14367, "wall": 46032.5} {"step": 10092, "train_loss": 3.480587959289551, "lr": 0.0003220963566959759, "tps": 14367, "wall": 46037.6} {"step": 10093, "train_loss": 3.4586944580078125, "lr": 0.0003220805779967982, "tps": 14367, "wall": 46042.7} {"step": 10094, "train_loss": 3.5182442665100098, "lr": 0.0003220647981412461, "tps": 14367, "wall": 46047.7} {"step": 10095, "train_loss": 3.5212182998657227, "lr": 0.00032204901712949854, "tps": 14367, "wall": 46052.8} {"step": 10096, "train_loss": 3.4615979194641113, "lr": 0.0003220332349617342, "tps": 14367, "wall": 46057.9} {"step": 10097, "train_loss": 3.484020233154297, "lr": 0.0003220174516381318, "tps": 14366, "wall": 46062.9} {"step": 10098, "train_loss": 3.4926443099975586, "lr": 0.0003220016671588702, "tps": 14366, "wall": 46068.0} {"step": 10099, "train_loss": 3.5000405311584473, "lr": 0.0003219858815241282, "tps": 14366, "wall": 46073.0} {"step": 10100, "train_loss": 3.4905691146850586, "lr": 0.00032197009473408465, "tps": 14366, "wall": 46078.2} {"step": 10101, "train_loss": 3.5036559104919434, "lr": 0.0003219543067889183, "tps": 14366, "wall": 46083.2} {"step": 10102, "train_loss": 3.5569591522216797, "lr": 0.0003219385176888081, "tps": 14366, "wall": 46088.3} {"step": 10103, "train_loss": 3.5031092166900635, "lr": 0.0003219227274339328, "tps": 14365, "wall": 46093.4} {"step": 10104, "train_loss": 3.476350784301758, "lr": 0.00032190693602447137, "tps": 14365, "wall": 46098.5} {"step": 10105, "train_loss": 3.507528066635132, "lr": 0.00032189114346060265, "tps": 14365, "wall": 46103.8} {"step": 10106, "train_loss": 3.5509629249572754, "lr": 0.0003218753497425055, "tps": 14365, "wall": 46108.9} {"step": 10107, "train_loss": 3.462481737136841, "lr": 0.00032185955487035894, "tps": 14365, "wall": 46113.9} {"step": 10108, "train_loss": 3.4248206615448, "lr": 0.0003218437588443418, "tps": 14365, "wall": 46119.0} {"step": 10109, "train_loss": 3.5485048294067383, "lr": 0.000321827961664633, "tps": 14364, "wall": 46124.1} {"step": 10110, "train_loss": 3.597633123397827, "lr": 0.0003218121633314116, "tps": 14364, "wall": 46129.1} {"step": 10111, "train_loss": 3.5386672019958496, "lr": 0.00032179636384485654, "tps": 14364, "wall": 46134.2} {"step": 10112, "train_loss": 3.553661823272705, "lr": 0.0003217805632051467, "tps": 14364, "wall": 46139.3} {"step": 10113, "train_loss": 3.5381128787994385, "lr": 0.0003217647614124612, "tps": 14364, "wall": 46144.4} {"step": 10114, "train_loss": 3.545427083969116, "lr": 0.0003217489584669789, "tps": 14364, "wall": 46149.5} {"step": 10115, "train_loss": 3.4063918590545654, "lr": 0.00032173315436887894, "tps": 14363, "wall": 46154.6} {"step": 10116, "train_loss": 3.51039457321167, "lr": 0.00032171734911834026, "tps": 14363, "wall": 46159.6} {"step": 10117, "train_loss": 3.524658679962158, "lr": 0.000321701542715542, "tps": 14363, "wall": 46164.7} {"step": 10118, "train_loss": 3.432435989379883, "lr": 0.00032168573516066313, "tps": 14363, "wall": 46169.8} {"step": 10119, "train_loss": 3.4478800296783447, "lr": 0.00032166992645388275, "tps": 14363, "wall": 46174.8} {"step": 10120, "train_loss": 3.5392048358917236, "lr": 0.00032165411659538, "tps": 14363, "wall": 46179.9} {"step": 10121, "train_loss": 3.5054287910461426, "lr": 0.00032163830558533385, "tps": 14363, "wall": 46185.0} {"step": 10122, "train_loss": 3.5679197311401367, "lr": 0.00032162249342392355, "tps": 14362, "wall": 46190.1} {"step": 10123, "train_loss": 3.4873597621917725, "lr": 0.0003216066801113281, "tps": 14362, "wall": 46195.2} {"step": 10124, "train_loss": 3.4832561016082764, "lr": 0.0003215908656477267, "tps": 14362, "wall": 46200.3} {"step": 10125, "train_loss": 3.5280165672302246, "lr": 0.0003215750500332984, "tps": 14362, "wall": 46205.3} {"step": 10126, "train_loss": 3.5405712127685547, "lr": 0.0003215592332682225, "tps": 14362, "wall": 46210.4} {"step": 10127, "train_loss": 3.4510324001312256, "lr": 0.00032154341535267807, "tps": 14362, "wall": 46215.5} {"step": 10128, "train_loss": 3.493637800216675, "lr": 0.0003215275962868444, "tps": 14361, "wall": 46220.5} {"step": 10129, "train_loss": 3.548473834991455, "lr": 0.00032151177607090065, "tps": 14361, "wall": 46225.6} {"step": 10130, "train_loss": 3.5268714427948, "lr": 0.00032149595470502596, "tps": 14361, "wall": 46230.7} {"step": 10131, "train_loss": 3.3781425952911377, "lr": 0.0003214801321893996, "tps": 14361, "wall": 46235.8} {"step": 10132, "train_loss": 3.5327210426330566, "lr": 0.0003214643085242008, "tps": 14361, "wall": 46240.8} {"step": 10133, "train_loss": 3.4917502403259277, "lr": 0.0003214484837096088, "tps": 14361, "wall": 46245.9} {"step": 10134, "train_loss": 3.396711587905884, "lr": 0.00032143265774580294, "tps": 14360, "wall": 46251.0} {"step": 10135, "train_loss": 3.5203700065612793, "lr": 0.0003214168306329624, "tps": 14360, "wall": 46256.1} {"step": 10136, "train_loss": 3.5359272956848145, "lr": 0.00032140100237126656, "tps": 14360, "wall": 46261.2} {"step": 10137, "train_loss": 3.54007887840271, "lr": 0.00032138517296089467, "tps": 14360, "wall": 46266.3} {"step": 10138, "train_loss": 3.546856164932251, "lr": 0.0003213693424020261, "tps": 14360, "wall": 46271.4} {"step": 10139, "train_loss": 3.4771156311035156, "lr": 0.00032135351069484007, "tps": 14360, "wall": 46276.4} {"step": 10140, "train_loss": 3.518392562866211, "lr": 0.000321337677839516, "tps": 14359, "wall": 46281.5} {"step": 10141, "train_loss": 3.47564697265625, "lr": 0.0003213218438362332, "tps": 14359, "wall": 46286.5} {"step": 10142, "train_loss": 3.451127529144287, "lr": 0.00032130600868517117, "tps": 14359, "wall": 46291.6} {"step": 10143, "train_loss": 3.4745888710021973, "lr": 0.0003212901723865091, "tps": 14359, "wall": 46296.7} {"step": 10144, "train_loss": 3.52541446685791, "lr": 0.00032127433494042655, "tps": 14359, "wall": 46301.7} {"step": 10145, "train_loss": 3.490262508392334, "lr": 0.0003212584963471028, "tps": 14359, "wall": 46306.8} {"step": 10146, "train_loss": 3.4907960891723633, "lr": 0.00032124265660671736, "tps": 14359, "wall": 46311.8} {"step": 10147, "train_loss": 3.451986312866211, "lr": 0.0003212268157194496, "tps": 14358, "wall": 46316.9} {"step": 10148, "train_loss": 3.42643404006958, "lr": 0.00032121097368547903, "tps": 14358, "wall": 46321.9} {"step": 10149, "train_loss": 3.5882065296173096, "lr": 0.00032119513050498505, "tps": 14358, "wall": 46327.0} {"step": 10150, "train_loss": 3.5934746265411377, "lr": 0.00032117928617814715, "tps": 14358, "wall": 46332.0} {"step": 10151, "train_loss": 3.539134979248047, "lr": 0.0003211634407051448, "tps": 14358, "wall": 46337.1} {"step": 10152, "train_loss": 3.496910572052002, "lr": 0.0003211475940861576, "tps": 14358, "wall": 46342.1} {"step": 10153, "train_loss": 3.5246386528015137, "lr": 0.0003211317463213649, "tps": 14358, "wall": 46347.1} {"step": 10154, "train_loss": 3.5012006759643555, "lr": 0.00032111589741094635, "tps": 14357, "wall": 46352.2} {"step": 10155, "train_loss": 3.4930763244628906, "lr": 0.00032110004735508144, "tps": 14357, "wall": 46357.3} {"step": 10156, "train_loss": 3.5805768966674805, "lr": 0.0003210841961539497, "tps": 14357, "wall": 46362.3} {"step": 10157, "train_loss": 3.5374207496643066, "lr": 0.00032106834380773075, "tps": 14357, "wall": 46367.3} {"step": 10158, "train_loss": 3.544288158416748, "lr": 0.0003210524903166041, "tps": 14357, "wall": 46372.4} {"step": 10159, "train_loss": 3.556389093399048, "lr": 0.0003210366356807494, "tps": 14357, "wall": 46377.5} {"step": 10160, "train_loss": 3.557404041290283, "lr": 0.0003210207799003463, "tps": 14356, "wall": 46382.5} {"step": 10161, "train_loss": 3.552978515625, "lr": 0.00032100492297557423, "tps": 14356, "wall": 46387.6} {"step": 10162, "train_loss": 3.5604043006896973, "lr": 0.00032098906490661295, "tps": 14356, "wall": 46392.6} {"step": 10163, "train_loss": 3.465379476547241, "lr": 0.0003209732056936421, "tps": 14356, "wall": 46397.6} {"step": 10164, "train_loss": 3.6410446166992188, "lr": 0.00032095734533684123, "tps": 14356, "wall": 46402.7} {"step": 10165, "train_loss": 3.4012653827667236, "lr": 0.00032094148383639016, "tps": 14356, "wall": 46407.7} {"step": 10166, "train_loss": 3.5263938903808594, "lr": 0.0003209256211924685, "tps": 14356, "wall": 46412.8} {"step": 10167, "train_loss": 3.401024341583252, "lr": 0.000320909757405256, "tps": 14355, "wall": 46417.8} {"step": 10168, "train_loss": 3.583486557006836, "lr": 0.0003208938924749322, "tps": 14355, "wall": 46422.9} {"step": 10169, "train_loss": 3.4036917686462402, "lr": 0.000320878026401677, "tps": 14355, "wall": 46427.9} {"step": 10170, "train_loss": 3.4642069339752197, "lr": 0.00032086215918567, "tps": 14355, "wall": 46432.9} {"step": 10171, "train_loss": 3.536862373352051, "lr": 0.00032084629082709104, "tps": 14355, "wall": 46438.0} {"step": 10172, "train_loss": 3.6190240383148193, "lr": 0.0003208304213261199, "tps": 14355, "wall": 46443.1} {"step": 10173, "train_loss": 3.4136862754821777, "lr": 0.00032081455068293626, "tps": 14355, "wall": 46448.1} {"step": 10174, "train_loss": 3.3847978115081787, "lr": 0.0003207986788977199, "tps": 14354, "wall": 46453.1} {"step": 10175, "train_loss": 3.527480125427246, "lr": 0.0003207828059706506, "tps": 14354, "wall": 46458.2} {"step": 10176, "train_loss": 3.4381375312805176, "lr": 0.00032076693190190834, "tps": 14354, "wall": 46463.2} {"step": 10177, "train_loss": 3.4949936866760254, "lr": 0.00032075105669167277, "tps": 14354, "wall": 46468.2} {"step": 10178, "train_loss": 3.534742832183838, "lr": 0.00032073518034012375, "tps": 14354, "wall": 46473.3} {"step": 10179, "train_loss": 3.5960464477539062, "lr": 0.00032071930284744115, "tps": 14354, "wall": 46478.3} {"step": 10180, "train_loss": 3.486910820007324, "lr": 0.0003207034242138049, "tps": 14354, "wall": 46483.3} {"step": 10181, "train_loss": 3.562251329421997, "lr": 0.00032068754443939483, "tps": 14353, "wall": 46488.3} {"step": 10182, "train_loss": 3.507965087890625, "lr": 0.0003206716635243908, "tps": 14353, "wall": 46493.3} {"step": 10183, "train_loss": 3.4423723220825195, "lr": 0.00032065578146897263, "tps": 14353, "wall": 46498.4} {"step": 10184, "train_loss": 3.470994710922241, "lr": 0.00032063989827332037, "tps": 14353, "wall": 46503.4} {"step": 10185, "train_loss": 3.398015260696411, "lr": 0.00032062401393761396, "tps": 14353, "wall": 46508.4} {"step": 10186, "train_loss": 3.6082143783569336, "lr": 0.0003206081284620332, "tps": 14353, "wall": 46513.5} {"step": 10187, "train_loss": 3.5261120796203613, "lr": 0.0003205922418467582, "tps": 14353, "wall": 46518.4} {"step": 10188, "train_loss": 3.451068162918091, "lr": 0.00032057635409196873, "tps": 14352, "wall": 46523.4} {"step": 10189, "train_loss": 3.4842734336853027, "lr": 0.00032056046519784493, "tps": 14352, "wall": 46528.5} {"step": 10190, "train_loss": 3.453317165374756, "lr": 0.0003205445751645667, "tps": 14352, "wall": 46533.4} {"step": 10191, "train_loss": 3.409968614578247, "lr": 0.00032052868399231417, "tps": 14352, "wall": 46538.4} {"step": 10192, "train_loss": 3.3925230503082275, "lr": 0.0003205127916812672, "tps": 14352, "wall": 46543.4} {"step": 10193, "train_loss": 3.524296522140503, "lr": 0.00032049689823160593, "tps": 14352, "wall": 46548.4} {"step": 10194, "train_loss": 3.4861862659454346, "lr": 0.0003204810036435103, "tps": 14352, "wall": 46553.4} {"step": 10195, "train_loss": 3.4179327487945557, "lr": 0.00032046510791716053, "tps": 14351, "wall": 46558.4} {"step": 10196, "train_loss": 3.4276769161224365, "lr": 0.00032044921105273653, "tps": 14351, "wall": 46563.5} {"step": 10197, "train_loss": 3.3947865962982178, "lr": 0.0003204333130504184, "tps": 14351, "wall": 46568.4} {"step": 10198, "train_loss": 3.456756114959717, "lr": 0.0003204174139103863, "tps": 14351, "wall": 46573.4} {"step": 10199, "train_loss": 3.500006675720215, "lr": 0.00032040151363282025, "tps": 14351, "wall": 46578.4} {"step": 10200, "train_loss": 3.606959342956543, "lr": 0.0003203856122179005, "tps": 14351, "wall": 46583.4} {"step": 10201, "train_loss": 3.509472608566284, "lr": 0.00032036970966580706, "tps": 14351, "wall": 46588.3} {"step": 10202, "train_loss": 3.5495054721832275, "lr": 0.00032035380597672015, "tps": 14351, "wall": 46593.3} {"step": 10203, "train_loss": 3.471691846847534, "lr": 0.00032033790115081984, "tps": 14350, "wall": 46598.3} {"step": 10204, "train_loss": 3.3898098468780518, "lr": 0.0003203219951882864, "tps": 14350, "wall": 46603.3} {"step": 10205, "train_loss": 3.448045492172241, "lr": 0.0003203060880893, "tps": 14350, "wall": 46608.3} {"step": 10206, "train_loss": 3.604353427886963, "lr": 0.00032029017985404077, "tps": 14350, "wall": 46613.2} {"step": 10207, "train_loss": 3.5856282711029053, "lr": 0.000320274270482689, "tps": 14350, "wall": 46618.3} {"step": 10208, "train_loss": 3.4485814571380615, "lr": 0.0003202583599754248, "tps": 14350, "wall": 46623.3} {"step": 10209, "train_loss": 3.501424789428711, "lr": 0.0003202424483324285, "tps": 14350, "wall": 46628.2} {"step": 10210, "train_loss": 3.3777027130126953, "lr": 0.00032022653555388033, "tps": 14350, "wall": 46633.2} {"step": 10211, "train_loss": 3.4785397052764893, "lr": 0.00032021062163996056, "tps": 14349, "wall": 46638.2} {"step": 10212, "train_loss": 3.5343942642211914, "lr": 0.0003201947065908494, "tps": 14349, "wall": 46643.1} {"step": 10213, "train_loss": 3.4974186420440674, "lr": 0.0003201787904067272, "tps": 14349, "wall": 46648.1} {"step": 10214, "train_loss": 3.4939522743225098, "lr": 0.00032016287308777425, "tps": 14349, "wall": 46653.1} {"step": 10215, "train_loss": 3.5025010108947754, "lr": 0.00032014695463417086, "tps": 14349, "wall": 46658.0} {"step": 10216, "train_loss": 3.507488250732422, "lr": 0.00032013103504609735, "tps": 14349, "wall": 46663.0} {"step": 10217, "train_loss": 3.510484218597412, "lr": 0.00032011511432373407, "tps": 14349, "wall": 46668.0} {"step": 10218, "train_loss": 3.5332725048065186, "lr": 0.0003200991924672613, "tps": 14349, "wall": 46672.9} {"step": 10219, "train_loss": 3.4386916160583496, "lr": 0.0003200832694768595, "tps": 14348, "wall": 46677.9} {"step": 10220, "train_loss": 3.4330248832702637, "lr": 0.000320067345352709, "tps": 14348, "wall": 46682.9} {"step": 10221, "train_loss": 3.457184314727783, "lr": 0.0003200514200949902, "tps": 14348, "wall": 46687.9} {"step": 10222, "train_loss": 3.5269973278045654, "lr": 0.0003200354937038836, "tps": 14348, "wall": 46692.9} {"step": 10223, "train_loss": 3.458643913269043, "lr": 0.0003200195661795694, "tps": 14348, "wall": 46697.8} {"step": 10224, "train_loss": 3.5022132396698, "lr": 0.00032000363752222817, "tps": 14348, "wall": 46702.7} {"step": 10225, "train_loss": 3.5678610801696777, "lr": 0.0003199877077320403, "tps": 14348, "wall": 46707.7} {"step": 10226, "train_loss": 3.46917462348938, "lr": 0.00031997177680918626, "tps": 14348, "wall": 46712.6} {"step": 10227, "train_loss": 3.4395928382873535, "lr": 0.00031995584475384665, "tps": 14347, "wall": 46717.6} {"step": 10228, "train_loss": 3.6269638538360596, "lr": 0.0003199399115662017, "tps": 14347, "wall": 46722.6} {"step": 10229, "train_loss": 3.4612884521484375, "lr": 0.00031992397724643206, "tps": 14347, "wall": 46727.5} {"step": 10230, "train_loss": 3.5689897537231445, "lr": 0.00031990804179471817, "tps": 14347, "wall": 46732.5} {"step": 10231, "train_loss": 3.5855088233947754, "lr": 0.0003198921052112406, "tps": 14347, "wall": 46737.5} {"step": 10232, "train_loss": 3.427551746368408, "lr": 0.0003198761674961798, "tps": 14347, "wall": 46742.4} {"step": 10233, "train_loss": 3.455188512802124, "lr": 0.0003198602286497165, "tps": 14347, "wall": 46747.4} {"step": 10234, "train_loss": 3.532315731048584, "lr": 0.00031984428867203106, "tps": 14347, "wall": 46752.4} {"step": 10235, "train_loss": 3.4908294677734375, "lr": 0.0003198283475633042, "tps": 14346, "wall": 46757.3} {"step": 10236, "train_loss": 3.4845428466796875, "lr": 0.00031981240532371626, "tps": 14346, "wall": 46762.3} {"step": 10237, "train_loss": 3.477612257003784, "lr": 0.0003197964619534481, "tps": 14346, "wall": 46767.3} {"step": 10238, "train_loss": 3.6127474308013916, "lr": 0.0003197805174526802, "tps": 14346, "wall": 46772.2} {"step": 10239, "train_loss": 3.5147247314453125, "lr": 0.00031976457182159317, "tps": 14346, "wall": 46777.2} {"step": 10240, "train_loss": 3.398737907409668, "lr": 0.00031974862506036774, "tps": 14346, "wall": 46782.1} {"step": 10241, "train_loss": 3.4103405475616455, "lr": 0.00031973267716918437, "tps": 14346, "wall": 46787.1} {"step": 10242, "train_loss": 3.49072265625, "lr": 0.00031971672814822395, "tps": 14346, "wall": 46792.1} {"step": 10243, "train_loss": 3.5896010398864746, "lr": 0.00031970077799766696, "tps": 14345, "wall": 46797.1} {"step": 10244, "train_loss": 3.4267396926879883, "lr": 0.00031968482671769423, "tps": 14345, "wall": 46802.0} {"step": 10245, "train_loss": 3.6682705879211426, "lr": 0.00031966887430848634, "tps": 14345, "wall": 46807.0} {"step": 10246, "train_loss": 3.577465534210205, "lr": 0.0003196529207702241, "tps": 14345, "wall": 46812.0} {"step": 10247, "train_loss": 3.3740673065185547, "lr": 0.0003196369661030881, "tps": 14345, "wall": 46816.9} {"step": 10248, "train_loss": 3.38155460357666, "lr": 0.00031962101030725925, "tps": 14345, "wall": 46821.9} {"step": 10249, "train_loss": 3.576671838760376, "lr": 0.0003196050533829181, "tps": 14345, "wall": 46826.9} {"step": 10250, "train_loss": 3.512277841567993, "lr": 0.0003195890953302456, "tps": 14345, "wall": 46831.9} {"step": 10251, "train_loss": 3.4353699684143066, "lr": 0.00031957313614942244, "tps": 14345, "wall": 46836.8} {"step": 10252, "train_loss": 3.5062146186828613, "lr": 0.00031955717584062943, "tps": 14344, "wall": 46841.8} {"step": 10253, "train_loss": 3.5167059898376465, "lr": 0.00031954121440404726, "tps": 14344, "wall": 46846.7} {"step": 10254, "train_loss": 3.5206918716430664, "lr": 0.0003195252518398569, "tps": 14344, "wall": 46851.7} {"step": 10255, "train_loss": 3.5490334033966064, "lr": 0.00031950928814823904, "tps": 14344, "wall": 46856.8} {"step": 10256, "train_loss": 3.5821030139923096, "lr": 0.0003194933233293746, "tps": 14344, "wall": 46861.7} {"step": 10257, "train_loss": 3.6024081707000732, "lr": 0.0003194773573834445, "tps": 14344, "wall": 46866.7} {"step": 10258, "train_loss": 3.487131118774414, "lr": 0.0003194613903106294, "tps": 14344, "wall": 46871.7} {"step": 10259, "train_loss": 3.5331082344055176, "lr": 0.00031944542211111035, "tps": 14344, "wall": 46876.7} {"step": 10260, "train_loss": 3.5336050987243652, "lr": 0.00031942945278506815, "tps": 14343, "wall": 46881.6} {"step": 10261, "train_loss": 3.4857707023620605, "lr": 0.0003194134823326838, "tps": 14343, "wall": 46886.6} {"step": 10262, "train_loss": 3.545562267303467, "lr": 0.00031939751075413806, "tps": 14343, "wall": 46891.6} {"step": 10263, "train_loss": 3.4885311126708984, "lr": 0.0003193815380496119, "tps": 14343, "wall": 46896.5} {"step": 10264, "train_loss": 3.4408106803894043, "lr": 0.0003193655642192864, "tps": 14343, "wall": 46901.5} {"step": 10265, "train_loss": 3.498018264770508, "lr": 0.00031934958926334235, "tps": 14343, "wall": 46906.5} {"step": 10266, "train_loss": 3.5597288608551025, "lr": 0.0003193336131819608, "tps": 14343, "wall": 46911.5} {"step": 10267, "train_loss": 3.4788854122161865, "lr": 0.00031931763597532276, "tps": 14343, "wall": 46916.5} {"step": 10268, "train_loss": 3.413666009902954, "lr": 0.0003193016576436091, "tps": 14342, "wall": 46921.5} {"step": 10269, "train_loss": 3.4314565658569336, "lr": 0.0003192856781870009, "tps": 14342, "wall": 46926.4} {"step": 10270, "train_loss": 3.4793384075164795, "lr": 0.00031926969760567923, "tps": 14342, "wall": 46931.4} {"step": 10271, "train_loss": 3.531717538833618, "lr": 0.000319253715899825, "tps": 14342, "wall": 46936.4} {"step": 10272, "train_loss": 3.5876264572143555, "lr": 0.00031923773306961927, "tps": 14342, "wall": 46941.3} {"step": 10273, "train_loss": 3.5615108013153076, "lr": 0.0003192217491152432, "tps": 14342, "wall": 46946.3} {"step": 10274, "train_loss": 3.460470199584961, "lr": 0.00031920576403687774, "tps": 14342, "wall": 46951.3} {"step": 10275, "train_loss": 3.498730421066284, "lr": 0.00031918977783470403, "tps": 14342, "wall": 46956.2} {"step": 10276, "train_loss": 3.465770721435547, "lr": 0.00031917379050890314, "tps": 14341, "wall": 46961.2} {"step": 10277, "train_loss": 3.5525717735290527, "lr": 0.0003191578020596562, "tps": 14341, "wall": 46966.2} {"step": 10278, "train_loss": 3.569746494293213, "lr": 0.0003191418124871443, "tps": 14341, "wall": 46971.1} {"step": 10279, "train_loss": 3.5361685752868652, "lr": 0.0003191258217915487, "tps": 14341, "wall": 46976.1} {"step": 10280, "train_loss": 3.5443692207336426, "lr": 0.00031910982997305023, "tps": 14341, "wall": 46981.1} {"step": 10281, "train_loss": 3.504412889480591, "lr": 0.00031909383703183035, "tps": 14341, "wall": 46986.0} {"step": 10282, "train_loss": 3.3682503700256348, "lr": 0.00031907784296807015, "tps": 14341, "wall": 46991.0} {"step": 10283, "train_loss": 3.5607080459594727, "lr": 0.0003190618477819507, "tps": 14341, "wall": 46996.0} {"step": 10284, "train_loss": 3.439511775970459, "lr": 0.0003190458514736534, "tps": 14340, "wall": 47001.0} {"step": 10285, "train_loss": 3.4973978996276855, "lr": 0.0003190298540433593, "tps": 14340, "wall": 47005.9} {"step": 10286, "train_loss": 3.4919559955596924, "lr": 0.00031901385549124955, "tps": 14340, "wall": 47010.9} {"step": 10287, "train_loss": 3.5852742195129395, "lr": 0.0003189978558175056, "tps": 14340, "wall": 47015.9} {"step": 10288, "train_loss": 3.4337539672851562, "lr": 0.00031898185502230846, "tps": 14340, "wall": 47020.9} {"step": 10289, "train_loss": 3.4675683975219727, "lr": 0.00031896585310583965, "tps": 14340, "wall": 47025.8} {"step": 10290, "train_loss": 3.4315414428710938, "lr": 0.0003189498500682802, "tps": 14340, "wall": 47030.8} {"step": 10291, "train_loss": 3.5576157569885254, "lr": 0.0003189338459098116, "tps": 14340, "wall": 47035.8} {"step": 10292, "train_loss": 3.4941554069519043, "lr": 0.0003189178406306149, "tps": 14339, "wall": 47040.8} {"step": 10293, "train_loss": 3.464289665222168, "lr": 0.0003189018342308717, "tps": 14339, "wall": 47045.8} {"step": 10294, "train_loss": 3.5091333389282227, "lr": 0.0003188858267107631, "tps": 14339, "wall": 47050.7} {"step": 10295, "train_loss": 3.5362050533294678, "lr": 0.00031886981807047047, "tps": 14339, "wall": 47055.7} {"step": 10296, "train_loss": 3.5146431922912598, "lr": 0.0003188538083101753, "tps": 14339, "wall": 47060.7} {"step": 10297, "train_loss": 3.4717164039611816, "lr": 0.00031883779743005876, "tps": 14339, "wall": 47065.6} {"step": 10298, "train_loss": 3.415437698364258, "lr": 0.00031882178543030234, "tps": 14339, "wall": 47070.6} {"step": 10299, "train_loss": 3.5103087425231934, "lr": 0.00031880577231108734, "tps": 14339, "wall": 47075.6} {"step": 10300, "train_loss": 3.547213077545166, "lr": 0.00031878975807259524, "tps": 14338, "wall": 47080.6} {"step": 10301, "train_loss": 3.489996910095215, "lr": 0.00031877374271500745, "tps": 14338, "wall": 47085.6} {"step": 10302, "train_loss": 3.4736804962158203, "lr": 0.0003187577262385053, "tps": 14338, "wall": 47090.5} {"step": 10303, "train_loss": 3.47525954246521, "lr": 0.0003187417086432703, "tps": 14338, "wall": 47095.6} {"step": 10304, "train_loss": 3.5162806510925293, "lr": 0.0003187256899294839, "tps": 14338, "wall": 47100.6} {"step": 10305, "train_loss": 3.516738176345825, "lr": 0.0003187096700973275, "tps": 14338, "wall": 47105.5} {"step": 10306, "train_loss": 3.5538477897644043, "lr": 0.00031869364914698263, "tps": 14338, "wall": 47110.5} {"step": 10307, "train_loss": 3.5694406032562256, "lr": 0.00031867762707863084, "tps": 14338, "wall": 47115.5} {"step": 10308, "train_loss": 3.5035719871520996, "lr": 0.0003186616038924534, "tps": 14337, "wall": 47120.4} {"step": 10309, "train_loss": 3.4175665378570557, "lr": 0.00031864557958863213, "tps": 14337, "wall": 47125.4} {"step": 10310, "train_loss": 3.5226309299468994, "lr": 0.0003186295541673483, "tps": 14337, "wall": 47130.4} {"step": 10311, "train_loss": 3.591421604156494, "lr": 0.0003186135276287836, "tps": 14337, "wall": 47135.3} {"step": 10312, "train_loss": 3.5048677921295166, "lr": 0.00031859749997311944, "tps": 14337, "wall": 47140.3} {"step": 10313, "train_loss": 3.516617774963379, "lr": 0.0003185814712005376, "tps": 14337, "wall": 47145.3} {"step": 10314, "train_loss": 3.5284056663513184, "lr": 0.00031856544131121943, "tps": 14337, "wall": 47150.3} {"step": 10315, "train_loss": 3.486905097961426, "lr": 0.0003185494103053466, "tps": 14337, "wall": 47155.3} {"step": 10316, "train_loss": 3.4821083545684814, "lr": 0.00031853337818310074, "tps": 14336, "wall": 47160.3} {"step": 10317, "train_loss": 3.484793186187744, "lr": 0.0003185173449446635, "tps": 14336, "wall": 47165.2} {"step": 10318, "train_loss": 3.473287582397461, "lr": 0.0003185013105902163, "tps": 14336, "wall": 47170.2} {"step": 10319, "train_loss": 3.460017681121826, "lr": 0.0003184852751199411, "tps": 14336, "wall": 47175.2} {"step": 10320, "train_loss": 3.5402140617370605, "lr": 0.0003184692385340193, "tps": 14336, "wall": 47180.2} {"step": 10321, "train_loss": 3.3871898651123047, "lr": 0.0003184532008326326, "tps": 14336, "wall": 47185.1} {"step": 10322, "train_loss": 3.4541079998016357, "lr": 0.0003184371620159628, "tps": 14336, "wall": 47190.1} {"step": 10323, "train_loss": 3.5123915672302246, "lr": 0.00031842112208419144, "tps": 14336, "wall": 47195.0} {"step": 10324, "train_loss": 3.581528425216675, "lr": 0.0003184050810375003, "tps": 14335, "wall": 47200.0} {"step": 10325, "train_loss": 3.5862178802490234, "lr": 0.00031838903887607107, "tps": 14335, "wall": 47205.0} {"step": 10326, "train_loss": 3.4928927421569824, "lr": 0.0003183729956000854, "tps": 14335, "wall": 47210.0} {"step": 10327, "train_loss": 3.5180492401123047, "lr": 0.00031835695120972524, "tps": 14335, "wall": 47214.9} {"step": 10328, "train_loss": 3.5199320316314697, "lr": 0.0003183409057051722, "tps": 14335, "wall": 47220.0} {"step": 10329, "train_loss": 3.5737507343292236, "lr": 0.00031832485908660804, "tps": 14335, "wall": 47224.9} {"step": 10330, "train_loss": 3.543679714202881, "lr": 0.00031830881135421456, "tps": 14335, "wall": 47229.9} {"step": 10331, "train_loss": 3.451922655105591, "lr": 0.00031829276250817354, "tps": 14335, "wall": 47234.9} {"step": 10332, "train_loss": 3.466538667678833, "lr": 0.00031827671254866687, "tps": 14335, "wall": 47239.8} {"step": 10333, "train_loss": 3.483755111694336, "lr": 0.00031826066147587614, "tps": 14334, "wall": 47244.8} {"step": 10334, "train_loss": 3.512930393218994, "lr": 0.0003182446092899834, "tps": 14334, "wall": 47249.8} {"step": 10335, "train_loss": 3.568321704864502, "lr": 0.00031822855599117036, "tps": 14334, "wall": 47254.7} {"step": 10336, "train_loss": 3.395608901977539, "lr": 0.000318212501579619, "tps": 14334, "wall": 47259.7} {"step": 10337, "train_loss": 3.4783096313476562, "lr": 0.000318196446055511, "tps": 14334, "wall": 47264.7} {"step": 10338, "train_loss": 3.448028564453125, "lr": 0.00031818038941902843, "tps": 14334, "wall": 47269.6} {"step": 10339, "train_loss": 3.566251277923584, "lr": 0.00031816433167035314, "tps": 14334, "wall": 47274.6} {"step": 10340, "train_loss": 3.5274300575256348, "lr": 0.0003181482728096669, "tps": 14334, "wall": 47279.6} {"step": 10341, "train_loss": 3.5648250579833984, "lr": 0.0003181322128371517, "tps": 14333, "wall": 47284.6} {"step": 10342, "train_loss": 3.491067886352539, "lr": 0.00031811615175298953, "tps": 14333, "wall": 47289.6} {"step": 10343, "train_loss": 3.485626220703125, "lr": 0.0003181000895573623, "tps": 14333, "wall": 47294.5} {"step": 10344, "train_loss": 3.59867262840271, "lr": 0.00031808402625045195, "tps": 14333, "wall": 47299.5} {"step": 10345, "train_loss": 3.5168051719665527, "lr": 0.0003180679618324404, "tps": 14333, "wall": 47304.5} {"step": 10346, "train_loss": 3.499964714050293, "lr": 0.00031805189630350973, "tps": 14333, "wall": 47309.5} {"step": 10347, "train_loss": 3.538792848587036, "lr": 0.0003180358296638419, "tps": 14333, "wall": 47314.4} {"step": 10348, "train_loss": 3.497100353240967, "lr": 0.0003180197619136188, "tps": 14333, "wall": 47319.4} {"step": 10349, "train_loss": 3.5237882137298584, "lr": 0.0003180036930530226, "tps": 14332, "wall": 47324.4} {"step": 10350, "train_loss": 3.4746367931365967, "lr": 0.0003179876230822352, "tps": 14332, "wall": 47329.3} {"step": 10351, "train_loss": 3.5016937255859375, "lr": 0.00031797155200143876, "tps": 14332, "wall": 47334.3} {"step": 10352, "train_loss": 3.566610097885132, "lr": 0.00031795547981081524, "tps": 14332, "wall": 47339.3} {"step": 10353, "train_loss": 3.550564765930176, "lr": 0.0003179394065105468, "tps": 14332, "wall": 47344.3} {"step": 10354, "train_loss": 3.478233814239502, "lr": 0.0003179233321008154, "tps": 14332, "wall": 47349.3} {"step": 10355, "train_loss": 3.41687273979187, "lr": 0.0003179072565818032, "tps": 14332, "wall": 47354.2} {"step": 10356, "train_loss": 3.3795042037963867, "lr": 0.00031789117995369235, "tps": 14332, "wall": 47359.2} {"step": 10357, "train_loss": 3.463944911956787, "lr": 0.0003178751022166649, "tps": 14331, "wall": 47364.1} {"step": 10358, "train_loss": 3.6631500720977783, "lr": 0.000317859023370903, "tps": 14331, "wall": 47369.1} {"step": 10359, "train_loss": 3.5247232913970947, "lr": 0.00031784294341658876, "tps": 14331, "wall": 47374.1} {"step": 10360, "train_loss": 3.4866385459899902, "lr": 0.00031782686235390443, "tps": 14331, "wall": 47379.0} {"step": 10361, "train_loss": 3.532909870147705, "lr": 0.00031781078018303197, "tps": 14331, "wall": 47384.0} {"step": 10362, "train_loss": 3.494096279144287, "lr": 0.00031779469690415384, "tps": 14331, "wall": 47389.0} {"step": 10363, "train_loss": 3.490649938583374, "lr": 0.000317778612517452, "tps": 14331, "wall": 47393.9} {"step": 10364, "train_loss": 3.5474014282226562, "lr": 0.0003177625270231089, "tps": 14331, "wall": 47399.0} {"step": 10365, "train_loss": 3.4238102436065674, "lr": 0.0003177464404213064, "tps": 14331, "wall": 47404.0} {"step": 10366, "train_loss": 3.5157997608184814, "lr": 0.00031773035271222706, "tps": 14330, "wall": 47408.9} {"step": 10367, "train_loss": 3.515011787414551, "lr": 0.00031771426389605293, "tps": 14330, "wall": 47413.9} {"step": 10368, "train_loss": 3.4654510021209717, "lr": 0.00031769817397296645, "tps": 14330, "wall": 47418.9} {"step": 10369, "train_loss": 3.456439971923828, "lr": 0.00031768208294314965, "tps": 14330, "wall": 47423.8} {"step": 10370, "train_loss": 3.4440183639526367, "lr": 0.000317665990806785, "tps": 14330, "wall": 47428.8} {"step": 10371, "train_loss": 3.4309229850769043, "lr": 0.0003176498975640547, "tps": 14330, "wall": 47433.8} {"step": 10372, "train_loss": 3.4855453968048096, "lr": 0.00031763380321514105, "tps": 14330, "wall": 47438.7} {"step": 10373, "train_loss": 3.4975666999816895, "lr": 0.0003176177077602264, "tps": 14330, "wall": 47443.7} {"step": 10374, "train_loss": 3.5606913566589355, "lr": 0.0003176016111994931, "tps": 14329, "wall": 47448.6} {"step": 10375, "train_loss": 3.5198912620544434, "lr": 0.00031758551353312347, "tps": 14329, "wall": 47453.6} {"step": 10376, "train_loss": 3.4302122592926025, "lr": 0.0003175694147612998, "tps": 14329, "wall": 47458.6} {"step": 10377, "train_loss": 3.6812267303466797, "lr": 0.00031755331488420464, "tps": 14329, "wall": 47463.6} {"step": 10378, "train_loss": 3.5344905853271484, "lr": 0.0003175372139020202, "tps": 14329, "wall": 47468.5} {"step": 10379, "train_loss": 3.4288012981414795, "lr": 0.00031752111181492887, "tps": 14329, "wall": 47473.5} {"step": 10380, "train_loss": 3.557846784591675, "lr": 0.0003175050086231131, "tps": 14329, "wall": 47478.4} {"step": 10381, "train_loss": 3.5139665603637695, "lr": 0.0003174889043267555, "tps": 14329, "wall": 47483.4} {"step": 10382, "train_loss": 3.46014142036438, "lr": 0.0003174727989260382, "tps": 14328, "wall": 47488.4} {"step": 10383, "train_loss": 3.453907012939453, "lr": 0.0003174566924211437, "tps": 14328, "wall": 47493.3} {"step": 10384, "train_loss": 3.512305974960327, "lr": 0.00031744058481225455, "tps": 14328, "wall": 47498.3} {"step": 10385, "train_loss": 3.5533978939056396, "lr": 0.0003174244760995532, "tps": 14328, "wall": 47503.3} {"step": 10386, "train_loss": 3.532724380493164, "lr": 0.0003174083662832221, "tps": 14328, "wall": 47508.3} {"step": 10387, "train_loss": 3.4364919662475586, "lr": 0.00031739225536344377, "tps": 14328, "wall": 47513.2} {"step": 10388, "train_loss": 3.566741466522217, "lr": 0.0003173761433404007, "tps": 14328, "wall": 47518.2} {"step": 10389, "train_loss": 3.513935089111328, "lr": 0.00031736003021427546, "tps": 14328, "wall": 47523.2} {"step": 10390, "train_loss": 3.4335391521453857, "lr": 0.0003173439159852504, "tps": 14328, "wall": 47528.1} {"step": 10391, "train_loss": 3.545339345932007, "lr": 0.0003173278006535083, "tps": 14327, "wall": 47533.1} {"step": 10392, "train_loss": 3.4293789863586426, "lr": 0.0003173116842192316, "tps": 14327, "wall": 47538.1} {"step": 10393, "train_loss": 3.450871467590332, "lr": 0.00031729556668260285, "tps": 14327, "wall": 47543.0} {"step": 10394, "train_loss": 3.5197601318359375, "lr": 0.0003172794480438047, "tps": 14327, "wall": 47548.0} {"step": 10395, "train_loss": 3.364678382873535, "lr": 0.00031726332830301967, "tps": 14327, "wall": 47553.0} {"step": 10396, "train_loss": 3.520340919494629, "lr": 0.0003172472074604304, "tps": 14327, "wall": 47557.9} {"step": 10397, "train_loss": 3.5191824436187744, "lr": 0.00031723108551621944, "tps": 14327, "wall": 47562.9} {"step": 10398, "train_loss": 3.4608917236328125, "lr": 0.00031721496247056957, "tps": 14327, "wall": 47567.9} {"step": 10399, "train_loss": 3.443103313446045, "lr": 0.0003171988383236633, "tps": 14326, "wall": 47572.8} {"step": 10400, "train_loss": 3.5451817512512207, "lr": 0.00031718271307568335, "tps": 14326, "wall": 47577.8} {"step": 10401, "train_loss": 3.474494457244873, "lr": 0.0003171665867268124, "tps": 14326, "wall": 47582.8} {"step": 10402, "train_loss": 3.4273509979248047, "lr": 0.00031715045927723304, "tps": 14326, "wall": 47587.8} {"step": 10403, "train_loss": 3.405893087387085, "lr": 0.00031713433072712803, "tps": 14326, "wall": 47592.7} {"step": 10404, "train_loss": 3.526577949523926, "lr": 0.00031711820107668007, "tps": 14326, "wall": 47597.7} {"step": 10405, "train_loss": 3.48020601272583, "lr": 0.00031710207032607194, "tps": 14326, "wall": 47602.7} {"step": 10406, "train_loss": 3.5673985481262207, "lr": 0.0003170859384754863, "tps": 14326, "wall": 47607.6} {"step": 10407, "train_loss": 3.5172979831695557, "lr": 0.0003170698055251058, "tps": 14326, "wall": 47612.6} {"step": 10408, "train_loss": 3.3330845832824707, "lr": 0.0003170536714751133, "tps": 14325, "wall": 47617.6} {"step": 10409, "train_loss": 3.3958864212036133, "lr": 0.00031703753632569164, "tps": 14325, "wall": 47622.6} {"step": 10410, "train_loss": 3.518099784851074, "lr": 0.0003170214000770235, "tps": 14325, "wall": 47627.5} {"step": 10411, "train_loss": 3.414329767227173, "lr": 0.0003170052627292916, "tps": 14325, "wall": 47632.5} {"step": 10412, "train_loss": 3.5304489135742188, "lr": 0.00031698912428267887, "tps": 14325, "wall": 47637.5} {"step": 10413, "train_loss": 3.4794468879699707, "lr": 0.0003169729847373682, "tps": 14325, "wall": 47642.5} {"step": 10414, "train_loss": 3.430034637451172, "lr": 0.0003169568440935422, "tps": 14325, "wall": 47647.4} {"step": 10415, "train_loss": 3.4685678482055664, "lr": 0.00031694070235138385, "tps": 14325, "wall": 47652.4} {"step": 10416, "train_loss": 3.4774701595306396, "lr": 0.00031692455951107604, "tps": 14324, "wall": 47657.4} {"step": 10417, "train_loss": 3.602266311645508, "lr": 0.0003169084155728015, "tps": 14324, "wall": 47662.3} {"step": 10418, "train_loss": 3.535040855407715, "lr": 0.0003168922705367432, "tps": 14324, "wall": 47667.3} {"step": 10419, "train_loss": 3.5146944522857666, "lr": 0.0003168761244030841, "tps": 14324, "wall": 47672.3} {"step": 10420, "train_loss": 3.576415538787842, "lr": 0.00031685997717200695, "tps": 14324, "wall": 47677.2} {"step": 10421, "train_loss": 3.4199254512786865, "lr": 0.0003168438288436947, "tps": 14324, "wall": 47682.2} {"step": 10422, "train_loss": 3.462704658508301, "lr": 0.0003168276794183304, "tps": 14324, "wall": 47687.1} {"step": 10423, "train_loss": 3.5145809650421143, "lr": 0.0003168115288960969, "tps": 14324, "wall": 47692.1} {"step": 10424, "train_loss": 3.4468178749084473, "lr": 0.0003167953772771771, "tps": 14323, "wall": 47697.1} {"step": 10425, "train_loss": 3.4272048473358154, "lr": 0.00031677922456175406, "tps": 14323, "wall": 47702.1} {"step": 10426, "train_loss": 3.4998393058776855, "lr": 0.0003167630707500107, "tps": 14323, "wall": 47707.0} {"step": 10427, "train_loss": 3.516352653503418, "lr": 0.00031674691584213007, "tps": 14323, "wall": 47712.0} {"step": 10428, "train_loss": 3.493694543838501, "lr": 0.00031673075983829513, "tps": 14323, "wall": 47717.0} {"step": 10429, "train_loss": 3.507211208343506, "lr": 0.00031671460273868893, "tps": 14323, "wall": 47721.9} {"step": 10430, "train_loss": 3.4331092834472656, "lr": 0.0003166984445434945, "tps": 14323, "wall": 47726.9} {"step": 10431, "train_loss": 3.435457706451416, "lr": 0.0003166822852528948, "tps": 14323, "wall": 47731.8} {"step": 10432, "train_loss": 3.46974515914917, "lr": 0.000316666124867073, "tps": 14323, "wall": 47736.8} {"step": 10433, "train_loss": 3.5194034576416016, "lr": 0.0003166499633862121, "tps": 14322, "wall": 47741.8} {"step": 10434, "train_loss": 3.454709053039551, "lr": 0.00031663380081049515, "tps": 14322, "wall": 47746.7} {"step": 10435, "train_loss": 3.4776978492736816, "lr": 0.00031661763714010526, "tps": 14322, "wall": 47751.7} {"step": 10436, "train_loss": 3.4545629024505615, "lr": 0.00031660147237522565, "tps": 14322, "wall": 47756.7} {"step": 10437, "train_loss": 3.4679512977600098, "lr": 0.00031658530651603925, "tps": 14322, "wall": 47761.7} {"step": 10438, "train_loss": 3.442077159881592, "lr": 0.00031656913956272926, "tps": 14322, "wall": 47766.6} {"step": 10439, "train_loss": 3.495144844055176, "lr": 0.00031655297151547885, "tps": 14322, "wall": 47771.6} {"step": 10440, "train_loss": 3.5222866535186768, "lr": 0.0003165368023744712, "tps": 14322, "wall": 47776.6} {"step": 10441, "train_loss": 3.600576400756836, "lr": 0.0003165206321398894, "tps": 14322, "wall": 47781.5} {"step": 10442, "train_loss": 3.507577657699585, "lr": 0.0003165044608119166, "tps": 14321, "wall": 47786.5} {"step": 10443, "train_loss": 3.4822447299957275, "lr": 0.0003164882883907362, "tps": 14321, "wall": 47791.4} {"step": 10444, "train_loss": 3.427781581878662, "lr": 0.00031647211487653113, "tps": 14321, "wall": 47796.4} {"step": 10445, "train_loss": 3.604987621307373, "lr": 0.0003164559402694847, "tps": 14321, "wall": 47801.4} {"step": 10446, "train_loss": 3.483872652053833, "lr": 0.0003164397645697803, "tps": 14321, "wall": 47806.3} {"step": 10447, "train_loss": 3.4737648963928223, "lr": 0.00031642358777760087, "tps": 14321, "wall": 47811.3} {"step": 10448, "train_loss": 3.390350341796875, "lr": 0.0003164074098931299, "tps": 14321, "wall": 47816.3} {"step": 10449, "train_loss": 3.404208183288574, "lr": 0.00031639123091655054, "tps": 14321, "wall": 47821.3} {"step": 10450, "train_loss": 3.4743854999542236, "lr": 0.00031637505084804613, "tps": 14320, "wall": 47826.2} {"step": 10451, "train_loss": 3.452033042907715, "lr": 0.00031635886968779995, "tps": 14320, "wall": 47831.2} {"step": 10452, "train_loss": 3.498265504837036, "lr": 0.00031634268743599523, "tps": 14320, "wall": 47836.1} {"step": 10453, "train_loss": 3.541722536087036, "lr": 0.0003163265040928154, "tps": 14320, "wall": 47841.1} {"step": 10454, "train_loss": 3.3841207027435303, "lr": 0.00031631031965844363, "tps": 14320, "wall": 47846.1} {"step": 10455, "train_loss": 3.5362653732299805, "lr": 0.00031629413413306344, "tps": 14320, "wall": 47851.1} {"step": 10456, "train_loss": 3.4948079586029053, "lr": 0.00031627794751685806, "tps": 14320, "wall": 47856.0} {"step": 10457, "train_loss": 3.505758762359619, "lr": 0.0003162617598100109, "tps": 14320, "wall": 47861.0} {"step": 10458, "train_loss": 3.441831111907959, "lr": 0.00031624557101270526, "tps": 14320, "wall": 47866.0} {"step": 10459, "train_loss": 3.5843558311462402, "lr": 0.0003162293811251246, "tps": 14319, "wall": 47870.9} {"step": 10460, "train_loss": 3.4945168495178223, "lr": 0.00031621319014745234, "tps": 14319, "wall": 47876.0} {"step": 10461, "train_loss": 3.4818460941314697, "lr": 0.0003161969980798718, "tps": 14319, "wall": 47880.9} {"step": 10462, "train_loss": 3.6205127239227295, "lr": 0.0003161808049225665, "tps": 14319, "wall": 47885.9} {"step": 10463, "train_loss": 3.428753137588501, "lr": 0.00031616461067571986, "tps": 14319, "wall": 47890.9} {"step": 10464, "train_loss": 3.4452600479125977, "lr": 0.00031614841533951526, "tps": 14319, "wall": 47895.9} {"step": 10465, "train_loss": 3.582545280456543, "lr": 0.0003161322189141362, "tps": 14319, "wall": 47900.9} {"step": 10466, "train_loss": 3.4862751960754395, "lr": 0.0003161160213997662, "tps": 14319, "wall": 47905.8} {"step": 10467, "train_loss": 3.502232074737549, "lr": 0.00031609982279658875, "tps": 14318, "wall": 47910.8} {"step": 10468, "train_loss": 3.4680285453796387, "lr": 0.00031608362310478727, "tps": 14318, "wall": 47915.8} {"step": 10469, "train_loss": 3.506836414337158, "lr": 0.00031606742232454524, "tps": 14318, "wall": 47920.8} {"step": 10470, "train_loss": 3.5013539791107178, "lr": 0.0003160512204560464, "tps": 14318, "wall": 47925.7} {"step": 10471, "train_loss": 3.306546688079834, "lr": 0.000316035017499474, "tps": 14318, "wall": 47930.7} {"step": 10472, "train_loss": 3.5422797203063965, "lr": 0.0003160188134550118, "tps": 14318, "wall": 47935.7} {"step": 10473, "train_loss": 3.4212777614593506, "lr": 0.0003160026083228433, "tps": 14318, "wall": 47940.7} {"step": 10474, "train_loss": 3.486464023590088, "lr": 0.000315986402103152, "tps": 14318, "wall": 47945.7} {"step": 10475, "train_loss": 3.463228940963745, "lr": 0.0003159701947961216, "tps": 14317, "wall": 47950.6} {"step": 10476, "train_loss": 3.527317523956299, "lr": 0.0003159539864019356, "tps": 14317, "wall": 47955.6} {"step": 10477, "train_loss": 3.268925189971924, "lr": 0.0003159377769207776, "tps": 14317, "wall": 47960.5} {"step": 10478, "train_loss": 3.682124137878418, "lr": 0.00031592156635283137, "tps": 14317, "wall": 47965.5} {"step": 10479, "train_loss": 3.496671199798584, "lr": 0.0003159053546982804, "tps": 14317, "wall": 47970.5} {"step": 10480, "train_loss": 3.532553195953369, "lr": 0.00031588914195730845, "tps": 14317, "wall": 47975.4} {"step": 10481, "train_loss": 3.561455488204956, "lr": 0.000315872928130099, "tps": 14317, "wall": 47980.3} {"step": 10482, "train_loss": 3.427945137023926, "lr": 0.0003158567132168359, "tps": 14317, "wall": 47985.3} {"step": 10483, "train_loss": 3.513209819793701, "lr": 0.00031584049721770273, "tps": 14317, "wall": 47990.3} {"step": 10484, "train_loss": 3.4466679096221924, "lr": 0.00031582428013288334, "tps": 14316, "wall": 47995.3} {"step": 10485, "train_loss": 3.422271728515625, "lr": 0.00031580806196256116, "tps": 14316, "wall": 48000.2} {"step": 10486, "train_loss": 3.554516553878784, "lr": 0.00031579184270692014, "tps": 14316, "wall": 48005.2} {"step": 10487, "train_loss": 3.5652220249176025, "lr": 0.00031577562236614404, "tps": 14316, "wall": 48010.2} {"step": 10488, "train_loss": 3.4818060398101807, "lr": 0.0003157594009404164, "tps": 14316, "wall": 48015.2} {"step": 10489, "train_loss": 3.4482812881469727, "lr": 0.00031574317842992107, "tps": 14316, "wall": 48020.1} {"step": 10490, "train_loss": 3.4355316162109375, "lr": 0.0003157269548348419, "tps": 14316, "wall": 48025.1} {"step": 10491, "train_loss": 3.4473907947540283, "lr": 0.0003157107301553626, "tps": 14316, "wall": 48030.0} {"step": 10492, "train_loss": 3.6107301712036133, "lr": 0.0003156945043916669, "tps": 14316, "wall": 48035.0} {"step": 10493, "train_loss": 3.479346990585327, "lr": 0.0003156782775439388, "tps": 14315, "wall": 48040.0} {"step": 10494, "train_loss": 3.4851696491241455, "lr": 0.00031566204961236183, "tps": 14315, "wall": 48044.9} {"step": 10495, "train_loss": 3.414895534515381, "lr": 0.0003156458205971201, "tps": 14315, "wall": 48049.9} {"step": 10496, "train_loss": 3.540060043334961, "lr": 0.00031562959049839735, "tps": 14315, "wall": 48054.9} {"step": 10497, "train_loss": 3.474182605743408, "lr": 0.00031561335931637734, "tps": 14315, "wall": 48059.9} {"step": 10498, "train_loss": 3.411740303039551, "lr": 0.00031559712705124407, "tps": 14315, "wall": 48064.8} {"step": 10499, "train_loss": 3.522235631942749, "lr": 0.0003155808937031814, "tps": 14315, "wall": 48069.8} {"step": 10500, "train_loss": 3.458062171936035, "lr": 0.0003155646592723732, "tps": 14315, "wall": 48074.8} {"step": 10501, "train_loss": 3.4787139892578125, "lr": 0.00031554842375900333, "tps": 14314, "wall": 48079.9} {"step": 10502, "train_loss": 3.386220932006836, "lr": 0.00031553218716325575, "tps": 14314, "wall": 48084.9} {"step": 10503, "train_loss": 3.466763973236084, "lr": 0.00031551594948531436, "tps": 14314, "wall": 48089.9} {"step": 10504, "train_loss": 3.4801716804504395, "lr": 0.0003154997107253632, "tps": 14314, "wall": 48094.9} {"step": 10505, "train_loss": 3.4984683990478516, "lr": 0.0003154834708835861, "tps": 14314, "wall": 48099.8} {"step": 10506, "train_loss": 3.4286835193634033, "lr": 0.0003154672299601671, "tps": 14314, "wall": 48104.8} {"step": 10507, "train_loss": 3.4626567363739014, "lr": 0.0003154509879552901, "tps": 14314, "wall": 48109.8} {"step": 10508, "train_loss": 3.3927605152130127, "lr": 0.0003154347448691392, "tps": 14314, "wall": 48114.7} {"step": 10509, "train_loss": 3.5410194396972656, "lr": 0.0003154185007018984, "tps": 14313, "wall": 48119.8} {"step": 10510, "train_loss": 3.407649278640747, "lr": 0.0003154022554537515, "tps": 14313, "wall": 48124.7} {"step": 10511, "train_loss": 3.500570297241211, "lr": 0.00031538600912488283, "tps": 14313, "wall": 48129.7} {"step": 10512, "train_loss": 3.523132562637329, "lr": 0.00031536976171547625, "tps": 14313, "wall": 48134.7} {"step": 10513, "train_loss": 3.540689468383789, "lr": 0.0003153535132257158, "tps": 14313, "wall": 48139.7} {"step": 10514, "train_loss": 3.5233798027038574, "lr": 0.00031533726365578563, "tps": 14313, "wall": 48144.6} {"step": 10515, "train_loss": 3.4881153106689453, "lr": 0.00031532101300586984, "tps": 14313, "wall": 48149.6} {"step": 10516, "train_loss": 3.4309871196746826, "lr": 0.0003153047612761524, "tps": 14313, "wall": 48154.6} {"step": 10517, "train_loss": 3.545827627182007, "lr": 0.0003152885084668174, "tps": 14313, "wall": 48159.5} {"step": 10518, "train_loss": 3.4906458854675293, "lr": 0.00031527225457804914, "tps": 14312, "wall": 48164.5} {"step": 10519, "train_loss": 3.459521770477295, "lr": 0.00031525599961003165, "tps": 14312, "wall": 48169.4} {"step": 10520, "train_loss": 3.496338129043579, "lr": 0.00031523974356294893, "tps": 14312, "wall": 48174.4} {"step": 10521, "train_loss": 3.53263521194458, "lr": 0.00031522348643698526, "tps": 14312, "wall": 48179.4} {"step": 10522, "train_loss": 3.5095794200897217, "lr": 0.0003152072282323248, "tps": 14312, "wall": 48184.4} {"step": 10523, "train_loss": 3.4367496967315674, "lr": 0.0003151909689491518, "tps": 14312, "wall": 48189.4} {"step": 10524, "train_loss": 3.5374412536621094, "lr": 0.0003151747085876502, "tps": 14312, "wall": 48194.3} {"step": 10525, "train_loss": 3.6191327571868896, "lr": 0.00031515844714800445, "tps": 14312, "wall": 48199.3} {"step": 10526, "train_loss": 3.478362798690796, "lr": 0.0003151421846303986, "tps": 14311, "wall": 48204.2} {"step": 10527, "train_loss": 3.4799273014068604, "lr": 0.000315125921035017, "tps": 14311, "wall": 48209.2} {"step": 10528, "train_loss": 3.5265908241271973, "lr": 0.0003151096563620438, "tps": 14311, "wall": 48214.1} {"step": 10529, "train_loss": 3.37837553024292, "lr": 0.00031509339061166325, "tps": 14311, "wall": 48219.1} {"step": 10530, "train_loss": 3.469400405883789, "lr": 0.0003150771237840596, "tps": 14311, "wall": 48224.1} {"step": 10531, "train_loss": 3.554485321044922, "lr": 0.00031506085587941723, "tps": 14311, "wall": 48229.0} {"step": 10532, "train_loss": 3.4836654663085938, "lr": 0.0003150445868979203, "tps": 14311, "wall": 48234.0} {"step": 10533, "train_loss": 3.42692232131958, "lr": 0.00031502831683975313, "tps": 14311, "wall": 48239.0} {"step": 10534, "train_loss": 3.5008041858673096, "lr": 0.0003150120457051, "tps": 14311, "wall": 48244.0} {"step": 10535, "train_loss": 3.514042615890503, "lr": 0.0003149957734941454, "tps": 14310, "wall": 48248.9} {"step": 10536, "train_loss": 3.5737369060516357, "lr": 0.00031497950020707347, "tps": 14310, "wall": 48253.9} {"step": 10537, "train_loss": 3.5427982807159424, "lr": 0.00031496322584406857, "tps": 14310, "wall": 48258.9} {"step": 10538, "train_loss": 3.525928497314453, "lr": 0.0003149469504053152, "tps": 14310, "wall": 48263.8} {"step": 10539, "train_loss": 3.4669320583343506, "lr": 0.00031493067389099763, "tps": 14310, "wall": 48268.8} {"step": 10540, "train_loss": 3.509885787963867, "lr": 0.0003149143963013002, "tps": 14310, "wall": 48273.7} {"step": 10541, "train_loss": 3.466089963912964, "lr": 0.0003148981176364074, "tps": 14310, "wall": 48278.7} {"step": 10542, "train_loss": 3.5524518489837646, "lr": 0.0003148818378965035, "tps": 14310, "wall": 48283.6} {"step": 10543, "train_loss": 3.5245702266693115, "lr": 0.00031486555708177313, "tps": 14310, "wall": 48288.6} {"step": 10544, "train_loss": 3.4165351390838623, "lr": 0.00031484927519240057, "tps": 14309, "wall": 48293.5} {"step": 10545, "train_loss": 3.527763843536377, "lr": 0.0003148329922285703, "tps": 14309, "wall": 48298.6} {"step": 10546, "train_loss": 3.51641845703125, "lr": 0.0003148167081904667, "tps": 14309, "wall": 48303.5} {"step": 10547, "train_loss": 3.6008501052856445, "lr": 0.0003148004230782743, "tps": 14309, "wall": 48308.5} {"step": 10548, "train_loss": 3.4564599990844727, "lr": 0.00031478413689217763, "tps": 14309, "wall": 48313.4} {"step": 10549, "train_loss": 3.532712697982788, "lr": 0.0003147678496323611, "tps": 14309, "wall": 48318.4} {"step": 10550, "train_loss": 3.4290337562561035, "lr": 0.0003147515612990092, "tps": 14309, "wall": 48323.3} {"step": 10551, "train_loss": 3.5198817253112793, "lr": 0.00031473527189230664, "tps": 14309, "wall": 48328.3} {"step": 10552, "train_loss": 3.4886577129364014, "lr": 0.00031471898141243766, "tps": 14309, "wall": 48333.2} {"step": 10553, "train_loss": 3.517211437225342, "lr": 0.0003147026898595869, "tps": 14308, "wall": 48338.2} {"step": 10554, "train_loss": 3.498704433441162, "lr": 0.00031468639723393905, "tps": 14308, "wall": 48343.1} {"step": 10555, "train_loss": 3.4831695556640625, "lr": 0.0003146701035356786, "tps": 14308, "wall": 48348.1} {"step": 10556, "train_loss": 3.548232078552246, "lr": 0.00031465380876499, "tps": 14308, "wall": 48353.1} {"step": 10557, "train_loss": 3.5215163230895996, "lr": 0.0003146375129220579, "tps": 14308, "wall": 48358.1} {"step": 10558, "train_loss": 3.4326980113983154, "lr": 0.00031462121600706706, "tps": 14308, "wall": 48363.1} {"step": 10559, "train_loss": 3.511522054672241, "lr": 0.0003146049180202019, "tps": 14308, "wall": 48368.0} {"step": 10560, "train_loss": 3.568624258041382, "lr": 0.00031458861896164705, "tps": 14308, "wall": 48373.0} {"step": 10561, "train_loss": 3.418336868286133, "lr": 0.00031457231883158727, "tps": 14307, "wall": 48378.0} {"step": 10562, "train_loss": 3.4389891624450684, "lr": 0.0003145560176302072, "tps": 14307, "wall": 48382.9} {"step": 10563, "train_loss": 3.51572322845459, "lr": 0.00031453971535769134, "tps": 14307, "wall": 48387.9} {"step": 10564, "train_loss": 3.5789847373962402, "lr": 0.00031452341201422453, "tps": 14307, "wall": 48392.8} {"step": 10565, "train_loss": 3.6023683547973633, "lr": 0.0003145071075999914, "tps": 14307, "wall": 48397.7} {"step": 10566, "train_loss": 3.5305333137512207, "lr": 0.00031449080211517664, "tps": 14307, "wall": 48402.7} {"step": 10567, "train_loss": 3.4215731620788574, "lr": 0.00031447449555996494, "tps": 14307, "wall": 48407.6} {"step": 10568, "train_loss": 3.5461509227752686, "lr": 0.0003144581879345411, "tps": 14307, "wall": 48412.6} {"step": 10569, "train_loss": 3.499354362487793, "lr": 0.0003144418792390897, "tps": 14307, "wall": 48417.6} {"step": 10570, "train_loss": 3.467264175415039, "lr": 0.00031442556947379566, "tps": 14306, "wall": 48422.6} {"step": 10571, "train_loss": 3.479597568511963, "lr": 0.0003144092586388436, "tps": 14306, "wall": 48427.5} {"step": 10572, "train_loss": 3.504331588745117, "lr": 0.00031439294673441844, "tps": 14306, "wall": 48432.4} {"step": 10573, "train_loss": 3.5892186164855957, "lr": 0.00031437663376070483, "tps": 14306, "wall": 48437.4} {"step": 10574, "train_loss": 3.530277729034424, "lr": 0.0003143603197178876, "tps": 14306, "wall": 48442.3} {"step": 10575, "train_loss": 3.5459256172180176, "lr": 0.00031434400460615154, "tps": 14306, "wall": 48447.3} {"step": 10576, "train_loss": 3.547091484069824, "lr": 0.0003143276884256815, "tps": 14306, "wall": 48452.2} {"step": 10577, "train_loss": 3.4251646995544434, "lr": 0.00031431137117666233, "tps": 14306, "wall": 48457.2} {"step": 10578, "train_loss": 3.4213664531707764, "lr": 0.00031429505285927883, "tps": 14306, "wall": 48462.1} {"step": 10579, "train_loss": 3.514669179916382, "lr": 0.00031427873347371593, "tps": 14306, "wall": 48467.1} {"step": 10580, "train_loss": 3.458620309829712, "lr": 0.0003142624130201583, "tps": 14305, "wall": 48472.0} {"step": 10581, "train_loss": 3.405139923095703, "lr": 0.00031424609149879103, "tps": 14305, "wall": 48477.0} {"step": 10582, "train_loss": 3.3745267391204834, "lr": 0.0003142297689097989, "tps": 14305, "wall": 48482.0} {"step": 10583, "train_loss": 3.638195514678955, "lr": 0.0003142134452533669, "tps": 14305, "wall": 48486.9} {"step": 10584, "train_loss": 3.5190248489379883, "lr": 0.00031419712052967993, "tps": 14305, "wall": 48491.9} {"step": 10585, "train_loss": 3.414825439453125, "lr": 0.0003141807947389228, "tps": 14305, "wall": 48496.8} {"step": 10586, "train_loss": 3.398045063018799, "lr": 0.0003141644678812806, "tps": 14305, "wall": 48501.7} {"step": 10587, "train_loss": 3.4613733291625977, "lr": 0.00031414813995693817, "tps": 14305, "wall": 48506.7} {"step": 10588, "train_loss": 3.40054988861084, "lr": 0.0003141318109660805, "tps": 14305, "wall": 48511.6} {"step": 10589, "train_loss": 3.447462558746338, "lr": 0.00031411548090889263, "tps": 14304, "wall": 48516.6} {"step": 10590, "train_loss": 3.4667282104492188, "lr": 0.0003140991497855595, "tps": 14304, "wall": 48521.5} {"step": 10591, "train_loss": 3.4735231399536133, "lr": 0.0003140828175962661, "tps": 14304, "wall": 48526.5} {"step": 10592, "train_loss": 3.4319567680358887, "lr": 0.0003140664843411974, "tps": 14304, "wall": 48531.4} {"step": 10593, "train_loss": 3.47855281829834, "lr": 0.00031405015002053854, "tps": 14304, "wall": 48536.4} {"step": 10594, "train_loss": 3.5330467224121094, "lr": 0.0003140338146344745, "tps": 14304, "wall": 48541.4} {"step": 10595, "train_loss": 3.42086124420166, "lr": 0.0003140174781831903, "tps": 14304, "wall": 48546.3} {"step": 10596, "train_loss": 3.398080825805664, "lr": 0.000314001140666871, "tps": 14304, "wall": 48551.3} {"step": 10597, "train_loss": 3.5369598865509033, "lr": 0.00031398480208570174, "tps": 14304, "wall": 48556.2} {"step": 10598, "train_loss": 3.435044288635254, "lr": 0.0003139684624398675, "tps": 14303, "wall": 48561.2} {"step": 10599, "train_loss": 3.5158309936523438, "lr": 0.00031395212172955346, "tps": 14303, "wall": 48566.1} {"step": 10600, "train_loss": 3.5179011821746826, "lr": 0.0003139357799549447, "tps": 14303, "wall": 48571.1} {"step": 10601, "train_loss": 3.545414924621582, "lr": 0.00031391943711622637, "tps": 14303, "wall": 48576.0} {"step": 10602, "train_loss": 3.47837495803833, "lr": 0.00031390309321358353, "tps": 14303, "wall": 48581.0} {"step": 10603, "train_loss": 3.6077821254730225, "lr": 0.0003138867482472014, "tps": 14303, "wall": 48586.0} {"step": 10604, "train_loss": 3.4986534118652344, "lr": 0.00031387040221726514, "tps": 14303, "wall": 48590.9} {"step": 10605, "train_loss": 3.463660478591919, "lr": 0.0003138540551239598, "tps": 14303, "wall": 48595.9} {"step": 10606, "train_loss": 3.5124239921569824, "lr": 0.0003138377069674707, "tps": 14303, "wall": 48600.9} {"step": 10607, "train_loss": 3.412644147872925, "lr": 0.0003138213577479829, "tps": 14302, "wall": 48605.9} {"step": 10608, "train_loss": 3.6096465587615967, "lr": 0.00031380500746568184, "tps": 14302, "wall": 48610.8} {"step": 10609, "train_loss": 3.464294195175171, "lr": 0.00031378865612075247, "tps": 14302, "wall": 48615.8} {"step": 10610, "train_loss": 3.535971164703369, "lr": 0.00031377230371338016, "tps": 14302, "wall": 48620.8} {"step": 10611, "train_loss": 3.5601892471313477, "lr": 0.00031375595024375004, "tps": 14302, "wall": 48625.7} {"step": 10612, "train_loss": 3.577247381210327, "lr": 0.00031373959571204756, "tps": 14302, "wall": 48630.7} {"step": 10613, "train_loss": 3.5042057037353516, "lr": 0.00031372324011845785, "tps": 14302, "wall": 48635.7} {"step": 10614, "train_loss": 3.368323802947998, "lr": 0.0003137068834631662, "tps": 14302, "wall": 48640.7} {"step": 10615, "train_loss": 3.4591784477233887, "lr": 0.00031369052574635784, "tps": 14301, "wall": 48645.7} {"step": 10616, "train_loss": 3.6054916381835938, "lr": 0.00031367416696821823, "tps": 14301, "wall": 48650.7} {"step": 10617, "train_loss": 3.413577079772949, "lr": 0.00031365780712893255, "tps": 14301, "wall": 48655.7} {"step": 10618, "train_loss": 3.5971221923828125, "lr": 0.00031364144622868614, "tps": 14301, "wall": 48660.7} {"step": 10619, "train_loss": 3.5420000553131104, "lr": 0.00031362508426766435, "tps": 14301, "wall": 48665.7} {"step": 10620, "train_loss": 3.4475460052490234, "lr": 0.0003136087212460526, "tps": 14301, "wall": 48670.7} {"step": 10621, "train_loss": 3.542088508605957, "lr": 0.00031359235716403616, "tps": 14301, "wall": 48675.7} {"step": 10622, "train_loss": 3.549820899963379, "lr": 0.0003135759920218004, "tps": 14301, "wall": 48680.6} {"step": 10623, "train_loss": 3.4470252990722656, "lr": 0.0003135596258195308, "tps": 14301, "wall": 48685.6} {"step": 10624, "train_loss": 3.4112133979797363, "lr": 0.0003135432585574126, "tps": 14300, "wall": 48690.6} {"step": 10625, "train_loss": 3.5445685386657715, "lr": 0.0003135268902356314, "tps": 14300, "wall": 48695.5} {"step": 10626, "train_loss": 3.465564727783203, "lr": 0.0003135105208543725, "tps": 14300, "wall": 48700.5} {"step": 10627, "train_loss": 3.521078109741211, "lr": 0.0003134941504138214, "tps": 14300, "wall": 48705.5} {"step": 10628, "train_loss": 3.5924243927001953, "lr": 0.00031347777891416347, "tps": 14300, "wall": 48710.5} {"step": 10629, "train_loss": 3.392270088195801, "lr": 0.00031346140635558423, "tps": 14300, "wall": 48715.6} {"step": 10630, "train_loss": 3.6296582221984863, "lr": 0.0003134450327382691, "tps": 14300, "wall": 48720.5} {"step": 10631, "train_loss": 3.5521905422210693, "lr": 0.00031342865806240354, "tps": 14300, "wall": 48725.6} {"step": 10632, "train_loss": 3.44110107421875, "lr": 0.00031341228232817316, "tps": 14299, "wall": 48730.6} {"step": 10633, "train_loss": 3.3898258209228516, "lr": 0.00031339590553576335, "tps": 14299, "wall": 48735.6} {"step": 10634, "train_loss": 3.463230609893799, "lr": 0.0003133795276853597, "tps": 14299, "wall": 48740.6} {"step": 10635, "train_loss": 3.422739267349243, "lr": 0.0003133631487771476, "tps": 14299, "wall": 48745.6} {"step": 10636, "train_loss": 3.4544484615325928, "lr": 0.0003133467688113128, "tps": 14299, "wall": 48750.6} {"step": 10637, "train_loss": 3.443033456802368, "lr": 0.00031333038778804084, "tps": 14299, "wall": 48755.6} {"step": 10638, "train_loss": 3.5291905403137207, "lr": 0.00031331400570751706, "tps": 14299, "wall": 48760.6} {"step": 10639, "train_loss": 3.624408483505249, "lr": 0.0003132976225699272, "tps": 14299, "wall": 48765.6} {"step": 10640, "train_loss": 3.46916127204895, "lr": 0.0003132812383754568, "tps": 14298, "wall": 48770.6} {"step": 10641, "train_loss": 3.597761392593384, "lr": 0.00031326485312429154, "tps": 14298, "wall": 48775.7} {"step": 10642, "train_loss": 3.6666531562805176, "lr": 0.000313248466816617, "tps": 14298, "wall": 48780.7} {"step": 10643, "train_loss": 3.514294147491455, "lr": 0.0003132320794526187, "tps": 14298, "wall": 48785.7} {"step": 10644, "train_loss": 3.3231687545776367, "lr": 0.0003132156910324824, "tps": 14298, "wall": 48790.7} {"step": 10645, "train_loss": 3.543670654296875, "lr": 0.00031319930155639374, "tps": 14298, "wall": 48795.8} {"step": 10646, "train_loss": 3.4721474647521973, "lr": 0.0003131829110245383, "tps": 14298, "wall": 48800.8} {"step": 10647, "train_loss": 3.4765453338623047, "lr": 0.00031316651943710187, "tps": 14298, "wall": 48805.9} {"step": 10648, "train_loss": 3.5627920627593994, "lr": 0.00031315012679426996, "tps": 14297, "wall": 48810.9} {"step": 10649, "train_loss": 3.433562755584717, "lr": 0.00031313373309622847, "tps": 14297, "wall": 48815.9} {"step": 10650, "train_loss": 3.469660758972168, "lr": 0.00031311733834316297, "tps": 14297, "wall": 48820.9} {"step": 10651, "train_loss": 3.54276442527771, "lr": 0.0003131009425352593, "tps": 14297, "wall": 48826.0} {"step": 10652, "train_loss": 3.448512554168701, "lr": 0.000313084545672703, "tps": 14297, "wall": 48831.0} {"step": 10653, "train_loss": 3.5964083671569824, "lr": 0.00031306814775568, "tps": 14297, "wall": 48836.1} {"step": 10654, "train_loss": 3.483839511871338, "lr": 0.00031305174878437593, "tps": 14297, "wall": 48841.1} {"step": 10655, "train_loss": 3.4548959732055664, "lr": 0.0003130353487589767, "tps": 14296, "wall": 48846.1} {"step": 10656, "train_loss": 3.4705588817596436, "lr": 0.00031301894767966795, "tps": 14296, "wall": 48851.1} {"step": 10657, "train_loss": 3.5689749717712402, "lr": 0.0003130025455466356, "tps": 14296, "wall": 48856.2} {"step": 10658, "train_loss": 3.5335562229156494, "lr": 0.0003129861423600653, "tps": 14296, "wall": 48861.2} {"step": 10659, "train_loss": 3.4482688903808594, "lr": 0.000312969738120143, "tps": 14296, "wall": 48866.3} {"step": 10660, "train_loss": 3.4402003288269043, "lr": 0.0003129533328270544, "tps": 14296, "wall": 48871.3} {"step": 10661, "train_loss": 3.5000762939453125, "lr": 0.0003129369264809855, "tps": 14296, "wall": 48876.4} {"step": 10662, "train_loss": 3.5532875061035156, "lr": 0.00031292051908212207, "tps": 14296, "wall": 48881.4} {"step": 10663, "train_loss": 3.494518518447876, "lr": 0.00031290411063064985, "tps": 14295, "wall": 48886.4} {"step": 10664, "train_loss": 3.618445634841919, "lr": 0.00031288770112675494, "tps": 14295, "wall": 48891.5} {"step": 10665, "train_loss": 3.4626946449279785, "lr": 0.0003128712905706231, "tps": 14295, "wall": 48896.6} {"step": 10666, "train_loss": 3.442664623260498, "lr": 0.00031285487896244026, "tps": 14295, "wall": 48901.7} {"step": 10667, "train_loss": 3.456149101257324, "lr": 0.00031283846630239233, "tps": 14295, "wall": 48906.7} {"step": 10668, "train_loss": 3.46090030670166, "lr": 0.00031282205259066526, "tps": 14295, "wall": 48911.8} {"step": 10669, "train_loss": 3.4722416400909424, "lr": 0.000312805637827445, "tps": 14295, "wall": 48916.8} {"step": 10670, "train_loss": 3.5597519874572754, "lr": 0.00031278922201291733, "tps": 14294, "wall": 48921.8} {"step": 10671, "train_loss": 3.4671053886413574, "lr": 0.00031277280514726836, "tps": 14294, "wall": 48926.9} {"step": 10672, "train_loss": 3.588399887084961, "lr": 0.0003127563872306841, "tps": 14294, "wall": 48931.9} {"step": 10673, "train_loss": 3.4762730598449707, "lr": 0.0003127399682633504, "tps": 14294, "wall": 48937.0} {"step": 10674, "train_loss": 3.527562141418457, "lr": 0.0003127235482454534, "tps": 14294, "wall": 48942.0} {"step": 10675, "train_loss": 3.437621831893921, "lr": 0.00031270712717717907, "tps": 14294, "wall": 48947.1} {"step": 10676, "train_loss": 3.59700870513916, "lr": 0.0003126907050587132, "tps": 14294, "wall": 48952.1} {"step": 10677, "train_loss": 3.493912935256958, "lr": 0.00031267428189024214, "tps": 14293, "wall": 48957.2} {"step": 10678, "train_loss": 3.479024887084961, "lr": 0.0003126578576719518, "tps": 14293, "wall": 48962.3} {"step": 10679, "train_loss": 3.459364891052246, "lr": 0.00031264143240402817, "tps": 14293, "wall": 48967.3} {"step": 10680, "train_loss": 3.503891944885254, "lr": 0.00031262500608665746, "tps": 14293, "wall": 48972.4} {"step": 10681, "train_loss": 3.505380868911743, "lr": 0.0003126085787200256, "tps": 14293, "wall": 48977.4} {"step": 10682, "train_loss": 3.504606008529663, "lr": 0.0003125921503043188, "tps": 14293, "wall": 48982.5} {"step": 10683, "train_loss": 3.5061147212982178, "lr": 0.00031257572083972303, "tps": 14293, "wall": 48987.5} {"step": 10684, "train_loss": 3.5400075912475586, "lr": 0.0003125592903264246, "tps": 14293, "wall": 48992.6} {"step": 10685, "train_loss": 3.592916965484619, "lr": 0.00031254285876460946, "tps": 14292, "wall": 48997.7} {"step": 10686, "train_loss": 3.445972204208374, "lr": 0.0003125264261544638, "tps": 14292, "wall": 49002.7} {"step": 10687, "train_loss": 3.5339879989624023, "lr": 0.00031250999249617383, "tps": 14292, "wall": 49007.8} {"step": 10688, "train_loss": 3.5236291885375977, "lr": 0.00031249355778992564, "tps": 14292, "wall": 49012.8} {"step": 10689, "train_loss": 3.511803388595581, "lr": 0.0003124771220359054, "tps": 14292, "wall": 49018.0} {"step": 10690, "train_loss": 3.523782253265381, "lr": 0.00031246068523429934, "tps": 14292, "wall": 49023.0} {"step": 10691, "train_loss": 3.549018144607544, "lr": 0.0003124442473852936, "tps": 14292, "wall": 49028.1} {"step": 10692, "train_loss": 3.5252394676208496, "lr": 0.0003124278084890745, "tps": 14291, "wall": 49033.2} {"step": 10693, "train_loss": 3.475485324859619, "lr": 0.00031241136854582815, "tps": 14291, "wall": 49038.3} {"step": 10694, "train_loss": 3.4805407524108887, "lr": 0.0003123949275557408, "tps": 14291, "wall": 49043.4} {"step": 10695, "train_loss": 3.4796030521392822, "lr": 0.0003123784855189987, "tps": 14291, "wall": 49048.4} {"step": 10696, "train_loss": 3.4775571823120117, "lr": 0.0003123620424357881, "tps": 14291, "wall": 49053.5} {"step": 10697, "train_loss": 3.430835723876953, "lr": 0.00031234559830629535, "tps": 14291, "wall": 49058.6} {"step": 10698, "train_loss": 3.452866554260254, "lr": 0.0003123291531307067, "tps": 14291, "wall": 49063.7} {"step": 10699, "train_loss": 3.5607335567474365, "lr": 0.0003123127069092083, "tps": 14290, "wall": 49068.7} {"step": 10700, "train_loss": 3.4879989624023438, "lr": 0.0003122962596419866, "tps": 14290, "wall": 49073.8} {"step": 10701, "train_loss": 3.4936575889587402, "lr": 0.00031227981132922786, "tps": 14290, "wall": 49079.0} {"step": 10702, "train_loss": 3.66029691696167, "lr": 0.00031226336197111846, "tps": 14290, "wall": 49084.0} {"step": 10703, "train_loss": 3.468986988067627, "lr": 0.0003122469115678447, "tps": 14290, "wall": 49089.1} {"step": 10704, "train_loss": 3.447988510131836, "lr": 0.0003122304601195929, "tps": 14290, "wall": 49094.2} {"step": 10705, "train_loss": 3.545736789703369, "lr": 0.0003122140076265495, "tps": 14289, "wall": 49099.3} {"step": 10706, "train_loss": 3.520946502685547, "lr": 0.00031219755408890085, "tps": 14289, "wall": 49104.4} {"step": 10707, "train_loss": 3.414477586746216, "lr": 0.0003121810995068333, "tps": 14289, "wall": 49109.5} {"step": 10708, "train_loss": 3.487529993057251, "lr": 0.00031216464388053323, "tps": 14289, "wall": 49114.6} {"step": 10709, "train_loss": 3.480623245239258, "lr": 0.0003121481872101871, "tps": 14289, "wall": 49119.7} {"step": 10710, "train_loss": 3.536639928817749, "lr": 0.00031213172949598136, "tps": 14289, "wall": 49124.8} {"step": 10711, "train_loss": 3.579047679901123, "lr": 0.00031211527073810236, "tps": 14289, "wall": 49129.9} {"step": 10712, "train_loss": 3.57999324798584, "lr": 0.00031209881093673667, "tps": 14288, "wall": 49134.9} {"step": 10713, "train_loss": 3.546621322631836, "lr": 0.0003120823500920706, "tps": 14288, "wall": 49140.1} {"step": 10714, "train_loss": 3.438920021057129, "lr": 0.0003120658882042907, "tps": 14288, "wall": 49145.2} {"step": 10715, "train_loss": 3.5715110301971436, "lr": 0.00031204942527358345, "tps": 14288, "wall": 49150.3} {"step": 10716, "train_loss": 3.3515610694885254, "lr": 0.0003120329613001353, "tps": 14288, "wall": 49155.4} {"step": 10717, "train_loss": 3.4972195625305176, "lr": 0.00031201649628413274, "tps": 14288, "wall": 49160.5} {"step": 10718, "train_loss": 3.387272357940674, "lr": 0.0003120000302257624, "tps": 14288, "wall": 49165.5} {"step": 10719, "train_loss": 3.4700849056243896, "lr": 0.0003119835631252108, "tps": 14287, "wall": 49170.6} {"step": 10720, "train_loss": 3.424304485321045, "lr": 0.00031196709498266433, "tps": 14287, "wall": 49175.7} {"step": 10721, "train_loss": 3.4533309936523438, "lr": 0.0003119506257983097, "tps": 14287, "wall": 49180.8} {"step": 10722, "train_loss": 3.4827585220336914, "lr": 0.0003119341555723333, "tps": 14287, "wall": 49185.9} {"step": 10723, "train_loss": 3.5767126083374023, "lr": 0.00031191768430492185, "tps": 14287, "wall": 49191.0} {"step": 10724, "train_loss": 3.5264201164245605, "lr": 0.00031190121199626197, "tps": 14287, "wall": 49196.1} {"step": 10725, "train_loss": 3.568819284439087, "lr": 0.00031188473864654016, "tps": 14287, "wall": 49201.2} {"step": 10726, "train_loss": 3.4373841285705566, "lr": 0.00031186826425594306, "tps": 14286, "wall": 49206.3} {"step": 10727, "train_loss": 3.512524366378784, "lr": 0.0003118517888246572, "tps": 14286, "wall": 49211.4} {"step": 10728, "train_loss": 3.521082878112793, "lr": 0.0003118353123528694, "tps": 14286, "wall": 49216.4} {"step": 10729, "train_loss": 3.350492477416992, "lr": 0.0003118188348407662, "tps": 14286, "wall": 49221.5} {"step": 10730, "train_loss": 3.4353528022766113, "lr": 0.00031180235628853423, "tps": 14286, "wall": 49226.6} {"step": 10731, "train_loss": 3.535869836807251, "lr": 0.0003117858766963603, "tps": 14286, "wall": 49231.7} {"step": 10732, "train_loss": 3.540365695953369, "lr": 0.00031176939606443097, "tps": 14286, "wall": 49236.8} {"step": 10733, "train_loss": 3.4460182189941406, "lr": 0.0003117529143929329, "tps": 14285, "wall": 49241.9} {"step": 10734, "train_loss": 3.564682960510254, "lr": 0.00031173643168205285, "tps": 14285, "wall": 49247.0} {"step": 10735, "train_loss": 3.346324920654297, "lr": 0.00031171994793197756, "tps": 14285, "wall": 49252.1} {"step": 10736, "train_loss": 3.4463894367218018, "lr": 0.0003117034631428937, "tps": 14285, "wall": 49257.2} {"step": 10737, "train_loss": 3.4591739177703857, "lr": 0.0003116869773149881, "tps": 14285, "wall": 49262.3} {"step": 10738, "train_loss": 3.481799364089966, "lr": 0.00031167049044844743, "tps": 14285, "wall": 49267.4} {"step": 10739, "train_loss": 3.487182855606079, "lr": 0.0003116540025434585, "tps": 14284, "wall": 49272.5} {"step": 10740, "train_loss": 3.5034449100494385, "lr": 0.0003116375136002081, "tps": 14284, "wall": 49277.6} {"step": 10741, "train_loss": 3.53935170173645, "lr": 0.000311621023618883, "tps": 14284, "wall": 49282.6} {"step": 10742, "train_loss": 3.4875941276550293, "lr": 0.0003116045325996699, "tps": 14284, "wall": 49287.8} {"step": 10743, "train_loss": 3.4501850605010986, "lr": 0.0003115880405427558, "tps": 14284, "wall": 49292.8} {"step": 10744, "train_loss": 3.3489696979522705, "lr": 0.0003115715474483274, "tps": 14284, "wall": 49297.9} {"step": 10745, "train_loss": 3.4999728202819824, "lr": 0.00031155505331657146, "tps": 14284, "wall": 49303.0} {"step": 10746, "train_loss": 3.581976890563965, "lr": 0.0003115385581476751, "tps": 14283, "wall": 49308.1} {"step": 10747, "train_loss": 3.450763463973999, "lr": 0.00031152206194182483, "tps": 14283, "wall": 49313.1} {"step": 10748, "train_loss": 3.464141845703125, "lr": 0.00031150556469920776, "tps": 14283, "wall": 49318.3} {"step": 10749, "train_loss": 3.442620277404785, "lr": 0.00031148906642001063, "tps": 14283, "wall": 49323.3} {"step": 10750, "train_loss": 3.538572311401367, "lr": 0.00031147256710442053, "tps": 14283, "wall": 49328.4} {"step": 10751, "train_loss": 3.623319149017334, "lr": 0.0003114560667526242, "tps": 14283, "wall": 49333.5} {"step": 10752, "train_loss": 3.5506930351257324, "lr": 0.0003114395653648085, "tps": 14283, "wall": 49338.6} {"step": 10753, "train_loss": 3.523334503173828, "lr": 0.00031142306294116055, "tps": 14282, "wall": 49343.7} {"step": 10754, "train_loss": 3.5309553146362305, "lr": 0.0003114065594818672, "tps": 14282, "wall": 49348.7} {"step": 10755, "train_loss": 3.5953776836395264, "lr": 0.0003113900549871154, "tps": 14282, "wall": 49353.8} {"step": 10756, "train_loss": 3.398407459259033, "lr": 0.0003113735494570921, "tps": 14282, "wall": 49358.9} {"step": 10757, "train_loss": 3.465127944946289, "lr": 0.00031135704289198424, "tps": 14282, "wall": 49363.9} {"step": 10758, "train_loss": 3.342451333999634, "lr": 0.00031134053529197894, "tps": 14282, "wall": 49369.0} {"step": 10759, "train_loss": 3.5290932655334473, "lr": 0.00031132402665726307, "tps": 14282, "wall": 49374.1} {"step": 10760, "train_loss": 3.414712905883789, "lr": 0.0003113075169880237, "tps": 14281, "wall": 49379.3} {"step": 10761, "train_loss": 3.4200332164764404, "lr": 0.00031129100628444784, "tps": 14281, "wall": 49384.3} {"step": 10762, "train_loss": 3.520780324935913, "lr": 0.0003112744945467225, "tps": 14281, "wall": 49389.4} {"step": 10763, "train_loss": 3.496333122253418, "lr": 0.00031125798177503476, "tps": 14281, "wall": 49394.5} {"step": 10764, "train_loss": 3.5173470973968506, "lr": 0.00031124146796957165, "tps": 14281, "wall": 49399.6} {"step": 10765, "train_loss": 3.5882582664489746, "lr": 0.00031122495313052023, "tps": 14281, "wall": 49404.7} {"step": 10766, "train_loss": 3.636577606201172, "lr": 0.0003112084372580677, "tps": 14281, "wall": 49409.8} {"step": 10767, "train_loss": 3.5683813095092773, "lr": 0.000311191920352401, "tps": 14280, "wall": 49414.9} {"step": 10768, "train_loss": 3.4349660873413086, "lr": 0.0003111754024137073, "tps": 14280, "wall": 49420.0} {"step": 10769, "train_loss": 3.5292434692382812, "lr": 0.00031115888344217366, "tps": 14280, "wall": 49425.0} {"step": 10770, "train_loss": 3.4860970973968506, "lr": 0.00031114236343798737, "tps": 14280, "wall": 49430.1} {"step": 10771, "train_loss": 3.458578586578369, "lr": 0.00031112584240133536, "tps": 14280, "wall": 49435.2} {"step": 10772, "train_loss": 3.5665643215179443, "lr": 0.00031110932033240487, "tps": 14280, "wall": 49440.3} {"step": 10773, "train_loss": 3.5390682220458984, "lr": 0.00031109279723138313, "tps": 14280, "wall": 49445.4} {"step": 10774, "train_loss": 3.4590229988098145, "lr": 0.00031107627309845723, "tps": 14279, "wall": 49450.5} {"step": 10775, "train_loss": 3.401022434234619, "lr": 0.00031105974793381436, "tps": 14279, "wall": 49455.6} {"step": 10776, "train_loss": 3.4860293865203857, "lr": 0.00031104322173764175, "tps": 14279, "wall": 49460.7} {"step": 10777, "train_loss": 3.415567636489868, "lr": 0.00031102669451012665, "tps": 14279, "wall": 49465.7} {"step": 10778, "train_loss": 3.4833788871765137, "lr": 0.0003110101662514562, "tps": 14279, "wall": 49470.8} {"step": 10779, "train_loss": 3.4902243614196777, "lr": 0.0003109936369618176, "tps": 14279, "wall": 49475.9} {"step": 10780, "train_loss": 3.500877857208252, "lr": 0.00031097710664139823, "tps": 14279, "wall": 49481.0} {"step": 10781, "train_loss": 3.4198877811431885, "lr": 0.0003109605752903853, "tps": 14278, "wall": 49486.1} {"step": 10782, "train_loss": 3.562476396560669, "lr": 0.00031094404290896594, "tps": 14278, "wall": 49491.2} {"step": 10783, "train_loss": 3.451681613922119, "lr": 0.0003109275094973277, "tps": 14278, "wall": 49496.3} {"step": 10784, "train_loss": 3.3698835372924805, "lr": 0.00031091097505565754, "tps": 14278, "wall": 49501.4} {"step": 10785, "train_loss": 3.553025245666504, "lr": 0.00031089443958414305, "tps": 14278, "wall": 49506.5} {"step": 10786, "train_loss": 3.4860243797302246, "lr": 0.0003108779030829714, "tps": 14278, "wall": 49511.5} {"step": 10787, "train_loss": 3.5042905807495117, "lr": 0.00031086136555232995, "tps": 14278, "wall": 49516.6} {"step": 10788, "train_loss": 3.552227258682251, "lr": 0.00031084482699240604, "tps": 14277, "wall": 49521.7} {"step": 10789, "train_loss": 3.5269570350646973, "lr": 0.00031082828740338703, "tps": 14277, "wall": 49526.8} {"step": 10790, "train_loss": 3.4947025775909424, "lr": 0.0003108117467854602, "tps": 14277, "wall": 49531.8} {"step": 10791, "train_loss": 3.4761252403259277, "lr": 0.00031079520513881305, "tps": 14277, "wall": 49536.9} {"step": 10792, "train_loss": 3.511540174484253, "lr": 0.0003107786624636329, "tps": 14277, "wall": 49542.0} {"step": 10793, "train_loss": 3.429250955581665, "lr": 0.0003107621187601072, "tps": 14277, "wall": 49547.0} {"step": 10794, "train_loss": 3.511207103729248, "lr": 0.0003107455740284232, "tps": 14277, "wall": 49552.1} {"step": 10795, "train_loss": 3.4130239486694336, "lr": 0.00031072902826876844, "tps": 14276, "wall": 49557.2} {"step": 10796, "train_loss": 3.557211399078369, "lr": 0.0003107124814813304, "tps": 14276, "wall": 49562.3} {"step": 10797, "train_loss": 3.4184064865112305, "lr": 0.00031069593366629645, "tps": 14276, "wall": 49567.4} {"step": 10798, "train_loss": 3.4529361724853516, "lr": 0.000310679384823854, "tps": 14276, "wall": 49572.5} {"step": 10799, "train_loss": 3.3775439262390137, "lr": 0.00031066283495419065, "tps": 14276, "wall": 49577.6} {"step": 10800, "train_loss": 3.562943458557129, "lr": 0.00031064628405749376, "tps": 14276, "wall": 49582.6} {"step": 10801, "train_loss": 3.393695831298828, "lr": 0.0003106297321339509, "tps": 14276, "wall": 49587.7} {"step": 10802, "train_loss": 3.457695960998535, "lr": 0.0003106131791837495, "tps": 14275, "wall": 49592.8} {"step": 10803, "train_loss": 3.4318127632141113, "lr": 0.0003105966252070771, "tps": 14275, "wall": 49597.9} {"step": 10804, "train_loss": 3.466939926147461, "lr": 0.00031058007020412124, "tps": 14275, "wall": 49602.9} {"step": 10805, "train_loss": 3.4605612754821777, "lr": 0.0003105635141750694, "tps": 14275, "wall": 49608.0} {"step": 10806, "train_loss": 3.4862353801727295, "lr": 0.00031054695712010917, "tps": 14275, "wall": 49613.1} {"step": 10807, "train_loss": 3.487846851348877, "lr": 0.0003105303990394282, "tps": 14275, "wall": 49618.2} {"step": 10808, "train_loss": 3.4977993965148926, "lr": 0.00031051383993321386, "tps": 14275, "wall": 49623.3} {"step": 10809, "train_loss": 3.5436713695526123, "lr": 0.0003104972798016539, "tps": 14274, "wall": 49628.4} {"step": 10810, "train_loss": 3.4142441749572754, "lr": 0.00031048071864493595, "tps": 14274, "wall": 49633.5} {"step": 10811, "train_loss": 3.545413017272949, "lr": 0.0003104641564632474, "tps": 14274, "wall": 49638.6} {"step": 10812, "train_loss": 3.535419464111328, "lr": 0.000310447593256776, "tps": 14274, "wall": 49643.6} {"step": 10813, "train_loss": 3.4837770462036133, "lr": 0.0003104310290257094, "tps": 14274, "wall": 49648.7} {"step": 10814, "train_loss": 3.5641026496887207, "lr": 0.0003104144637702353, "tps": 14274, "wall": 49653.8} {"step": 10815, "train_loss": 3.473261833190918, "lr": 0.00031039789749054116, "tps": 14274, "wall": 49658.9} {"step": 10816, "train_loss": 3.526174783706665, "lr": 0.0003103813301868147, "tps": 14274, "wall": 49663.9} {"step": 10817, "train_loss": 3.5454938411712646, "lr": 0.0003103647618592438, "tps": 14273, "wall": 49669.0} {"step": 10818, "train_loss": 3.5073606967926025, "lr": 0.0003103481925080158, "tps": 14273, "wall": 49674.1} {"step": 10819, "train_loss": 3.4807963371276855, "lr": 0.0003103316221333187, "tps": 14273, "wall": 49679.2} {"step": 10820, "train_loss": 3.4716076850891113, "lr": 0.0003103150507353401, "tps": 14273, "wall": 49684.3} {"step": 10821, "train_loss": 3.5048294067382812, "lr": 0.00031029847831426767, "tps": 14273, "wall": 49689.4} {"step": 10822, "train_loss": 3.5331509113311768, "lr": 0.00031028190487028925, "tps": 14273, "wall": 49694.4} {"step": 10823, "train_loss": 3.4322705268859863, "lr": 0.00031026533040359245, "tps": 14272, "wall": 49699.6} {"step": 10824, "train_loss": 3.501796007156372, "lr": 0.0003102487549143652, "tps": 14272, "wall": 49704.7} {"step": 10825, "train_loss": 3.4881038665771484, "lr": 0.00031023217840279516, "tps": 14272, "wall": 49709.8} {"step": 10826, "train_loss": 3.491316795349121, "lr": 0.0003102156008690701, "tps": 14272, "wall": 49714.8} {"step": 10827, "train_loss": 3.484773635864258, "lr": 0.00031019902231337775, "tps": 14272, "wall": 49719.9} {"step": 10828, "train_loss": 3.4291610717773438, "lr": 0.0003101824427359061, "tps": 14272, "wall": 49725.0} {"step": 10829, "train_loss": 3.357877731323242, "lr": 0.0003101658621368428, "tps": 14272, "wall": 49730.0} {"step": 10830, "train_loss": 3.46958327293396, "lr": 0.00031014928051637577, "tps": 14272, "wall": 49735.1} {"step": 10831, "train_loss": 3.3968327045440674, "lr": 0.00031013269787469284, "tps": 14271, "wall": 49740.2} {"step": 10832, "train_loss": 3.4676434993743896, "lr": 0.00031011611421198176, "tps": 14271, "wall": 49745.3} {"step": 10833, "train_loss": 3.5681145191192627, "lr": 0.0003100995295284305, "tps": 14271, "wall": 49750.4} {"step": 10834, "train_loss": 3.3975870609283447, "lr": 0.0003100829438242269, "tps": 14271, "wall": 49755.5} {"step": 10835, "train_loss": 3.4903690814971924, "lr": 0.00031006635709955886, "tps": 14271, "wall": 49760.5} {"step": 10836, "train_loss": 3.506829261779785, "lr": 0.0003100497693546142, "tps": 14271, "wall": 49765.6} {"step": 10837, "train_loss": 3.4929208755493164, "lr": 0.00031003318058958086, "tps": 14271, "wall": 49770.7} {"step": 10838, "train_loss": 3.386260509490967, "lr": 0.0003100165908046469, "tps": 14270, "wall": 49775.7} {"step": 10839, "train_loss": 3.468337059020996, "lr": 0.00031, "tps": 14270, "wall": 49780.8} {"step": 10840, "train_loss": 3.5554282665252686, "lr": 0.0003099834081758283, "tps": 14270, "wall": 49785.9} {"step": 10841, "train_loss": 3.4920806884765625, "lr": 0.0003099668153323197, "tps": 14270, "wall": 49791.0} {"step": 10842, "train_loss": 3.447206974029541, "lr": 0.00030995022146966213, "tps": 14270, "wall": 49796.2} {"step": 10843, "train_loss": 3.5309643745422363, "lr": 0.0003099336265880435, "tps": 14270, "wall": 49801.2} {"step": 10844, "train_loss": 3.5520381927490234, "lr": 0.000309917030687652, "tps": 14270, "wall": 49806.3} {"step": 10845, "train_loss": 3.548243761062622, "lr": 0.0003099004337686755, "tps": 14269, "wall": 49811.3} {"step": 10846, "train_loss": 3.475794792175293, "lr": 0.00030988383583130196, "tps": 14269, "wall": 49816.4} {"step": 10847, "train_loss": 3.3830068111419678, "lr": 0.00030986723687571947, "tps": 14269, "wall": 49821.5} {"step": 10848, "train_loss": 3.51821231842041, "lr": 0.0003098506369021162, "tps": 14269, "wall": 49826.5} {"step": 10849, "train_loss": 3.581782341003418, "lr": 0.00030983403591067985, "tps": 14269, "wall": 49831.6} {"step": 10850, "train_loss": 3.5180444717407227, "lr": 0.0003098174339015988, "tps": 14269, "wall": 49836.7} {"step": 10851, "train_loss": 3.455284595489502, "lr": 0.00030980083087506097, "tps": 14269, "wall": 49841.8} {"step": 10852, "train_loss": 3.418492317199707, "lr": 0.0003097842268312545, "tps": 14268, "wall": 49846.9} {"step": 10853, "train_loss": 3.4926390647888184, "lr": 0.00030976762177036736, "tps": 14268, "wall": 49851.9} {"step": 10854, "train_loss": 3.478590965270996, "lr": 0.00030975101569258784, "tps": 14268, "wall": 49857.1} {"step": 10855, "train_loss": 3.3510704040527344, "lr": 0.00030973440859810396, "tps": 14268, "wall": 49862.1} {"step": 10856, "train_loss": 3.48170804977417, "lr": 0.0003097178004871038, "tps": 14268, "wall": 49867.2} {"step": 10857, "train_loss": 3.532585382461548, "lr": 0.00030970119135977553, "tps": 14268, "wall": 49872.3} {"step": 10858, "train_loss": 3.5858800411224365, "lr": 0.00030968458121630735, "tps": 14268, "wall": 49877.4} {"step": 10859, "train_loss": 3.4794929027557373, "lr": 0.00030966797005688737, "tps": 14267, "wall": 49882.4} {"step": 10860, "train_loss": 3.426877498626709, "lr": 0.00030965135788170374, "tps": 14267, "wall": 49887.5} {"step": 10861, "train_loss": 3.532021999359131, "lr": 0.0003096347446909447, "tps": 14267, "wall": 49892.6} {"step": 10862, "train_loss": 3.5379700660705566, "lr": 0.0003096181304847985, "tps": 14267, "wall": 49897.6} {"step": 10863, "train_loss": 3.542480707168579, "lr": 0.0003096015152634531, "tps": 14267, "wall": 49902.7} {"step": 10864, "train_loss": 3.524860382080078, "lr": 0.000309584899027097, "tps": 14267, "wall": 49907.8} {"step": 10865, "train_loss": 3.489905834197998, "lr": 0.0003095682817759184, "tps": 14267, "wall": 49912.9} {"step": 10866, "train_loss": 3.490654945373535, "lr": 0.00030955166351010534, "tps": 14266, "wall": 49918.1} {"step": 10867, "train_loss": 3.5367350578308105, "lr": 0.0003095350442298462, "tps": 14266, "wall": 49923.1} {"step": 10868, "train_loss": 3.3707497119903564, "lr": 0.0003095184239353293, "tps": 14266, "wall": 49928.3} {"step": 10869, "train_loss": 3.5531563758850098, "lr": 0.00030950180262674274, "tps": 14266, "wall": 49933.3} {"step": 10870, "train_loss": 3.5289058685302734, "lr": 0.000309485180304275, "tps": 14266, "wall": 49938.4} {"step": 10871, "train_loss": 3.5495786666870117, "lr": 0.00030946855696811423, "tps": 14266, "wall": 49943.5} {"step": 10872, "train_loss": 3.414803981781006, "lr": 0.0003094519326184489, "tps": 14266, "wall": 49948.6} {"step": 10873, "train_loss": 3.4460668563842773, "lr": 0.0003094353072554672, "tps": 14265, "wall": 49953.7} {"step": 10874, "train_loss": 3.463444709777832, "lr": 0.0003094186808793575, "tps": 14265, "wall": 49958.8} {"step": 10875, "train_loss": 3.5092430114746094, "lr": 0.0003094020534903082, "tps": 14265, "wall": 49963.8} {"step": 10876, "train_loss": 3.571171283721924, "lr": 0.0003093854250885075, "tps": 14265, "wall": 49968.9} {"step": 10877, "train_loss": 3.477509021759033, "lr": 0.0003093687956741439, "tps": 14265, "wall": 49974.0} {"step": 10878, "train_loss": 3.596560001373291, "lr": 0.0003093521652474057, "tps": 14265, "wall": 49979.1} {"step": 10879, "train_loss": 3.4464809894561768, "lr": 0.00030933553380848146, "tps": 14265, "wall": 49984.2} {"step": 10880, "train_loss": 3.454561710357666, "lr": 0.0003093189013575594, "tps": 14264, "wall": 49989.3} {"step": 10881, "train_loss": 3.4612128734588623, "lr": 0.0003093022678948279, "tps": 14264, "wall": 49994.4} {"step": 10882, "train_loss": 3.474445343017578, "lr": 0.00030928563342047565, "tps": 14264, "wall": 49999.5} {"step": 10883, "train_loss": 3.4648332595825195, "lr": 0.0003092689979346908, "tps": 14264, "wall": 50004.5} {"step": 10884, "train_loss": 3.531546115875244, "lr": 0.00030925236143766196, "tps": 14264, "wall": 50009.6} {"step": 10885, "train_loss": 3.4627490043640137, "lr": 0.0003092357239295775, "tps": 14264, "wall": 50014.7} {"step": 10886, "train_loss": 3.456191062927246, "lr": 0.00030921908541062595, "tps": 14264, "wall": 50019.8} {"step": 10887, "train_loss": 3.446514844894409, "lr": 0.0003092024458809958, "tps": 14264, "wall": 50024.9} {"step": 10888, "train_loss": 3.635408878326416, "lr": 0.0003091858053408755, "tps": 14263, "wall": 50029.9} {"step": 10889, "train_loss": 3.5267205238342285, "lr": 0.00030916916379045357, "tps": 14263, "wall": 50035.0} {"step": 10890, "train_loss": 3.382432460784912, "lr": 0.00030915252122991853, "tps": 14263, "wall": 50040.1} {"step": 10891, "train_loss": 3.4797651767730713, "lr": 0.0003091358776594589, "tps": 14263, "wall": 50045.2} {"step": 10892, "train_loss": 3.4625325202941895, "lr": 0.00030911923307926325, "tps": 14263, "wall": 50050.3} {"step": 10893, "train_loss": 3.448493003845215, "lr": 0.00030910258748952004, "tps": 14263, "wall": 50055.4} {"step": 10894, "train_loss": 3.5061392784118652, "lr": 0.00030908594089041795, "tps": 14263, "wall": 50060.5} {"step": 10895, "train_loss": 3.4240028858184814, "lr": 0.0003090692932821455, "tps": 14262, "wall": 50065.5} {"step": 10896, "train_loss": 3.598111629486084, "lr": 0.0003090526446648913, "tps": 14262, "wall": 50070.6} {"step": 10897, "train_loss": 3.5849623680114746, "lr": 0.0003090359950388439, "tps": 14262, "wall": 50075.7} {"step": 10898, "train_loss": 3.492823600769043, "lr": 0.0003090193444041919, "tps": 14262, "wall": 50080.7} {"step": 10899, "train_loss": 3.4294896125793457, "lr": 0.000309002692761124, "tps": 14262, "wall": 50085.8} {"step": 10900, "train_loss": 3.4597790241241455, "lr": 0.00030898604010982873, "tps": 14262, "wall": 50090.9} {"step": 10901, "train_loss": 3.6386525630950928, "lr": 0.00030896938645049484, "tps": 14262, "wall": 50096.1} {"step": 10902, "train_loss": 3.504007339477539, "lr": 0.0003089527317833109, "tps": 14261, "wall": 50101.1} {"step": 10903, "train_loss": 3.430274486541748, "lr": 0.0003089360761084656, "tps": 14261, "wall": 50106.2} {"step": 10904, "train_loss": 3.499309539794922, "lr": 0.0003089194194261476, "tps": 14261, "wall": 50111.3} {"step": 10905, "train_loss": 3.5453786849975586, "lr": 0.0003089027617365456, "tps": 14261, "wall": 50116.4} {"step": 10906, "train_loss": 3.476768732070923, "lr": 0.0003088861030398484, "tps": 14261, "wall": 50121.5} {"step": 10907, "train_loss": 3.459409713745117, "lr": 0.00030886944333624453, "tps": 14261, "wall": 50126.5} {"step": 10908, "train_loss": 3.551076889038086, "lr": 0.0003088527826259228, "tps": 14261, "wall": 50131.6} {"step": 10909, "train_loss": 3.482232093811035, "lr": 0.00030883612090907203, "tps": 14260, "wall": 50136.7} {"step": 10910, "train_loss": 3.529171943664551, "lr": 0.0003088194581858808, "tps": 14260, "wall": 50141.7} {"step": 10911, "train_loss": 3.4537370204925537, "lr": 0.00030880279445653794, "tps": 14260, "wall": 50146.8} {"step": 10912, "train_loss": 3.5424160957336426, "lr": 0.0003087861297212322, "tps": 14260, "wall": 50151.9} {"step": 10913, "train_loss": 3.460426092147827, "lr": 0.00030876946398015245, "tps": 14260, "wall": 50157.0} {"step": 10914, "train_loss": 3.5155386924743652, "lr": 0.00030875279723348737, "tps": 14260, "wall": 50162.2} {"step": 10915, "train_loss": 3.456244468688965, "lr": 0.0003087361294814258, "tps": 14260, "wall": 50167.2} {"step": 10916, "train_loss": 3.4698970317840576, "lr": 0.0003087194607241565, "tps": 14259, "wall": 50172.3} {"step": 10917, "train_loss": 3.4808239936828613, "lr": 0.00030870279096186843, "tps": 14259, "wall": 50177.4} {"step": 10918, "train_loss": 3.5284199714660645, "lr": 0.0003086861201947504, "tps": 14259, "wall": 50182.5} {"step": 10919, "train_loss": 3.512711524963379, "lr": 0.00030866944842299104, "tps": 14259, "wall": 50187.6} {"step": 10920, "train_loss": 3.5651495456695557, "lr": 0.0003086527756467795, "tps": 14259, "wall": 50192.7} {"step": 10921, "train_loss": 3.394378423690796, "lr": 0.0003086361018663045, "tps": 14259, "wall": 50197.8} {"step": 10922, "train_loss": 3.5390512943267822, "lr": 0.00030861942708175483, "tps": 14259, "wall": 50202.9} {"step": 10923, "train_loss": 3.4685468673706055, "lr": 0.0003086027512933196, "tps": 14259, "wall": 50207.9} {"step": 10924, "train_loss": 3.5208685398101807, "lr": 0.0003085860745011876, "tps": 14258, "wall": 50213.0} {"step": 10925, "train_loss": 3.3987107276916504, "lr": 0.00030856939670554777, "tps": 14258, "wall": 50218.2} {"step": 10926, "train_loss": 3.5182223320007324, "lr": 0.00030855271790658896, "tps": 14258, "wall": 50223.3} {"step": 10927, "train_loss": 3.5930657386779785, "lr": 0.00030853603810450023, "tps": 14258, "wall": 50228.4} {"step": 10928, "train_loss": 3.4452693462371826, "lr": 0.00030851935729947044, "tps": 14258, "wall": 50233.4} {"step": 10929, "train_loss": 3.4330410957336426, "lr": 0.0003085026754916886, "tps": 14258, "wall": 50238.6} {"step": 10930, "train_loss": 3.543571710586548, "lr": 0.0003084859926813437, "tps": 14257, "wall": 50243.7} {"step": 10931, "train_loss": 3.4415974617004395, "lr": 0.0003084693088686246, "tps": 14257, "wall": 50248.8} {"step": 10932, "train_loss": 3.4158153533935547, "lr": 0.00030845262405372045, "tps": 14257, "wall": 50253.8} {"step": 10933, "train_loss": 3.5101118087768555, "lr": 0.0003084359382368202, "tps": 14257, "wall": 50258.9} {"step": 10934, "train_loss": 3.3750557899475098, "lr": 0.0003084192514181128, "tps": 14257, "wall": 50264.0} {"step": 10935, "train_loss": 3.4720184803009033, "lr": 0.0003084025635977873, "tps": 14257, "wall": 50269.0} {"step": 10936, "train_loss": 3.5634357929229736, "lr": 0.00030838587477603286, "tps": 14257, "wall": 50274.1} {"step": 10937, "train_loss": 3.466705799102783, "lr": 0.00030836918495303847, "tps": 14257, "wall": 50279.2} {"step": 10938, "train_loss": 3.4260332584381104, "lr": 0.0003083524941289931, "tps": 14256, "wall": 50284.3} {"step": 10939, "train_loss": 3.403585195541382, "lr": 0.000308335802304086, "tps": 14256, "wall": 50289.4} {"step": 10940, "train_loss": 3.5955183506011963, "lr": 0.00030831910947850605, "tps": 14256, "wall": 50294.5} {"step": 10941, "train_loss": 3.559227466583252, "lr": 0.00030830241565244247, "tps": 14256, "wall": 50299.5} {"step": 10942, "train_loss": 3.445204496383667, "lr": 0.00030828572082608436, "tps": 14256, "wall": 50304.6} {"step": 10943, "train_loss": 3.4590237140655518, "lr": 0.0003082690249996208, "tps": 14256, "wall": 50309.7} {"step": 10944, "train_loss": 3.5373082160949707, "lr": 0.000308252328173241, "tps": 14256, "wall": 50314.8} {"step": 10945, "train_loss": 3.5313291549682617, "lr": 0.00030823563034713405, "tps": 14255, "wall": 50319.9} {"step": 10946, "train_loss": 3.418487548828125, "lr": 0.0003082189315214891, "tps": 14255, "wall": 50324.9} {"step": 10947, "train_loss": 3.4712893962860107, "lr": 0.0003082022316964953, "tps": 14255, "wall": 50330.0} {"step": 10948, "train_loss": 3.484405040740967, "lr": 0.00030818553087234185, "tps": 14255, "wall": 50335.1} {"step": 10949, "train_loss": 3.355513095855713, "lr": 0.0003081688290492179, "tps": 14255, "wall": 50340.2} {"step": 10950, "train_loss": 3.4268131256103516, "lr": 0.00030815212622731274, "tps": 14255, "wall": 50345.3} {"step": 10951, "train_loss": 3.534571409225464, "lr": 0.0003081354224068155, "tps": 14255, "wall": 50350.4} {"step": 10952, "train_loss": 3.58420467376709, "lr": 0.00030811871758791543, "tps": 14254, "wall": 50355.5} {"step": 10953, "train_loss": 3.450011968612671, "lr": 0.0003081020117708018, "tps": 14254, "wall": 50360.6} {"step": 10954, "train_loss": 3.462642192840576, "lr": 0.0003080853049556638, "tps": 14254, "wall": 50365.6} {"step": 10955, "train_loss": 3.4511232376098633, "lr": 0.00030806859714269065, "tps": 14254, "wall": 50370.7} {"step": 10956, "train_loss": 3.5130786895751953, "lr": 0.0003080518883320717, "tps": 14254, "wall": 50375.7} {"step": 10957, "train_loss": 3.6910152435302734, "lr": 0.0003080351785239962, "tps": 14254, "wall": 50380.8} {"step": 10958, "train_loss": 3.427145004272461, "lr": 0.0003080184677186534, "tps": 14254, "wall": 50385.9} {"step": 10959, "train_loss": 3.5381743907928467, "lr": 0.0003080017559162327, "tps": 14254, "wall": 50391.0} {"step": 10960, "train_loss": 3.5850133895874023, "lr": 0.0003079850431169233, "tps": 14253, "wall": 50396.1} {"step": 10961, "train_loss": 3.44096040725708, "lr": 0.00030796832932091455, "tps": 14253, "wall": 50401.2} {"step": 10962, "train_loss": 3.4229440689086914, "lr": 0.0003079516145283959, "tps": 14253, "wall": 50406.3} {"step": 10963, "train_loss": 3.56065034866333, "lr": 0.0003079348987395565, "tps": 14253, "wall": 50411.4} {"step": 10964, "train_loss": 3.502049446105957, "lr": 0.00030791818195458585, "tps": 14253, "wall": 50416.5} {"step": 10965, "train_loss": 3.5113871097564697, "lr": 0.00030790146417367326, "tps": 14253, "wall": 50421.6} {"step": 10966, "train_loss": 3.4730730056762695, "lr": 0.0003078847453970082, "tps": 14253, "wall": 50426.7} {"step": 10967, "train_loss": 3.5101375579833984, "lr": 0.00030786802562477995, "tps": 14252, "wall": 50431.7} {"step": 10968, "train_loss": 3.4618544578552246, "lr": 0.0003078513048571779, "tps": 14252, "wall": 50436.8} {"step": 10969, "train_loss": 3.5098607540130615, "lr": 0.0003078345830943915, "tps": 14252, "wall": 50441.9} {"step": 10970, "train_loss": 3.511002779006958, "lr": 0.00030781786033661033, "tps": 14252, "wall": 50447.0} {"step": 10971, "train_loss": 3.4650542736053467, "lr": 0.0003078011365840236, "tps": 14252, "wall": 50452.0} {"step": 10972, "train_loss": 3.4036474227905273, "lr": 0.00030778441183682085, "tps": 14252, "wall": 50457.1} {"step": 10973, "train_loss": 3.4874839782714844, "lr": 0.00030776768609519153, "tps": 14252, "wall": 50462.2} {"step": 10974, "train_loss": 3.4534645080566406, "lr": 0.00030775095935932513, "tps": 14251, "wall": 50467.3} {"step": 10975, "train_loss": 3.5005428791046143, "lr": 0.00030773423162941106, "tps": 14251, "wall": 50472.4} {"step": 10976, "train_loss": 3.4265265464782715, "lr": 0.00030771750290563895, "tps": 14251, "wall": 50477.5} {"step": 10977, "train_loss": 3.520529270172119, "lr": 0.00030770077318819814, "tps": 14251, "wall": 50482.6} {"step": 10978, "train_loss": 3.5382940769195557, "lr": 0.0003076840424772783, "tps": 14251, "wall": 50487.6} {"step": 10979, "train_loss": 3.3722357749938965, "lr": 0.00030766731077306887, "tps": 14251, "wall": 50492.7} {"step": 10980, "train_loss": 3.425978660583496, "lr": 0.0003076505780757594, "tps": 14251, "wall": 50497.8} {"step": 10981, "train_loss": 3.416069984436035, "lr": 0.0003076338443855394, "tps": 14250, "wall": 50502.9} {"step": 10982, "train_loss": 3.4232680797576904, "lr": 0.00030761710970259845, "tps": 14250, "wall": 50508.0} {"step": 10983, "train_loss": 3.42301607131958, "lr": 0.00030760037402712616, "tps": 14250, "wall": 50513.0} {"step": 10984, "train_loss": 3.5284714698791504, "lr": 0.0003075836373593122, "tps": 14250, "wall": 50518.1} {"step": 10985, "train_loss": 3.48712158203125, "lr": 0.00030756689969934595, "tps": 14250, "wall": 50523.2} {"step": 10986, "train_loss": 3.47347092628479, "lr": 0.0003075501610474171, "tps": 14250, "wall": 50528.3} {"step": 10987, "train_loss": 3.5032143592834473, "lr": 0.00030753342140371544, "tps": 14250, "wall": 50533.4} {"step": 10988, "train_loss": 3.483870029449463, "lr": 0.0003075166807684303, "tps": 14250, "wall": 50538.5} {"step": 10989, "train_loss": 3.4974074363708496, "lr": 0.0003074999391417515, "tps": 14249, "wall": 50543.6} {"step": 10990, "train_loss": 3.5326781272888184, "lr": 0.0003074831965238687, "tps": 14249, "wall": 50548.6} {"step": 10991, "train_loss": 3.4450697898864746, "lr": 0.0003074664529149714, "tps": 14249, "wall": 50553.7} {"step": 10992, "train_loss": 3.4909889698028564, "lr": 0.0003074497083152495, "tps": 14249, "wall": 50558.8} {"step": 10993, "train_loss": 3.4619693756103516, "lr": 0.0003074329627248926, "tps": 14249, "wall": 50563.9} {"step": 10994, "train_loss": 3.4877102375030518, "lr": 0.0003074162161440903, "tps": 14249, "wall": 50569.0} {"step": 10995, "train_loss": 3.4822402000427246, "lr": 0.0003073994685730324, "tps": 14249, "wall": 50574.1} {"step": 10996, "train_loss": 3.5459494590759277, "lr": 0.0003073827200119086, "tps": 14248, "wall": 50579.2} {"step": 10997, "train_loss": 3.6450979709625244, "lr": 0.00030736597046090856, "tps": 14248, "wall": 50584.3} {"step": 10998, "train_loss": 3.506666660308838, "lr": 0.0003073492199202221, "tps": 14248, "wall": 50589.4} {"step": 10999, "train_loss": 3.504117965698242, "lr": 0.000307332468390039, "tps": 14248, "wall": 50594.5} {"step": 11000, "train_loss": 3.484938383102417, "lr": 0.00030731571587054894, "tps": 14248, "wall": 50599.6, "val_loss_monitor": 3.51584625878622} {"step": 11001, "train_loss": 3.4525763988494873, "lr": 0.0003072989623619418, "tps": 14234, "wall": 50654.4} {"step": 11002, "train_loss": 3.5277366638183594, "lr": 0.0003072822078644072, "tps": 14234, "wall": 50659.6} {"step": 11003, "train_loss": 3.4746172428131104, "lr": 0.00030726545237813504, "tps": 14233, "wall": 50664.7} {"step": 11004, "train_loss": 3.497504234313965, "lr": 0.0003072486959033151, "tps": 14233, "wall": 50669.8} {"step": 11005, "train_loss": 3.3957571983337402, "lr": 0.00030723193844013727, "tps": 14233, "wall": 50674.9} {"step": 11006, "train_loss": 3.3931190967559814, "lr": 0.0003072151799887913, "tps": 14233, "wall": 50680.0} {"step": 11007, "train_loss": 3.587092161178589, "lr": 0.000307198420549467, "tps": 14233, "wall": 50685.1} {"step": 11008, "train_loss": 3.5821022987365723, "lr": 0.00030718166012235436, "tps": 14233, "wall": 50690.2} {"step": 11009, "train_loss": 3.465492010116577, "lr": 0.00030716489870764304, "tps": 14233, "wall": 50695.3} {"step": 11010, "train_loss": 3.4581503868103027, "lr": 0.0003071481363055231, "tps": 14232, "wall": 50700.5} {"step": 11011, "train_loss": 3.424510955810547, "lr": 0.00030713137291618446, "tps": 14232, "wall": 50705.6} {"step": 11012, "train_loss": 3.4852280616760254, "lr": 0.0003071146085398168, "tps": 14232, "wall": 50710.7} {"step": 11013, "train_loss": 3.4539568424224854, "lr": 0.0003070978431766101, "tps": 14232, "wall": 50715.8} {"step": 11014, "train_loss": 3.5708885192871094, "lr": 0.00030708107682675444, "tps": 14232, "wall": 50720.9} {"step": 11015, "train_loss": 3.4958763122558594, "lr": 0.0003070643094904396, "tps": 14232, "wall": 50726.0} {"step": 11016, "train_loss": 3.5210165977478027, "lr": 0.0003070475411678555, "tps": 14232, "wall": 50731.1} {"step": 11017, "train_loss": 3.407505512237549, "lr": 0.00030703077185919214, "tps": 14231, "wall": 50736.1} {"step": 11018, "train_loss": 3.4860405921936035, "lr": 0.00030701400156463957, "tps": 14231, "wall": 50741.2} {"step": 11019, "train_loss": 3.417536973953247, "lr": 0.0003069972302843876, "tps": 14231, "wall": 50746.3} {"step": 11020, "train_loss": 3.537148952484131, "lr": 0.0003069804580186263, "tps": 14231, "wall": 50751.3} {"step": 11021, "train_loss": 3.4797263145446777, "lr": 0.0003069636847675457, "tps": 14231, "wall": 50756.5} {"step": 11022, "train_loss": 3.551997423171997, "lr": 0.0003069469105313358, "tps": 14231, "wall": 50761.6} {"step": 11023, "train_loss": 3.441655158996582, "lr": 0.0003069301353101866, "tps": 14231, "wall": 50766.7} {"step": 11024, "train_loss": 3.4817211627960205, "lr": 0.00030691335910428805, "tps": 14231, "wall": 50771.8} {"step": 11025, "train_loss": 3.4568405151367188, "lr": 0.0003068965819138303, "tps": 14230, "wall": 50776.8} {"step": 11026, "train_loss": 3.439716339111328, "lr": 0.0003068798037390034, "tps": 14230, "wall": 50781.9} {"step": 11027, "train_loss": 3.414177417755127, "lr": 0.0003068630245799973, "tps": 14230, "wall": 50787.0} {"step": 11028, "train_loss": 3.4806809425354004, "lr": 0.00030684624443700226, "tps": 14230, "wall": 50792.1} {"step": 11029, "train_loss": 3.416250705718994, "lr": 0.00030682946331020823, "tps": 14230, "wall": 50797.2} {"step": 11030, "train_loss": 3.46110463142395, "lr": 0.0003068126811998053, "tps": 14230, "wall": 50802.3} {"step": 11031, "train_loss": 3.518035888671875, "lr": 0.00030679589810598363, "tps": 14230, "wall": 50807.3} {"step": 11032, "train_loss": 3.519709587097168, "lr": 0.0003067791140289334, "tps": 14229, "wall": 50812.4} {"step": 11033, "train_loss": 3.540274143218994, "lr": 0.0003067623289688446, "tps": 14229, "wall": 50817.6} {"step": 11034, "train_loss": 3.5522403717041016, "lr": 0.00030674554292590744, "tps": 14229, "wall": 50822.7} {"step": 11035, "train_loss": 3.4226624965667725, "lr": 0.00030672875590031216, "tps": 14229, "wall": 50827.8} {"step": 11036, "train_loss": 3.516019105911255, "lr": 0.00030671196789224876, "tps": 14229, "wall": 50832.9} {"step": 11037, "train_loss": 3.381317615509033, "lr": 0.0003066951789019075, "tps": 14229, "wall": 50837.9} {"step": 11038, "train_loss": 3.4149932861328125, "lr": 0.00030667838892947853, "tps": 14229, "wall": 50843.0} {"step": 11039, "train_loss": 3.4991049766540527, "lr": 0.00030666159797515226, "tps": 14229, "wall": 50848.1} {"step": 11040, "train_loss": 3.4444546699523926, "lr": 0.00030664480603911855, "tps": 14228, "wall": 50853.2} {"step": 11041, "train_loss": 3.453913688659668, "lr": 0.00030662801312156783, "tps": 14228, "wall": 50858.2} {"step": 11042, "train_loss": 3.5332539081573486, "lr": 0.0003066112192226903, "tps": 14228, "wall": 50863.3} {"step": 11043, "train_loss": 3.4859838485717773, "lr": 0.0003065944243426762, "tps": 14228, "wall": 50868.4} {"step": 11044, "train_loss": 3.315431594848633, "lr": 0.00030657762848171577, "tps": 14228, "wall": 50873.5} {"step": 11045, "train_loss": 3.479745626449585, "lr": 0.00030656083163999926, "tps": 14228, "wall": 50878.6} {"step": 11046, "train_loss": 3.4515700340270996, "lr": 0.000306544033817717, "tps": 14228, "wall": 50883.7} {"step": 11047, "train_loss": 3.4676756858825684, "lr": 0.0003065272350150592, "tps": 14227, "wall": 50888.8} {"step": 11048, "train_loss": 3.521791934967041, "lr": 0.0003065104352322162, "tps": 14227, "wall": 50893.9} {"step": 11049, "train_loss": 3.542346715927124, "lr": 0.00030649363446937837, "tps": 14227, "wall": 50899.0} {"step": 11050, "train_loss": 3.4600374698638916, "lr": 0.0003064768327267359, "tps": 14227, "wall": 50904.0} {"step": 11051, "train_loss": 3.618391513824463, "lr": 0.00030646003000447925, "tps": 14227, "wall": 50909.1} {"step": 11052, "train_loss": 3.5413777828216553, "lr": 0.0003064432263027987, "tps": 14227, "wall": 50914.2} {"step": 11053, "train_loss": 3.4393177032470703, "lr": 0.0003064264216218846, "tps": 14227, "wall": 50919.3} {"step": 11054, "train_loss": 3.4689979553222656, "lr": 0.0003064096159619273, "tps": 14226, "wall": 50924.4} {"step": 11055, "train_loss": 3.4774744510650635, "lr": 0.0003063928093231172, "tps": 14226, "wall": 50929.5} {"step": 11056, "train_loss": 3.45475435256958, "lr": 0.0003063760017056447, "tps": 14226, "wall": 50934.5} {"step": 11057, "train_loss": 3.499537944793701, "lr": 0.00030635919310970013, "tps": 14226, "wall": 50939.7} {"step": 11058, "train_loss": 3.4302711486816406, "lr": 0.00030634238353547397, "tps": 14226, "wall": 50944.8} {"step": 11059, "train_loss": 3.408968448638916, "lr": 0.00030632557298315667, "tps": 14226, "wall": 50949.9} {"step": 11060, "train_loss": 3.4981589317321777, "lr": 0.00030630876145293855, "tps": 14226, "wall": 50955.0} {"step": 11061, "train_loss": 3.514557361602783, "lr": 0.0003062919489450101, "tps": 14226, "wall": 50960.1} {"step": 11062, "train_loss": 3.5318942070007324, "lr": 0.00030627513545956187, "tps": 14225, "wall": 50965.1} {"step": 11063, "train_loss": 3.511942148208618, "lr": 0.0003062583209967842, "tps": 14225, "wall": 50970.2} {"step": 11064, "train_loss": 3.430582046508789, "lr": 0.00030624150555686754, "tps": 14225, "wall": 50975.3} {"step": 11065, "train_loss": 3.5851454734802246, "lr": 0.00030622468914000246, "tps": 14225, "wall": 50980.4} {"step": 11066, "train_loss": 3.5792152881622314, "lr": 0.00030620787174637953, "tps": 14225, "wall": 50985.5} {"step": 11067, "train_loss": 3.4900145530700684, "lr": 0.00030619105337618903, "tps": 14225, "wall": 50990.6} {"step": 11068, "train_loss": 3.4428255558013916, "lr": 0.0003061742340296217, "tps": 14225, "wall": 50995.7} {"step": 11069, "train_loss": 3.420619010925293, "lr": 0.000306157413706868, "tps": 14224, "wall": 51000.8} {"step": 11070, "train_loss": 3.482835292816162, "lr": 0.0003061405924081184, "tps": 14224, "wall": 51005.9} {"step": 11071, "train_loss": 3.4995956420898438, "lr": 0.0003061237701335635, "tps": 14224, "wall": 51011.0} {"step": 11072, "train_loss": 3.397480010986328, "lr": 0.0003061069468833939, "tps": 14224, "wall": 51016.1} {"step": 11073, "train_loss": 3.44252872467041, "lr": 0.0003060901226578002, "tps": 14224, "wall": 51021.1} {"step": 11074, "train_loss": 3.460646629333496, "lr": 0.00030607329745697287, "tps": 14224, "wall": 51026.2} {"step": 11075, "train_loss": 3.536540985107422, "lr": 0.0003060564712811026, "tps": 14224, "wall": 51031.3} {"step": 11076, "train_loss": 3.588535785675049, "lr": 0.00030603964413038, "tps": 14224, "wall": 51036.4} {"step": 11077, "train_loss": 3.382652521133423, "lr": 0.00030602281600499554, "tps": 14223, "wall": 51041.5} {"step": 11078, "train_loss": 3.488129138946533, "lr": 0.00030600598690514006, "tps": 14223, "wall": 51046.6} {"step": 11079, "train_loss": 3.561800956726074, "lr": 0.0003059891568310041, "tps": 14223, "wall": 51051.6} {"step": 11080, "train_loss": 3.608752727508545, "lr": 0.0003059723257827783, "tps": 14223, "wall": 51056.8} {"step": 11081, "train_loss": 3.512448787689209, "lr": 0.00030595549376065336, "tps": 14223, "wall": 51061.9} {"step": 11082, "train_loss": 3.574892997741699, "lr": 0.00030593866076481993, "tps": 14223, "wall": 51067.0} {"step": 11083, "train_loss": 3.4741759300231934, "lr": 0.0003059218267954687, "tps": 14223, "wall": 51072.0} {"step": 11084, "train_loss": 3.5283970832824707, "lr": 0.00030590499185279035, "tps": 14222, "wall": 51077.1} {"step": 11085, "train_loss": 3.439528465270996, "lr": 0.0003058881559369756, "tps": 14222, "wall": 51082.2} {"step": 11086, "train_loss": 3.4799628257751465, "lr": 0.0003058713190482152, "tps": 14222, "wall": 51087.3} {"step": 11087, "train_loss": 3.4705615043640137, "lr": 0.0003058544811866998, "tps": 14222, "wall": 51092.3} {"step": 11088, "train_loss": 3.3812527656555176, "lr": 0.0003058376423526203, "tps": 14222, "wall": 51097.4} {"step": 11089, "train_loss": 3.410470962524414, "lr": 0.00030582080254616727, "tps": 14222, "wall": 51102.5} {"step": 11090, "train_loss": 3.411301612854004, "lr": 0.00030580396176753155, "tps": 14222, "wall": 51107.6} {"step": 11091, "train_loss": 3.400005340576172, "lr": 0.00030578712001690393, "tps": 14222, "wall": 51112.6} {"step": 11092, "train_loss": 3.447622776031494, "lr": 0.0003057702772944751, "tps": 14221, "wall": 51117.8} {"step": 11093, "train_loss": 3.541926860809326, "lr": 0.00030575343360043607, "tps": 14221, "wall": 51122.9} {"step": 11094, "train_loss": 3.4935061931610107, "lr": 0.00030573658893497737, "tps": 14221, "wall": 51127.9} {"step": 11095, "train_loss": 3.4825119972229004, "lr": 0.00030571974329829, "tps": 14221, "wall": 51133.0} {"step": 11096, "train_loss": 3.474842071533203, "lr": 0.0003057028966905647, "tps": 14221, "wall": 51138.1} {"step": 11097, "train_loss": 3.411426067352295, "lr": 0.0003056860491119924, "tps": 14221, "wall": 51143.1} {"step": 11098, "train_loss": 3.4599685668945312, "lr": 0.00030566920056276394, "tps": 14221, "wall": 51148.2} {"step": 11099, "train_loss": 3.4769721031188965, "lr": 0.0003056523510430701, "tps": 14220, "wall": 51153.3} {"step": 11100, "train_loss": 3.557097911834717, "lr": 0.0003056355005531018, "tps": 14220, "wall": 51158.4} {"step": 11101, "train_loss": 3.417823553085327, "lr": 0.0003056186490930499, "tps": 14220, "wall": 51163.4} {"step": 11102, "train_loss": 3.5449869632720947, "lr": 0.0003056017966631053, "tps": 14220, "wall": 51168.5} {"step": 11103, "train_loss": 3.4410881996154785, "lr": 0.00030558494326345895, "tps": 14220, "wall": 51173.5} {"step": 11104, "train_loss": 3.4249770641326904, "lr": 0.0003055680888943017, "tps": 14220, "wall": 51178.6} {"step": 11105, "train_loss": 3.565105676651001, "lr": 0.0003055512335558245, "tps": 14220, "wall": 51183.7} {"step": 11106, "train_loss": 3.579576253890991, "lr": 0.0003055343772482183, "tps": 14220, "wall": 51188.7} {"step": 11107, "train_loss": 3.492579460144043, "lr": 0.00030551751997167406, "tps": 14219, "wall": 51193.8} {"step": 11108, "train_loss": 3.4666671752929688, "lr": 0.0003055006617263828, "tps": 14219, "wall": 51198.8} {"step": 11109, "train_loss": 3.5386931896209717, "lr": 0.0003054838025125353, "tps": 14219, "wall": 51203.8} {"step": 11110, "train_loss": 3.418221950531006, "lr": 0.0003054669423303228, "tps": 14219, "wall": 51208.9} {"step": 11111, "train_loss": 3.49371600151062, "lr": 0.000305450081179936, "tps": 14219, "wall": 51213.9} {"step": 11112, "train_loss": 3.351659059524536, "lr": 0.00030543321906156617, "tps": 14219, "wall": 51219.0} {"step": 11113, "train_loss": 3.4242680072784424, "lr": 0.00030541635597540413, "tps": 14219, "wall": 51224.0} {"step": 11114, "train_loss": 3.476032257080078, "lr": 0.00030539949192164104, "tps": 14219, "wall": 51229.1} {"step": 11115, "train_loss": 3.4365930557250977, "lr": 0.0003053826269004679, "tps": 14219, "wall": 51234.1} {"step": 11116, "train_loss": 3.5309250354766846, "lr": 0.0003053657609120757, "tps": 14218, "wall": 51239.2} {"step": 11117, "train_loss": 3.6501078605651855, "lr": 0.00030534889395665555, "tps": 14218, "wall": 51244.3} {"step": 11118, "train_loss": 3.4367098808288574, "lr": 0.00030533202603439855, "tps": 14218, "wall": 51249.3} {"step": 11119, "train_loss": 3.4364535808563232, "lr": 0.0003053151571454957, "tps": 14218, "wall": 51254.3} {"step": 11120, "train_loss": 3.551403522491455, "lr": 0.00030529828729013815, "tps": 14218, "wall": 51259.4} {"step": 11121, "train_loss": 3.5619442462921143, "lr": 0.000305281416468517, "tps": 14218, "wall": 51264.4} {"step": 11122, "train_loss": 3.6021575927734375, "lr": 0.0003052645446808233, "tps": 14218, "wall": 51269.4} {"step": 11123, "train_loss": 3.5182747840881348, "lr": 0.0003052476719272483, "tps": 14218, "wall": 51274.5} {"step": 11124, "train_loss": 3.573326826095581, "lr": 0.000305230798207983, "tps": 14217, "wall": 51279.6} {"step": 11125, "train_loss": 3.4275197982788086, "lr": 0.0003052139235232186, "tps": 14217, "wall": 51284.6} {"step": 11126, "train_loss": 3.4130687713623047, "lr": 0.0003051970478731463, "tps": 14217, "wall": 51289.6} {"step": 11127, "train_loss": 3.437248706817627, "lr": 0.00030518017125795725, "tps": 14217, "wall": 51294.7} {"step": 11128, "train_loss": 3.5566015243530273, "lr": 0.00030516329367784263, "tps": 14217, "wall": 51299.8} {"step": 11129, "train_loss": 3.5461323261260986, "lr": 0.00030514641513299353, "tps": 14217, "wall": 51304.8} {"step": 11130, "train_loss": 3.651729106903076, "lr": 0.0003051295356236013, "tps": 14217, "wall": 51309.8} {"step": 11131, "train_loss": 3.5469560623168945, "lr": 0.00030511265514985707, "tps": 14217, "wall": 51314.8} {"step": 11132, "train_loss": 3.371169090270996, "lr": 0.00030509577371195206, "tps": 14216, "wall": 51319.9} {"step": 11133, "train_loss": 3.4979536533355713, "lr": 0.00030507889131007747, "tps": 14216, "wall": 51324.9} {"step": 11134, "train_loss": 3.4220643043518066, "lr": 0.00030506200794442473, "tps": 14216, "wall": 51329.9} {"step": 11135, "train_loss": 3.480099678039551, "lr": 0.00030504512361518486, "tps": 14216, "wall": 51334.9} {"step": 11136, "train_loss": 3.402782440185547, "lr": 0.00030502823832254924, "tps": 14216, "wall": 51339.9} {"step": 11137, "train_loss": 3.554708480834961, "lr": 0.00030501135206670917, "tps": 14216, "wall": 51345.0} {"step": 11138, "train_loss": 3.4822583198547363, "lr": 0.0003049944648478559, "tps": 14216, "wall": 51350.0} {"step": 11139, "train_loss": 3.5518712997436523, "lr": 0.0003049775766661807, "tps": 14216, "wall": 51355.0} {"step": 11140, "train_loss": 3.3993618488311768, "lr": 0.0003049606875218749, "tps": 14216, "wall": 51360.0} {"step": 11141, "train_loss": 3.474323272705078, "lr": 0.0003049437974151299, "tps": 14215, "wall": 51365.0} {"step": 11142, "train_loss": 3.4535725116729736, "lr": 0.000304926906346137, "tps": 14215, "wall": 51370.0} {"step": 11143, "train_loss": 3.368741989135742, "lr": 0.0003049100143150874, "tps": 14215, "wall": 51375.1} {"step": 11144, "train_loss": 3.5603833198547363, "lr": 0.0003048931213221726, "tps": 14215, "wall": 51380.1} {"step": 11145, "train_loss": 3.4651682376861572, "lr": 0.000304876227367584, "tps": 14215, "wall": 51385.1} {"step": 11146, "train_loss": 3.4950602054595947, "lr": 0.00030485933245151276, "tps": 14215, "wall": 51390.1} {"step": 11147, "train_loss": 3.3750534057617188, "lr": 0.0003048424365741505, "tps": 14215, "wall": 51395.1} {"step": 11148, "train_loss": 3.547443389892578, "lr": 0.0003048255397356886, "tps": 14215, "wall": 51400.1} {"step": 11149, "train_loss": 3.4159204959869385, "lr": 0.0003048086419363183, "tps": 14215, "wall": 51405.1} {"step": 11150, "train_loss": 3.498112678527832, "lr": 0.0003047917431762311, "tps": 14214, "wall": 51410.1} {"step": 11151, "train_loss": 3.4547812938690186, "lr": 0.0003047748434556185, "tps": 14214, "wall": 51415.1} {"step": 11152, "train_loss": 3.5978341102600098, "lr": 0.00030475794277467187, "tps": 14214, "wall": 51420.1} {"step": 11153, "train_loss": 3.5583901405334473, "lr": 0.0003047410411335827, "tps": 14214, "wall": 51425.1} {"step": 11154, "train_loss": 3.3861489295959473, "lr": 0.0003047241385325424, "tps": 14214, "wall": 51430.1} {"step": 11155, "train_loss": 3.5112338066101074, "lr": 0.0003047072349717425, "tps": 14214, "wall": 51435.1} {"step": 11156, "train_loss": 3.583296537399292, "lr": 0.0003046903304513745, "tps": 14214, "wall": 51440.0} {"step": 11157, "train_loss": 3.416001796722412, "lr": 0.00030467342497162976, "tps": 14214, "wall": 51445.0} {"step": 11158, "train_loss": 3.448207378387451, "lr": 0.0003046565185326999, "tps": 14214, "wall": 51450.0} {"step": 11159, "train_loss": 3.5545127391815186, "lr": 0.00030463961113477646, "tps": 14214, "wall": 51455.0} {"step": 11160, "train_loss": 3.5913078784942627, "lr": 0.0003046227027780509, "tps": 14213, "wall": 51459.9} {"step": 11161, "train_loss": 3.465604066848755, "lr": 0.0003046057934627148, "tps": 14213, "wall": 51464.9} {"step": 11162, "train_loss": 3.402538776397705, "lr": 0.0003045888831889597, "tps": 14213, "wall": 51469.9} {"step": 11163, "train_loss": 3.6145894527435303, "lr": 0.00030457197195697715, "tps": 14213, "wall": 51474.9} {"step": 11164, "train_loss": 3.4247264862060547, "lr": 0.0003045550597669587, "tps": 14213, "wall": 51479.9} {"step": 11165, "train_loss": 3.455799102783203, "lr": 0.000304538146619096, "tps": 14213, "wall": 51484.9} {"step": 11166, "train_loss": 3.4175164699554443, "lr": 0.0003045212325135806, "tps": 14213, "wall": 51489.8} {"step": 11167, "train_loss": 3.5343008041381836, "lr": 0.00030450431745060404, "tps": 14213, "wall": 51494.8} {"step": 11168, "train_loss": 3.5512213706970215, "lr": 0.0003044874014303581, "tps": 14213, "wall": 51499.9} {"step": 11169, "train_loss": 3.4240214824676514, "lr": 0.00030447048445303427, "tps": 14212, "wall": 51504.8} {"step": 11170, "train_loss": 3.453362464904785, "lr": 0.0003044535665188242, "tps": 14212, "wall": 51509.8} {"step": 11171, "train_loss": 3.566485643386841, "lr": 0.00030443664762791955, "tps": 14212, "wall": 51514.8} {"step": 11172, "train_loss": 3.4628865718841553, "lr": 0.000304419727780512, "tps": 14212, "wall": 51519.8} {"step": 11173, "train_loss": 3.4901294708251953, "lr": 0.00030440280697679317, "tps": 14212, "wall": 51524.8} {"step": 11174, "train_loss": 3.4263155460357666, "lr": 0.00030438588521695487, "tps": 14212, "wall": 51529.8} {"step": 11175, "train_loss": 3.4267044067382812, "lr": 0.0003043689625011886, "tps": 14212, "wall": 51534.7} {"step": 11176, "train_loss": 3.5202226638793945, "lr": 0.0003043520388296862, "tps": 14212, "wall": 51539.8} {"step": 11177, "train_loss": 3.5346696376800537, "lr": 0.00030433511420263935, "tps": 14212, "wall": 51544.7} {"step": 11178, "train_loss": 3.4984214305877686, "lr": 0.0003043181886202398, "tps": 14212, "wall": 51549.7} {"step": 11179, "train_loss": 3.4583213329315186, "lr": 0.00030430126208267917, "tps": 14211, "wall": 51554.7} {"step": 11180, "train_loss": 3.4632930755615234, "lr": 0.00030428433459014936, "tps": 14211, "wall": 51559.7} {"step": 11181, "train_loss": 3.3977181911468506, "lr": 0.00030426740614284195, "tps": 14211, "wall": 51564.6} {"step": 11182, "train_loss": 3.4577064514160156, "lr": 0.00030425047674094885, "tps": 14211, "wall": 51569.6} {"step": 11183, "train_loss": 3.4356255531311035, "lr": 0.0003042335463846618, "tps": 14211, "wall": 51574.6} {"step": 11184, "train_loss": 3.4283790588378906, "lr": 0.0003042166150741726, "tps": 14211, "wall": 51579.6} {"step": 11185, "train_loss": 3.562833786010742, "lr": 0.000304199682809673, "tps": 14211, "wall": 51584.5} {"step": 11186, "train_loss": 3.5257768630981445, "lr": 0.00030418274959135487, "tps": 14211, "wall": 51589.5} {"step": 11187, "train_loss": 3.4102654457092285, "lr": 0.00030416581541940996, "tps": 14211, "wall": 51594.5} {"step": 11188, "train_loss": 3.496446132659912, "lr": 0.0003041488802940302, "tps": 14211, "wall": 51599.5} {"step": 11189, "train_loss": 3.5949575901031494, "lr": 0.00030413194421540727, "tps": 14210, "wall": 51604.6} {"step": 11190, "train_loss": 3.42673921585083, "lr": 0.00030411500718373314, "tps": 14210, "wall": 51609.6} {"step": 11191, "train_loss": 3.370267152786255, "lr": 0.00030409806919919974, "tps": 14210, "wall": 51614.5} {"step": 11192, "train_loss": 3.4341702461242676, "lr": 0.0003040811302619988, "tps": 14210, "wall": 51619.5} {"step": 11193, "train_loss": 3.5160155296325684, "lr": 0.0003040641903723223, "tps": 14210, "wall": 51624.5} {"step": 11194, "train_loss": 3.485518455505371, "lr": 0.0003040472495303621, "tps": 14210, "wall": 51629.5} {"step": 11195, "train_loss": 3.406536102294922, "lr": 0.0003040303077363101, "tps": 14210, "wall": 51634.5} {"step": 11196, "train_loss": 3.604585886001587, "lr": 0.0003040133649903582, "tps": 14210, "wall": 51639.5} {"step": 11197, "train_loss": 3.5116400718688965, "lr": 0.00030399642129269843, "tps": 14210, "wall": 51644.5} {"step": 11198, "train_loss": 3.4946300983428955, "lr": 0.0003039794766435225, "tps": 14209, "wall": 51649.5} {"step": 11199, "train_loss": 3.4145305156707764, "lr": 0.0003039625310430227, "tps": 14209, "wall": 51654.5} {"step": 11200, "train_loss": 3.4336605072021484, "lr": 0.00030394558449139074, "tps": 14209, "wall": 51659.5} {"step": 11201, "train_loss": 3.4617209434509277, "lr": 0.00030392863698881865, "tps": 14209, "wall": 51664.5} {"step": 11202, "train_loss": 3.514028787612915, "lr": 0.00030391168853549844, "tps": 14209, "wall": 51669.5} {"step": 11203, "train_loss": 3.4779903888702393, "lr": 0.00030389473913162204, "tps": 14209, "wall": 51674.5} {"step": 11204, "train_loss": 3.492539405822754, "lr": 0.0003038777887773815, "tps": 14209, "wall": 51679.4} {"step": 11205, "train_loss": 3.4664907455444336, "lr": 0.0003038608374729689, "tps": 14209, "wall": 51684.4} {"step": 11206, "train_loss": 3.437959671020508, "lr": 0.00030384388521857616, "tps": 14209, "wall": 51689.4} {"step": 11207, "train_loss": 3.4339420795440674, "lr": 0.0003038269320143953, "tps": 14209, "wall": 51694.4} {"step": 11208, "train_loss": 3.4413466453552246, "lr": 0.0003038099778606184, "tps": 14208, "wall": 51699.4} {"step": 11209, "train_loss": 3.568655252456665, "lr": 0.00030379302275743765, "tps": 14208, "wall": 51704.3} {"step": 11210, "train_loss": 3.4681291580200195, "lr": 0.000303776066705045, "tps": 14208, "wall": 51709.3} {"step": 11211, "train_loss": 3.5111336708068848, "lr": 0.0003037591097036324, "tps": 14208, "wall": 51714.3} {"step": 11212, "train_loss": 3.344561815261841, "lr": 0.00030374215175339215, "tps": 14208, "wall": 51719.3} {"step": 11213, "train_loss": 3.5336899757385254, "lr": 0.00030372519285451634, "tps": 14208, "wall": 51724.3} {"step": 11214, "train_loss": 3.3581817150115967, "lr": 0.00030370823300719695, "tps": 14208, "wall": 51729.3} {"step": 11215, "train_loss": 3.5207738876342773, "lr": 0.0003036912722116262, "tps": 14208, "wall": 51734.3} {"step": 11216, "train_loss": 3.5073022842407227, "lr": 0.0003036743104679962, "tps": 14208, "wall": 51739.3} {"step": 11217, "train_loss": 3.4797871112823486, "lr": 0.000303657347776499, "tps": 14208, "wall": 51744.3} {"step": 11218, "train_loss": 3.509573221206665, "lr": 0.0003036403841373269, "tps": 14207, "wall": 51749.3} {"step": 11219, "train_loss": 3.4427621364593506, "lr": 0.000303623419550672, "tps": 14207, "wall": 51754.3} {"step": 11220, "train_loss": 3.402724266052246, "lr": 0.00030360645401672644, "tps": 14207, "wall": 51759.2} {"step": 11221, "train_loss": 3.413196563720703, "lr": 0.0003035894875356825, "tps": 14207, "wall": 51764.2} {"step": 11222, "train_loss": 3.5019114017486572, "lr": 0.00030357252010773233, "tps": 14207, "wall": 51769.2} {"step": 11223, "train_loss": 3.456235408782959, "lr": 0.0003035555517330681, "tps": 14207, "wall": 51774.1} {"step": 11224, "train_loss": 3.445978879928589, "lr": 0.0003035385824118821, "tps": 14207, "wall": 51779.2} {"step": 11225, "train_loss": 3.5226426124572754, "lr": 0.00030352161214436646, "tps": 14207, "wall": 51784.2} {"step": 11226, "train_loss": 3.3775694370269775, "lr": 0.00030350464093071346, "tps": 14207, "wall": 51789.2} {"step": 11227, "train_loss": 3.4237968921661377, "lr": 0.00030348766877111543, "tps": 14206, "wall": 51794.1} {"step": 11228, "train_loss": 3.344376802444458, "lr": 0.0003034706956657645, "tps": 14206, "wall": 51799.1} {"step": 11229, "train_loss": 3.4598171710968018, "lr": 0.00030345372161485313, "tps": 14206, "wall": 51804.1} {"step": 11230, "train_loss": 3.4827232360839844, "lr": 0.00030343674661857336, "tps": 14206, "wall": 51809.1} {"step": 11231, "train_loss": 3.548520088195801, "lr": 0.0003034197706771177, "tps": 14206, "wall": 51814.1} {"step": 11232, "train_loss": 3.5670077800750732, "lr": 0.0003034027937906784, "tps": 14206, "wall": 51819.1} {"step": 11233, "train_loss": 3.5320065021514893, "lr": 0.0003033858159594476, "tps": 14206, "wall": 51824.1} {"step": 11234, "train_loss": 3.4921069145202637, "lr": 0.0003033688371836179, "tps": 14206, "wall": 51829.0} {"step": 11235, "train_loss": 3.405989170074463, "lr": 0.0003033518574633814, "tps": 14206, "wall": 51834.0} {"step": 11236, "train_loss": 3.571101665496826, "lr": 0.00030333487679893065, "tps": 14206, "wall": 51839.1} {"step": 11237, "train_loss": 3.5107762813568115, "lr": 0.0003033178951904578, "tps": 14205, "wall": 51844.1} {"step": 11238, "train_loss": 3.4798076152801514, "lr": 0.00030330091263815537, "tps": 14205, "wall": 51849.1} {"step": 11239, "train_loss": 3.3688836097717285, "lr": 0.00030328392914221575, "tps": 14205, "wall": 51854.0} {"step": 11240, "train_loss": 3.4339957237243652, "lr": 0.0003032669447028312, "tps": 14205, "wall": 51859.0} {"step": 11241, "train_loss": 3.5524942874908447, "lr": 0.00030324995932019426, "tps": 14205, "wall": 51864.0} {"step": 11242, "train_loss": 3.376751661300659, "lr": 0.00030323297299449727, "tps": 14205, "wall": 51869.0} {"step": 11243, "train_loss": 3.480565309524536, "lr": 0.0003032159857259326, "tps": 14205, "wall": 51873.9} {"step": 11244, "train_loss": 3.5344226360321045, "lr": 0.0003031989975146928, "tps": 14205, "wall": 51878.9} {"step": 11245, "train_loss": 3.4642255306243896, "lr": 0.00030318200836097016, "tps": 14205, "wall": 51883.9} {"step": 11246, "train_loss": 3.3968632221221924, "lr": 0.00030316501826495735, "tps": 14205, "wall": 51888.9} {"step": 11247, "train_loss": 3.4812707901000977, "lr": 0.0003031480272268467, "tps": 14204, "wall": 51893.9} {"step": 11248, "train_loss": 3.4166760444641113, "lr": 0.0003031310352468306, "tps": 14204, "wall": 51898.9} {"step": 11249, "train_loss": 3.643031597137451, "lr": 0.0003031140423251017, "tps": 14204, "wall": 51904.0} {"step": 11250, "train_loss": 3.566253662109375, "lr": 0.0003030970484618525, "tps": 14204, "wall": 51909.0} {"step": 11251, "train_loss": 3.506737232208252, "lr": 0.0003030800536572753, "tps": 14204, "wall": 51913.9} {"step": 11252, "train_loss": 3.4806718826293945, "lr": 0.0003030630579115628, "tps": 14204, "wall": 51918.9} {"step": 11253, "train_loss": 3.4126036167144775, "lr": 0.0003030460612249076, "tps": 14204, "wall": 51923.9} {"step": 11254, "train_loss": 3.590897560119629, "lr": 0.000303029063597502, "tps": 14204, "wall": 51928.9} {"step": 11255, "train_loss": 3.51023006439209, "lr": 0.00030301206502953874, "tps": 14204, "wall": 51933.9} {"step": 11256, "train_loss": 3.486380100250244, "lr": 0.0003029950655212102, "tps": 14203, "wall": 51938.8} {"step": 11257, "train_loss": 3.5324580669403076, "lr": 0.00030297806507270924, "tps": 14203, "wall": 51943.8} {"step": 11258, "train_loss": 3.3907413482666016, "lr": 0.00030296106368422817, "tps": 14203, "wall": 51948.8} {"step": 11259, "train_loss": 3.552455425262451, "lr": 0.0003029440613559597, "tps": 14203, "wall": 51953.8} {"step": 11260, "train_loss": 3.491295099258423, "lr": 0.00030292705808809643, "tps": 14203, "wall": 51958.8} {"step": 11261, "train_loss": 3.515338897705078, "lr": 0.00030291005388083093, "tps": 14203, "wall": 51963.8} {"step": 11262, "train_loss": 3.4856371879577637, "lr": 0.00030289304873435584, "tps": 14203, "wall": 51968.8} {"step": 11263, "train_loss": 3.436458110809326, "lr": 0.00030287604264886387, "tps": 14203, "wall": 51973.8} {"step": 11264, "train_loss": 3.5534400939941406, "lr": 0.0003028590356245476, "tps": 14203, "wall": 51978.8} {"step": 11265, "train_loss": 3.4193809032440186, "lr": 0.0003028420276615996, "tps": 14203, "wall": 51983.7} {"step": 11266, "train_loss": 3.4652373790740967, "lr": 0.00030282501876021273, "tps": 14202, "wall": 51988.7} {"step": 11267, "train_loss": 3.4447450637817383, "lr": 0.00030280800892057956, "tps": 14202, "wall": 51993.7} {"step": 11268, "train_loss": 3.377936840057373, "lr": 0.0003027909981428927, "tps": 14202, "wall": 51998.7} {"step": 11269, "train_loss": 3.503290891647339, "lr": 0.00030277398642734497, "tps": 14202, "wall": 52003.6} {"step": 11270, "train_loss": 3.4464101791381836, "lr": 0.00030275697377412915, "tps": 14202, "wall": 52008.6} {"step": 11271, "train_loss": 3.4606642723083496, "lr": 0.0003027399601834377, "tps": 14202, "wall": 52013.6} {"step": 11272, "train_loss": 3.5095081329345703, "lr": 0.00030272294565546356, "tps": 14202, "wall": 52018.7} {"step": 11273, "train_loss": 3.511850357055664, "lr": 0.00030270593019039943, "tps": 14202, "wall": 52023.6} {"step": 11274, "train_loss": 3.4682486057281494, "lr": 0.0003026889137884381, "tps": 14202, "wall": 52028.6} {"step": 11275, "train_loss": 3.488192081451416, "lr": 0.00030267189644977223, "tps": 14202, "wall": 52033.6} {"step": 11276, "train_loss": 3.4910383224487305, "lr": 0.00030265487817459464, "tps": 14201, "wall": 52038.6} {"step": 11277, "train_loss": 3.4472804069519043, "lr": 0.00030263785896309816, "tps": 14201, "wall": 52043.5} {"step": 11278, "train_loss": 3.593536853790283, "lr": 0.0003026208388154755, "tps": 14201, "wall": 52048.5} {"step": 11279, "train_loss": 3.5034291744232178, "lr": 0.0003026038177319194, "tps": 14201, "wall": 52053.5} {"step": 11280, "train_loss": 3.383870840072632, "lr": 0.000302586795712623, "tps": 14201, "wall": 52058.5} {"step": 11281, "train_loss": 3.4469780921936035, "lr": 0.0003025697727577788, "tps": 14201, "wall": 52063.5} {"step": 11282, "train_loss": 3.37038516998291, "lr": 0.00030255274886757975, "tps": 14201, "wall": 52068.4} {"step": 11283, "train_loss": 3.4651777744293213, "lr": 0.0003025357240422187, "tps": 14201, "wall": 52073.4} {"step": 11284, "train_loss": 3.5555763244628906, "lr": 0.0003025186982818885, "tps": 14201, "wall": 52078.5} {"step": 11285, "train_loss": 3.3563289642333984, "lr": 0.000302501671586782, "tps": 14201, "wall": 52083.5} {"step": 11286, "train_loss": 3.4747226238250732, "lr": 0.00030248464395709213, "tps": 14200, "wall": 52088.4} {"step": 11287, "train_loss": 3.543806552886963, "lr": 0.0003024676153930118, "tps": 14200, "wall": 52093.4} {"step": 11288, "train_loss": 3.4143872261047363, "lr": 0.0003024505858947338, "tps": 14200, "wall": 52098.4} {"step": 11289, "train_loss": 3.4834094047546387, "lr": 0.00030243355546245106, "tps": 14200, "wall": 52103.4} {"step": 11290, "train_loss": 3.4978365898132324, "lr": 0.00030241652409635666, "tps": 14200, "wall": 52108.4} {"step": 11291, "train_loss": 3.4693803787231445, "lr": 0.00030239949179664336, "tps": 14200, "wall": 52113.3} {"step": 11292, "train_loss": 3.3608102798461914, "lr": 0.00030238245856350414, "tps": 14200, "wall": 52118.3} {"step": 11293, "train_loss": 3.4320316314697266, "lr": 0.00030236542439713194, "tps": 14200, "wall": 52123.3} {"step": 11294, "train_loss": 3.373109817504883, "lr": 0.00030234838929771985, "tps": 14200, "wall": 52128.3} {"step": 11295, "train_loss": 3.4649834632873535, "lr": 0.0003023313532654607, "tps": 14200, "wall": 52133.3} {"step": 11296, "train_loss": 3.437849521636963, "lr": 0.0003023143163005475, "tps": 14199, "wall": 52138.3} {"step": 11297, "train_loss": 3.5434134006500244, "lr": 0.00030229727840317333, "tps": 14199, "wall": 52143.3} {"step": 11298, "train_loss": 3.5140464305877686, "lr": 0.00030228023957353103, "tps": 14199, "wall": 52148.3} {"step": 11299, "train_loss": 3.4590790271759033, "lr": 0.00030226319981181384, "tps": 14199, "wall": 52153.3} {"step": 11300, "train_loss": 3.40431547164917, "lr": 0.00030224615911821464, "tps": 14199, "wall": 52158.2} {"step": 11301, "train_loss": 3.441042900085449, "lr": 0.0003022291174929265, "tps": 14199, "wall": 52163.2} {"step": 11302, "train_loss": 3.523603916168213, "lr": 0.0003022120749361424, "tps": 14199, "wall": 52168.2} {"step": 11303, "train_loss": 3.5892086029052734, "lr": 0.00030219503144805553, "tps": 14199, "wall": 52173.2} {"step": 11304, "train_loss": 3.5506553649902344, "lr": 0.00030217798702885897, "tps": 14199, "wall": 52178.1} {"step": 11305, "train_loss": 3.4804632663726807, "lr": 0.00030216094167874566, "tps": 14199, "wall": 52183.1} {"step": 11306, "train_loss": 3.4154207706451416, "lr": 0.0003021438953979087, "tps": 14198, "wall": 52188.1} {"step": 11307, "train_loss": 3.4912328720092773, "lr": 0.00030212684818654135, "tps": 14198, "wall": 52193.1} {"step": 11308, "train_loss": 3.380439519882202, "lr": 0.0003021098000448366, "tps": 14198, "wall": 52198.1} {"step": 11309, "train_loss": 3.4336752891540527, "lr": 0.0003020927509729875, "tps": 14198, "wall": 52203.1} {"step": 11310, "train_loss": 3.4583518505096436, "lr": 0.00030207570097118736, "tps": 14198, "wall": 52208.1} {"step": 11311, "train_loss": 3.3871002197265625, "lr": 0.00030205865003962923, "tps": 14198, "wall": 52213.1} {"step": 11312, "train_loss": 3.4745123386383057, "lr": 0.00030204159817850626, "tps": 14198, "wall": 52218.1} {"step": 11313, "train_loss": 3.564077138900757, "lr": 0.0003020245453880116, "tps": 14198, "wall": 52223.1} {"step": 11314, "train_loss": 3.5408430099487305, "lr": 0.00030200749166833855, "tps": 14198, "wall": 52228.0} {"step": 11315, "train_loss": 3.5819482803344727, "lr": 0.0003019904370196801, "tps": 14198, "wall": 52233.0} {"step": 11316, "train_loss": 3.50748348236084, "lr": 0.00030197338144222956, "tps": 14197, "wall": 52238.0} {"step": 11317, "train_loss": 3.4933247566223145, "lr": 0.00030195632493618016, "tps": 14197, "wall": 52243.0} {"step": 11318, "train_loss": 3.3468759059906006, "lr": 0.00030193926750172507, "tps": 14197, "wall": 52248.0} {"step": 11319, "train_loss": 3.399528980255127, "lr": 0.00030192220913905746, "tps": 14197, "wall": 52253.0} {"step": 11320, "train_loss": 3.449418783187866, "lr": 0.0003019051498483707, "tps": 14197, "wall": 52258.0} {"step": 11321, "train_loss": 3.4913434982299805, "lr": 0.000301888089629858, "tps": 14197, "wall": 52263.0} {"step": 11322, "train_loss": 3.492828607559204, "lr": 0.00030187102848371246, "tps": 14197, "wall": 52268.0} {"step": 11323, "train_loss": 3.398709297180176, "lr": 0.0003018539664101276, "tps": 14197, "wall": 52272.9} {"step": 11324, "train_loss": 3.5090653896331787, "lr": 0.0003018369034092965, "tps": 14197, "wall": 52277.9} {"step": 11325, "train_loss": 3.423521041870117, "lr": 0.0003018198394814126, "tps": 14197, "wall": 52282.9} {"step": 11326, "train_loss": 3.426699638366699, "lr": 0.00030180277462666906, "tps": 14196, "wall": 52287.9} {"step": 11327, "train_loss": 3.375462532043457, "lr": 0.00030178570884525934, "tps": 14196, "wall": 52292.8} {"step": 11328, "train_loss": 3.443635940551758, "lr": 0.00030176864213737664, "tps": 14196, "wall": 52297.8} {"step": 11329, "train_loss": 3.3919529914855957, "lr": 0.0003017515745032144, "tps": 14196, "wall": 52302.8} {"step": 11330, "train_loss": 3.453263282775879, "lr": 0.00030173450594296586, "tps": 14196, "wall": 52307.8} {"step": 11331, "train_loss": 3.5277233123779297, "lr": 0.0003017174364568244, "tps": 14196, "wall": 52312.8} {"step": 11332, "train_loss": 3.452958583831787, "lr": 0.00030170036604498346, "tps": 14196, "wall": 52317.8} {"step": 11333, "train_loss": 3.607231616973877, "lr": 0.0003016832947076363, "tps": 14196, "wall": 52322.8} {"step": 11334, "train_loss": 3.4731285572052, "lr": 0.0003016662224449763, "tps": 14196, "wall": 52327.8} {"step": 11335, "train_loss": 3.5227773189544678, "lr": 0.000301649149257197, "tps": 14195, "wall": 52332.8} {"step": 11336, "train_loss": 3.4734973907470703, "lr": 0.0003016320751444917, "tps": 14195, "wall": 52337.8} {"step": 11337, "train_loss": 3.3575711250305176, "lr": 0.00030161500010705383, "tps": 14195, "wall": 52342.8} {"step": 11338, "train_loss": 3.3675103187561035, "lr": 0.00030159792414507684, "tps": 14195, "wall": 52347.8} {"step": 11339, "train_loss": 3.4506278038024902, "lr": 0.0003015808472587541, "tps": 14195, "wall": 52352.8} {"step": 11340, "train_loss": 3.3665881156921387, "lr": 0.00030156376944827915, "tps": 14195, "wall": 52357.7} {"step": 11341, "train_loss": 3.406181812286377, "lr": 0.00030154669071384536, "tps": 14195, "wall": 52362.7} {"step": 11342, "train_loss": 3.453795909881592, "lr": 0.00030152961105564633, "tps": 14195, "wall": 52367.7} {"step": 11343, "train_loss": 3.3528642654418945, "lr": 0.0003015125304738754, "tps": 14195, "wall": 52372.7} {"step": 11344, "train_loss": 3.3698134422302246, "lr": 0.00030149544896872617, "tps": 14195, "wall": 52377.8} {"step": 11345, "train_loss": 3.4698424339294434, "lr": 0.000301478366540392, "tps": 14194, "wall": 52382.8} {"step": 11346, "train_loss": 3.440028429031372, "lr": 0.00030146128318906654, "tps": 14194, "wall": 52387.7} {"step": 11347, "train_loss": 3.630563735961914, "lr": 0.00030144419891494327, "tps": 14194, "wall": 52392.7} {"step": 11348, "train_loss": 3.628866195678711, "lr": 0.0003014271137182156, "tps": 14194, "wall": 52397.7} {"step": 11349, "train_loss": 3.457273483276367, "lr": 0.0003014100275990773, "tps": 14194, "wall": 52402.8} {"step": 11350, "train_loss": 3.489243507385254, "lr": 0.00030139294055772176, "tps": 14194, "wall": 52407.8} {"step": 11351, "train_loss": 3.505539894104004, "lr": 0.00030137585259434267, "tps": 14194, "wall": 52412.8} {"step": 11352, "train_loss": 3.4593920707702637, "lr": 0.0003013587637091334, "tps": 14194, "wall": 52417.7} {"step": 11353, "train_loss": 3.4572548866271973, "lr": 0.0003013416739022877, "tps": 14194, "wall": 52422.7} {"step": 11354, "train_loss": 3.454573631286621, "lr": 0.0003013245831739991, "tps": 14194, "wall": 52427.7} {"step": 11355, "train_loss": 3.4562389850616455, "lr": 0.0003013074915244613, "tps": 14193, "wall": 52432.7} {"step": 11356, "train_loss": 3.478832960128784, "lr": 0.00030129039895386773, "tps": 14193, "wall": 52437.7} {"step": 11357, "train_loss": 3.4332685470581055, "lr": 0.00030127330546241216, "tps": 14193, "wall": 52442.7} {"step": 11358, "train_loss": 3.3528990745544434, "lr": 0.0003012562110502882, "tps": 14193, "wall": 52447.7} {"step": 11359, "train_loss": 3.5134170055389404, "lr": 0.0003012391157176895, "tps": 14193, "wall": 52452.7} {"step": 11360, "train_loss": 3.4052584171295166, "lr": 0.00030122201946480967, "tps": 14193, "wall": 52457.6} {"step": 11361, "train_loss": 3.4130260944366455, "lr": 0.00030120492229184246, "tps": 14193, "wall": 52462.6} {"step": 11362, "train_loss": 3.4385523796081543, "lr": 0.00030118782419898143, "tps": 14193, "wall": 52467.6} {"step": 11363, "train_loss": 3.411008358001709, "lr": 0.00030117072518642037, "tps": 14193, "wall": 52472.6} {"step": 11364, "train_loss": 3.427424430847168, "lr": 0.0003011536252543529, "tps": 14193, "wall": 52477.6} {"step": 11365, "train_loss": 3.469484329223633, "lr": 0.00030113652440297284, "tps": 14192, "wall": 52482.5} {"step": 11366, "train_loss": 3.4375181198120117, "lr": 0.00030111942263247386, "tps": 14192, "wall": 52487.5} {"step": 11367, "train_loss": 3.5344078540802, "lr": 0.00030110231994304957, "tps": 14192, "wall": 52492.5} {"step": 11368, "train_loss": 3.429640531539917, "lr": 0.0003010852163348939, "tps": 14192, "wall": 52497.5} {"step": 11369, "train_loss": 3.4549028873443604, "lr": 0.0003010681118082005, "tps": 14192, "wall": 52502.5} {"step": 11370, "train_loss": 3.437896728515625, "lr": 0.0003010510063631631, "tps": 14192, "wall": 52507.5} {"step": 11371, "train_loss": 3.4637866020202637, "lr": 0.0003010338999999755, "tps": 14192, "wall": 52512.5} {"step": 11372, "train_loss": 3.49867582321167, "lr": 0.0003010167927188316, "tps": 14192, "wall": 52517.5} {"step": 11373, "train_loss": 3.5147433280944824, "lr": 0.00030099968451992505, "tps": 14192, "wall": 52522.5} {"step": 11374, "train_loss": 3.5083703994750977, "lr": 0.0003009825754034496, "tps": 14192, "wall": 52527.4} {"step": 11375, "train_loss": 3.4729487895965576, "lr": 0.00030096546536959924, "tps": 14191, "wall": 52532.4} {"step": 11376, "train_loss": 3.459542989730835, "lr": 0.00030094835441856773, "tps": 14191, "wall": 52537.4} {"step": 11377, "train_loss": 3.4471559524536133, "lr": 0.00030093124255054876, "tps": 14191, "wall": 52542.4} {"step": 11378, "train_loss": 3.471360206604004, "lr": 0.0003009141297657364, "tps": 14191, "wall": 52547.3} {"step": 11379, "train_loss": 3.504793167114258, "lr": 0.0003008970160643244, "tps": 14191, "wall": 52552.3} {"step": 11380, "train_loss": 3.4152493476867676, "lr": 0.00030087990144650657, "tps": 14191, "wall": 52557.3} {"step": 11381, "train_loss": 3.4535939693450928, "lr": 0.0003008627859124769, "tps": 14191, "wall": 52562.3} {"step": 11382, "train_loss": 3.438276767730713, "lr": 0.00030084566946242923, "tps": 14191, "wall": 52567.3} {"step": 11383, "train_loss": 3.3785314559936523, "lr": 0.0003008285520965574, "tps": 14191, "wall": 52572.3} {"step": 11384, "train_loss": 3.423884868621826, "lr": 0.00030081143381505533, "tps": 14191, "wall": 52577.3} {"step": 11385, "train_loss": 3.4533557891845703, "lr": 0.000300794314618117, "tps": 14190, "wall": 52582.3} {"step": 11386, "train_loss": 3.4783153533935547, "lr": 0.0003007771945059363, "tps": 14190, "wall": 52587.2} {"step": 11387, "train_loss": 3.3530759811401367, "lr": 0.0003007600734787072, "tps": 14190, "wall": 52592.2} {"step": 11388, "train_loss": 3.466813564300537, "lr": 0.0003007429515366236, "tps": 14190, "wall": 52597.2} {"step": 11389, "train_loss": 3.5448386669158936, "lr": 0.0003007258286798795, "tps": 14190, "wall": 52602.2} {"step": 11390, "train_loss": 3.5399885177612305, "lr": 0.00030070870490866877, "tps": 14190, "wall": 52607.1} {"step": 11391, "train_loss": 3.4848878383636475, "lr": 0.00030069158022318554, "tps": 14190, "wall": 52612.1} {"step": 11392, "train_loss": 3.605649709701538, "lr": 0.0003006744546236237, "tps": 14190, "wall": 52617.2} {"step": 11393, "train_loss": 3.4762871265411377, "lr": 0.00030065732811017723, "tps": 14190, "wall": 52622.2} {"step": 11394, "train_loss": 3.520508289337158, "lr": 0.0003006402006830402, "tps": 14190, "wall": 52627.2} {"step": 11395, "train_loss": 3.376521110534668, "lr": 0.00030062307234240667, "tps": 14189, "wall": 52632.1} {"step": 11396, "train_loss": 3.5442605018615723, "lr": 0.0003006059430884706, "tps": 14189, "wall": 52637.1} {"step": 11397, "train_loss": 3.4540581703186035, "lr": 0.000300588812921426, "tps": 14189, "wall": 52642.1} {"step": 11398, "train_loss": 3.4316368103027344, "lr": 0.000300571681841467, "tps": 14189, "wall": 52647.1} {"step": 11399, "train_loss": 3.3914425373077393, "lr": 0.0003005545498487876, "tps": 14189, "wall": 52652.1} {"step": 11400, "train_loss": 3.4946279525756836, "lr": 0.00030053741694358195, "tps": 14189, "wall": 52657.0} {"step": 11401, "train_loss": 3.586880683898926, "lr": 0.000300520283126044, "tps": 14189, "wall": 52662.0} {"step": 11402, "train_loss": 3.4993700981140137, "lr": 0.00030050314839636804, "tps": 14189, "wall": 52667.0} {"step": 11403, "train_loss": 3.376713514328003, "lr": 0.00030048601275474803, "tps": 14189, "wall": 52672.0} {"step": 11404, "train_loss": 3.4697909355163574, "lr": 0.000300468876201378, "tps": 14189, "wall": 52677.0} {"step": 11405, "train_loss": 3.473708152770996, "lr": 0.0003004517387364523, "tps": 14188, "wall": 52682.0} {"step": 11406, "train_loss": 3.4344208240509033, "lr": 0.000300434600360165, "tps": 14188, "wall": 52687.0} {"step": 11407, "train_loss": 3.361321210861206, "lr": 0.0003004174610727101, "tps": 14188, "wall": 52692.0} {"step": 11408, "train_loss": 3.4680562019348145, "lr": 0.0003004003208742818, "tps": 14188, "wall": 52696.9} {"step": 11409, "train_loss": 3.4609124660491943, "lr": 0.00030038317976507445, "tps": 14188, "wall": 52701.9} {"step": 11410, "train_loss": 3.4681921005249023, "lr": 0.00030036603774528204, "tps": 14188, "wall": 52706.9} {"step": 11411, "train_loss": 3.5227456092834473, "lr": 0.00030034889481509873, "tps": 14188, "wall": 52711.9} {"step": 11412, "train_loss": 3.453648567199707, "lr": 0.00030033175097471886, "tps": 14188, "wall": 52716.9} {"step": 11413, "train_loss": 3.3786168098449707, "lr": 0.00030031460622433656, "tps": 14188, "wall": 52721.9} {"step": 11414, "train_loss": 3.485867977142334, "lr": 0.0003002974605641461, "tps": 14188, "wall": 52726.8} {"step": 11415, "train_loss": 3.5411856174468994, "lr": 0.00030028031399434164, "tps": 14187, "wall": 52731.8} {"step": 11416, "train_loss": 3.5302553176879883, "lr": 0.00030026316651511744, "tps": 14187, "wall": 52736.9} {"step": 11417, "train_loss": 3.4404778480529785, "lr": 0.00030024601812666775, "tps": 14187, "wall": 52741.8} {"step": 11418, "train_loss": 3.3614301681518555, "lr": 0.00030022886882918675, "tps": 14187, "wall": 52746.8} {"step": 11419, "train_loss": 3.4964115619659424, "lr": 0.0003002117186228689, "tps": 14187, "wall": 52751.8} {"step": 11420, "train_loss": 3.4507017135620117, "lr": 0.00030019456750790834, "tps": 14187, "wall": 52756.8} {"step": 11421, "train_loss": 3.5525076389312744, "lr": 0.00030017741548449934, "tps": 14187, "wall": 52761.8} {"step": 11422, "train_loss": 3.524860382080078, "lr": 0.00030016026255283624, "tps": 14187, "wall": 52766.7} {"step": 11423, "train_loss": 3.439136028289795, "lr": 0.00030014310871311333, "tps": 14187, "wall": 52771.7} {"step": 11424, "train_loss": 3.413149118423462, "lr": 0.00030012595396552495, "tps": 14187, "wall": 52776.7} {"step": 11425, "train_loss": 3.4342355728149414, "lr": 0.00030010879831026543, "tps": 14187, "wall": 52781.7} {"step": 11426, "train_loss": 3.4773736000061035, "lr": 0.00030009164174752914, "tps": 14186, "wall": 52786.6} {"step": 11427, "train_loss": 3.4175658226013184, "lr": 0.0003000744842775104, "tps": 14186, "wall": 52791.6} {"step": 11428, "train_loss": 3.504209518432617, "lr": 0.00030005732590040356, "tps": 14186, "wall": 52796.7} {"step": 11429, "train_loss": 3.5871894359588623, "lr": 0.000300040166616403, "tps": 14186, "wall": 52801.7} {"step": 11430, "train_loss": 3.474078893661499, "lr": 0.00030002300642570313, "tps": 14186, "wall": 52806.7} {"step": 11431, "train_loss": 3.482470989227295, "lr": 0.0003000058453284983, "tps": 14186, "wall": 52811.6} {"step": 11432, "train_loss": 3.4505419731140137, "lr": 0.00029998868332498286, "tps": 14186, "wall": 52816.6} {"step": 11433, "train_loss": 3.4560341835021973, "lr": 0.00029997152041535133, "tps": 14186, "wall": 52821.6} {"step": 11434, "train_loss": 3.3372817039489746, "lr": 0.00029995435659979815, "tps": 14186, "wall": 52826.6} {"step": 11435, "train_loss": 3.377906322479248, "lr": 0.0002999371918785176, "tps": 14186, "wall": 52831.6} {"step": 11436, "train_loss": 3.506073236465454, "lr": 0.0002999200262517043, "tps": 14185, "wall": 52836.5} {"step": 11437, "train_loss": 3.4770984649658203, "lr": 0.0002999028597195526, "tps": 14185, "wall": 52841.5} {"step": 11438, "train_loss": 3.470398187637329, "lr": 0.0002998856922822569, "tps": 14185, "wall": 52846.5} {"step": 11439, "train_loss": 3.435004234313965, "lr": 0.0002998685239400119, "tps": 14185, "wall": 52851.5} {"step": 11440, "train_loss": 3.427677869796753, "lr": 0.00029985135469301185, "tps": 14185, "wall": 52856.5} {"step": 11441, "train_loss": 3.5089967250823975, "lr": 0.0002998341845414513, "tps": 14185, "wall": 52861.5} {"step": 11442, "train_loss": 3.521618366241455, "lr": 0.00029981701348552484, "tps": 14185, "wall": 52866.5} {"step": 11443, "train_loss": 3.3600873947143555, "lr": 0.00029979984152542693, "tps": 14185, "wall": 52871.5} {"step": 11444, "train_loss": 3.5162553787231445, "lr": 0.0002997826686613521, "tps": 14185, "wall": 52876.5} {"step": 11445, "train_loss": 3.4804344177246094, "lr": 0.00029976549489349485, "tps": 14185, "wall": 52881.4} {"step": 11446, "train_loss": 3.4872994422912598, "lr": 0.0002997483202220498, "tps": 14184, "wall": 52886.4} {"step": 11447, "train_loss": 3.4483606815338135, "lr": 0.00029973114464721144, "tps": 14184, "wall": 52891.4} {"step": 11448, "train_loss": 3.515108585357666, "lr": 0.00029971396816917434, "tps": 14184, "wall": 52896.4} {"step": 11449, "train_loss": 3.4733433723449707, "lr": 0.0002996967907881331, "tps": 14184, "wall": 52901.4} {"step": 11450, "train_loss": 3.473520278930664, "lr": 0.0002996796125042824, "tps": 14184, "wall": 52906.4} {"step": 11451, "train_loss": 3.415419101715088, "lr": 0.00029966243331781665, "tps": 14184, "wall": 52911.3} {"step": 11452, "train_loss": 3.531606435775757, "lr": 0.0002996452532289306, "tps": 14184, "wall": 52916.4} {"step": 11453, "train_loss": 3.483795404434204, "lr": 0.0002996280722378187, "tps": 14184, "wall": 52921.4} {"step": 11454, "train_loss": 3.4220261573791504, "lr": 0.0002996108903446758, "tps": 14184, "wall": 52926.4} {"step": 11455, "train_loss": 3.4203858375549316, "lr": 0.0002995937075496964, "tps": 14184, "wall": 52931.4} {"step": 11456, "train_loss": 3.459977865219116, "lr": 0.00029957652385307514, "tps": 14183, "wall": 52936.4} {"step": 11457, "train_loss": 3.432786464691162, "lr": 0.00029955933925500676, "tps": 14183, "wall": 52941.3} {"step": 11458, "train_loss": 3.5860073566436768, "lr": 0.00029954215375568584, "tps": 14183, "wall": 52946.3} {"step": 11459, "train_loss": 3.4404983520507812, "lr": 0.00029952496735530715, "tps": 14183, "wall": 52951.3} {"step": 11460, "train_loss": 3.4569156169891357, "lr": 0.0002995077800540653, "tps": 14183, "wall": 52956.3} {"step": 11461, "train_loss": 3.488424062728882, "lr": 0.00029949059185215503, "tps": 14183, "wall": 52961.3} {"step": 11462, "train_loss": 3.3975045680999756, "lr": 0.000299473402749771, "tps": 14183, "wall": 52966.3} {"step": 11463, "train_loss": 3.523963689804077, "lr": 0.000299456212747108, "tps": 14183, "wall": 52971.2} {"step": 11464, "train_loss": 3.557570457458496, "lr": 0.0002994390218443607, "tps": 14183, "wall": 52976.3} {"step": 11465, "train_loss": 3.4608116149902344, "lr": 0.00029942183004172385, "tps": 14183, "wall": 52981.3} {"step": 11466, "train_loss": 3.508302688598633, "lr": 0.0002994046373393922, "tps": 14182, "wall": 52986.2} {"step": 11467, "train_loss": 3.3106141090393066, "lr": 0.0002993874437375606, "tps": 14182, "wall": 52991.2} {"step": 11468, "train_loss": 3.4715576171875, "lr": 0.0002993702492364237, "tps": 14182, "wall": 52996.2} {"step": 11469, "train_loss": 3.523216724395752, "lr": 0.00029935305383617627, "tps": 14182, "wall": 53001.2} {"step": 11470, "train_loss": 3.45389986038208, "lr": 0.0002993358575370132, "tps": 14182, "wall": 53006.2} {"step": 11471, "train_loss": 3.4979867935180664, "lr": 0.00029931866033912927, "tps": 14182, "wall": 53011.1} {"step": 11472, "train_loss": 3.4775071144104004, "lr": 0.0002993014622427193, "tps": 14182, "wall": 53016.1} {"step": 11473, "train_loss": 3.7008862495422363, "lr": 0.00029928426324797797, "tps": 14182, "wall": 53021.1} {"step": 11474, "train_loss": 3.4029383659362793, "lr": 0.0002992670633551003, "tps": 14182, "wall": 53026.1} {"step": 11475, "train_loss": 3.517099618911743, "lr": 0.000299249862564281, "tps": 14182, "wall": 53031.0} {"step": 11476, "train_loss": 3.4232177734375, "lr": 0.0002992326608757149, "tps": 14181, "wall": 53036.1} {"step": 11477, "train_loss": 3.4186887741088867, "lr": 0.0002992154582895971, "tps": 14181, "wall": 53041.1} {"step": 11478, "train_loss": 3.5100488662719727, "lr": 0.0002991982548061222, "tps": 14181, "wall": 53046.0} {"step": 11479, "train_loss": 3.411501169204712, "lr": 0.00029918105042548517, "tps": 14181, "wall": 53051.0} {"step": 11480, "train_loss": 3.39286732673645, "lr": 0.00029916384514788095, "tps": 14181, "wall": 53056.0} {"step": 11481, "train_loss": 3.4676849842071533, "lr": 0.00029914663897350445, "tps": 14181, "wall": 53061.0} {"step": 11482, "train_loss": 3.4602761268615723, "lr": 0.0002991294319025505, "tps": 14181, "wall": 53065.9} {"step": 11483, "train_loss": 3.473743200302124, "lr": 0.00029911222393521405, "tps": 14181, "wall": 53070.9} {"step": 11484, "train_loss": 3.4251868724823, "lr": 0.0002990950150716901, "tps": 14181, "wall": 53075.9} {"step": 11485, "train_loss": 3.445843458175659, "lr": 0.00029907780531217347, "tps": 14181, "wall": 53080.9} {"step": 11486, "train_loss": 3.463120460510254, "lr": 0.00029906059465685915, "tps": 14181, "wall": 53085.9} {"step": 11487, "train_loss": 3.4563260078430176, "lr": 0.00029904338310594224, "tps": 14180, "wall": 53090.9} {"step": 11488, "train_loss": 3.440183639526367, "lr": 0.0002990261706596176, "tps": 14180, "wall": 53095.9} {"step": 11489, "train_loss": 3.4641623497009277, "lr": 0.00029900895731808014, "tps": 14180, "wall": 53100.9} {"step": 11490, "train_loss": 3.410702705383301, "lr": 0.00029899174308152505, "tps": 14180, "wall": 53105.9} {"step": 11491, "train_loss": 3.5850579738616943, "lr": 0.00029897452795014717, "tps": 14180, "wall": 53110.9} {"step": 11492, "train_loss": 3.5090808868408203, "lr": 0.0002989573119241415, "tps": 14180, "wall": 53115.8} {"step": 11493, "train_loss": 3.5664823055267334, "lr": 0.00029894009500370324, "tps": 14180, "wall": 53120.8} {"step": 11494, "train_loss": 3.5355372428894043, "lr": 0.0002989228771890273, "tps": 14180, "wall": 53125.8} {"step": 11495, "train_loss": 3.4989490509033203, "lr": 0.0002989056584803086, "tps": 14180, "wall": 53130.8} {"step": 11496, "train_loss": 3.4329276084899902, "lr": 0.00029888843887774245, "tps": 14180, "wall": 53135.7} {"step": 11497, "train_loss": 3.4688072204589844, "lr": 0.0002988712183815237, "tps": 14179, "wall": 53140.7} {"step": 11498, "train_loss": 3.4216134548187256, "lr": 0.0002988539969918477, "tps": 14179, "wall": 53145.7} {"step": 11499, "train_loss": 3.4759955406188965, "lr": 0.00029883677470890924, "tps": 14179, "wall": 53150.7} {"step": 11500, "train_loss": 3.525789737701416, "lr": 0.0002988195515329036, "tps": 14179, "wall": 53155.7} {"step": 11501, "train_loss": 3.5129754543304443, "lr": 0.0002988023274640257, "tps": 14179, "wall": 53160.8} {"step": 11502, "train_loss": 3.4811105728149414, "lr": 0.00029878510250247085, "tps": 14179, "wall": 53165.8} {"step": 11503, "train_loss": 3.4758353233337402, "lr": 0.0002987678766484341, "tps": 14179, "wall": 53170.8} {"step": 11504, "train_loss": 3.4257850646972656, "lr": 0.0002987506499021105, "tps": 14179, "wall": 53175.8} {"step": 11505, "train_loss": 3.3801510334014893, "lr": 0.0002987334222636954, "tps": 14179, "wall": 53180.8} {"step": 11506, "train_loss": 3.5085768699645996, "lr": 0.00029871619373338375, "tps": 14179, "wall": 53185.8} {"step": 11507, "train_loss": 3.427183151245117, "lr": 0.0002986989643113708, "tps": 14178, "wall": 53190.7} {"step": 11508, "train_loss": 3.5849251747131348, "lr": 0.0002986817339978517, "tps": 14178, "wall": 53195.7} {"step": 11509, "train_loss": 3.423164129257202, "lr": 0.0002986645027930218, "tps": 14178, "wall": 53200.7} {"step": 11510, "train_loss": 3.435030221939087, "lr": 0.00029864727069707606, "tps": 14178, "wall": 53205.7} {"step": 11511, "train_loss": 3.5397255420684814, "lr": 0.0002986300377102097, "tps": 14178, "wall": 53210.6} {"step": 11512, "train_loss": 3.5285959243774414, "lr": 0.00029861280383261816, "tps": 14178, "wall": 53215.6} {"step": 11513, "train_loss": 3.400493860244751, "lr": 0.00029859556906449645, "tps": 14178, "wall": 53220.6} {"step": 11514, "train_loss": 3.539210557937622, "lr": 0.0002985783334060399, "tps": 14178, "wall": 53225.6} {"step": 11515, "train_loss": 3.4454121589660645, "lr": 0.0002985610968574438, "tps": 14178, "wall": 53230.6} {"step": 11516, "train_loss": 3.3699450492858887, "lr": 0.00029854385941890325, "tps": 14178, "wall": 53235.6} {"step": 11517, "train_loss": 3.41899037361145, "lr": 0.00029852662109061364, "tps": 14177, "wall": 53240.6} {"step": 11518, "train_loss": 3.4831252098083496, "lr": 0.00029850938187277025, "tps": 14177, "wall": 53245.5} {"step": 11519, "train_loss": 3.414668083190918, "lr": 0.0002984921417655683, "tps": 14177, "wall": 53250.5} {"step": 11520, "train_loss": 3.5125510692596436, "lr": 0.0002984749007692031, "tps": 14177, "wall": 53255.5} {"step": 11521, "train_loss": 3.5156359672546387, "lr": 0.00029845765888387, "tps": 14177, "wall": 53260.5} {"step": 11522, "train_loss": 3.484229326248169, "lr": 0.00029844041610976434, "tps": 14177, "wall": 53265.5} {"step": 11523, "train_loss": 3.4884867668151855, "lr": 0.0002984231724470814, "tps": 14177, "wall": 53270.5} {"step": 11524, "train_loss": 3.392395496368408, "lr": 0.0002984059278960165, "tps": 14177, "wall": 53275.5} {"step": 11525, "train_loss": 3.428399085998535, "lr": 0.000298388682456765, "tps": 14177, "wall": 53280.5} {"step": 11526, "train_loss": 3.5264434814453125, "lr": 0.00029837143612952217, "tps": 14177, "wall": 53285.5} {"step": 11527, "train_loss": 3.505683422088623, "lr": 0.0002983541889144836, "tps": 14176, "wall": 53290.5} {"step": 11528, "train_loss": 3.409745693206787, "lr": 0.00029833694081184446, "tps": 14176, "wall": 53295.5} {"step": 11529, "train_loss": 3.490785598754883, "lr": 0.00029831969182180033, "tps": 14176, "wall": 53300.5} {"step": 11530, "train_loss": 3.6234230995178223, "lr": 0.00029830244194454635, "tps": 14176, "wall": 53305.4} {"step": 11531, "train_loss": 3.485675573348999, "lr": 0.0002982851911802782, "tps": 14176, "wall": 53310.4} {"step": 11532, "train_loss": 3.499514102935791, "lr": 0.0002982679395291911, "tps": 14176, "wall": 53315.4} {"step": 11533, "train_loss": 3.4698078632354736, "lr": 0.00029825068699148053, "tps": 14176, "wall": 53320.4} {"step": 11534, "train_loss": 3.4687976837158203, "lr": 0.000298233433567342, "tps": 14176, "wall": 53325.4} {"step": 11535, "train_loss": 3.430288076400757, "lr": 0.00029821617925697083, "tps": 14176, "wall": 53330.4} {"step": 11536, "train_loss": 3.4758522510528564, "lr": 0.0002981989240605626, "tps": 14176, "wall": 53335.3} {"step": 11537, "train_loss": 3.4393327236175537, "lr": 0.00029818166797831276, "tps": 14176, "wall": 53340.4} {"step": 11538, "train_loss": 3.581939220428467, "lr": 0.00029816441101041663, "tps": 14175, "wall": 53345.3} {"step": 11539, "train_loss": 3.5614945888519287, "lr": 0.00029814715315707, "tps": 14175, "wall": 53350.3} {"step": 11540, "train_loss": 3.4881508350372314, "lr": 0.0002981298944184681, "tps": 14175, "wall": 53355.3} {"step": 11541, "train_loss": 3.435988426208496, "lr": 0.00029811263479480646, "tps": 14175, "wall": 53360.3} {"step": 11542, "train_loss": 3.414660930633545, "lr": 0.0002980953742862808, "tps": 14175, "wall": 53365.2} {"step": 11543, "train_loss": 3.3780431747436523, "lr": 0.00029807811289308644, "tps": 14175, "wall": 53370.2} {"step": 11544, "train_loss": 3.362632989883423, "lr": 0.00029806085061541903, "tps": 14175, "wall": 53375.2} {"step": 11545, "train_loss": 3.5525193214416504, "lr": 0.000298043587453474, "tps": 14175, "wall": 53380.2} {"step": 11546, "train_loss": 3.457461357116699, "lr": 0.0002980263234074471, "tps": 14175, "wall": 53385.2} {"step": 11547, "train_loss": 3.511000871658325, "lr": 0.00029800905847753375, "tps": 14175, "wall": 53390.2} {"step": 11548, "train_loss": 3.476790189743042, "lr": 0.0002979917926639295, "tps": 14174, "wall": 53395.2} {"step": 11549, "train_loss": 3.4199776649475098, "lr": 0.0002979745259668301, "tps": 14174, "wall": 53400.2} {"step": 11550, "train_loss": 3.445136547088623, "lr": 0.000297957258386431, "tps": 14174, "wall": 53405.2} {"step": 11551, "train_loss": 3.452568769454956, "lr": 0.00029793998992292786, "tps": 14174, "wall": 53410.1} {"step": 11552, "train_loss": 3.5950989723205566, "lr": 0.0002979227205765163, "tps": 14174, "wall": 53415.1} {"step": 11553, "train_loss": 3.381702423095703, "lr": 0.0002979054503473919, "tps": 14174, "wall": 53420.1} {"step": 11554, "train_loss": 3.4341955184936523, "lr": 0.00029788817923575043, "tps": 14174, "wall": 53425.1} {"step": 11555, "train_loss": 3.4665768146514893, "lr": 0.00029787090724178744, "tps": 14174, "wall": 53430.1} {"step": 11556, "train_loss": 3.472341299057007, "lr": 0.0002978536343656986, "tps": 14174, "wall": 53435.0} {"step": 11557, "train_loss": 3.5053658485412598, "lr": 0.0002978363606076795, "tps": 14174, "wall": 53440.0} {"step": 11558, "train_loss": 3.4693775177001953, "lr": 0.000297819085967926, "tps": 14174, "wall": 53445.0} {"step": 11559, "train_loss": 3.4520044326782227, "lr": 0.00029780181044663357, "tps": 14173, "wall": 53450.0} {"step": 11560, "train_loss": 3.3079452514648438, "lr": 0.0002977845340439981, "tps": 14173, "wall": 53455.0} {"step": 11561, "train_loss": 3.419339179992676, "lr": 0.00029776725676021525, "tps": 14173, "wall": 53460.0} {"step": 11562, "train_loss": 3.4238739013671875, "lr": 0.0002977499785954806, "tps": 14173, "wall": 53465.0} {"step": 11563, "train_loss": 3.5061302185058594, "lr": 0.0002977326995499901, "tps": 14173, "wall": 53470.0} {"step": 11564, "train_loss": 3.4654152393341064, "lr": 0.0002977154196239393, "tps": 14173, "wall": 53475.0} {"step": 11565, "train_loss": 3.4062023162841797, "lr": 0.00029769813881752404, "tps": 14173, "wall": 53479.9} {"step": 11566, "train_loss": 3.5339417457580566, "lr": 0.0002976808571309401, "tps": 14173, "wall": 53484.9} {"step": 11567, "train_loss": 3.5306291580200195, "lr": 0.00029766357456438314, "tps": 14173, "wall": 53489.9} {"step": 11568, "train_loss": 3.47343111038208, "lr": 0.00029764629111804904, "tps": 14173, "wall": 53494.9} {"step": 11569, "train_loss": 3.5500874519348145, "lr": 0.0002976290067921335, "tps": 14172, "wall": 53499.9} {"step": 11570, "train_loss": 3.4237987995147705, "lr": 0.00029761172158683253, "tps": 14172, "wall": 53504.8} {"step": 11571, "train_loss": 3.5246613025665283, "lr": 0.00029759443550234164, "tps": 14172, "wall": 53509.8} {"step": 11572, "train_loss": 3.6074838638305664, "lr": 0.00029757714853885677, "tps": 14172, "wall": 53514.8} {"step": 11573, "train_loss": 3.578420400619507, "lr": 0.00029755986069657383, "tps": 14172, "wall": 53519.8} {"step": 11574, "train_loss": 3.541904926300049, "lr": 0.0002975425719756886, "tps": 14172, "wall": 53524.8} {"step": 11575, "train_loss": 3.4907257556915283, "lr": 0.0002975252823763969, "tps": 14172, "wall": 53529.8} {"step": 11576, "train_loss": 3.4000766277313232, "lr": 0.0002975079918988946, "tps": 14172, "wall": 53534.8} {"step": 11577, "train_loss": 3.452500581741333, "lr": 0.00029749070054337757, "tps": 14172, "wall": 53539.8} {"step": 11578, "train_loss": 3.5077271461486816, "lr": 0.00029747340831004173, "tps": 14172, "wall": 53544.7} {"step": 11579, "train_loss": 3.51039981842041, "lr": 0.00029745611519908295, "tps": 14172, "wall": 53549.7} {"step": 11580, "train_loss": 3.532155752182007, "lr": 0.000297438821210697, "tps": 14171, "wall": 53554.7} {"step": 11581, "train_loss": 3.401149272918701, "lr": 0.00029742152634507996, "tps": 14171, "wall": 53559.6} {"step": 11582, "train_loss": 3.5115549564361572, "lr": 0.0002974042306024276, "tps": 14171, "wall": 53564.6} {"step": 11583, "train_loss": 3.3590383529663086, "lr": 0.00029738693398293604, "tps": 14171, "wall": 53569.6} {"step": 11584, "train_loss": 3.467142105102539, "lr": 0.0002973696364868011, "tps": 14171, "wall": 53574.6} {"step": 11585, "train_loss": 3.477963447570801, "lr": 0.0002973523381142187, "tps": 14171, "wall": 53579.6} {"step": 11586, "train_loss": 3.5486552715301514, "lr": 0.00029733503886538484, "tps": 14171, "wall": 53584.6} {"step": 11587, "train_loss": 3.4961507320404053, "lr": 0.0002973177387404955, "tps": 14171, "wall": 53589.6} {"step": 11588, "train_loss": 3.442497968673706, "lr": 0.00029730043773974654, "tps": 14171, "wall": 53594.5} {"step": 11589, "train_loss": 3.4439518451690674, "lr": 0.0002972831358633341, "tps": 14171, "wall": 53599.5} {"step": 11590, "train_loss": 3.455606460571289, "lr": 0.0002972658331114541, "tps": 14170, "wall": 53604.5} {"step": 11591, "train_loss": 3.476991653442383, "lr": 0.0002972485294843026, "tps": 14170, "wall": 53609.4} {"step": 11592, "train_loss": 3.4590048789978027, "lr": 0.0002972312249820755, "tps": 14170, "wall": 53614.4} {"step": 11593, "train_loss": 3.4207310676574707, "lr": 0.000297213919604969, "tps": 14170, "wall": 53619.4} {"step": 11594, "train_loss": 3.412541627883911, "lr": 0.000297196613353179, "tps": 14170, "wall": 53624.4} {"step": 11595, "train_loss": 3.475733995437622, "lr": 0.0002971793062269016, "tps": 14170, "wall": 53629.3} {"step": 11596, "train_loss": 3.3945233821868896, "lr": 0.0002971619982263328, "tps": 14170, "wall": 53634.3} {"step": 11597, "train_loss": 3.481720209121704, "lr": 0.0002971446893516688, "tps": 14170, "wall": 53639.4} {"step": 11598, "train_loss": 3.4500250816345215, "lr": 0.0002971273796031055, "tps": 14170, "wall": 53644.4} {"step": 11599, "train_loss": 3.4402008056640625, "lr": 0.00029711006898083906, "tps": 14170, "wall": 53649.4} {"step": 11600, "train_loss": 3.4745116233825684, "lr": 0.00029709275748506566, "tps": 14170, "wall": 53654.3} {"step": 11601, "train_loss": 3.566375494003296, "lr": 0.0002970754451159813, "tps": 14169, "wall": 53659.3} {"step": 11602, "train_loss": 3.4978673458099365, "lr": 0.0002970581318737821, "tps": 14169, "wall": 53664.3} {"step": 11603, "train_loss": 3.403277635574341, "lr": 0.0002970408177586642, "tps": 14169, "wall": 53669.3} {"step": 11604, "train_loss": 3.4066529273986816, "lr": 0.0002970235027708239, "tps": 14169, "wall": 53674.3} {"step": 11605, "train_loss": 3.375369071960449, "lr": 0.00029700618691045705, "tps": 14169, "wall": 53679.2} {"step": 11606, "train_loss": 3.4527060985565186, "lr": 0.00029698887017775996, "tps": 14169, "wall": 53684.2} {"step": 11607, "train_loss": 3.3787245750427246, "lr": 0.0002969715525729288, "tps": 14169, "wall": 53689.2} {"step": 11608, "train_loss": 3.3845584392547607, "lr": 0.00029695423409615976, "tps": 14169, "wall": 53694.2} {"step": 11609, "train_loss": 3.3993475437164307, "lr": 0.0002969369147476489, "tps": 14169, "wall": 53699.2} {"step": 11610, "train_loss": 3.4374961853027344, "lr": 0.0002969195945275926, "tps": 14169, "wall": 53704.2} {"step": 11611, "train_loss": 3.381279706954956, "lr": 0.0002969022734361869, "tps": 14168, "wall": 53709.2} {"step": 11612, "train_loss": 3.455021858215332, "lr": 0.00029688495147362816, "tps": 14168, "wall": 53714.2} {"step": 11613, "train_loss": 3.5319037437438965, "lr": 0.0002968676286401125, "tps": 14168, "wall": 53719.2} {"step": 11614, "train_loss": 3.5058155059814453, "lr": 0.0002968503049358362, "tps": 14168, "wall": 53724.2} {"step": 11615, "train_loss": 3.359976291656494, "lr": 0.0002968329803609955, "tps": 14168, "wall": 53729.2} {"step": 11616, "train_loss": 3.5190155506134033, "lr": 0.0002968156549157866, "tps": 14168, "wall": 53734.2} {"step": 11617, "train_loss": 3.4173688888549805, "lr": 0.0002967983286004058, "tps": 14168, "wall": 53739.2} {"step": 11618, "train_loss": 3.5027337074279785, "lr": 0.0002967810014150494, "tps": 14168, "wall": 53744.2} {"step": 11619, "train_loss": 3.4628758430480957, "lr": 0.0002967636733599137, "tps": 14168, "wall": 53749.2} {"step": 11620, "train_loss": 3.491020441055298, "lr": 0.00029674634443519485, "tps": 14168, "wall": 53754.2} {"step": 11621, "train_loss": 3.44857120513916, "lr": 0.0002967290146410894, "tps": 14167, "wall": 53759.3} {"step": 11622, "train_loss": 3.445308208465576, "lr": 0.00029671168397779336, "tps": 14167, "wall": 53764.3} {"step": 11623, "train_loss": 3.504035711288452, "lr": 0.00029669435244550335, "tps": 14167, "wall": 53769.3} {"step": 11624, "train_loss": 3.5063276290893555, "lr": 0.00029667702004441553, "tps": 14167, "wall": 53774.3} {"step": 11625, "train_loss": 3.49100923538208, "lr": 0.0002966596867747263, "tps": 14167, "wall": 53779.3} {"step": 11626, "train_loss": 3.3918962478637695, "lr": 0.00029664235263663193, "tps": 14167, "wall": 53784.4} {"step": 11627, "train_loss": 3.3946402072906494, "lr": 0.00029662501763032885, "tps": 14167, "wall": 53789.4} {"step": 11628, "train_loss": 3.354292154312134, "lr": 0.00029660768175601346, "tps": 14167, "wall": 53794.4} {"step": 11629, "train_loss": 3.560375213623047, "lr": 0.00029659034501388205, "tps": 14167, "wall": 53799.4} {"step": 11630, "train_loss": 3.469252824783325, "lr": 0.00029657300740413114, "tps": 14167, "wall": 53804.5} {"step": 11631, "train_loss": 3.4755616188049316, "lr": 0.000296555668926957, "tps": 14166, "wall": 53809.5} {"step": 11632, "train_loss": 3.4858782291412354, "lr": 0.0002965383295825562, "tps": 14166, "wall": 53814.5} {"step": 11633, "train_loss": 3.3849117755889893, "lr": 0.00029652098937112494, "tps": 14166, "wall": 53819.6} {"step": 11634, "train_loss": 3.521336793899536, "lr": 0.0002965036482928598, "tps": 14166, "wall": 53824.6} {"step": 11635, "train_loss": 3.389939069747925, "lr": 0.00029648630634795725, "tps": 14166, "wall": 53829.7} {"step": 11636, "train_loss": 3.4152278900146484, "lr": 0.0002964689635366136, "tps": 14166, "wall": 53834.7} {"step": 11637, "train_loss": 3.58681058883667, "lr": 0.00029645161985902553, "tps": 14166, "wall": 53839.7} {"step": 11638, "train_loss": 3.4238953590393066, "lr": 0.00029643427531538924, "tps": 14166, "wall": 53844.8} {"step": 11639, "train_loss": 3.371540069580078, "lr": 0.0002964169299059014, "tps": 14166, "wall": 53849.8} {"step": 11640, "train_loss": 3.509777307510376, "lr": 0.00029639958363075845, "tps": 14165, "wall": 53854.8} {"step": 11641, "train_loss": 3.5167884826660156, "lr": 0.0002963822364901569, "tps": 14165, "wall": 53859.8} {"step": 11642, "train_loss": 3.397834300994873, "lr": 0.0002963648884842932, "tps": 14165, "wall": 53864.8} {"step": 11643, "train_loss": 3.4289257526397705, "lr": 0.0002963475396133639, "tps": 14165, "wall": 53869.8} {"step": 11644, "train_loss": 3.4295713901519775, "lr": 0.0002963301898775656, "tps": 14165, "wall": 53874.9} {"step": 11645, "train_loss": 3.5140252113342285, "lr": 0.0002963128392770947, "tps": 14165, "wall": 53880.0} {"step": 11646, "train_loss": 3.5119268894195557, "lr": 0.00029629548781214785, "tps": 14165, "wall": 53885.1} {"step": 11647, "train_loss": 3.501277446746826, "lr": 0.0002962781354829217, "tps": 14165, "wall": 53890.1} {"step": 11648, "train_loss": 3.4504554271698, "lr": 0.0002962607822896126, "tps": 14165, "wall": 53895.1} {"step": 11649, "train_loss": 3.4822332859039307, "lr": 0.0002962434282324172, "tps": 14164, "wall": 53900.1} {"step": 11650, "train_loss": 3.388953924179077, "lr": 0.0002962260733115322, "tps": 14164, "wall": 53905.2} {"step": 11651, "train_loss": 3.5156960487365723, "lr": 0.0002962087175271541, "tps": 14164, "wall": 53910.2} {"step": 11652, "train_loss": 3.4863121509552, "lr": 0.00029619136087947947, "tps": 14164, "wall": 53915.3} {"step": 11653, "train_loss": 3.5978951454162598, "lr": 0.00029617400336870507, "tps": 14164, "wall": 53920.3} {"step": 11654, "train_loss": 3.514810085296631, "lr": 0.0002961566449950274, "tps": 14164, "wall": 53925.4} {"step": 11655, "train_loss": 3.4451045989990234, "lr": 0.00029613928575864315, "tps": 14164, "wall": 53930.4} {"step": 11656, "train_loss": 3.4705970287323, "lr": 0.0002961219256597489, "tps": 14164, "wall": 53935.5} {"step": 11657, "train_loss": 3.353720188140869, "lr": 0.00029610456469854134, "tps": 14164, "wall": 53940.6} {"step": 11658, "train_loss": 3.4198620319366455, "lr": 0.0002960872028752173, "tps": 14163, "wall": 53945.6} {"step": 11659, "train_loss": 3.4730522632598877, "lr": 0.0002960698401899732, "tps": 14163, "wall": 53950.7} {"step": 11660, "train_loss": 3.4821012020111084, "lr": 0.00029605247664300576, "tps": 14163, "wall": 53955.7} {"step": 11661, "train_loss": 3.4674084186553955, "lr": 0.0002960351122345119, "tps": 14163, "wall": 53960.8} {"step": 11662, "train_loss": 3.4324445724487305, "lr": 0.0002960177469646881, "tps": 14163, "wall": 53965.8} {"step": 11663, "train_loss": 3.33925199508667, "lr": 0.0002960003808337311, "tps": 14163, "wall": 53970.9} {"step": 11664, "train_loss": 3.4232780933380127, "lr": 0.0002959830138418378, "tps": 14163, "wall": 53975.9} {"step": 11665, "train_loss": 3.4150900840759277, "lr": 0.0002959656459892047, "tps": 14163, "wall": 53981.0} {"step": 11666, "train_loss": 3.4444079399108887, "lr": 0.0002959482772760287, "tps": 14163, "wall": 53986.0} {"step": 11667, "train_loss": 3.484426498413086, "lr": 0.00029593090770250655, "tps": 14162, "wall": 53991.1} {"step": 11668, "train_loss": 3.4453115463256836, "lr": 0.0002959135372688349, "tps": 14162, "wall": 53996.2} {"step": 11669, "train_loss": 3.5391592979431152, "lr": 0.00029589616597521065, "tps": 14162, "wall": 54001.2} {"step": 11670, "train_loss": 3.4251961708068848, "lr": 0.0002958787938218305, "tps": 14162, "wall": 54006.3} {"step": 11671, "train_loss": 3.464571952819824, "lr": 0.0002958614208088912, "tps": 14162, "wall": 54011.4} {"step": 11672, "train_loss": 3.3986265659332275, "lr": 0.00029584404693658973, "tps": 14162, "wall": 54016.4} {"step": 11673, "train_loss": 3.5179011821746826, "lr": 0.00029582667220512274, "tps": 14162, "wall": 54021.5} {"step": 11674, "train_loss": 3.5499765872955322, "lr": 0.0002958092966146871, "tps": 14162, "wall": 54026.5} {"step": 11675, "train_loss": 3.4224648475646973, "lr": 0.0002957919201654797, "tps": 14162, "wall": 54031.6} {"step": 11676, "train_loss": 3.47422456741333, "lr": 0.0002957745428576972, "tps": 14161, "wall": 54036.6} {"step": 11677, "train_loss": 3.5015058517456055, "lr": 0.00029575716469153673, "tps": 14161, "wall": 54041.7} {"step": 11678, "train_loss": 3.489990711212158, "lr": 0.0002957397856671949, "tps": 14161, "wall": 54046.8} {"step": 11679, "train_loss": 3.4464027881622314, "lr": 0.00029572240578486876, "tps": 14161, "wall": 54051.8} {"step": 11680, "train_loss": 3.3855183124542236, "lr": 0.00029570502504475506, "tps": 14161, "wall": 54057.0} {"step": 11681, "train_loss": 3.4249651432037354, "lr": 0.00029568764344705073, "tps": 14161, "wall": 54062.0} {"step": 11682, "train_loss": 3.467102527618408, "lr": 0.0002956702609919527, "tps": 14161, "wall": 54067.1} {"step": 11683, "train_loss": 3.5762784481048584, "lr": 0.00029565287767965783, "tps": 14161, "wall": 54072.1} {"step": 11684, "train_loss": 3.454256057739258, "lr": 0.00029563549351036315, "tps": 14161, "wall": 54077.2} {"step": 11685, "train_loss": 3.4530844688415527, "lr": 0.00029561810848426545, "tps": 14160, "wall": 54082.3} {"step": 11686, "train_loss": 3.4793529510498047, "lr": 0.00029560072260156173, "tps": 14160, "wall": 54087.4} {"step": 11687, "train_loss": 3.3772261142730713, "lr": 0.0002955833358624489, "tps": 14160, "wall": 54092.5} {"step": 11688, "train_loss": 3.4379494190216064, "lr": 0.00029556594826712397, "tps": 14160, "wall": 54097.5} {"step": 11689, "train_loss": 3.5466713905334473, "lr": 0.0002955485598157839, "tps": 14160, "wall": 54102.6} {"step": 11690, "train_loss": 3.4607465267181396, "lr": 0.0002955311705086257, "tps": 14160, "wall": 54107.7} {"step": 11691, "train_loss": 3.492887020111084, "lr": 0.0002955137803458463, "tps": 14160, "wall": 54112.8} {"step": 11692, "train_loss": 3.443704605102539, "lr": 0.0002954963893276427, "tps": 14160, "wall": 54117.9} {"step": 11693, "train_loss": 3.5123610496520996, "lr": 0.00029547899745421184, "tps": 14159, "wall": 54123.0} {"step": 11694, "train_loss": 3.550405502319336, "lr": 0.00029546160472575093, "tps": 14159, "wall": 54128.1} {"step": 11695, "train_loss": 3.458437919616699, "lr": 0.00029544421114245683, "tps": 14159, "wall": 54133.2} {"step": 11696, "train_loss": 3.5219836235046387, "lr": 0.0002954268167045266, "tps": 14159, "wall": 54138.3} {"step": 11697, "train_loss": 3.449951171875, "lr": 0.00029540942141215734, "tps": 14159, "wall": 54143.4} {"step": 11698, "train_loss": 3.3700613975524902, "lr": 0.000295392025265546, "tps": 14159, "wall": 54148.5} {"step": 11699, "train_loss": 3.416807174682617, "lr": 0.00029537462826488987, "tps": 14159, "wall": 54153.5} {"step": 11700, "train_loss": 3.3703951835632324, "lr": 0.00029535723041038576, "tps": 14159, "wall": 54158.6} {"step": 11701, "train_loss": 3.5117132663726807, "lr": 0.0002953398317022309, "tps": 14158, "wall": 54163.7} {"step": 11702, "train_loss": 3.481912851333618, "lr": 0.0002953224321406224, "tps": 14158, "wall": 54168.8} {"step": 11703, "train_loss": 3.443942070007324, "lr": 0.00029530503172575727, "tps": 14158, "wall": 54173.9} {"step": 11704, "train_loss": 3.4148168563842773, "lr": 0.0002952876304578326, "tps": 14158, "wall": 54179.0} {"step": 11705, "train_loss": 3.53275990486145, "lr": 0.0002952702283370456, "tps": 14158, "wall": 54184.1} {"step": 11706, "train_loss": 3.4942502975463867, "lr": 0.0002952528253635935, "tps": 14158, "wall": 54189.2} {"step": 11707, "train_loss": 3.4848387241363525, "lr": 0.00029523542153767323, "tps": 14158, "wall": 54194.3} {"step": 11708, "train_loss": 3.52554988861084, "lr": 0.00029521801685948205, "tps": 14158, "wall": 54199.4} {"step": 11709, "train_loss": 3.4490113258361816, "lr": 0.00029520061132921714, "tps": 14157, "wall": 54204.5} {"step": 11710, "train_loss": 3.528451442718506, "lr": 0.0002951832049470755, "tps": 14157, "wall": 54209.5} {"step": 11711, "train_loss": 3.432826280593872, "lr": 0.0002951657977132546, "tps": 14157, "wall": 54214.6} {"step": 11712, "train_loss": 3.4939520359039307, "lr": 0.00029514838962795144, "tps": 14157, "wall": 54219.7} {"step": 11713, "train_loss": 3.3968889713287354, "lr": 0.00029513098069136324, "tps": 14157, "wall": 54224.8} {"step": 11714, "train_loss": 3.368180990219116, "lr": 0.00029511357090368723, "tps": 14157, "wall": 54229.9} {"step": 11715, "train_loss": 3.499450206756592, "lr": 0.0002950961602651206, "tps": 14157, "wall": 54234.9} {"step": 11716, "train_loss": 3.4973032474517822, "lr": 0.00029507874877586065, "tps": 14157, "wall": 54240.1} {"step": 11717, "train_loss": 3.5373659133911133, "lr": 0.0002950613364361045, "tps": 14157, "wall": 54245.2} {"step": 11718, "train_loss": 3.436568260192871, "lr": 0.0002950439232460496, "tps": 14156, "wall": 54250.2} {"step": 11719, "train_loss": 3.5155601501464844, "lr": 0.000295026509205893, "tps": 14156, "wall": 54255.3} {"step": 11720, "train_loss": 3.474501132965088, "lr": 0.000295009094315832, "tps": 14156, "wall": 54260.3} {"step": 11721, "train_loss": 3.497406482696533, "lr": 0.0002949916785760639, "tps": 14156, "wall": 54265.5} {"step": 11722, "train_loss": 3.426767349243164, "lr": 0.0002949742619867861, "tps": 14156, "wall": 54270.5} {"step": 11723, "train_loss": 3.4328384399414062, "lr": 0.0002949568445481958, "tps": 14156, "wall": 54275.6} {"step": 11724, "train_loss": 3.484640598297119, "lr": 0.00029493942626049026, "tps": 14156, "wall": 54280.6} {"step": 11725, "train_loss": 3.477861166000366, "lr": 0.0002949220071238669, "tps": 14156, "wall": 54285.7} {"step": 11726, "train_loss": 3.4470040798187256, "lr": 0.00029490458713852293, "tps": 14156, "wall": 54290.8} {"step": 11727, "train_loss": 3.514772653579712, "lr": 0.0002948871663046558, "tps": 14155, "wall": 54295.9} {"step": 11728, "train_loss": 3.476618766784668, "lr": 0.0002948697446224627, "tps": 14155, "wall": 54301.0} {"step": 11729, "train_loss": 3.4926137924194336, "lr": 0.0002948523220921413, "tps": 14155, "wall": 54306.1} {"step": 11730, "train_loss": 3.4643256664276123, "lr": 0.0002948348987138885, "tps": 14155, "wall": 54311.1} {"step": 11731, "train_loss": 3.4205315113067627, "lr": 0.00029481747448790205, "tps": 14155, "wall": 54316.2} {"step": 11732, "train_loss": 3.5216164588928223, "lr": 0.0002948000494143791, "tps": 14155, "wall": 54321.3} {"step": 11733, "train_loss": 3.4791650772094727, "lr": 0.0002947826234935173, "tps": 14155, "wall": 54326.4} {"step": 11734, "train_loss": 3.3992559909820557, "lr": 0.0002947651967255138, "tps": 14155, "wall": 54331.4} {"step": 11735, "train_loss": 3.4301321506500244, "lr": 0.00029474776911056613, "tps": 14154, "wall": 54336.5} {"step": 11736, "train_loss": 3.3397727012634277, "lr": 0.0002947303406488717, "tps": 14154, "wall": 54341.6} {"step": 11737, "train_loss": 3.4538326263427734, "lr": 0.0002947129113406279, "tps": 14154, "wall": 54346.6} {"step": 11738, "train_loss": 3.490452766418457, "lr": 0.00029469548118603214, "tps": 14154, "wall": 54351.7} {"step": 11739, "train_loss": 3.39699125289917, "lr": 0.000294678050185282, "tps": 14154, "wall": 54356.9} {"step": 11740, "train_loss": 3.381944179534912, "lr": 0.0002946606183385749, "tps": 14154, "wall": 54362.0} {"step": 11741, "train_loss": 3.532480239868164, "lr": 0.0002946431856461082, "tps": 14154, "wall": 54367.0} {"step": 11742, "train_loss": 3.4552531242370605, "lr": 0.0002946257521080795, "tps": 14154, "wall": 54372.1} {"step": 11743, "train_loss": 3.4812421798706055, "lr": 0.00029460831772468626, "tps": 14154, "wall": 54377.1} {"step": 11744, "train_loss": 3.546278715133667, "lr": 0.00029459088249612594, "tps": 14153, "wall": 54382.2} {"step": 11745, "train_loss": 3.4926915168762207, "lr": 0.000294573446422596, "tps": 14153, "wall": 54387.3} {"step": 11746, "train_loss": 3.548621654510498, "lr": 0.0002945560095042941, "tps": 14153, "wall": 54392.4} {"step": 11747, "train_loss": 3.459653377532959, "lr": 0.0002945385717414177, "tps": 14153, "wall": 54397.4} {"step": 11748, "train_loss": 3.4780502319335938, "lr": 0.0002945211331341643, "tps": 14153, "wall": 54402.5} {"step": 11749, "train_loss": 3.500016450881958, "lr": 0.0002945036936827314, "tps": 14153, "wall": 54407.6} {"step": 11750, "train_loss": 3.501399040222168, "lr": 0.00029448625338731677, "tps": 14153, "wall": 54412.7} {"step": 11751, "train_loss": 3.431396484375, "lr": 0.00029446881224811776, "tps": 14153, "wall": 54417.8} {"step": 11752, "train_loss": 3.469003200531006, "lr": 0.000294451370265332, "tps": 14152, "wall": 54422.8} {"step": 11753, "train_loss": 3.4006919860839844, "lr": 0.00029443392743915713, "tps": 14152, "wall": 54427.9} {"step": 11754, "train_loss": 3.445517063140869, "lr": 0.0002944164837697907, "tps": 14152, "wall": 54433.0} {"step": 11755, "train_loss": 3.435795545578003, "lr": 0.00029439903925743035, "tps": 14152, "wall": 54438.0} {"step": 11756, "train_loss": 3.484464645385742, "lr": 0.0002943815939022736, "tps": 14152, "wall": 54443.1} {"step": 11757, "train_loss": 3.4742093086242676, "lr": 0.00029436414770451813, "tps": 14152, "wall": 54448.2} {"step": 11758, "train_loss": 3.5040578842163086, "lr": 0.0002943467006643616, "tps": 14152, "wall": 54453.2} {"step": 11759, "train_loss": 3.356417655944824, "lr": 0.0002943292527820015, "tps": 14152, "wall": 54458.3} {"step": 11760, "train_loss": 3.3606619834899902, "lr": 0.00029431180405763575, "tps": 14152, "wall": 54463.4} {"step": 11761, "train_loss": 3.5063045024871826, "lr": 0.00029429435449146186, "tps": 14151, "wall": 54468.4} {"step": 11762, "train_loss": 3.5182831287384033, "lr": 0.00029427690408367744, "tps": 14151, "wall": 54473.5} {"step": 11763, "train_loss": 3.482686996459961, "lr": 0.00029425945283448026, "tps": 14151, "wall": 54478.7} {"step": 11764, "train_loss": 3.3798270225524902, "lr": 0.000294242000744068, "tps": 14151, "wall": 54483.7} {"step": 11765, "train_loss": 3.463107109069824, "lr": 0.00029422454781263834, "tps": 14151, "wall": 54488.8} {"step": 11766, "train_loss": 3.4305922985076904, "lr": 0.00029420709404038886, "tps": 14151, "wall": 54493.9} {"step": 11767, "train_loss": 3.4244496822357178, "lr": 0.0002941896394275176, "tps": 14151, "wall": 54498.9} {"step": 11768, "train_loss": 3.5072789192199707, "lr": 0.00029417218397422197, "tps": 14151, "wall": 54504.0} {"step": 11769, "train_loss": 3.4345593452453613, "lr": 0.00029415472768069985, "tps": 14150, "wall": 54509.1} {"step": 11770, "train_loss": 3.473607301712036, "lr": 0.0002941372705471489, "tps": 14150, "wall": 54514.2} {"step": 11771, "train_loss": 3.56329345703125, "lr": 0.0002941198125737671, "tps": 14150, "wall": 54519.3} {"step": 11772, "train_loss": 3.4101500511169434, "lr": 0.0002941023537607519, "tps": 14150, "wall": 54524.3} {"step": 11773, "train_loss": 3.482282876968384, "lr": 0.0002940848941083013, "tps": 14150, "wall": 54529.4} {"step": 11774, "train_loss": 3.504887104034424, "lr": 0.00029406743361661306, "tps": 14150, "wall": 54534.4} {"step": 11775, "train_loss": 3.459372043609619, "lr": 0.00029404997228588484, "tps": 14150, "wall": 54539.6} {"step": 11776, "train_loss": 3.448946714401245, "lr": 0.00029403251011631454, "tps": 14150, "wall": 54544.7} {"step": 11777, "train_loss": 3.4896020889282227, "lr": 0.0002940150471081, "tps": 14150, "wall": 54549.8} {"step": 11778, "train_loss": 3.497119188308716, "lr": 0.000293997583261439, "tps": 14149, "wall": 54554.8} {"step": 11779, "train_loss": 3.5254013538360596, "lr": 0.0002939801185765293, "tps": 14149, "wall": 54559.9} {"step": 11780, "train_loss": 3.404341697692871, "lr": 0.00029396265305356884, "tps": 14149, "wall": 54565.0} {"step": 11781, "train_loss": 3.395432233810425, "lr": 0.0002939451866927555, "tps": 14149, "wall": 54570.0} {"step": 11782, "train_loss": 3.3800344467163086, "lr": 0.000293927719494287, "tps": 14149, "wall": 54575.1} {"step": 11783, "train_loss": 3.4106388092041016, "lr": 0.0002939102514583614, "tps": 14149, "wall": 54580.2} {"step": 11784, "train_loss": 3.4604618549346924, "lr": 0.00029389278258517643, "tps": 14149, "wall": 54585.2} {"step": 11785, "train_loss": 3.4247357845306396, "lr": 0.00029387531287492993, "tps": 14149, "wall": 54590.3} {"step": 11786, "train_loss": 3.56740665435791, "lr": 0.00029385784232782, "tps": 14149, "wall": 54595.4} {"step": 11787, "train_loss": 3.5076634883880615, "lr": 0.00029384037094404443, "tps": 14148, "wall": 54600.6} {"step": 11788, "train_loss": 3.4609618186950684, "lr": 0.0002938228987238011, "tps": 14148, "wall": 54605.6} {"step": 11789, "train_loss": 3.431495428085327, "lr": 0.000293805425667288, "tps": 14148, "wall": 54610.7} {"step": 11790, "train_loss": 3.446563243865967, "lr": 0.00029378795177470305, "tps": 14148, "wall": 54615.8} {"step": 11791, "train_loss": 3.542160987854004, "lr": 0.0002937704770462442, "tps": 14148, "wall": 54620.9} {"step": 11792, "train_loss": 3.3605494499206543, "lr": 0.00029375300148210936, "tps": 14148, "wall": 54626.0} {"step": 11793, "train_loss": 3.447462320327759, "lr": 0.00029373552508249657, "tps": 14148, "wall": 54631.0} {"step": 11794, "train_loss": 3.389801025390625, "lr": 0.00029371804784760375, "tps": 14148, "wall": 54636.1} {"step": 11795, "train_loss": 3.4729650020599365, "lr": 0.00029370056977762887, "tps": 14147, "wall": 54641.2} {"step": 11796, "train_loss": 3.503293514251709, "lr": 0.00029368309087276996, "tps": 14147, "wall": 54646.2} {"step": 11797, "train_loss": 3.4749560356140137, "lr": 0.00029366561113322505, "tps": 14147, "wall": 54651.3} {"step": 11798, "train_loss": 3.37424898147583, "lr": 0.00029364813055919207, "tps": 14147, "wall": 54656.4} {"step": 11799, "train_loss": 3.5362658500671387, "lr": 0.00029363064915086904, "tps": 14147, "wall": 54661.5} {"step": 11800, "train_loss": 3.4851441383361816, "lr": 0.00029361316690845415, "tps": 14147, "wall": 54666.6} {"step": 11801, "train_loss": 3.63283634185791, "lr": 0.0002935956838321452, "tps": 14147, "wall": 54671.7} {"step": 11802, "train_loss": 3.4858105182647705, "lr": 0.0002935781999221405, "tps": 14147, "wall": 54676.7} {"step": 11803, "train_loss": 3.4469761848449707, "lr": 0.00029356071517863783, "tps": 14147, "wall": 54681.8} {"step": 11804, "train_loss": 3.354802131652832, "lr": 0.0002935432296018355, "tps": 14146, "wall": 54686.8} {"step": 11805, "train_loss": 3.4665756225585938, "lr": 0.00029352574319193144, "tps": 14146, "wall": 54691.9} {"step": 11806, "train_loss": 3.4009504318237305, "lr": 0.0002935082559491238, "tps": 14146, "wall": 54697.0} {"step": 11807, "train_loss": 3.3912672996520996, "lr": 0.00029349076787361055, "tps": 14146, "wall": 54702.0} {"step": 11808, "train_loss": 3.3449816703796387, "lr": 0.0002934732789655901, "tps": 14146, "wall": 54707.1} {"step": 11809, "train_loss": 3.5475237369537354, "lr": 0.00029345578922526026, "tps": 14146, "wall": 54712.2} {"step": 11810, "train_loss": 3.4689245223999023, "lr": 0.00029343829865281925, "tps": 14146, "wall": 54717.3} {"step": 11811, "train_loss": 3.4117212295532227, "lr": 0.0002934208072484653, "tps": 14146, "wall": 54722.4} {"step": 11812, "train_loss": 3.5206923484802246, "lr": 0.0002934033150123964, "tps": 14146, "wall": 54727.5} {"step": 11813, "train_loss": 3.5215840339660645, "lr": 0.0002933858219448108, "tps": 14145, "wall": 54732.6} {"step": 11814, "train_loss": 3.408684015274048, "lr": 0.00029336832804590664, "tps": 14145, "wall": 54737.6} {"step": 11815, "train_loss": 3.44442081451416, "lr": 0.00029335083331588207, "tps": 14145, "wall": 54742.7} {"step": 11816, "train_loss": 3.5261216163635254, "lr": 0.0002933333377549353, "tps": 14145, "wall": 54747.8} {"step": 11817, "train_loss": 3.387836217880249, "lr": 0.0002933158413632646, "tps": 14145, "wall": 54752.9} {"step": 11818, "train_loss": 3.4422426223754883, "lr": 0.00029329834414106796, "tps": 14145, "wall": 54758.0} {"step": 11819, "train_loss": 3.396493434906006, "lr": 0.0002932808460885438, "tps": 14145, "wall": 54763.0} {"step": 11820, "train_loss": 3.410104274749756, "lr": 0.00029326334720589017, "tps": 14145, "wall": 54768.1} {"step": 11821, "train_loss": 3.4978179931640625, "lr": 0.00029324584749330543, "tps": 14144, "wall": 54773.2} {"step": 11822, "train_loss": 3.345625400543213, "lr": 0.0002932283469509877, "tps": 14144, "wall": 54778.3} {"step": 11823, "train_loss": 3.493281841278076, "lr": 0.00029321084557913543, "tps": 14144, "wall": 54783.4} {"step": 11824, "train_loss": 3.3358407020568848, "lr": 0.0002931933433779466, "tps": 14144, "wall": 54788.5} {"step": 11825, "train_loss": 3.5133988857269287, "lr": 0.0002931758403476197, "tps": 14144, "wall": 54793.5} {"step": 11826, "train_loss": 3.4748122692108154, "lr": 0.00029315833648835293, "tps": 14144, "wall": 54798.6} {"step": 11827, "train_loss": 3.459681987762451, "lr": 0.00029314083180034453, "tps": 14144, "wall": 54803.7} {"step": 11828, "train_loss": 3.5436694622039795, "lr": 0.00029312332628379285, "tps": 14144, "wall": 54808.7} {"step": 11829, "train_loss": 3.5871524810791016, "lr": 0.0002931058199388961, "tps": 14144, "wall": 54813.8} {"step": 11830, "train_loss": 3.4148452281951904, "lr": 0.00029308831276585276, "tps": 14143, "wall": 54818.9} {"step": 11831, "train_loss": 3.511772871017456, "lr": 0.00029307080476486107, "tps": 14143, "wall": 54823.9} {"step": 11832, "train_loss": 3.377113103866577, "lr": 0.0002930532959361193, "tps": 14143, "wall": 54829.0} {"step": 11833, "train_loss": 3.4965872764587402, "lr": 0.00029303578627982584, "tps": 14143, "wall": 54834.0} {"step": 11834, "train_loss": 3.545912504196167, "lr": 0.00029301827579617906, "tps": 14143, "wall": 54839.2} {"step": 11835, "train_loss": 3.547633409500122, "lr": 0.00029300076448537726, "tps": 14143, "wall": 54844.2} {"step": 11836, "train_loss": 3.4329757690429688, "lr": 0.00029298325234761895, "tps": 14143, "wall": 54849.3} {"step": 11837, "train_loss": 3.3571982383728027, "lr": 0.00029296573938310234, "tps": 14143, "wall": 54854.4} {"step": 11838, "train_loss": 3.427806854248047, "lr": 0.0002929482255920258, "tps": 14143, "wall": 54859.5} {"step": 11839, "train_loss": 3.3380022048950195, "lr": 0.00029293071097458796, "tps": 14142, "wall": 54864.5} {"step": 11840, "train_loss": 3.3838143348693848, "lr": 0.000292913195530987, "tps": 14142, "wall": 54869.6} {"step": 11841, "train_loss": 3.4590320587158203, "lr": 0.00029289567926142146, "tps": 14142, "wall": 54874.7} {"step": 11842, "train_loss": 3.561969518661499, "lr": 0.00029287816216608974, "tps": 14142, "wall": 54879.7} {"step": 11843, "train_loss": 3.4133198261260986, "lr": 0.00029286064424519017, "tps": 14142, "wall": 54884.8} {"step": 11844, "train_loss": 3.4633607864379883, "lr": 0.0002928431254989213, "tps": 14142, "wall": 54889.9} {"step": 11845, "train_loss": 3.474168539047241, "lr": 0.00029282560592748167, "tps": 14142, "wall": 54894.9} {"step": 11846, "train_loss": 3.40109920501709, "lr": 0.00029280808553106956, "tps": 14142, "wall": 54900.1} {"step": 11847, "train_loss": 3.3792176246643066, "lr": 0.0002927905643098835, "tps": 14142, "wall": 54905.2} {"step": 11848, "train_loss": 3.4398486614227295, "lr": 0.00029277304226412197, "tps": 14141, "wall": 54910.2} {"step": 11849, "train_loss": 3.468493938446045, "lr": 0.00029275551939398356, "tps": 14141, "wall": 54915.3} {"step": 11850, "train_loss": 3.3532443046569824, "lr": 0.00029273799569966665, "tps": 14141, "wall": 54920.3} {"step": 11851, "train_loss": 3.438547134399414, "lr": 0.00029272047118136975, "tps": 14141, "wall": 54925.4} {"step": 11852, "train_loss": 3.4490294456481934, "lr": 0.0002927029458392915, "tps": 14141, "wall": 54930.5} {"step": 11853, "train_loss": 3.4367570877075195, "lr": 0.0002926854196736303, "tps": 14141, "wall": 54935.5} {"step": 11854, "train_loss": 3.3851616382598877, "lr": 0.0002926678926845847, "tps": 14141, "wall": 54940.6} {"step": 11855, "train_loss": 3.480038642883301, "lr": 0.0002926503648723533, "tps": 14141, "wall": 54945.7} {"step": 11856, "train_loss": 3.5167884826660156, "lr": 0.0002926328362371347, "tps": 14141, "wall": 54950.7} {"step": 11857, "train_loss": 3.5833396911621094, "lr": 0.00029261530677912736, "tps": 14140, "wall": 54955.8} {"step": 11858, "train_loss": 3.4596686363220215, "lr": 0.0002925977764985299, "tps": 14140, "wall": 54960.9} {"step": 11859, "train_loss": 3.4045352935791016, "lr": 0.0002925802453955409, "tps": 14140, "wall": 54966.0} {"step": 11860, "train_loss": 3.389235496520996, "lr": 0.0002925627134703589, "tps": 14140, "wall": 54971.1} {"step": 11861, "train_loss": 3.4386227130889893, "lr": 0.00029254518072318263, "tps": 14140, "wall": 54976.2} {"step": 11862, "train_loss": 3.4760656356811523, "lr": 0.0002925276471542106, "tps": 14140, "wall": 54981.4} {"step": 11863, "train_loss": 3.3802876472473145, "lr": 0.00029251011276364147, "tps": 14140, "wall": 54986.8} {"step": 11864, "train_loss": 3.446115493774414, "lr": 0.0002924925775516738, "tps": 14139, "wall": 54992.1} {"step": 11865, "train_loss": 3.3872551918029785, "lr": 0.00029247504151850635, "tps": 14139, "wall": 54997.5} {"step": 11866, "train_loss": 3.3525753021240234, "lr": 0.0002924575046643377, "tps": 14139, "wall": 55003.0} {"step": 11867, "train_loss": 3.49605131149292, "lr": 0.00029243996698936653, "tps": 14139, "wall": 55008.4} {"step": 11868, "train_loss": 3.475581169128418, "lr": 0.0002924224284937914, "tps": 14139, "wall": 55014.0} {"step": 11869, "train_loss": 3.50455641746521, "lr": 0.00029240488917781126, "tps": 14138, "wall": 55019.7} {"step": 11870, "train_loss": 3.4816718101501465, "lr": 0.0002923873490416245, "tps": 14138, "wall": 55025.3} {"step": 11871, "train_loss": 3.41904878616333, "lr": 0.00029236980808542996, "tps": 14138, "wall": 55031.0} {"step": 11872, "train_loss": 3.5146594047546387, "lr": 0.00029235226630942634, "tps": 14138, "wall": 55036.6} {"step": 11873, "train_loss": 3.464010715484619, "lr": 0.0002923347237138123, "tps": 14137, "wall": 55042.3} {"step": 11874, "train_loss": 3.394240140914917, "lr": 0.0002923171802987866, "tps": 14137, "wall": 55048.1} {"step": 11875, "train_loss": 3.434959888458252, "lr": 0.0002922996360645479, "tps": 14137, "wall": 55054.0} {"step": 11876, "train_loss": 3.4828639030456543, "lr": 0.00029228209101129517, "tps": 14136, "wall": 55059.8} {"step": 11877, "train_loss": 3.38576602935791, "lr": 0.0002922645451392268, "tps": 14136, "wall": 55065.6} {"step": 11878, "train_loss": 3.3906893730163574, "lr": 0.00029224699844854196, "tps": 14136, "wall": 55071.6} {"step": 11879, "train_loss": 3.316317081451416, "lr": 0.00029222945093943913, "tps": 14135, "wall": 55077.6} {"step": 11880, "train_loss": 3.435849189758301, "lr": 0.00029221190261211717, "tps": 14135, "wall": 55083.6} {"step": 11881, "train_loss": 3.4701271057128906, "lr": 0.0002921943534667748, "tps": 14135, "wall": 55089.6} {"step": 11882, "train_loss": 3.4369678497314453, "lr": 0.0002921768035036109, "tps": 14134, "wall": 55095.7} {"step": 11883, "train_loss": 3.2561216354370117, "lr": 0.00029215925272282444, "tps": 14134, "wall": 55101.9} {"step": 11884, "train_loss": 3.5092270374298096, "lr": 0.00029214170112461387, "tps": 14133, "wall": 55108.1} {"step": 11885, "train_loss": 3.427917242050171, "lr": 0.00029212414870917827, "tps": 14133, "wall": 55114.3} {"step": 11886, "train_loss": 3.40999698638916, "lr": 0.0002921065954767165, "tps": 14133, "wall": 55120.6} {"step": 11887, "train_loss": 3.4167771339416504, "lr": 0.0002920890414274272, "tps": 14132, "wall": 55126.9} {"step": 11888, "train_loss": 3.322300672531128, "lr": 0.0002920714865615093, "tps": 14132, "wall": 55133.4} {"step": 11889, "train_loss": 3.4697866439819336, "lr": 0.00029205393087916186, "tps": 14131, "wall": 55139.9} {"step": 11890, "train_loss": 3.4047224521636963, "lr": 0.00029203637438058347, "tps": 14131, "wall": 55146.4} {"step": 11891, "train_loss": 3.4734559059143066, "lr": 0.00029201881706597316, "tps": 14130, "wall": 55152.8} {"step": 11892, "train_loss": 3.477609872817993, "lr": 0.0002920012589355298, "tps": 14130, "wall": 55159.4} {"step": 11893, "train_loss": 3.39736270904541, "lr": 0.00029198369998945236, "tps": 14129, "wall": 55166.0} {"step": 11894, "train_loss": 3.501978635787964, "lr": 0.0002919661402279395, "tps": 14129, "wall": 55172.6} {"step": 11895, "train_loss": 3.4369685649871826, "lr": 0.0002919485796511904, "tps": 14128, "wall": 55179.2} {"step": 11896, "train_loss": 3.5152063369750977, "lr": 0.00029193101825940397, "tps": 14128, "wall": 55186.0} {"step": 11897, "train_loss": 3.401723623275757, "lr": 0.000291913456052779, "tps": 14127, "wall": 55192.7} {"step": 11898, "train_loss": 3.4439849853515625, "lr": 0.00029189589303151454, "tps": 14127, "wall": 55199.6} {"step": 11899, "train_loss": 3.390916347503662, "lr": 0.00029187832919580953, "tps": 14126, "wall": 55206.4} {"step": 11900, "train_loss": 3.6033034324645996, "lr": 0.0002918607645458629, "tps": 14126, "wall": 55213.3} {"step": 11901, "train_loss": 3.387458324432373, "lr": 0.00029184319908187356, "tps": 14125, "wall": 55220.2} {"step": 11902, "train_loss": 3.480921506881714, "lr": 0.0002918256328040406, "tps": 14124, "wall": 55227.2} {"step": 11903, "train_loss": 3.3759782314300537, "lr": 0.00029180806571256306, "tps": 14124, "wall": 55234.2} {"step": 11904, "train_loss": 3.354642629623413, "lr": 0.00029179049780763983, "tps": 14123, "wall": 55241.2} {"step": 11905, "train_loss": 3.511556625366211, "lr": 0.00029177292908946995, "tps": 14123, "wall": 55248.2} {"step": 11906, "train_loss": 3.4620699882507324, "lr": 0.00029175535955825246, "tps": 14122, "wall": 55255.3} {"step": 11907, "train_loss": 3.407078266143799, "lr": 0.0002917377892141864, "tps": 14121, "wall": 55262.5} {"step": 11908, "train_loss": 3.358013868331909, "lr": 0.0002917202180574707, "tps": 14121, "wall": 55269.6} {"step": 11909, "train_loss": 3.4570231437683105, "lr": 0.0002917026460883046, "tps": 14120, "wall": 55276.8} {"step": 11910, "train_loss": 3.4231321811676025, "lr": 0.000291685073306887, "tps": 14120, "wall": 55282.9} {"step": 11911, "train_loss": 3.424098014831543, "lr": 0.000291667499713417, "tps": 14119, "wall": 55288.5} {"step": 11912, "train_loss": 3.529632091522217, "lr": 0.00029164992530809365, "tps": 14119, "wall": 55293.8} {"step": 11913, "train_loss": 3.4728729724884033, "lr": 0.00029163235009111615, "tps": 14119, "wall": 55299.0} {"step": 11914, "train_loss": 3.4418694972991943, "lr": 0.0002916147740626834, "tps": 14119, "wall": 55304.2} {"step": 11915, "train_loss": 3.405073642730713, "lr": 0.0002915971972229947, "tps": 14119, "wall": 55309.2} {"step": 11916, "train_loss": 3.490450859069824, "lr": 0.0002915796195722491, "tps": 14119, "wall": 55314.2} {"step": 11917, "train_loss": 3.495664596557617, "lr": 0.0002915620411106457, "tps": 14119, "wall": 55319.3} {"step": 11918, "train_loss": 3.4464855194091797, "lr": 0.0002915444618383835, "tps": 14119, "wall": 55324.3} {"step": 11919, "train_loss": 3.449793577194214, "lr": 0.0002915268817556619, "tps": 14118, "wall": 55329.2} {"step": 11920, "train_loss": 3.4746954441070557, "lr": 0.0002915093008626799, "tps": 14118, "wall": 55334.1} {"step": 11921, "train_loss": 3.4235341548919678, "lr": 0.0002914917191596366, "tps": 14118, "wall": 55339.1} {"step": 11922, "train_loss": 3.372044086456299, "lr": 0.00029147413664673126, "tps": 14118, "wall": 55344.0} {"step": 11923, "train_loss": 3.38560152053833, "lr": 0.00029145655332416307, "tps": 14118, "wall": 55348.9} {"step": 11924, "train_loss": 3.441476345062256, "lr": 0.0002914389691921312, "tps": 14118, "wall": 55353.8} {"step": 11925, "train_loss": 3.414198398590088, "lr": 0.0002914213842508347, "tps": 14118, "wall": 55358.7} {"step": 11926, "train_loss": 3.424673557281494, "lr": 0.00029140379850047297, "tps": 14118, "wall": 55363.6} {"step": 11927, "train_loss": 3.485520601272583, "lr": 0.0002913862119412452, "tps": 14118, "wall": 55368.6} {"step": 11928, "train_loss": 3.45772385597229, "lr": 0.0002913686245733505, "tps": 14118, "wall": 55373.5} {"step": 11929, "train_loss": 3.4665796756744385, "lr": 0.00029135103639698815, "tps": 14118, "wall": 55378.4} {"step": 11930, "train_loss": 3.4400269985198975, "lr": 0.00029133344741235744, "tps": 14118, "wall": 55383.3} {"step": 11931, "train_loss": 3.460602283477783, "lr": 0.0002913158576196576, "tps": 14118, "wall": 55388.2} {"step": 11932, "train_loss": 3.443282127380371, "lr": 0.0002912982670190878, "tps": 14118, "wall": 55393.1} {"step": 11933, "train_loss": 3.3433034420013428, "lr": 0.00029128067561084737, "tps": 14117, "wall": 55398.1} {"step": 11934, "train_loss": 3.4752371311187744, "lr": 0.0002912630833951357, "tps": 14117, "wall": 55403.0} {"step": 11935, "train_loss": 3.448838472366333, "lr": 0.00029124549037215183, "tps": 14117, "wall": 55407.9} {"step": 11936, "train_loss": 3.579763174057007, "lr": 0.0002912278965420952, "tps": 14117, "wall": 55412.8} {"step": 11937, "train_loss": 3.4522736072540283, "lr": 0.0002912103019051652, "tps": 14117, "wall": 55417.7} {"step": 11938, "train_loss": 3.4902215003967285, "lr": 0.000291192706461561, "tps": 14117, "wall": 55422.6} {"step": 11939, "train_loss": 3.487257719039917, "lr": 0.00029117511021148194, "tps": 14117, "wall": 55427.5} {"step": 11940, "train_loss": 3.417570114135742, "lr": 0.0002911575131551274, "tps": 14117, "wall": 55432.5} {"step": 11941, "train_loss": 3.4609947204589844, "lr": 0.00029113991529269677, "tps": 14117, "wall": 55437.5} {"step": 11942, "train_loss": 3.523616313934326, "lr": 0.00029112231662438925, "tps": 14117, "wall": 55442.4} {"step": 11943, "train_loss": 3.510643482208252, "lr": 0.00029110471715040426, "tps": 14117, "wall": 55447.3} {"step": 11944, "train_loss": 3.411984920501709, "lr": 0.00029108711687094124, "tps": 14117, "wall": 55452.2} {"step": 11945, "train_loss": 3.3743669986724854, "lr": 0.00029106951578619953, "tps": 14117, "wall": 55457.1} {"step": 11946, "train_loss": 3.439612865447998, "lr": 0.00029105191389637846, "tps": 14117, "wall": 55462.1} {"step": 11947, "train_loss": 3.494112253189087, "lr": 0.00029103431120167746, "tps": 14116, "wall": 55467.0} {"step": 11948, "train_loss": 3.3380348682403564, "lr": 0.000291016707702296, "tps": 14116, "wall": 55471.9} {"step": 11949, "train_loss": 3.468045473098755, "lr": 0.0002909991033984333, "tps": 14116, "wall": 55476.9} {"step": 11950, "train_loss": 3.423689365386963, "lr": 0.0002909814982902891, "tps": 14116, "wall": 55481.8} {"step": 11951, "train_loss": 3.3882484436035156, "lr": 0.00029096389237806254, "tps": 14116, "wall": 55486.7} {"step": 11952, "train_loss": 3.425699234008789, "lr": 0.0002909462856619532, "tps": 14116, "wall": 55491.6} {"step": 11953, "train_loss": 3.415663957595825, "lr": 0.0002909286781421604, "tps": 14116, "wall": 55496.6} {"step": 11954, "train_loss": 3.4480233192443848, "lr": 0.00029091106981888384, "tps": 14116, "wall": 55501.6} {"step": 11955, "train_loss": 3.4076688289642334, "lr": 0.0002908934606923228, "tps": 14116, "wall": 55506.5} {"step": 11956, "train_loss": 3.46100115776062, "lr": 0.00029087585076267673, "tps": 14116, "wall": 55511.4} {"step": 11957, "train_loss": 3.6444928646087646, "lr": 0.0002908582400301452, "tps": 14116, "wall": 55516.4} {"step": 11958, "train_loss": 3.4679794311523438, "lr": 0.0002908406284949278, "tps": 14116, "wall": 55521.3} {"step": 11959, "train_loss": 3.45011568069458, "lr": 0.0002908230161572239, "tps": 14116, "wall": 55526.2} {"step": 11960, "train_loss": 3.502795934677124, "lr": 0.00029080540301723297, "tps": 14115, "wall": 55531.2} {"step": 11961, "train_loss": 3.392829418182373, "lr": 0.00029078778907515464, "tps": 14115, "wall": 55536.1} {"step": 11962, "train_loss": 3.455519199371338, "lr": 0.0002907701743311884, "tps": 14115, "wall": 55541.0} {"step": 11963, "train_loss": 3.4696896076202393, "lr": 0.0002907525587855338, "tps": 14115, "wall": 55546.0} {"step": 11964, "train_loss": 3.4347095489501953, "lr": 0.0002907349424383904, "tps": 14115, "wall": 55550.9} {"step": 11965, "train_loss": 3.429501533508301, "lr": 0.00029071732528995775, "tps": 14115, "wall": 55555.8} {"step": 11966, "train_loss": 3.3361763954162598, "lr": 0.0002906997073404354, "tps": 14115, "wall": 55560.9} {"step": 11967, "train_loss": 3.4562840461730957, "lr": 0.0002906820885900229, "tps": 14115, "wall": 55565.8} {"step": 11968, "train_loss": 3.4090967178344727, "lr": 0.00029066446903891995, "tps": 14115, "wall": 55570.7} {"step": 11969, "train_loss": 3.398186445236206, "lr": 0.000290646848687326, "tps": 14115, "wall": 55575.7} {"step": 11970, "train_loss": 3.464406728744507, "lr": 0.0002906292275354408, "tps": 14115, "wall": 55580.6} {"step": 11971, "train_loss": 3.375910758972168, "lr": 0.0002906116055834639, "tps": 14115, "wall": 55585.6} {"step": 11972, "train_loss": 3.469116449356079, "lr": 0.0002905939828315948, "tps": 14115, "wall": 55590.5} {"step": 11973, "train_loss": 3.4432427883148193, "lr": 0.00029057635928003326, "tps": 14114, "wall": 55595.5} {"step": 11974, "train_loss": 3.5500636100769043, "lr": 0.000290558734928979, "tps": 14114, "wall": 55600.4} {"step": 11975, "train_loss": 3.499494791030884, "lr": 0.0002905411097786315, "tps": 14114, "wall": 55605.3} {"step": 11976, "train_loss": 3.5172924995422363, "lr": 0.0002905234838291905, "tps": 14114, "wall": 55610.3} {"step": 11977, "train_loss": 3.470442771911621, "lr": 0.00029050585708085576, "tps": 14114, "wall": 55615.2} {"step": 11978, "train_loss": 3.638277053833008, "lr": 0.0002904882295338268, "tps": 14114, "wall": 55620.2} {"step": 11979, "train_loss": 3.5220444202423096, "lr": 0.00029047060118830327, "tps": 14114, "wall": 55625.2} {"step": 11980, "train_loss": 3.419070243835449, "lr": 0.000290452972044485, "tps": 14114, "wall": 55630.1} {"step": 11981, "train_loss": 3.5825576782226562, "lr": 0.0002904353421025717, "tps": 14114, "wall": 55635.1} {"step": 11982, "train_loss": 3.4604198932647705, "lr": 0.00029041771136276303, "tps": 14114, "wall": 55640.0} {"step": 11983, "train_loss": 3.4895193576812744, "lr": 0.00029040007982525866, "tps": 14114, "wall": 55645.0} {"step": 11984, "train_loss": 3.388798713684082, "lr": 0.0002903824474902584, "tps": 14114, "wall": 55649.9} {"step": 11985, "train_loss": 3.4140396118164062, "lr": 0.000290364814357962, "tps": 14114, "wall": 55654.9} {"step": 11986, "train_loss": 3.4649248123168945, "lr": 0.00029034718042856916, "tps": 14113, "wall": 55659.9} {"step": 11987, "train_loss": 3.4484663009643555, "lr": 0.0002903295457022797, "tps": 14113, "wall": 55664.8} {"step": 11988, "train_loss": 3.430002212524414, "lr": 0.0002903119101792933, "tps": 14113, "wall": 55669.8} {"step": 11989, "train_loss": 3.3795204162597656, "lr": 0.00029029427385980974, "tps": 14113, "wall": 55674.7} {"step": 11990, "train_loss": 3.451587438583374, "lr": 0.0002902766367440288, "tps": 14113, "wall": 55679.7} {"step": 11991, "train_loss": 3.4092695713043213, "lr": 0.00029025899883215045, "tps": 14113, "wall": 55684.7} {"step": 11992, "train_loss": 3.4849917888641357, "lr": 0.00029024136012437433, "tps": 14113, "wall": 55689.6} {"step": 11993, "train_loss": 3.386383056640625, "lr": 0.0002902237206209002, "tps": 14113, "wall": 55694.5} {"step": 11994, "train_loss": 3.483393430709839, "lr": 0.00029020608032192803, "tps": 14113, "wall": 55699.5} {"step": 11995, "train_loss": 3.4271929264068604, "lr": 0.0002901884392276576, "tps": 14113, "wall": 55704.4} {"step": 11996, "train_loss": 3.492637872695923, "lr": 0.0002901707973382887, "tps": 14113, "wall": 55709.4} {"step": 11997, "train_loss": 3.418384552001953, "lr": 0.00029015315465402117, "tps": 14113, "wall": 55714.3} {"step": 11998, "train_loss": 3.392658233642578, "lr": 0.00029013551117505493, "tps": 14113, "wall": 55719.3} {"step": 11999, "train_loss": 3.3452792167663574, "lr": 0.00029011786690158985, "tps": 14112, "wall": 55724.2} {"step": 12000, "train_loss": 3.4152109622955322, "lr": 0.0002901002218338258, "tps": 14112, "wall": 55729.2, "val_loss_monitor": 3.486335449599439} {"step": 12001, "train_loss": 3.406801223754883, "lr": 0.00029008257597196266, "tps": 14100, "wall": 55782.5} {"step": 12002, "train_loss": 3.392777919769287, "lr": 0.00029006492931620025, "tps": 14100, "wall": 55787.4} {"step": 12003, "train_loss": 3.4013237953186035, "lr": 0.0002900472818667386, "tps": 14100, "wall": 55792.4} {"step": 12004, "train_loss": 3.5194802284240723, "lr": 0.00029002963362377744, "tps": 14100, "wall": 55797.5} {"step": 12005, "train_loss": 3.5299105644226074, "lr": 0.00029001198458751694, "tps": 14100, "wall": 55802.4} {"step": 12006, "train_loss": 3.4460110664367676, "lr": 0.0002899943347581568, "tps": 14100, "wall": 55807.4} {"step": 12007, "train_loss": 3.40771222114563, "lr": 0.0002899766841358971, "tps": 14100, "wall": 55812.3} {"step": 12008, "train_loss": 3.468994617462158, "lr": 0.0002899590327209377, "tps": 14099, "wall": 55817.3} {"step": 12009, "train_loss": 3.406552791595459, "lr": 0.0002899413805134786, "tps": 14099, "wall": 55822.2} {"step": 12010, "train_loss": 3.4063868522644043, "lr": 0.00028992372751371977, "tps": 14099, "wall": 55827.2} {"step": 12011, "train_loss": 3.3437447547912598, "lr": 0.00028990607372186107, "tps": 14099, "wall": 55832.2} {"step": 12012, "train_loss": 3.289598226547241, "lr": 0.00028988841913810267, "tps": 14099, "wall": 55837.1} {"step": 12013, "train_loss": 3.4725847244262695, "lr": 0.0002898707637626445, "tps": 14099, "wall": 55842.1} {"step": 12014, "train_loss": 3.5266664028167725, "lr": 0.0002898531075956865, "tps": 14099, "wall": 55847.0} {"step": 12015, "train_loss": 3.4582760334014893, "lr": 0.00028983545063742875, "tps": 14099, "wall": 55852.0} {"step": 12016, "train_loss": 3.4322469234466553, "lr": 0.0002898177928880713, "tps": 14099, "wall": 55857.0} {"step": 12017, "train_loss": 3.400330066680908, "lr": 0.00028980013434781396, "tps": 14099, "wall": 55862.0} {"step": 12018, "train_loss": 3.3761510848999023, "lr": 0.000289782475016857, "tps": 14099, "wall": 55866.9} {"step": 12019, "train_loss": 3.442810535430908, "lr": 0.0002897648148954004, "tps": 14099, "wall": 55871.9} {"step": 12020, "train_loss": 3.436575412750244, "lr": 0.00028974715398364417, "tps": 14099, "wall": 55876.8} {"step": 12021, "train_loss": 3.562927722930908, "lr": 0.00028972949228178843, "tps": 14098, "wall": 55881.8} {"step": 12022, "train_loss": 3.4687113761901855, "lr": 0.00028971182979003324, "tps": 14098, "wall": 55886.7} {"step": 12023, "train_loss": 3.3790574073791504, "lr": 0.00028969416650857863, "tps": 14098, "wall": 55891.6} {"step": 12024, "train_loss": 3.506875514984131, "lr": 0.00028967650243762476, "tps": 14098, "wall": 55896.6} {"step": 12025, "train_loss": 3.386610984802246, "lr": 0.0002896588375773717, "tps": 14098, "wall": 55901.5} {"step": 12026, "train_loss": 3.4731311798095703, "lr": 0.00028964117192801955, "tps": 14098, "wall": 55906.5} {"step": 12027, "train_loss": 3.439720869064331, "lr": 0.00028962350548976845, "tps": 14098, "wall": 55911.4} {"step": 12028, "train_loss": 3.5248661041259766, "lr": 0.0002896058382628185, "tps": 14098, "wall": 55916.5} {"step": 12029, "train_loss": 3.475346088409424, "lr": 0.0002895881702473699, "tps": 14098, "wall": 55921.5} {"step": 12030, "train_loss": 3.4965178966522217, "lr": 0.00028957050144362263, "tps": 14098, "wall": 55926.4} {"step": 12031, "train_loss": 3.4971494674682617, "lr": 0.00028955283185177707, "tps": 14098, "wall": 55931.4} {"step": 12032, "train_loss": 3.5026702880859375, "lr": 0.00028953516147203317, "tps": 14098, "wall": 55936.3} {"step": 12033, "train_loss": 3.500922679901123, "lr": 0.0002895174903045913, "tps": 14098, "wall": 55941.3} {"step": 12034, "train_loss": 3.540452241897583, "lr": 0.00028949981834965147, "tps": 14097, "wall": 55946.2} {"step": 12035, "train_loss": 3.39341402053833, "lr": 0.00028948214560741396, "tps": 14097, "wall": 55951.2} {"step": 12036, "train_loss": 3.4772918224334717, "lr": 0.00028946447207807896, "tps": 14097, "wall": 55956.1} {"step": 12037, "train_loss": 3.381417751312256, "lr": 0.00028944679776184666, "tps": 14097, "wall": 55961.1} {"step": 12038, "train_loss": 3.4447216987609863, "lr": 0.0002894291226589172, "tps": 14097, "wall": 55966.1} {"step": 12039, "train_loss": 3.3854641914367676, "lr": 0.000289411446769491, "tps": 14097, "wall": 55971.0} {"step": 12040, "train_loss": 3.5538251399993896, "lr": 0.0002893937700937681, "tps": 14097, "wall": 55976.0} {"step": 12041, "train_loss": 3.3934078216552734, "lr": 0.0002893760926319488, "tps": 14097, "wall": 55981.0} {"step": 12042, "train_loss": 3.434058666229248, "lr": 0.00028935841438423345, "tps": 14097, "wall": 55985.9} {"step": 12043, "train_loss": 3.4486327171325684, "lr": 0.0002893407353508222, "tps": 14097, "wall": 55990.9} {"step": 12044, "train_loss": 3.465181350708008, "lr": 0.0002893230555319153, "tps": 14097, "wall": 55995.8} {"step": 12045, "train_loss": 3.5396604537963867, "lr": 0.0002893053749277131, "tps": 14097, "wall": 56000.8} {"step": 12046, "train_loss": 3.463306427001953, "lr": 0.00028928769353841593, "tps": 14096, "wall": 56005.8} {"step": 12047, "train_loss": 3.523106098175049, "lr": 0.00028927001136422396, "tps": 14096, "wall": 56010.7} {"step": 12048, "train_loss": 3.596139430999756, "lr": 0.0002892523284053375, "tps": 14096, "wall": 56015.7} {"step": 12049, "train_loss": 3.400306224822998, "lr": 0.00028923464466195704, "tps": 14096, "wall": 56020.7} {"step": 12050, "train_loss": 3.4544849395751953, "lr": 0.0002892169601342827, "tps": 14096, "wall": 56025.6} {"step": 12051, "train_loss": 3.4714508056640625, "lr": 0.00028919927482251486, "tps": 14096, "wall": 56030.5} {"step": 12052, "train_loss": 3.4414379596710205, "lr": 0.000289181588726854, "tps": 14096, "wall": 56035.5} {"step": 12053, "train_loss": 3.4452641010284424, "lr": 0.0002891639018475003, "tps": 14096, "wall": 56040.5} {"step": 12054, "train_loss": 3.449542760848999, "lr": 0.00028914621418465417, "tps": 14096, "wall": 56045.5} {"step": 12055, "train_loss": 3.4469523429870605, "lr": 0.00028912852573851597, "tps": 14096, "wall": 56050.4} {"step": 12056, "train_loss": 3.431485891342163, "lr": 0.0002891108365092862, "tps": 14096, "wall": 56055.4} {"step": 12057, "train_loss": 3.3375027179718018, "lr": 0.000289093146497165, "tps": 14096, "wall": 56060.3} {"step": 12058, "train_loss": 3.526881456375122, "lr": 0.0002890754557023529, "tps": 14096, "wall": 56065.3} {"step": 12059, "train_loss": 3.4124228954315186, "lr": 0.00028905776412505046, "tps": 14095, "wall": 56070.3} {"step": 12060, "train_loss": 3.408634901046753, "lr": 0.0002890400717654578, "tps": 14095, "wall": 56075.2} {"step": 12061, "train_loss": 3.5549144744873047, "lr": 0.00028902237862377545, "tps": 14095, "wall": 56080.2} {"step": 12062, "train_loss": 3.4575679302215576, "lr": 0.00028900468470020386, "tps": 14095, "wall": 56085.2} {"step": 12063, "train_loss": 3.523052453994751, "lr": 0.0002889869899949436, "tps": 14095, "wall": 56090.1} {"step": 12064, "train_loss": 3.4859766960144043, "lr": 0.0002889692945081949, "tps": 14095, "wall": 56095.0} {"step": 12065, "train_loss": 3.357877492904663, "lr": 0.0002889515982401582, "tps": 14095, "wall": 56100.1} {"step": 12066, "train_loss": 3.3864407539367676, "lr": 0.00028893390119103424, "tps": 14095, "wall": 56105.0} {"step": 12067, "train_loss": 3.49320650100708, "lr": 0.00028891620336102324, "tps": 14095, "wall": 56110.0} {"step": 12068, "train_loss": 3.4232892990112305, "lr": 0.0002888985047503257, "tps": 14095, "wall": 56114.9} {"step": 12069, "train_loss": 3.4937331676483154, "lr": 0.0002888808053591422, "tps": 14095, "wall": 56119.9} {"step": 12070, "train_loss": 3.413928985595703, "lr": 0.0002888631051876733, "tps": 14095, "wall": 56124.8} {"step": 12071, "train_loss": 3.403916835784912, "lr": 0.0002888454042361194, "tps": 14095, "wall": 56129.7} {"step": 12072, "train_loss": 3.6055567264556885, "lr": 0.0002888277025046809, "tps": 14094, "wall": 56134.7} {"step": 12073, "train_loss": 3.4153285026550293, "lr": 0.00028880999999355867, "tps": 14094, "wall": 56139.7} {"step": 12074, "train_loss": 3.3621106147766113, "lr": 0.00028879229670295285, "tps": 14094, "wall": 56144.6} {"step": 12075, "train_loss": 3.480717897415161, "lr": 0.00028877459263306426, "tps": 14094, "wall": 56149.6} {"step": 12076, "train_loss": 3.3822813034057617, "lr": 0.0002887568877840934, "tps": 14094, "wall": 56154.5} {"step": 12077, "train_loss": 3.4627087116241455, "lr": 0.00028873918215624076, "tps": 14094, "wall": 56159.6} {"step": 12078, "train_loss": 3.322549819946289, "lr": 0.0002887214757497069, "tps": 14094, "wall": 56164.5} {"step": 12079, "train_loss": 3.3796486854553223, "lr": 0.0002887037685646925, "tps": 14094, "wall": 56169.4} {"step": 12080, "train_loss": 3.3735783100128174, "lr": 0.0002886860606013981, "tps": 14094, "wall": 56174.4} {"step": 12081, "train_loss": 3.4705255031585693, "lr": 0.0002886683518600242, "tps": 14094, "wall": 56179.3} {"step": 12082, "train_loss": 3.4038820266723633, "lr": 0.00028865064234077155, "tps": 14094, "wall": 56184.3} {"step": 12083, "train_loss": 3.4562747478485107, "lr": 0.00028863293204384074, "tps": 14094, "wall": 56189.3} {"step": 12084, "train_loss": 3.4072763919830322, "lr": 0.00028861522096943235, "tps": 14094, "wall": 56194.2} {"step": 12085, "train_loss": 3.420689105987549, "lr": 0.000288597509117747, "tps": 14093, "wall": 56199.2} {"step": 12086, "train_loss": 3.5323712825775146, "lr": 0.00028857979648898535, "tps": 14093, "wall": 56204.1} {"step": 12087, "train_loss": 3.5253024101257324, "lr": 0.0002885620830833481, "tps": 14093, "wall": 56209.1} {"step": 12088, "train_loss": 3.4728665351867676, "lr": 0.00028854436890103587, "tps": 14093, "wall": 56214.0} {"step": 12089, "train_loss": 3.5809519290924072, "lr": 0.00028852665394224925, "tps": 14093, "wall": 56219.0} {"step": 12090, "train_loss": 3.4409303665161133, "lr": 0.00028850893820718906, "tps": 14093, "wall": 56224.0} {"step": 12091, "train_loss": 3.5848779678344727, "lr": 0.00028849122169605587, "tps": 14093, "wall": 56228.9} {"step": 12092, "train_loss": 3.540858745574951, "lr": 0.0002884735044090504, "tps": 14093, "wall": 56233.9} {"step": 12093, "train_loss": 3.3838205337524414, "lr": 0.0002884557863463734, "tps": 14093, "wall": 56238.8} {"step": 12094, "train_loss": 3.505620002746582, "lr": 0.0002884380675082256, "tps": 14093, "wall": 56243.8} {"step": 12095, "train_loss": 3.432612419128418, "lr": 0.0002884203478948076, "tps": 14093, "wall": 56248.7} {"step": 12096, "train_loss": 3.4848949909210205, "lr": 0.00028840262750632023, "tps": 14093, "wall": 56253.7} {"step": 12097, "train_loss": 3.4101266860961914, "lr": 0.0002883849063429642, "tps": 14093, "wall": 56258.6} {"step": 12098, "train_loss": 3.479050397872925, "lr": 0.0002883671844049402, "tps": 14092, "wall": 56263.6} {"step": 12099, "train_loss": 3.549133062362671, "lr": 0.000288349461692449, "tps": 14092, "wall": 56268.5} {"step": 12100, "train_loss": 3.468026876449585, "lr": 0.00028833173820569147, "tps": 14092, "wall": 56273.5} {"step": 12101, "train_loss": 3.3836913108825684, "lr": 0.00028831401394486834, "tps": 14092, "wall": 56278.5} {"step": 12102, "train_loss": 3.4311609268188477, "lr": 0.0002882962889101803, "tps": 14092, "wall": 56283.5} {"step": 12103, "train_loss": 3.5093650817871094, "lr": 0.0002882785631018282, "tps": 14092, "wall": 56288.4} {"step": 12104, "train_loss": 3.585048198699951, "lr": 0.00028826083652001285, "tps": 14092, "wall": 56293.4} {"step": 12105, "train_loss": 3.396137237548828, "lr": 0.0002882431091649351, "tps": 14092, "wall": 56298.3} {"step": 12106, "train_loss": 3.339467763900757, "lr": 0.00028822538103679573, "tps": 14092, "wall": 56303.3} {"step": 12107, "train_loss": 3.5452592372894287, "lr": 0.0002882076521357955, "tps": 14092, "wall": 56308.3} {"step": 12108, "train_loss": 3.5126583576202393, "lr": 0.0002881899224621353, "tps": 14092, "wall": 56313.2} {"step": 12109, "train_loss": 3.3796143531799316, "lr": 0.000288172192016016, "tps": 14092, "wall": 56318.2} {"step": 12110, "train_loss": 3.408722400665283, "lr": 0.0002881544607976384, "tps": 14092, "wall": 56323.1} {"step": 12111, "train_loss": 3.47625732421875, "lr": 0.00028813672880720337, "tps": 14091, "wall": 56328.1} {"step": 12112, "train_loss": 3.5897817611694336, "lr": 0.00028811899604491183, "tps": 14091, "wall": 56333.1} {"step": 12113, "train_loss": 3.4805660247802734, "lr": 0.0002881012625109646, "tps": 14091, "wall": 56338.1} {"step": 12114, "train_loss": 3.5956225395202637, "lr": 0.0002880835282055625, "tps": 14091, "wall": 56343.0} {"step": 12115, "train_loss": 3.52801513671875, "lr": 0.0002880657931289067, "tps": 14091, "wall": 56348.0} {"step": 12116, "train_loss": 3.472989082336426, "lr": 0.00028804805728119775, "tps": 14091, "wall": 56353.0} {"step": 12117, "train_loss": 3.507535219192505, "lr": 0.0002880303206626368, "tps": 14091, "wall": 56357.9} {"step": 12118, "train_loss": 3.5139222145080566, "lr": 0.00028801258327342466, "tps": 14091, "wall": 56362.9} {"step": 12119, "train_loss": 3.4115891456604004, "lr": 0.0002879948451137623, "tps": 14091, "wall": 56367.9} {"step": 12120, "train_loss": 3.483485460281372, "lr": 0.00028797710618385064, "tps": 14091, "wall": 56372.9} {"step": 12121, "train_loss": 3.452227830886841, "lr": 0.0002879593664838907, "tps": 14091, "wall": 56377.8} {"step": 12122, "train_loss": 3.4524145126342773, "lr": 0.00028794162601408334, "tps": 14091, "wall": 56382.8} {"step": 12123, "train_loss": 3.4598100185394287, "lr": 0.0002879238847746295, "tps": 14090, "wall": 56387.7} {"step": 12124, "train_loss": 3.438938856124878, "lr": 0.0002879061427657304, "tps": 14090, "wall": 56392.7} {"step": 12125, "train_loss": 3.4436097145080566, "lr": 0.00028788839998758665, "tps": 14090, "wall": 56397.7} {"step": 12126, "train_loss": 3.4420671463012695, "lr": 0.00028787065644039956, "tps": 14090, "wall": 56402.7} {"step": 12127, "train_loss": 3.3995323181152344, "lr": 0.00028785291212436997, "tps": 14090, "wall": 56407.6} {"step": 12128, "train_loss": 3.491152286529541, "lr": 0.0002878351670396989, "tps": 14090, "wall": 56412.6} {"step": 12129, "train_loss": 3.4795656204223633, "lr": 0.0002878174211865874, "tps": 14090, "wall": 56417.5} {"step": 12130, "train_loss": 3.4132113456726074, "lr": 0.00028779967456523645, "tps": 14090, "wall": 56422.5} {"step": 12131, "train_loss": 3.476696729660034, "lr": 0.0002877819271758472, "tps": 14090, "wall": 56427.4} {"step": 12132, "train_loss": 3.452812910079956, "lr": 0.00028776417901862054, "tps": 14090, "wall": 56432.5} {"step": 12133, "train_loss": 3.4233779907226562, "lr": 0.0002877464300937576, "tps": 14090, "wall": 56437.4} {"step": 12134, "train_loss": 3.427499771118164, "lr": 0.00028772868040145947, "tps": 14090, "wall": 56442.3} {"step": 12135, "train_loss": 3.450054407119751, "lr": 0.00028771092994192717, "tps": 14090, "wall": 56447.3} {"step": 12136, "train_loss": 3.445375919342041, "lr": 0.0002876931787153618, "tps": 14089, "wall": 56452.3} {"step": 12137, "train_loss": 3.4578418731689453, "lr": 0.00028767542672196434, "tps": 14089, "wall": 56457.3} {"step": 12138, "train_loss": 3.433764934539795, "lr": 0.00028765767396193615, "tps": 14089, "wall": 56462.2} {"step": 12139, "train_loss": 3.4872398376464844, "lr": 0.00028763992043547807, "tps": 14089, "wall": 56467.2} {"step": 12140, "train_loss": 3.451467514038086, "lr": 0.00028762216614279133, "tps": 14089, "wall": 56472.2} {"step": 12141, "train_loss": 3.5672495365142822, "lr": 0.00028760441108407705, "tps": 14089, "wall": 56477.1} {"step": 12142, "train_loss": 3.4012484550476074, "lr": 0.0002875866552595363, "tps": 14089, "wall": 56482.1} {"step": 12143, "train_loss": 3.440563201904297, "lr": 0.0002875688986693703, "tps": 14089, "wall": 56487.0} {"step": 12144, "train_loss": 3.413334846496582, "lr": 0.00028755114131378016, "tps": 14089, "wall": 56492.0} {"step": 12145, "train_loss": 3.53120756149292, "lr": 0.000287533383192967, "tps": 14089, "wall": 56497.0} {"step": 12146, "train_loss": 3.4745125770568848, "lr": 0.00028751562430713205, "tps": 14089, "wall": 56502.0} {"step": 12147, "train_loss": 3.428896903991699, "lr": 0.0002874978646564765, "tps": 14089, "wall": 56506.9} {"step": 12148, "train_loss": 3.3820836544036865, "lr": 0.0002874801042412014, "tps": 14089, "wall": 56511.9} {"step": 12149, "train_loss": 3.4594593048095703, "lr": 0.00028746234306150807, "tps": 14088, "wall": 56516.9} {"step": 12150, "train_loss": 3.479895830154419, "lr": 0.0002874445811175977, "tps": 14088, "wall": 56521.8} {"step": 12151, "train_loss": 3.451331377029419, "lr": 0.0002874268184096715, "tps": 14088, "wall": 56526.8} {"step": 12152, "train_loss": 3.4315476417541504, "lr": 0.00028740905493793053, "tps": 14088, "wall": 56531.8} {"step": 12153, "train_loss": 3.4962761402130127, "lr": 0.0002873912907025762, "tps": 14088, "wall": 56536.7} {"step": 12154, "train_loss": 3.4891557693481445, "lr": 0.00028737352570380964, "tps": 14088, "wall": 56541.7} {"step": 12155, "train_loss": 3.386875629425049, "lr": 0.00028735575994183227, "tps": 14088, "wall": 56546.6} {"step": 12156, "train_loss": 3.424628973007202, "lr": 0.0002873379934168451, "tps": 14088, "wall": 56551.6} {"step": 12157, "train_loss": 3.5168533325195312, "lr": 0.0002873202261290495, "tps": 14088, "wall": 56556.5} {"step": 12158, "train_loss": 3.5034022331237793, "lr": 0.00028730245807864676, "tps": 14088, "wall": 56561.5} {"step": 12159, "train_loss": 3.453707456588745, "lr": 0.0002872846892658381, "tps": 14088, "wall": 56566.4} {"step": 12160, "train_loss": 3.401841163635254, "lr": 0.00028726691969082485, "tps": 14088, "wall": 56571.4} {"step": 12161, "train_loss": 3.4337120056152344, "lr": 0.0002872491493538083, "tps": 14088, "wall": 56576.4} {"step": 12162, "train_loss": 3.3975486755371094, "lr": 0.00028723137825498976, "tps": 14087, "wall": 56581.3} {"step": 12163, "train_loss": 3.3986682891845703, "lr": 0.0002872136063945705, "tps": 14087, "wall": 56586.3} {"step": 12164, "train_loss": 3.3398711681365967, "lr": 0.0002871958337727519, "tps": 14087, "wall": 56591.2} {"step": 12165, "train_loss": 3.43898344039917, "lr": 0.0002871780603897353, "tps": 14087, "wall": 56596.2} {"step": 12166, "train_loss": 3.482271194458008, "lr": 0.00028716028624572196, "tps": 14087, "wall": 56601.2} {"step": 12167, "train_loss": 3.404193162918091, "lr": 0.00028714251134091324, "tps": 14087, "wall": 56606.1} {"step": 12168, "train_loss": 3.511305809020996, "lr": 0.00028712473567551057, "tps": 14087, "wall": 56611.1} {"step": 12169, "train_loss": 3.3769965171813965, "lr": 0.0002871069592497152, "tps": 14087, "wall": 56616.0} {"step": 12170, "train_loss": 3.5342774391174316, "lr": 0.0002870891820637286, "tps": 14087, "wall": 56621.0} {"step": 12171, "train_loss": 3.56058669090271, "lr": 0.0002870714041177521, "tps": 14087, "wall": 56626.0} {"step": 12172, "train_loss": 3.4693400859832764, "lr": 0.0002870536254119871, "tps": 14087, "wall": 56630.9} {"step": 12173, "train_loss": 3.4592456817626953, "lr": 0.0002870358459466351, "tps": 14087, "wall": 56635.9} {"step": 12174, "train_loss": 3.49429988861084, "lr": 0.00028701806572189727, "tps": 14087, "wall": 56640.9} {"step": 12175, "train_loss": 3.4945740699768066, "lr": 0.00028700028473797526, "tps": 14086, "wall": 56645.9} {"step": 12176, "train_loss": 3.453134298324585, "lr": 0.00028698250299507037, "tps": 14086, "wall": 56650.8} {"step": 12177, "train_loss": 3.3696372509002686, "lr": 0.0002869647204933841, "tps": 14086, "wall": 56655.8} {"step": 12178, "train_loss": 3.5032427310943604, "lr": 0.0002869469372331178, "tps": 14086, "wall": 56660.8} {"step": 12179, "train_loss": 3.480398654937744, "lr": 0.00028692915321447296, "tps": 14086, "wall": 56665.7} {"step": 12180, "train_loss": 3.355253219604492, "lr": 0.0002869113684376511, "tps": 14086, "wall": 56670.6} {"step": 12181, "train_loss": 3.3870697021484375, "lr": 0.0002868935829028536, "tps": 14086, "wall": 56675.6} {"step": 12182, "train_loss": 3.3583245277404785, "lr": 0.000286875796610282, "tps": 14086, "wall": 56680.6} {"step": 12183, "train_loss": 3.52162504196167, "lr": 0.00028685800956013775, "tps": 14086, "wall": 56685.5} {"step": 12184, "train_loss": 3.4145121574401855, "lr": 0.00028684022175262235, "tps": 14086, "wall": 56690.5} {"step": 12185, "train_loss": 3.402007818222046, "lr": 0.0002868224331879373, "tps": 14086, "wall": 56695.4} {"step": 12186, "train_loss": 3.4146230220794678, "lr": 0.0002868046438662841, "tps": 14086, "wall": 56700.4} {"step": 12187, "train_loss": 3.4977030754089355, "lr": 0.00028678685378786433, "tps": 14086, "wall": 56705.4} {"step": 12188, "train_loss": 3.4513566493988037, "lr": 0.00028676906295287943, "tps": 14085, "wall": 56710.4} {"step": 12189, "train_loss": 3.497535228729248, "lr": 0.000286751271361531, "tps": 14085, "wall": 56715.3} {"step": 12190, "train_loss": 3.370863199234009, "lr": 0.00028673347901402046, "tps": 14085, "wall": 56720.3} {"step": 12191, "train_loss": 3.4199490547180176, "lr": 0.00028671568591054954, "tps": 14085, "wall": 56725.2} {"step": 12192, "train_loss": 3.472910165786743, "lr": 0.00028669789205131973, "tps": 14085, "wall": 56730.2} {"step": 12193, "train_loss": 3.315605401992798, "lr": 0.00028668009743653257, "tps": 14085, "wall": 56735.2} {"step": 12194, "train_loss": 3.3572332859039307, "lr": 0.00028666230206638967, "tps": 14085, "wall": 56740.1} {"step": 12195, "train_loss": 3.4801220893859863, "lr": 0.0002866445059410926, "tps": 14085, "wall": 56745.1} {"step": 12196, "train_loss": 3.3454272747039795, "lr": 0.0002866267090608429, "tps": 14085, "wall": 56750.0} {"step": 12197, "train_loss": 3.5269808769226074, "lr": 0.00028660891142584234, "tps": 14085, "wall": 56755.0} {"step": 12198, "train_loss": 3.376349449157715, "lr": 0.0002865911130362924, "tps": 14085, "wall": 56760.0} {"step": 12199, "train_loss": 3.356541156768799, "lr": 0.0002865733138923947, "tps": 14085, "wall": 56764.9} {"step": 12200, "train_loss": 3.427248954772949, "lr": 0.0002865555139943509, "tps": 14085, "wall": 56769.9} {"step": 12201, "train_loss": 3.3826470375061035, "lr": 0.0002865377133423627, "tps": 14084, "wall": 56774.8} {"step": 12202, "train_loss": 3.4538331031799316, "lr": 0.00028651991193663157, "tps": 14084, "wall": 56779.8} {"step": 12203, "train_loss": 3.452953815460205, "lr": 0.00028650210977735935, "tps": 14084, "wall": 56784.7} {"step": 12204, "train_loss": 3.4271352291107178, "lr": 0.0002864843068647476, "tps": 14084, "wall": 56789.7} {"step": 12205, "train_loss": 3.502216100692749, "lr": 0.000286466503198998, "tps": 14084, "wall": 56794.6} {"step": 12206, "train_loss": 3.445801258087158, "lr": 0.0002864486987803124, "tps": 14084, "wall": 56799.6} {"step": 12207, "train_loss": 3.3879973888397217, "lr": 0.0002864308936088922, "tps": 14084, "wall": 56804.5} {"step": 12208, "train_loss": 3.4082460403442383, "lr": 0.0002864130876849393, "tps": 14084, "wall": 56809.4} {"step": 12209, "train_loss": 3.504897356033325, "lr": 0.00028639528100865536, "tps": 14084, "wall": 56814.4} {"step": 12210, "train_loss": 3.3932955265045166, "lr": 0.000286377473580242, "tps": 14084, "wall": 56819.3} {"step": 12211, "train_loss": 3.470485210418701, "lr": 0.0002863596653999011, "tps": 14084, "wall": 56824.3} {"step": 12212, "train_loss": 3.361257791519165, "lr": 0.00028634185646783433, "tps": 14084, "wall": 56829.2} {"step": 12213, "train_loss": 3.475586414337158, "lr": 0.0002863240467842434, "tps": 14084, "wall": 56834.2} {"step": 12214, "train_loss": 3.530945301055908, "lr": 0.0002863062363493301, "tps": 14084, "wall": 56839.1} {"step": 12215, "train_loss": 3.4208731651306152, "lr": 0.00028628842516329616, "tps": 14083, "wall": 56844.0} {"step": 12216, "train_loss": 3.425790786743164, "lr": 0.0002862706132263434, "tps": 14083, "wall": 56849.0} {"step": 12217, "train_loss": 3.432006359100342, "lr": 0.0002862528005386734, "tps": 14083, "wall": 56853.9} {"step": 12218, "train_loss": 3.4087700843811035, "lr": 0.0002862349871004882, "tps": 14083, "wall": 56858.8} {"step": 12219, "train_loss": 3.4056615829467773, "lr": 0.00028621717291198943, "tps": 14083, "wall": 56863.7} {"step": 12220, "train_loss": 3.4422266483306885, "lr": 0.000286199357973379, "tps": 14083, "wall": 56868.6} {"step": 12221, "train_loss": 3.4986135959625244, "lr": 0.0002861815422848587, "tps": 14083, "wall": 56873.6} {"step": 12222, "train_loss": 3.470322370529175, "lr": 0.00028616372584663023, "tps": 14083, "wall": 56878.5} {"step": 12223, "train_loss": 3.4821176528930664, "lr": 0.00028614590865889554, "tps": 14083, "wall": 56883.5} {"step": 12224, "train_loss": 3.4566752910614014, "lr": 0.0002861280907218564, "tps": 14083, "wall": 56888.4} {"step": 12225, "train_loss": 3.4818482398986816, "lr": 0.00028611027203571466, "tps": 14083, "wall": 56893.3} {"step": 12226, "train_loss": 3.4436941146850586, "lr": 0.0002860924526006722, "tps": 14083, "wall": 56898.3} {"step": 12227, "train_loss": 3.425060749053955, "lr": 0.0002860746324169308, "tps": 14083, "wall": 56903.2} {"step": 12228, "train_loss": 3.4486398696899414, "lr": 0.00028605681148469246, "tps": 14083, "wall": 56908.2} {"step": 12229, "train_loss": 3.4361743927001953, "lr": 0.00028603898980415895, "tps": 14082, "wall": 56913.1} {"step": 12230, "train_loss": 3.493335247039795, "lr": 0.00028602116737553223, "tps": 14082, "wall": 56918.0} {"step": 12231, "train_loss": 3.436180591583252, "lr": 0.00028600334419901413, "tps": 14082, "wall": 56922.9} {"step": 12232, "train_loss": 3.4560747146606445, "lr": 0.0002859855202748065, "tps": 14082, "wall": 56927.8} {"step": 12233, "train_loss": 3.5641980171203613, "lr": 0.0002859676956031115, "tps": 14082, "wall": 56932.7} {"step": 12234, "train_loss": 3.44441556930542, "lr": 0.0002859498701841308, "tps": 14082, "wall": 56937.7} {"step": 12235, "train_loss": 3.434380054473877, "lr": 0.0002859320440180663, "tps": 14082, "wall": 56942.6} {"step": 12236, "train_loss": 3.398711681365967, "lr": 0.00028591421710512014, "tps": 14082, "wall": 56947.5} {"step": 12237, "train_loss": 3.4118616580963135, "lr": 0.00028589638944549414, "tps": 14082, "wall": 56952.5} {"step": 12238, "train_loss": 3.3933746814727783, "lr": 0.00028587856103939023, "tps": 14082, "wall": 56957.4} {"step": 12239, "train_loss": 3.470001220703125, "lr": 0.0002858607318870105, "tps": 14082, "wall": 56962.3} {"step": 12240, "train_loss": 3.570192337036133, "lr": 0.00028584290198855683, "tps": 14082, "wall": 56967.2} {"step": 12241, "train_loss": 3.468003511428833, "lr": 0.00028582507134423116, "tps": 14082, "wall": 56972.1} {"step": 12242, "train_loss": 3.360170364379883, "lr": 0.0002858072399542355, "tps": 14082, "wall": 56977.0} {"step": 12243, "train_loss": 3.450709581375122, "lr": 0.00028578940781877197, "tps": 14082, "wall": 56981.9} {"step": 12244, "train_loss": 3.579348087310791, "lr": 0.00028577157493804236, "tps": 14082, "wall": 56986.8} {"step": 12245, "train_loss": 3.439730644226074, "lr": 0.00028575374131224876, "tps": 14081, "wall": 56991.7} {"step": 12246, "train_loss": 3.4594168663024902, "lr": 0.0002857359069415933, "tps": 14081, "wall": 56996.7} {"step": 12247, "train_loss": 3.550034999847412, "lr": 0.00028571807182627796, "tps": 14081, "wall": 57001.6} {"step": 12248, "train_loss": 3.4883852005004883, "lr": 0.00028570023596650475, "tps": 14081, "wall": 57006.6} {"step": 12249, "train_loss": 3.492976188659668, "lr": 0.00028568239936247565, "tps": 14081, "wall": 57011.5} {"step": 12250, "train_loss": 3.2837963104248047, "lr": 0.0002856645620143928, "tps": 14081, "wall": 57016.4} {"step": 12251, "train_loss": 3.347872018814087, "lr": 0.0002856467239224582, "tps": 14081, "wall": 57021.3} {"step": 12252, "train_loss": 3.519073247909546, "lr": 0.00028562888508687403, "tps": 14081, "wall": 57026.2} {"step": 12253, "train_loss": 3.5091605186462402, "lr": 0.00028561104550784225, "tps": 14081, "wall": 57031.2} {"step": 12254, "train_loss": 3.5021963119506836, "lr": 0.00028559320518556505, "tps": 14081, "wall": 57036.1} {"step": 12255, "train_loss": 3.546816825866699, "lr": 0.00028557536412024436, "tps": 14081, "wall": 57041.0} {"step": 12256, "train_loss": 3.439115047454834, "lr": 0.0002855575223120825, "tps": 14081, "wall": 57045.9} {"step": 12257, "train_loss": 3.468503952026367, "lr": 0.00028553967976128146, "tps": 14081, "wall": 57050.8} {"step": 12258, "train_loss": 3.4200074672698975, "lr": 0.0002855218364680434, "tps": 14081, "wall": 57055.7} {"step": 12259, "train_loss": 3.4685721397399902, "lr": 0.0002855039924325704, "tps": 14080, "wall": 57060.7} {"step": 12260, "train_loss": 3.343139410018921, "lr": 0.0002854861476550646, "tps": 14080, "wall": 57065.6} {"step": 12261, "train_loss": 3.4192161560058594, "lr": 0.00028546830213572826, "tps": 14080, "wall": 57070.6} {"step": 12262, "train_loss": 3.4612762928009033, "lr": 0.0002854504558747634, "tps": 14080, "wall": 57075.5} {"step": 12263, "train_loss": 3.4290528297424316, "lr": 0.00028543260887237224, "tps": 14080, "wall": 57080.4} {"step": 12264, "train_loss": 3.4489543437957764, "lr": 0.0002854147611287569, "tps": 14080, "wall": 57085.3} {"step": 12265, "train_loss": 3.446597099304199, "lr": 0.0002853969126441197, "tps": 14080, "wall": 57090.3} {"step": 12266, "train_loss": 3.378514528274536, "lr": 0.0002853790634186627, "tps": 14080, "wall": 57095.2} {"step": 12267, "train_loss": 3.387873649597168, "lr": 0.00028536121345258816, "tps": 14080, "wall": 57100.1} {"step": 12268, "train_loss": 3.5107059478759766, "lr": 0.0002853433627460982, "tps": 14080, "wall": 57105.0} {"step": 12269, "train_loss": 3.467165946960449, "lr": 0.0002853255112993951, "tps": 14080, "wall": 57109.9} {"step": 12270, "train_loss": 3.4122118949890137, "lr": 0.00028530765911268104, "tps": 14080, "wall": 57114.9} {"step": 12271, "train_loss": 3.437222480773926, "lr": 0.00028528980618615834, "tps": 14080, "wall": 57119.8} {"step": 12272, "train_loss": 3.5150129795074463, "lr": 0.00028527195252002924, "tps": 14080, "wall": 57124.8} {"step": 12273, "train_loss": 3.4484853744506836, "lr": 0.00028525409811449583, "tps": 14080, "wall": 57129.7} {"step": 12274, "train_loss": 3.447598457336426, "lr": 0.0002852362429697605, "tps": 14079, "wall": 57134.6} {"step": 12275, "train_loss": 3.410963296890259, "lr": 0.0002852183870860255, "tps": 14079, "wall": 57139.5} {"step": 12276, "train_loss": 3.4335639476776123, "lr": 0.00028520053046349306, "tps": 14079, "wall": 57144.4} {"step": 12277, "train_loss": 3.4343249797821045, "lr": 0.00028518267310236544, "tps": 14079, "wall": 57149.4} {"step": 12278, "train_loss": 3.4041876792907715, "lr": 0.0002851648150028451, "tps": 14079, "wall": 57154.3} {"step": 12279, "train_loss": 3.4578027725219727, "lr": 0.0002851469561651341, "tps": 14079, "wall": 57159.2} {"step": 12280, "train_loss": 3.3992297649383545, "lr": 0.00028512909658943487, "tps": 14079, "wall": 57164.1} {"step": 12281, "train_loss": 3.424820899963379, "lr": 0.0002851112362759497, "tps": 14079, "wall": 57169.0} {"step": 12282, "train_loss": 3.406405210494995, "lr": 0.000285093375224881, "tps": 14079, "wall": 57173.9} {"step": 12283, "train_loss": 3.4915099143981934, "lr": 0.00028507551343643093, "tps": 14079, "wall": 57178.9} {"step": 12284, "train_loss": 3.45776629447937, "lr": 0.000285057650910802, "tps": 14079, "wall": 57183.8} {"step": 12285, "train_loss": 3.4700965881347656, "lr": 0.00028503978764819645, "tps": 14079, "wall": 57188.8} {"step": 12286, "train_loss": 3.369229555130005, "lr": 0.00028502192364881666, "tps": 14079, "wall": 57193.7} {"step": 12287, "train_loss": 3.513084650039673, "lr": 0.000285004058912865, "tps": 14079, "wall": 57198.7} {"step": 12288, "train_loss": 3.3303637504577637, "lr": 0.0002849861934405439, "tps": 14079, "wall": 57203.6} {"step": 12289, "train_loss": 3.463176727294922, "lr": 0.00028496832723205555, "tps": 14078, "wall": 57208.5} {"step": 12290, "train_loss": 3.5410969257354736, "lr": 0.0002849504602876026, "tps": 14078, "wall": 57213.5} {"step": 12291, "train_loss": 3.431457996368408, "lr": 0.0002849325926073873, "tps": 14078, "wall": 57218.4} {"step": 12292, "train_loss": 3.4424667358398438, "lr": 0.00028491472419161205, "tps": 14078, "wall": 57223.3} {"step": 12293, "train_loss": 3.5164597034454346, "lr": 0.0002848968550404793, "tps": 14078, "wall": 57228.2} {"step": 12294, "train_loss": 3.42826509475708, "lr": 0.00028487898515419153, "tps": 14078, "wall": 57233.1} {"step": 12295, "train_loss": 3.456416130065918, "lr": 0.000284861114532951, "tps": 14078, "wall": 57238.1} {"step": 12296, "train_loss": 3.3545336723327637, "lr": 0.0002848432431769603, "tps": 14078, "wall": 57243.0} {"step": 12297, "train_loss": 3.3994219303131104, "lr": 0.00028482537108642184, "tps": 14078, "wall": 57248.0} {"step": 12298, "train_loss": 3.449627637863159, "lr": 0.0002848074982615381, "tps": 14078, "wall": 57252.9} {"step": 12299, "train_loss": 3.361035108566284, "lr": 0.00028478962470251143, "tps": 14078, "wall": 57257.8} {"step": 12300, "train_loss": 3.4753336906433105, "lr": 0.0002847717504095444, "tps": 14078, "wall": 57262.7} {"step": 12301, "train_loss": 3.3849282264709473, "lr": 0.0002847538753828396, "tps": 14078, "wall": 57267.6} {"step": 12302, "train_loss": 3.4288265705108643, "lr": 0.00028473599962259926, "tps": 14078, "wall": 57272.6} {"step": 12303, "train_loss": 3.3883538246154785, "lr": 0.00028471812312902607, "tps": 14078, "wall": 57277.5} {"step": 12304, "train_loss": 3.4168152809143066, "lr": 0.0002847002459023224, "tps": 14077, "wall": 57282.4} {"step": 12305, "train_loss": 3.5236964225769043, "lr": 0.000284682367942691, "tps": 14077, "wall": 57287.3} {"step": 12306, "train_loss": 3.5195491313934326, "lr": 0.00028466448925033416, "tps": 14077, "wall": 57292.3} {"step": 12307, "train_loss": 3.45703125, "lr": 0.0002846466098254544, "tps": 14077, "wall": 57297.3} {"step": 12308, "train_loss": 3.4488940238952637, "lr": 0.00028462872966825446, "tps": 14077, "wall": 57302.2} {"step": 12309, "train_loss": 3.4509429931640625, "lr": 0.00028461084877893676, "tps": 14077, "wall": 57307.1} {"step": 12310, "train_loss": 3.5312678813934326, "lr": 0.0002845929671577039, "tps": 14077, "wall": 57312.0} {"step": 12311, "train_loss": 3.3610048294067383, "lr": 0.00028457508480475834, "tps": 14077, "wall": 57316.9} {"step": 12312, "train_loss": 3.495537757873535, "lr": 0.00028455720172030274, "tps": 14077, "wall": 57321.9} {"step": 12313, "train_loss": 3.3734922409057617, "lr": 0.00028453931790453966, "tps": 14077, "wall": 57326.8} {"step": 12314, "train_loss": 3.50246000289917, "lr": 0.00028452143335767167, "tps": 14077, "wall": 57331.7} {"step": 12315, "train_loss": 3.4810705184936523, "lr": 0.00028450354807990153, "tps": 14077, "wall": 57336.6} {"step": 12316, "train_loss": 3.412716865539551, "lr": 0.00028448566207143154, "tps": 14077, "wall": 57341.6} {"step": 12317, "train_loss": 3.4040918350219727, "lr": 0.0002844677753324645, "tps": 14077, "wall": 57346.5} {"step": 12318, "train_loss": 3.5170297622680664, "lr": 0.00028444988786320314, "tps": 14077, "wall": 57351.4} {"step": 12319, "train_loss": 3.4044711589813232, "lr": 0.0002844319996638499, "tps": 14076, "wall": 57356.4} {"step": 12320, "train_loss": 3.3210525512695312, "lr": 0.00028441411073460744, "tps": 14076, "wall": 57361.3} {"step": 12321, "train_loss": 3.3533806800842285, "lr": 0.0002843962210756785, "tps": 14076, "wall": 57366.2} {"step": 12322, "train_loss": 3.353969097137451, "lr": 0.0002843783306872657, "tps": 14076, "wall": 57371.2} {"step": 12323, "train_loss": 3.5054402351379395, "lr": 0.0002843604395695716, "tps": 14076, "wall": 57376.1} {"step": 12324, "train_loss": 3.3722963333129883, "lr": 0.000284342547722799, "tps": 14076, "wall": 57381.0} {"step": 12325, "train_loss": 3.3707590103149414, "lr": 0.0002843246551471506, "tps": 14076, "wall": 57385.9} {"step": 12326, "train_loss": 3.4677481651306152, "lr": 0.0002843067618428289, "tps": 14076, "wall": 57390.8} {"step": 12327, "train_loss": 3.3411431312561035, "lr": 0.00028428886781003683, "tps": 14076, "wall": 57395.8} {"step": 12328, "train_loss": 3.3725697994232178, "lr": 0.000284270973048977, "tps": 14076, "wall": 57400.7} {"step": 12329, "train_loss": 3.3680613040924072, "lr": 0.0002842530775598521, "tps": 14076, "wall": 57405.6} {"step": 12330, "train_loss": 3.5220844745635986, "lr": 0.00028423518134286475, "tps": 14076, "wall": 57410.5} {"step": 12331, "train_loss": 3.40371036529541, "lr": 0.0002842172843982179, "tps": 14076, "wall": 57415.4} {"step": 12332, "train_loss": 3.404597759246826, "lr": 0.00028419938672611414, "tps": 14076, "wall": 57420.4} {"step": 12333, "train_loss": 3.4589667320251465, "lr": 0.00028418148832675625, "tps": 14076, "wall": 57425.3} {"step": 12334, "train_loss": 3.4687414169311523, "lr": 0.00028416358920034697, "tps": 14075, "wall": 57430.3} {"step": 12335, "train_loss": 3.4945907592773438, "lr": 0.00028414568934708915, "tps": 14075, "wall": 57435.2} {"step": 12336, "train_loss": 3.491983652114868, "lr": 0.0002841277887671855, "tps": 14075, "wall": 57440.1} {"step": 12337, "train_loss": 3.4127416610717773, "lr": 0.0002841098874608387, "tps": 14075, "wall": 57445.0} {"step": 12338, "train_loss": 3.5360162258148193, "lr": 0.00028409198542825163, "tps": 14075, "wall": 57450.0} {"step": 12339, "train_loss": 3.413613796234131, "lr": 0.00028407408266962716, "tps": 14075, "wall": 57454.9} {"step": 12340, "train_loss": 3.457756757736206, "lr": 0.00028405617918516793, "tps": 14075, "wall": 57459.8} {"step": 12341, "train_loss": 3.4222655296325684, "lr": 0.0002840382749750769, "tps": 14075, "wall": 57464.8} {"step": 12342, "train_loss": 3.5865516662597656, "lr": 0.00028402037003955684, "tps": 14075, "wall": 57469.7} {"step": 12343, "train_loss": 3.4289019107818604, "lr": 0.0002840024643788105, "tps": 14075, "wall": 57474.6} {"step": 12344, "train_loss": 3.3850111961364746, "lr": 0.0002839845579930408, "tps": 14075, "wall": 57479.6} {"step": 12345, "train_loss": 3.4583752155303955, "lr": 0.0002839666508824506, "tps": 14075, "wall": 57484.5} {"step": 12346, "train_loss": 3.4387450218200684, "lr": 0.0002839487430472427, "tps": 14075, "wall": 57489.4} {"step": 12347, "train_loss": 3.502127170562744, "lr": 0.00028393083448762, "tps": 14075, "wall": 57494.3} {"step": 12348, "train_loss": 3.278172492980957, "lr": 0.0002839129252037853, "tps": 14075, "wall": 57499.3} {"step": 12349, "train_loss": 3.463348865509033, "lr": 0.0002838950151959416, "tps": 14074, "wall": 57504.2} {"step": 12350, "train_loss": 3.5563414096832275, "lr": 0.00028387710446429163, "tps": 14074, "wall": 57509.1} {"step": 12351, "train_loss": 3.4307005405426025, "lr": 0.00028385919300903835, "tps": 14074, "wall": 57514.0} {"step": 12352, "train_loss": 3.435410261154175, "lr": 0.0002838412808303847, "tps": 14074, "wall": 57519.0} {"step": 12353, "train_loss": 3.400240659713745, "lr": 0.00028382336792853366, "tps": 14074, "wall": 57523.9} {"step": 12354, "train_loss": 3.5070064067840576, "lr": 0.00028380545430368797, "tps": 14074, "wall": 57528.8} {"step": 12355, "train_loss": 3.4735281467437744, "lr": 0.00028378753995605065, "tps": 14074, "wall": 57533.7} {"step": 12356, "train_loss": 3.4528415203094482, "lr": 0.00028376962488582463, "tps": 14074, "wall": 57538.7} {"step": 12357, "train_loss": 3.3956072330474854, "lr": 0.00028375170909321286, "tps": 14074, "wall": 57543.6} {"step": 12358, "train_loss": 3.3845791816711426, "lr": 0.0002837337925784183, "tps": 14074, "wall": 57548.5} {"step": 12359, "train_loss": 3.444674491882324, "lr": 0.00028371587534164387, "tps": 14074, "wall": 57553.5} {"step": 12360, "train_loss": 3.3894166946411133, "lr": 0.0002836979573830925, "tps": 14074, "wall": 57558.4} {"step": 12361, "train_loss": 3.475811004638672, "lr": 0.0002836800387029673, "tps": 14074, "wall": 57563.3} {"step": 12362, "train_loss": 3.517662286758423, "lr": 0.00028366211930147116, "tps": 14074, "wall": 57568.2} {"step": 12363, "train_loss": 3.4951682090759277, "lr": 0.00028364419917880707, "tps": 14074, "wall": 57573.1} {"step": 12364, "train_loss": 3.593536138534546, "lr": 0.0002836262783351781, "tps": 14073, "wall": 57578.1} {"step": 12365, "train_loss": 3.418972969055176, "lr": 0.0002836083567707871, "tps": 14073, "wall": 57583.0} {"step": 12366, "train_loss": 3.473829507827759, "lr": 0.0002835904344858373, "tps": 14073, "wall": 57587.9} {"step": 12367, "train_loss": 3.514085292816162, "lr": 0.00028357251148053154, "tps": 14073, "wall": 57592.8} {"step": 12368, "train_loss": 3.413581132888794, "lr": 0.00028355458775507295, "tps": 14073, "wall": 57597.8} {"step": 12369, "train_loss": 3.5068464279174805, "lr": 0.0002835366633096646, "tps": 14073, "wall": 57602.7} {"step": 12370, "train_loss": 3.410404682159424, "lr": 0.00028351873814450946, "tps": 14073, "wall": 57607.6} {"step": 12371, "train_loss": 3.4308831691741943, "lr": 0.0002835008122598106, "tps": 14073, "wall": 57612.6} {"step": 12372, "train_loss": 3.421114206314087, "lr": 0.0002834828856557711, "tps": 14073, "wall": 57617.5} {"step": 12373, "train_loss": 3.469241142272949, "lr": 0.0002834649583325941, "tps": 14073, "wall": 57622.4} {"step": 12374, "train_loss": 3.39687442779541, "lr": 0.00028344703029048256, "tps": 14073, "wall": 57627.3} {"step": 12375, "train_loss": 3.492321491241455, "lr": 0.0002834291015296396, "tps": 14073, "wall": 57632.3} {"step": 12376, "train_loss": 3.404924154281616, "lr": 0.0002834111720502684, "tps": 14073, "wall": 57637.2} {"step": 12377, "train_loss": 3.4090988636016846, "lr": 0.00028339324185257204, "tps": 14073, "wall": 57642.1} {"step": 12378, "train_loss": 3.5251975059509277, "lr": 0.00028337531093675355, "tps": 14073, "wall": 57647.0} {"step": 12379, "train_loss": 3.3883864879608154, "lr": 0.0002833573793030161, "tps": 14072, "wall": 57651.9} {"step": 12380, "train_loss": 3.4929964542388916, "lr": 0.0002833394469515629, "tps": 14072, "wall": 57657.0} {"step": 12381, "train_loss": 3.420734405517578, "lr": 0.00028332151388259696, "tps": 14072, "wall": 57661.8} {"step": 12382, "train_loss": 3.401759147644043, "lr": 0.00028330358009632145, "tps": 14072, "wall": 57666.8} {"step": 12383, "train_loss": 3.4707367420196533, "lr": 0.00028328564559293966, "tps": 14072, "wall": 57671.7} {"step": 12384, "train_loss": 3.4293463230133057, "lr": 0.0002832677103726546, "tps": 14072, "wall": 57676.6} {"step": 12385, "train_loss": 3.3900938034057617, "lr": 0.0002832497744356695, "tps": 14072, "wall": 57681.6} {"step": 12386, "train_loss": 3.4334511756896973, "lr": 0.00028323183778218754, "tps": 14072, "wall": 57686.5} {"step": 12387, "train_loss": 3.4695072174072266, "lr": 0.00028321390041241194, "tps": 14072, "wall": 57691.4} {"step": 12388, "train_loss": 3.4257404804229736, "lr": 0.00028319596232654574, "tps": 14072, "wall": 57696.3} {"step": 12389, "train_loss": 3.3645448684692383, "lr": 0.0002831780235247924, "tps": 14072, "wall": 57701.2} {"step": 12390, "train_loss": 3.432969093322754, "lr": 0.00028316008400735486, "tps": 14072, "wall": 57706.2} {"step": 12391, "train_loss": 3.4474616050720215, "lr": 0.00028314214377443654, "tps": 14072, "wall": 57711.1} {"step": 12392, "train_loss": 3.411327362060547, "lr": 0.00028312420282624055, "tps": 14072, "wall": 57716.0} {"step": 12393, "train_loss": 3.3751981258392334, "lr": 0.0002831062611629703, "tps": 14072, "wall": 57721.0} {"step": 12394, "train_loss": 3.3427369594573975, "lr": 0.0002830883187848288, "tps": 14071, "wall": 57725.9} {"step": 12395, "train_loss": 3.4988815784454346, "lr": 0.00028307037569201944, "tps": 14071, "wall": 57730.8} {"step": 12396, "train_loss": 3.445066213607788, "lr": 0.0002830524318847454, "tps": 14071, "wall": 57735.7} {"step": 12397, "train_loss": 3.6074399948120117, "lr": 0.00028303448736321005, "tps": 14071, "wall": 57740.6} {"step": 12398, "train_loss": 3.4101428985595703, "lr": 0.00028301654212761664, "tps": 14071, "wall": 57745.6} {"step": 12399, "train_loss": 3.5771145820617676, "lr": 0.0002829985961781684, "tps": 14071, "wall": 57750.5} {"step": 12400, "train_loss": 3.376558780670166, "lr": 0.0002829806495150687, "tps": 14071, "wall": 57755.4} {"step": 12401, "train_loss": 3.4667184352874756, "lr": 0.00028296270213852077, "tps": 14071, "wall": 57760.3} {"step": 12402, "train_loss": 3.4544825553894043, "lr": 0.0002829447540487279, "tps": 14071, "wall": 57765.2} {"step": 12403, "train_loss": 3.460458993911743, "lr": 0.0002829268052458935, "tps": 14071, "wall": 57770.2} {"step": 12404, "train_loss": 3.488593578338623, "lr": 0.0002829088557302208, "tps": 14071, "wall": 57775.1} {"step": 12405, "train_loss": 3.390542507171631, "lr": 0.00028289090550191325, "tps": 14071, "wall": 57780.1} {"step": 12406, "train_loss": 3.5671281814575195, "lr": 0.00028287295456117407, "tps": 14071, "wall": 57785.0} {"step": 12407, "train_loss": 3.5459675788879395, "lr": 0.00028285500290820665, "tps": 14071, "wall": 57789.9} {"step": 12408, "train_loss": 3.5017638206481934, "lr": 0.0002828370505432144, "tps": 14071, "wall": 57794.9} {"step": 12409, "train_loss": 3.492604970932007, "lr": 0.0002828190974664006, "tps": 14071, "wall": 57799.9} {"step": 12410, "train_loss": 3.421382427215576, "lr": 0.00028280114367796867, "tps": 14070, "wall": 57804.8} {"step": 12411, "train_loss": 3.523200511932373, "lr": 0.00028278318917812205, "tps": 14070, "wall": 57809.7} {"step": 12412, "train_loss": 3.494810104370117, "lr": 0.00028276523396706396, "tps": 14070, "wall": 57814.6} {"step": 12413, "train_loss": 3.453976631164551, "lr": 0.000282747278044998, "tps": 14070, "wall": 57819.5} {"step": 12414, "train_loss": 3.3614237308502197, "lr": 0.00028272932141212745, "tps": 14070, "wall": 57824.4} {"step": 12415, "train_loss": 3.4611587524414062, "lr": 0.0002827113640686557, "tps": 14070, "wall": 57829.4} {"step": 12416, "train_loss": 3.4415628910064697, "lr": 0.00028269340601478623, "tps": 14070, "wall": 57834.3} {"step": 12417, "train_loss": 3.471989870071411, "lr": 0.0002826754472507226, "tps": 14070, "wall": 57839.3} {"step": 12418, "train_loss": 3.4206783771514893, "lr": 0.0002826574877766679, "tps": 14070, "wall": 57844.2} {"step": 12419, "train_loss": 3.4302773475646973, "lr": 0.000282639527592826, "tps": 14070, "wall": 57849.1} {"step": 12420, "train_loss": 3.5066676139831543, "lr": 0.0002826215666994, "tps": 14070, "wall": 57854.0} {"step": 12421, "train_loss": 3.5261924266815186, "lr": 0.0002826036050965936, "tps": 14070, "wall": 57859.0} {"step": 12422, "train_loss": 3.4989209175109863, "lr": 0.00028258564278461006, "tps": 14070, "wall": 57863.9} {"step": 12423, "train_loss": 3.4384751319885254, "lr": 0.00028256767976365314, "tps": 14070, "wall": 57868.8} {"step": 12424, "train_loss": 3.5242979526519775, "lr": 0.000282549716033926, "tps": 14070, "wall": 57873.7} {"step": 12425, "train_loss": 3.310875415802002, "lr": 0.00028253175159563234, "tps": 14069, "wall": 57878.6} {"step": 12426, "train_loss": 3.362636089324951, "lr": 0.00028251378644897563, "tps": 14069, "wall": 57883.6} {"step": 12427, "train_loss": 3.376405954360962, "lr": 0.00028249582059415937, "tps": 14069, "wall": 57888.5} {"step": 12428, "train_loss": 3.4147684574127197, "lr": 0.0002824778540313871, "tps": 14069, "wall": 57893.4} {"step": 12429, "train_loss": 3.5201048851013184, "lr": 0.00028245988676086226, "tps": 14069, "wall": 57898.4} {"step": 12430, "train_loss": 3.4227235317230225, "lr": 0.0002824419187827885, "tps": 14069, "wall": 57903.3} {"step": 12431, "train_loss": 3.3873186111450195, "lr": 0.0002824239500973693, "tps": 14069, "wall": 57908.2} {"step": 12432, "train_loss": 3.4567365646362305, "lr": 0.00028240598070480816, "tps": 14069, "wall": 57913.2} {"step": 12433, "train_loss": 3.4198670387268066, "lr": 0.0002823880106053087, "tps": 14069, "wall": 57918.1} {"step": 12434, "train_loss": 3.412726402282715, "lr": 0.00028237003979907457, "tps": 14069, "wall": 57923.0} {"step": 12435, "train_loss": 3.410881519317627, "lr": 0.00028235206828630915, "tps": 14069, "wall": 57928.0} {"step": 12436, "train_loss": 3.4318976402282715, "lr": 0.00028233409606721616, "tps": 14069, "wall": 57932.9} {"step": 12437, "train_loss": 3.4493627548217773, "lr": 0.00028231612314199916, "tps": 14069, "wall": 57937.9} {"step": 12438, "train_loss": 3.3558053970336914, "lr": 0.00028229814951086175, "tps": 14069, "wall": 57942.8} {"step": 12439, "train_loss": 3.3564887046813965, "lr": 0.00028228017517400756, "tps": 14069, "wall": 57947.7} {"step": 12440, "train_loss": 3.4493584632873535, "lr": 0.00028226220013164013, "tps": 14068, "wall": 57952.6} {"step": 12441, "train_loss": 3.3314695358276367, "lr": 0.00028224422438396314, "tps": 14068, "wall": 57957.6} {"step": 12442, "train_loss": 3.423062324523926, "lr": 0.0002822262479311802, "tps": 14068, "wall": 57962.5} {"step": 12443, "train_loss": 3.4935615062713623, "lr": 0.000282208270773495, "tps": 14068, "wall": 57967.4} {"step": 12444, "train_loss": 3.432904005050659, "lr": 0.00028219029291111114, "tps": 14068, "wall": 57972.3} {"step": 12445, "train_loss": 3.421353816986084, "lr": 0.0002821723143442322, "tps": 14068, "wall": 57977.3} {"step": 12446, "train_loss": 3.448448657989502, "lr": 0.00028215433507306197, "tps": 14068, "wall": 57982.2} {"step": 12447, "train_loss": 3.347104787826538, "lr": 0.0002821363550978041, "tps": 14068, "wall": 57987.1} {"step": 12448, "train_loss": 3.501457691192627, "lr": 0.00028211837441866224, "tps": 14068, "wall": 57992.1} {"step": 12449, "train_loss": 3.4656176567077637, "lr": 0.00028210039303584, "tps": 14068, "wall": 57997.0} {"step": 12450, "train_loss": 3.3485488891601562, "lr": 0.0002820824109495412, "tps": 14068, "wall": 58001.9} {"step": 12451, "train_loss": 3.4555139541625977, "lr": 0.00028206442815996956, "tps": 14068, "wall": 58006.8} {"step": 12452, "train_loss": 3.446028232574463, "lr": 0.0002820464446673286, "tps": 14068, "wall": 58011.7} {"step": 12453, "train_loss": 3.424781322479248, "lr": 0.00028202846047182216, "tps": 14068, "wall": 58016.7} {"step": 12454, "train_loss": 3.335151195526123, "lr": 0.000282010475573654, "tps": 14068, "wall": 58021.7} {"step": 12455, "train_loss": 3.4144349098205566, "lr": 0.0002819924899730278, "tps": 14067, "wall": 58026.6} {"step": 12456, "train_loss": 3.4254822731018066, "lr": 0.00028197450367014736, "tps": 14067, "wall": 58031.5} {"step": 12457, "train_loss": 3.570040702819824, "lr": 0.0002819565166652164, "tps": 14067, "wall": 58036.4} {"step": 12458, "train_loss": 3.4175801277160645, "lr": 0.0002819385289584387, "tps": 14067, "wall": 58041.3} {"step": 12459, "train_loss": 3.5293071269989014, "lr": 0.0002819205405500179, "tps": 14067, "wall": 58046.3} {"step": 12460, "train_loss": 3.3309102058410645, "lr": 0.00028190255144015786, "tps": 14067, "wall": 58051.3} {"step": 12461, "train_loss": 3.3834102153778076, "lr": 0.00028188456162906247, "tps": 14067, "wall": 58056.2} {"step": 12462, "train_loss": 3.4863932132720947, "lr": 0.00028186657111693535, "tps": 14067, "wall": 58061.1} {"step": 12463, "train_loss": 3.3528270721435547, "lr": 0.0002818485799039804, "tps": 14067, "wall": 58066.0} {"step": 12464, "train_loss": 3.526411533355713, "lr": 0.00028183058799040127, "tps": 14067, "wall": 58071.0} {"step": 12465, "train_loss": 3.4616074562072754, "lr": 0.00028181259537640203, "tps": 14067, "wall": 58075.9} {"step": 12466, "train_loss": 3.408578872680664, "lr": 0.0002817946020621863, "tps": 14067, "wall": 58080.9} {"step": 12467, "train_loss": 3.425365924835205, "lr": 0.000281776608047958, "tps": 14067, "wall": 58085.8} {"step": 12468, "train_loss": 3.375486373901367, "lr": 0.000281758613333921, "tps": 14067, "wall": 58090.7} {"step": 12469, "train_loss": 3.4978151321411133, "lr": 0.00028174061792027896, "tps": 14067, "wall": 58095.7} {"step": 12470, "train_loss": 3.4090070724487305, "lr": 0.00028172262180723595, "tps": 14066, "wall": 58100.6} {"step": 12471, "train_loss": 3.37261700630188, "lr": 0.0002817046249949958, "tps": 14066, "wall": 58105.5} {"step": 12472, "train_loss": 3.3712878227233887, "lr": 0.0002816866274837622, "tps": 14066, "wall": 58110.4} {"step": 12473, "train_loss": 3.471466541290283, "lr": 0.00028166862927373913, "tps": 14066, "wall": 58115.3} {"step": 12474, "train_loss": 3.479398250579834, "lr": 0.0002816506303651306, "tps": 14066, "wall": 58120.3} {"step": 12475, "train_loss": 3.424614906311035, "lr": 0.0002816326307581403, "tps": 14066, "wall": 58125.2} {"step": 12476, "train_loss": 3.349594831466675, "lr": 0.0002816146304529723, "tps": 14066, "wall": 58130.1} {"step": 12477, "train_loss": 3.365098237991333, "lr": 0.00028159662944983037, "tps": 14066, "wall": 58135.0} {"step": 12478, "train_loss": 3.3956432342529297, "lr": 0.00028157862774891854, "tps": 14066, "wall": 58140.0} {"step": 12479, "train_loss": 3.4791650772094727, "lr": 0.0002815606253504407, "tps": 14066, "wall": 58145.0} {"step": 12480, "train_loss": 3.488255023956299, "lr": 0.0002815426222546007, "tps": 14066, "wall": 58149.9} {"step": 12481, "train_loss": 3.4926841259002686, "lr": 0.0002815246184616025, "tps": 14066, "wall": 58154.8} {"step": 12482, "train_loss": 3.484860897064209, "lr": 0.0002815066139716502, "tps": 14066, "wall": 58159.7} {"step": 12483, "train_loss": 3.486170768737793, "lr": 0.0002814886087849476, "tps": 14066, "wall": 58164.7} {"step": 12484, "train_loss": 3.5396101474761963, "lr": 0.00028147060290169875, "tps": 14066, "wall": 58169.6} {"step": 12485, "train_loss": 3.4448158740997314, "lr": 0.00028145259632210754, "tps": 14065, "wall": 58174.5} {"step": 12486, "train_loss": 3.3553240299224854, "lr": 0.00028143458904637803, "tps": 14065, "wall": 58179.4} {"step": 12487, "train_loss": 3.413433074951172, "lr": 0.00028141658107471416, "tps": 14065, "wall": 58184.3} {"step": 12488, "train_loss": 3.37684965133667, "lr": 0.0002813985724073199, "tps": 14065, "wall": 58189.3} {"step": 12489, "train_loss": 3.456831455230713, "lr": 0.00028138056304439937, "tps": 14065, "wall": 58194.2} {"step": 12490, "train_loss": 3.3526248931884766, "lr": 0.00028136255298615644, "tps": 14065, "wall": 58199.2} {"step": 12491, "train_loss": 3.4627268314361572, "lr": 0.0002813445422327952, "tps": 14065, "wall": 58204.1} {"step": 12492, "train_loss": 3.478485584259033, "lr": 0.00028132653078451967, "tps": 14065, "wall": 58209.0} {"step": 12493, "train_loss": 3.395541191101074, "lr": 0.00028130851864153393, "tps": 14065, "wall": 58213.9} {"step": 12494, "train_loss": 3.443929672241211, "lr": 0.0002812905058040419, "tps": 14065, "wall": 58218.9} {"step": 12495, "train_loss": 3.4312100410461426, "lr": 0.0002812724922722478, "tps": 14065, "wall": 58223.8} {"step": 12496, "train_loss": 3.477538824081421, "lr": 0.00028125447804635547, "tps": 14065, "wall": 58228.7} {"step": 12497, "train_loss": 3.3247220516204834, "lr": 0.00028123646312656913, "tps": 14065, "wall": 58233.6} {"step": 12498, "train_loss": 3.444756031036377, "lr": 0.0002812184475130929, "tps": 14065, "wall": 58238.6} {"step": 12499, "train_loss": 3.4171290397644043, "lr": 0.00028120043120613076, "tps": 14065, "wall": 58243.5} {"step": 12500, "train_loss": 3.4856245517730713, "lr": 0.00028118241420588676, "tps": 14065, "wall": 58248.4} {"step": 12501, "train_loss": 3.463104724884033, "lr": 0.00028116439651256506, "tps": 14064, "wall": 58253.5} {"step": 12502, "train_loss": 3.4816060066223145, "lr": 0.0002811463781263699, "tps": 14064, "wall": 58258.5} {"step": 12503, "train_loss": 3.450477361679077, "lr": 0.0002811283590475051, "tps": 14064, "wall": 58263.5} {"step": 12504, "train_loss": 3.5425472259521484, "lr": 0.0002811103392761751, "tps": 14064, "wall": 58268.4} {"step": 12505, "train_loss": 3.4358913898468018, "lr": 0.0002810923188125837, "tps": 14064, "wall": 58273.3} {"step": 12506, "train_loss": 3.3281803131103516, "lr": 0.0002810742976569353, "tps": 14064, "wall": 58278.3} {"step": 12507, "train_loss": 3.430691719055176, "lr": 0.00028105627580943395, "tps": 14064, "wall": 58283.2} {"step": 12508, "train_loss": 3.4266886711120605, "lr": 0.0002810382532702838, "tps": 14064, "wall": 58288.1} {"step": 12509, "train_loss": 3.4900431632995605, "lr": 0.000281020230039689, "tps": 14064, "wall": 58293.1} {"step": 12510, "train_loss": 3.330566883087158, "lr": 0.0002810022061178538, "tps": 14064, "wall": 58298.0} {"step": 12511, "train_loss": 3.3412587642669678, "lr": 0.0002809841815049822, "tps": 14064, "wall": 58302.9} {"step": 12512, "train_loss": 3.428374767303467, "lr": 0.00028096615620127853, "tps": 14064, "wall": 58307.8} {"step": 12513, "train_loss": 3.391277313232422, "lr": 0.000280948130206947, "tps": 14064, "wall": 58312.8} {"step": 12514, "train_loss": 3.4703116416931152, "lr": 0.0002809301035221917, "tps": 14064, "wall": 58317.8} {"step": 12515, "train_loss": 3.417323112487793, "lr": 0.0002809120761472169, "tps": 14063, "wall": 58322.7} {"step": 12516, "train_loss": 3.562875270843506, "lr": 0.00028089404808222685, "tps": 14063, "wall": 58327.6} {"step": 12517, "train_loss": 3.425269603729248, "lr": 0.00028087601932742567, "tps": 14063, "wall": 58332.5} {"step": 12518, "train_loss": 3.5299899578094482, "lr": 0.00028085798988301765, "tps": 14063, "wall": 58337.5} {"step": 12519, "train_loss": 3.363306760787964, "lr": 0.0002808399597492071, "tps": 14063, "wall": 58342.4} {"step": 12520, "train_loss": 3.4276185035705566, "lr": 0.0002808219289261981, "tps": 14063, "wall": 58347.3} {"step": 12521, "train_loss": 3.49748158454895, "lr": 0.0002808038974141951, "tps": 14063, "wall": 58352.2} {"step": 12522, "train_loss": 3.481783866882324, "lr": 0.00028078586521340215, "tps": 14063, "wall": 58357.1} {"step": 12523, "train_loss": 3.426576614379883, "lr": 0.0002807678323240237, "tps": 14063, "wall": 58362.1} {"step": 12524, "train_loss": 3.459713935852051, "lr": 0.0002807497987462639, "tps": 14063, "wall": 58367.0} {"step": 12525, "train_loss": 3.3816537857055664, "lr": 0.0002807317644803272, "tps": 14063, "wall": 58371.9} {"step": 12526, "train_loss": 3.4376518726348877, "lr": 0.00028071372952641766, "tps": 14063, "wall": 58376.9} {"step": 12527, "train_loss": 3.3813841342926025, "lr": 0.0002806956938847398, "tps": 14063, "wall": 58381.8} {"step": 12528, "train_loss": 3.4167163372039795, "lr": 0.0002806776575554978, "tps": 14063, "wall": 58386.7} {"step": 12529, "train_loss": 3.290663480758667, "lr": 0.000280659620538896, "tps": 14063, "wall": 58391.7} {"step": 12530, "train_loss": 3.466108798980713, "lr": 0.00028064158283513875, "tps": 14063, "wall": 58396.6} {"step": 12531, "train_loss": 3.4643266201019287, "lr": 0.0002806235444444304, "tps": 14062, "wall": 58401.5} {"step": 12532, "train_loss": 3.408186435699463, "lr": 0.0002806055053669752, "tps": 14062, "wall": 58406.4} {"step": 12533, "train_loss": 3.454688787460327, "lr": 0.00028058746560297756, "tps": 14062, "wall": 58411.4} {"step": 12534, "train_loss": 3.460442543029785, "lr": 0.00028056942515264187, "tps": 14062, "wall": 58416.3} {"step": 12535, "train_loss": 3.3689026832580566, "lr": 0.0002805513840161724, "tps": 14062, "wall": 58421.2} {"step": 12536, "train_loss": 3.4421424865722656, "lr": 0.0002805333421937737, "tps": 14062, "wall": 58426.1} {"step": 12537, "train_loss": 3.44097638130188, "lr": 0.00028051529968564995, "tps": 14062, "wall": 58431.1} {"step": 12538, "train_loss": 3.375094413757324, "lr": 0.0002804972564920056, "tps": 14062, "wall": 58436.0} {"step": 12539, "train_loss": 3.4677255153656006, "lr": 0.000280479212613045, "tps": 14062, "wall": 58441.0} {"step": 12540, "train_loss": 3.471649646759033, "lr": 0.0002804611680489727, "tps": 14062, "wall": 58445.9} {"step": 12541, "train_loss": 3.3604238033294678, "lr": 0.000280443122799993, "tps": 14062, "wall": 58450.8} {"step": 12542, "train_loss": 3.432084560394287, "lr": 0.0002804250768663103, "tps": 14062, "wall": 58455.8} {"step": 12543, "train_loss": 3.4682421684265137, "lr": 0.00028040703024812913, "tps": 14062, "wall": 58460.7} {"step": 12544, "train_loss": 3.421578884124756, "lr": 0.00028038898294565376, "tps": 14062, "wall": 58465.6} {"step": 12545, "train_loss": 3.373652458190918, "lr": 0.0002803709349590888, "tps": 14062, "wall": 58470.5} {"step": 12546, "train_loss": 3.481966733932495, "lr": 0.0002803528862886386, "tps": 14061, "wall": 58475.4} {"step": 12547, "train_loss": 3.4401330947875977, "lr": 0.0002803348369345076, "tps": 14061, "wall": 58480.4} {"step": 12548, "train_loss": 3.4631361961364746, "lr": 0.0002803167868969003, "tps": 14061, "wall": 58485.3} {"step": 12549, "train_loss": 3.405669689178467, "lr": 0.00028029873617602124, "tps": 14061, "wall": 58490.2} {"step": 12550, "train_loss": 3.4713926315307617, "lr": 0.0002802806847720748, "tps": 14061, "wall": 58495.1} {"step": 12551, "train_loss": 3.342489004135132, "lr": 0.00028026263268526554, "tps": 14061, "wall": 58500.1} {"step": 12552, "train_loss": 3.4934844970703125, "lr": 0.00028024457991579786, "tps": 14061, "wall": 58505.0} {"step": 12553, "train_loss": 3.5434317588806152, "lr": 0.00028022652646387636, "tps": 14061, "wall": 58509.9} {"step": 12554, "train_loss": 3.484525680541992, "lr": 0.00028020847232970546, "tps": 14061, "wall": 58514.9} {"step": 12555, "train_loss": 3.4816625118255615, "lr": 0.0002801904175134898, "tps": 14061, "wall": 58519.8} {"step": 12556, "train_loss": 3.4415745735168457, "lr": 0.00028017236201543377, "tps": 14061, "wall": 58524.8} {"step": 12557, "train_loss": 3.38315486907959, "lr": 0.000280154305835742, "tps": 14061, "wall": 58529.7} {"step": 12558, "train_loss": 3.377018690109253, "lr": 0.000280136248974619, "tps": 14061, "wall": 58534.6} {"step": 12559, "train_loss": 3.5765597820281982, "lr": 0.0002801181914322693, "tps": 14061, "wall": 58539.5} {"step": 12560, "train_loss": 3.39207124710083, "lr": 0.0002801001332088975, "tps": 14061, "wall": 58544.5} {"step": 12561, "train_loss": 3.476327657699585, "lr": 0.00028008207430470813, "tps": 14061, "wall": 58549.4} {"step": 12562, "train_loss": 3.4460020065307617, "lr": 0.00028006401471990575, "tps": 14060, "wall": 58554.3} {"step": 12563, "train_loss": 3.4366354942321777, "lr": 0.000280045954454695, "tps": 14060, "wall": 58559.3} {"step": 12564, "train_loss": 3.407593011856079, "lr": 0.00028002789350928037, "tps": 14060, "wall": 58564.2} {"step": 12565, "train_loss": 3.534864902496338, "lr": 0.00028000983188386654, "tps": 14060, "wall": 58569.1} {"step": 12566, "train_loss": 3.457285165786743, "lr": 0.0002799917695786581, "tps": 14060, "wall": 58574.1} {"step": 12567, "train_loss": 3.3974173069000244, "lr": 0.0002799737065938597, "tps": 14060, "wall": 58579.0} {"step": 12568, "train_loss": 3.3462672233581543, "lr": 0.00027995564292967583, "tps": 14060, "wall": 58583.9} {"step": 12569, "train_loss": 3.3613319396972656, "lr": 0.0002799375785863112, "tps": 14060, "wall": 58588.9} {"step": 12570, "train_loss": 3.5779976844787598, "lr": 0.0002799195135639705, "tps": 14060, "wall": 58593.8} {"step": 12571, "train_loss": 3.5467944145202637, "lr": 0.0002799014478628583, "tps": 14060, "wall": 58598.7} {"step": 12572, "train_loss": 3.4901297092437744, "lr": 0.00027988338148317917, "tps": 14060, "wall": 58603.7} {"step": 12573, "train_loss": 3.3005313873291016, "lr": 0.0002798653144251379, "tps": 14060, "wall": 58608.6} {"step": 12574, "train_loss": 3.478327751159668, "lr": 0.00027984724668893914, "tps": 14060, "wall": 58613.5} {"step": 12575, "train_loss": 3.420395612716675, "lr": 0.0002798291782747875, "tps": 14060, "wall": 58618.5} {"step": 12576, "train_loss": 3.385573387145996, "lr": 0.0002798111091828877, "tps": 14060, "wall": 58623.4} {"step": 12577, "train_loss": 3.480851173400879, "lr": 0.00027979303941344443, "tps": 14059, "wall": 58628.4} {"step": 12578, "train_loss": 3.410353422164917, "lr": 0.00027977496896666233, "tps": 14059, "wall": 58633.3} {"step": 12579, "train_loss": 3.422628879547119, "lr": 0.0002797568978427462, "tps": 14059, "wall": 58638.2} {"step": 12580, "train_loss": 3.4067025184631348, "lr": 0.0002797388260419007, "tps": 14059, "wall": 58643.1} {"step": 12581, "train_loss": 3.5636885166168213, "lr": 0.0002797207535643305, "tps": 14059, "wall": 58648.1} {"step": 12582, "train_loss": 3.4188859462738037, "lr": 0.0002797026804102404, "tps": 14059, "wall": 58653.0} {"step": 12583, "train_loss": 3.494213342666626, "lr": 0.0002796846065798351, "tps": 14059, "wall": 58657.9} {"step": 12584, "train_loss": 3.4265456199645996, "lr": 0.0002796665320733194, "tps": 14059, "wall": 58662.9} {"step": 12585, "train_loss": 3.445922613143921, "lr": 0.0002796484568908979, "tps": 14059, "wall": 58667.8} {"step": 12586, "train_loss": 3.4598591327667236, "lr": 0.00027963038103277554, "tps": 14059, "wall": 58672.7} {"step": 12587, "train_loss": 3.469740629196167, "lr": 0.000279612304499157, "tps": 14059, "wall": 58677.7} {"step": 12588, "train_loss": 3.452859401702881, "lr": 0.000279594227290247, "tps": 14059, "wall": 58682.6} {"step": 12589, "train_loss": 3.5074565410614014, "lr": 0.00027957614940625036, "tps": 14059, "wall": 58687.5} {"step": 12590, "train_loss": 3.4910812377929688, "lr": 0.0002795580708473719, "tps": 14059, "wall": 58692.4} {"step": 12591, "train_loss": 3.3848814964294434, "lr": 0.0002795399916138164, "tps": 14059, "wall": 58697.4} {"step": 12592, "train_loss": 3.4201080799102783, "lr": 0.00027952191170578863, "tps": 14058, "wall": 58702.3} {"step": 12593, "train_loss": 3.440197229385376, "lr": 0.00027950383112349344, "tps": 14058, "wall": 58707.3} {"step": 12594, "train_loss": 3.4201865196228027, "lr": 0.0002794857498671356, "tps": 14058, "wall": 58712.2} {"step": 12595, "train_loss": 3.526193857192993, "lr": 0.00027946766793692006, "tps": 14058, "wall": 58717.1} {"step": 12596, "train_loss": 3.51809024810791, "lr": 0.0002794495853330515, "tps": 14058, "wall": 58722.0} {"step": 12597, "train_loss": 3.436958074569702, "lr": 0.0002794315020557348, "tps": 14058, "wall": 58726.9} {"step": 12598, "train_loss": 3.426487445831299, "lr": 0.00027941341810517483, "tps": 14058, "wall": 58731.9} {"step": 12599, "train_loss": 3.4666051864624023, "lr": 0.0002793953334815765, "tps": 14058, "wall": 58736.9} {"step": 12600, "train_loss": 3.423870801925659, "lr": 0.00027937724818514456, "tps": 14058, "wall": 58741.8} {"step": 12601, "train_loss": 3.322425603866577, "lr": 0.000279359162216084, "tps": 14058, "wall": 58746.7} {"step": 12602, "train_loss": 3.4291300773620605, "lr": 0.00027934107557459965, "tps": 14058, "wall": 58751.6} {"step": 12603, "train_loss": 3.4374897480010986, "lr": 0.0002793229882608963, "tps": 14058, "wall": 58756.5} {"step": 12604, "train_loss": 3.5022597312927246, "lr": 0.00027930490027517897, "tps": 14058, "wall": 58761.5} {"step": 12605, "train_loss": 3.433785915374756, "lr": 0.00027928681161765254, "tps": 14058, "wall": 58766.4} {"step": 12606, "train_loss": 3.458127021789551, "lr": 0.00027926872228852185, "tps": 14058, "wall": 58771.3} {"step": 12607, "train_loss": 3.37165904045105, "lr": 0.0002792506322879919, "tps": 14058, "wall": 58776.2} {"step": 12608, "train_loss": 3.4574809074401855, "lr": 0.0002792325416162676, "tps": 14057, "wall": 58781.2} {"step": 12609, "train_loss": 3.5067343711853027, "lr": 0.0002792144502735538, "tps": 14057, "wall": 58786.1} {"step": 12610, "train_loss": 3.3584511280059814, "lr": 0.0002791963582600555, "tps": 14057, "wall": 58791.0} {"step": 12611, "train_loss": 3.450683116912842, "lr": 0.00027917826557597776, "tps": 14057, "wall": 58796.0} {"step": 12612, "train_loss": 3.5623972415924072, "lr": 0.0002791601722215254, "tps": 14057, "wall": 58800.9} {"step": 12613, "train_loss": 3.364269256591797, "lr": 0.00027914207819690334, "tps": 14057, "wall": 58805.9} {"step": 12614, "train_loss": 3.476975917816162, "lr": 0.00027912398350231663, "tps": 14057, "wall": 58810.8} {"step": 12615, "train_loss": 3.43170428276062, "lr": 0.0002791058881379703, "tps": 14057, "wall": 58815.7} {"step": 12616, "train_loss": 3.3755221366882324, "lr": 0.00027908779210406926, "tps": 14057, "wall": 58820.6} {"step": 12617, "train_loss": 3.438030958175659, "lr": 0.0002790696954008184, "tps": 14057, "wall": 58825.5} {"step": 12618, "train_loss": 3.3734962940216064, "lr": 0.000279051598028423, "tps": 14057, "wall": 58830.4} {"step": 12619, "train_loss": 3.4662575721740723, "lr": 0.0002790334999870878, "tps": 14057, "wall": 58835.3} {"step": 12620, "train_loss": 3.3341357707977295, "lr": 0.00027901540127701793, "tps": 14057, "wall": 58840.3} {"step": 12621, "train_loss": 3.436948776245117, "lr": 0.00027899730189841844, "tps": 14057, "wall": 58845.2} {"step": 12622, "train_loss": 3.415459156036377, "lr": 0.00027897920185149423, "tps": 14057, "wall": 58850.1} {"step": 12623, "train_loss": 3.437556743621826, "lr": 0.00027896110113645055, "tps": 14057, "wall": 58855.0} {"step": 12624, "train_loss": 3.5333151817321777, "lr": 0.00027894299975349225, "tps": 14056, "wall": 58860.0} {"step": 12625, "train_loss": 3.4134416580200195, "lr": 0.00027892489770282446, "tps": 14056, "wall": 58864.9} {"step": 12626, "train_loss": 3.402794361114502, "lr": 0.0002789067949846523, "tps": 14056, "wall": 58869.8} {"step": 12627, "train_loss": 3.360996961593628, "lr": 0.0002788886915991808, "tps": 14056, "wall": 58874.7} {"step": 12628, "train_loss": 3.4297938346862793, "lr": 0.00027887058754661495, "tps": 14056, "wall": 58879.6} {"step": 12629, "train_loss": 3.5466065406799316, "lr": 0.0002788524828271599, "tps": 14056, "wall": 58884.6} {"step": 12630, "train_loss": 3.286054849624634, "lr": 0.0002788343774410207, "tps": 14056, "wall": 58889.5} {"step": 12631, "train_loss": 3.453713893890381, "lr": 0.0002788162713884026, "tps": 14056, "wall": 58894.4} {"step": 12632, "train_loss": 3.5095131397247314, "lr": 0.00027879816466951047, "tps": 14056, "wall": 58899.3} {"step": 12633, "train_loss": 3.454491376876831, "lr": 0.0002787800572845496, "tps": 14056, "wall": 58904.3} {"step": 12634, "train_loss": 3.4190680980682373, "lr": 0.0002787619492337251, "tps": 14056, "wall": 58909.2} {"step": 12635, "train_loss": 3.40499210357666, "lr": 0.00027874384051724204, "tps": 14056, "wall": 58914.1} {"step": 12636, "train_loss": 3.375452995300293, "lr": 0.0002787257311353056, "tps": 14056, "wall": 58919.1} {"step": 12637, "train_loss": 3.5888655185699463, "lr": 0.0002787076210881208, "tps": 14056, "wall": 58924.0} {"step": 12638, "train_loss": 3.4799904823303223, "lr": 0.000278689510375893, "tps": 14056, "wall": 58928.9} {"step": 12639, "train_loss": 3.379493474960327, "lr": 0.0002786713989988272, "tps": 14056, "wall": 58933.8} {"step": 12640, "train_loss": 3.483156442642212, "lr": 0.00027865328695712865, "tps": 14055, "wall": 58938.8} {"step": 12641, "train_loss": 3.489671230316162, "lr": 0.0002786351742510025, "tps": 14055, "wall": 58943.7} {"step": 12642, "train_loss": 3.506134271621704, "lr": 0.0002786170608806539, "tps": 14055, "wall": 58948.6} {"step": 12643, "train_loss": 3.380873203277588, "lr": 0.000278598946846288, "tps": 14055, "wall": 58953.5} {"step": 12644, "train_loss": 3.5223441123962402, "lr": 0.00027858083214811014, "tps": 14055, "wall": 58958.4} {"step": 12645, "train_loss": 3.4334754943847656, "lr": 0.0002785627167863255, "tps": 14055, "wall": 58963.4} {"step": 12646, "train_loss": 3.5268378257751465, "lr": 0.0002785446007611391, "tps": 14055, "wall": 58968.3} {"step": 12647, "train_loss": 3.4398488998413086, "lr": 0.0002785264840727564, "tps": 14055, "wall": 58973.2} {"step": 12648, "train_loss": 3.428285598754883, "lr": 0.0002785083667213825, "tps": 14055, "wall": 58978.2} {"step": 12649, "train_loss": 3.403216600418091, "lr": 0.0002784902487072226, "tps": 14055, "wall": 58983.1} {"step": 12650, "train_loss": 3.362351417541504, "lr": 0.00027847213003048203, "tps": 14055, "wall": 58988.0} {"step": 12651, "train_loss": 3.479071617126465, "lr": 0.000278454010691366, "tps": 14055, "wall": 58993.0} {"step": 12652, "train_loss": 3.400876998901367, "lr": 0.00027843589069007985, "tps": 14055, "wall": 58997.9} {"step": 12653, "train_loss": 3.396275520324707, "lr": 0.0002784177700268287, "tps": 14055, "wall": 59002.8} {"step": 12654, "train_loss": 3.429500102996826, "lr": 0.0002783996487018179, "tps": 14055, "wall": 59007.8} {"step": 12655, "train_loss": 3.450638771057129, "lr": 0.0002783815267152527, "tps": 14054, "wall": 59012.7} {"step": 12656, "train_loss": 3.401993989944458, "lr": 0.0002783634040673384, "tps": 14054, "wall": 59017.6} {"step": 12657, "train_loss": 3.3485989570617676, "lr": 0.00027834528075828033, "tps": 14054, "wall": 59022.5} {"step": 12658, "train_loss": 3.406634569168091, "lr": 0.0002783271567882838, "tps": 14054, "wall": 59027.4} {"step": 12659, "train_loss": 3.4403507709503174, "lr": 0.00027830903215755404, "tps": 14054, "wall": 59032.4} {"step": 12660, "train_loss": 3.4066379070281982, "lr": 0.0002782909068662964, "tps": 14054, "wall": 59037.4} {"step": 12661, "train_loss": 3.389069080352783, "lr": 0.0002782727809147162, "tps": 14054, "wall": 59042.3} {"step": 12662, "train_loss": 3.415729284286499, "lr": 0.00027825465430301885, "tps": 14054, "wall": 59047.2} {"step": 12663, "train_loss": 3.502054452896118, "lr": 0.00027823652703140957, "tps": 14054, "wall": 59052.1} {"step": 12664, "train_loss": 3.511044979095459, "lr": 0.0002782183991000938, "tps": 14054, "wall": 59057.0} {"step": 12665, "train_loss": 3.4882593154907227, "lr": 0.0002782002705092768, "tps": 14054, "wall": 59062.0} {"step": 12666, "train_loss": 3.408771514892578, "lr": 0.000278182141259164, "tps": 14054, "wall": 59066.9} {"step": 12667, "train_loss": 3.47638201713562, "lr": 0.0002781640113499608, "tps": 14054, "wall": 59071.8} {"step": 12668, "train_loss": 3.418755054473877, "lr": 0.00027814588078187245, "tps": 14054, "wall": 59076.7} {"step": 12669, "train_loss": 3.4459125995635986, "lr": 0.00027812774955510454, "tps": 14054, "wall": 59081.7} {"step": 12670, "train_loss": 3.4364490509033203, "lr": 0.00027810961766986227, "tps": 14054, "wall": 59086.6} {"step": 12671, "train_loss": 3.4708051681518555, "lr": 0.0002780914851263511, "tps": 14054, "wall": 59091.5} {"step": 12672, "train_loss": 3.3555197715759277, "lr": 0.00027807335192477653, "tps": 14053, "wall": 59096.4} {"step": 12673, "train_loss": 3.365694522857666, "lr": 0.00027805521806534376, "tps": 14053, "wall": 59101.4} {"step": 12674, "train_loss": 3.448113441467285, "lr": 0.0002780370835482584, "tps": 14053, "wall": 59106.3} {"step": 12675, "train_loss": 3.476647138595581, "lr": 0.0002780189483737258, "tps": 14053, "wall": 59111.2} {"step": 12676, "train_loss": 3.549514055252075, "lr": 0.0002780008125419514, "tps": 14053, "wall": 59116.2} {"step": 12677, "train_loss": 3.433809280395508, "lr": 0.0002779826760531407, "tps": 14053, "wall": 59121.1} {"step": 12678, "train_loss": 3.3565673828125, "lr": 0.0002779645389074991, "tps": 14053, "wall": 59126.0} {"step": 12679, "train_loss": 3.4248361587524414, "lr": 0.00027794640110523203, "tps": 14053, "wall": 59130.9} {"step": 12680, "train_loss": 3.381740093231201, "lr": 0.00027792826264654507, "tps": 14053, "wall": 59135.8} {"step": 12681, "train_loss": 3.4538021087646484, "lr": 0.00027791012353164355, "tps": 14053, "wall": 59140.8} {"step": 12682, "train_loss": 3.469618558883667, "lr": 0.000277891983760733, "tps": 14053, "wall": 59145.7} {"step": 12683, "train_loss": 3.3695287704467773, "lr": 0.00027787384333401903, "tps": 14053, "wall": 59150.6} {"step": 12684, "train_loss": 3.3911423683166504, "lr": 0.00027785570225170696, "tps": 14053, "wall": 59155.5} {"step": 12685, "train_loss": 3.347080945968628, "lr": 0.00027783756051400236, "tps": 14053, "wall": 59160.5} {"step": 12686, "train_loss": 3.352252721786499, "lr": 0.00027781941812111076, "tps": 14053, "wall": 59165.4} {"step": 12687, "train_loss": 3.3251566886901855, "lr": 0.0002778012750732376, "tps": 14052, "wall": 59170.3} {"step": 12688, "train_loss": 3.479219436645508, "lr": 0.00027778313137058854, "tps": 14052, "wall": 59175.3} {"step": 12689, "train_loss": 3.4010210037231445, "lr": 0.00027776498701336905, "tps": 14052, "wall": 59180.2} {"step": 12690, "train_loss": 3.4644956588745117, "lr": 0.00027774684200178464, "tps": 14052, "wall": 59185.1} {"step": 12691, "train_loss": 3.4152607917785645, "lr": 0.00027772869633604084, "tps": 14052, "wall": 59190.0} {"step": 12692, "train_loss": 3.4333133697509766, "lr": 0.00027771055001634326, "tps": 14052, "wall": 59195.0} {"step": 12693, "train_loss": 3.390371799468994, "lr": 0.00027769240304289757, "tps": 14052, "wall": 59199.9} {"step": 12694, "train_loss": 3.46207857131958, "lr": 0.00027767425541590907, "tps": 14052, "wall": 59204.8} {"step": 12695, "train_loss": 3.4736404418945312, "lr": 0.00027765610713558354, "tps": 14052, "wall": 59209.7} {"step": 12696, "train_loss": 3.5705199241638184, "lr": 0.0002776379582021265, "tps": 14052, "wall": 59214.6} {"step": 12697, "train_loss": 3.462425947189331, "lr": 0.0002776198086157436, "tps": 14052, "wall": 59219.6} {"step": 12698, "train_loss": 3.466637134552002, "lr": 0.0002776016583766403, "tps": 14052, "wall": 59224.5} {"step": 12699, "train_loss": 3.4395172595977783, "lr": 0.00027758350748502235, "tps": 14052, "wall": 59229.4} {"step": 12700, "train_loss": 3.448396682739258, "lr": 0.0002775653559410953, "tps": 14052, "wall": 59234.4} {"step": 12701, "train_loss": 3.4118542671203613, "lr": 0.00027754720374506477, "tps": 14052, "wall": 59239.3} {"step": 12702, "train_loss": 3.4483180046081543, "lr": 0.00027752905089713643, "tps": 14052, "wall": 59244.2} {"step": 12703, "train_loss": 3.346313238143921, "lr": 0.0002775108973975159, "tps": 14052, "wall": 59249.1} {"step": 12704, "train_loss": 3.3520359992980957, "lr": 0.0002774927432464088, "tps": 14051, "wall": 59254.0} {"step": 12705, "train_loss": 3.540142059326172, "lr": 0.00027747458844402077, "tps": 14051, "wall": 59258.9} {"step": 12706, "train_loss": 3.3672585487365723, "lr": 0.0002774564329905575, "tps": 14051, "wall": 59263.9} {"step": 12707, "train_loss": 3.492892265319824, "lr": 0.00027743827688622464, "tps": 14051, "wall": 59268.8} {"step": 12708, "train_loss": 3.5105438232421875, "lr": 0.0002774201201312279, "tps": 14051, "wall": 59273.7} {"step": 12709, "train_loss": 3.3499326705932617, "lr": 0.00027740196272577294, "tps": 14051, "wall": 59278.7} {"step": 12710, "train_loss": 3.4266443252563477, "lr": 0.00027738380467006547, "tps": 14051, "wall": 59283.6} {"step": 12711, "train_loss": 3.453864812850952, "lr": 0.0002773656459643111, "tps": 14051, "wall": 59288.6} {"step": 12712, "train_loss": 3.4623165130615234, "lr": 0.00027734748660871556, "tps": 14051, "wall": 59293.5} {"step": 12713, "train_loss": 3.575333595275879, "lr": 0.00027732932660348464, "tps": 14051, "wall": 59298.4} {"step": 12714, "train_loss": 3.3430275917053223, "lr": 0.00027731116594882405, "tps": 14051, "wall": 59303.3} {"step": 12715, "train_loss": 3.3420815467834473, "lr": 0.00027729300464493934, "tps": 14051, "wall": 59308.2} {"step": 12716, "train_loss": 3.386415958404541, "lr": 0.0002772748426920365, "tps": 14051, "wall": 59313.2} {"step": 12717, "train_loss": 3.37068247795105, "lr": 0.0002772566800903211, "tps": 14051, "wall": 59318.1} {"step": 12718, "train_loss": 3.461052894592285, "lr": 0.00027723851683999893, "tps": 14051, "wall": 59323.0} {"step": 12719, "train_loss": 3.4123780727386475, "lr": 0.0002772203529412757, "tps": 14051, "wall": 59327.9} {"step": 12720, "train_loss": 3.347743272781372, "lr": 0.0002772021883943573, "tps": 14050, "wall": 59332.8} {"step": 12721, "train_loss": 3.3601274490356445, "lr": 0.00027718402319944934, "tps": 14050, "wall": 59337.8} {"step": 12722, "train_loss": 3.4957261085510254, "lr": 0.00027716585735675764, "tps": 14050, "wall": 59342.7} {"step": 12723, "train_loss": 3.5121498107910156, "lr": 0.00027714769086648814, "tps": 14050, "wall": 59347.6} {"step": 12724, "train_loss": 3.377415180206299, "lr": 0.00027712952372884646, "tps": 14050, "wall": 59352.5} {"step": 12725, "train_loss": 3.3488612174987793, "lr": 0.00027711135594403843, "tps": 14050, "wall": 59357.4} {"step": 12726, "train_loss": 3.508897542953491, "lr": 0.00027709318751226983, "tps": 14050, "wall": 59362.4} {"step": 12727, "train_loss": 3.4169774055480957, "lr": 0.0002770750184337466, "tps": 14050, "wall": 59367.3} {"step": 12728, "train_loss": 3.4539573192596436, "lr": 0.0002770568487086744, "tps": 14050, "wall": 59372.2} {"step": 12729, "train_loss": 3.4023256301879883, "lr": 0.00027703867833725915, "tps": 14050, "wall": 59377.1} {"step": 12730, "train_loss": 3.4220030307769775, "lr": 0.0002770205073197067, "tps": 14050, "wall": 59382.1} {"step": 12731, "train_loss": 3.5354831218719482, "lr": 0.00027700233565622286, "tps": 14050, "wall": 59387.0} {"step": 12732, "train_loss": 3.471099853515625, "lr": 0.00027698416334701335, "tps": 14050, "wall": 59391.9} {"step": 12733, "train_loss": 3.4897267818450928, "lr": 0.0002769659903922843, "tps": 14050, "wall": 59396.9} {"step": 12734, "train_loss": 3.420283079147339, "lr": 0.00027694781679224136, "tps": 14050, "wall": 59401.8} {"step": 12735, "train_loss": 3.4024903774261475, "lr": 0.0002769296425470905, "tps": 14050, "wall": 59406.7} {"step": 12736, "train_loss": 3.4571871757507324, "lr": 0.00027691146765703757, "tps": 14049, "wall": 59411.6} {"step": 12737, "train_loss": 3.3610048294067383, "lr": 0.0002768932921222885, "tps": 14049, "wall": 59416.5} {"step": 12738, "train_loss": 3.4942564964294434, "lr": 0.00027687511594304905, "tps": 14049, "wall": 59421.5} {"step": 12739, "train_loss": 3.337057113647461, "lr": 0.0002768569391195253, "tps": 14049, "wall": 59426.4} {"step": 12740, "train_loss": 3.4154815673828125, "lr": 0.000276838761651923, "tps": 14049, "wall": 59431.3} {"step": 12741, "train_loss": 3.5863265991210938, "lr": 0.0002768205835404481, "tps": 14049, "wall": 59436.2} {"step": 12742, "train_loss": 3.3643155097961426, "lr": 0.0002768024047853066, "tps": 14049, "wall": 59441.1} {"step": 12743, "train_loss": 3.505636215209961, "lr": 0.00027678422538670444, "tps": 14049, "wall": 59446.1} {"step": 12744, "train_loss": 3.322111129760742, "lr": 0.0002767660453448474, "tps": 14049, "wall": 59451.0} {"step": 12745, "train_loss": 3.3918914794921875, "lr": 0.00027674786465994167, "tps": 14049, "wall": 59455.9} {"step": 12746, "train_loss": 3.42433500289917, "lr": 0.0002767296833321929, "tps": 14049, "wall": 59460.9} {"step": 12747, "train_loss": 3.5702364444732666, "lr": 0.0002767115013618073, "tps": 14049, "wall": 59465.8} {"step": 12748, "train_loss": 3.3829376697540283, "lr": 0.0002766933187489907, "tps": 14049, "wall": 59470.7} {"step": 12749, "train_loss": 3.3233389854431152, "lr": 0.00027667513549394917, "tps": 14049, "wall": 59475.6} {"step": 12750, "train_loss": 3.4160592555999756, "lr": 0.0002766569515968886, "tps": 14049, "wall": 59480.6} {"step": 12751, "train_loss": 3.436077117919922, "lr": 0.00027663876705801504, "tps": 14049, "wall": 59485.5} {"step": 12752, "train_loss": 3.3940186500549316, "lr": 0.00027662058187753443, "tps": 14048, "wall": 59490.4} {"step": 12753, "train_loss": 3.364983558654785, "lr": 0.00027660239605565277, "tps": 14048, "wall": 59495.3} {"step": 12754, "train_loss": 3.4291181564331055, "lr": 0.0002765842095925762, "tps": 14048, "wall": 59500.3} {"step": 12755, "train_loss": 3.4316697120666504, "lr": 0.00027656602248851063, "tps": 14048, "wall": 59505.2} {"step": 12756, "train_loss": 3.4997498989105225, "lr": 0.00027654783474366203, "tps": 14048, "wall": 59510.1} {"step": 12757, "train_loss": 3.3705317974090576, "lr": 0.0002765296463582366, "tps": 14048, "wall": 59515.0} {"step": 12758, "train_loss": 3.4259133338928223, "lr": 0.0002765114573324402, "tps": 14048, "wall": 59520.0} {"step": 12759, "train_loss": 3.4853787422180176, "lr": 0.000276493267666479, "tps": 14048, "wall": 59524.9} {"step": 12760, "train_loss": 3.4278459548950195, "lr": 0.00027647507736055897, "tps": 14048, "wall": 59529.8} {"step": 12761, "train_loss": 3.550940990447998, "lr": 0.00027645688641488616, "tps": 14048, "wall": 59534.8} {"step": 12762, "train_loss": 3.51489520072937, "lr": 0.00027643869482966673, "tps": 14048, "wall": 59539.7} {"step": 12763, "train_loss": 3.3805971145629883, "lr": 0.0002764205026051067, "tps": 14048, "wall": 59544.6} {"step": 12764, "train_loss": 3.3787999153137207, "lr": 0.00027640230974141223, "tps": 14048, "wall": 59549.5} {"step": 12765, "train_loss": 3.520401954650879, "lr": 0.0002763841162387894, "tps": 14048, "wall": 59554.5} {"step": 12766, "train_loss": 3.4511871337890625, "lr": 0.00027636592209744407, "tps": 14048, "wall": 59559.4} {"step": 12767, "train_loss": 3.3870716094970703, "lr": 0.0002763477273175826, "tps": 14048, "wall": 59564.3} {"step": 12768, "train_loss": 3.498034715652466, "lr": 0.0002763295318994111, "tps": 14048, "wall": 59569.2} {"step": 12769, "train_loss": 3.3316991329193115, "lr": 0.00027631133584313553, "tps": 14047, "wall": 59574.1} {"step": 12770, "train_loss": 3.4388532638549805, "lr": 0.0002762931391489621, "tps": 14047, "wall": 59579.1} {"step": 12771, "train_loss": 3.419344425201416, "lr": 0.000276274941817097, "tps": 14047, "wall": 59584.1} {"step": 12772, "train_loss": 3.4605541229248047, "lr": 0.00027625674384774626, "tps": 14047, "wall": 59589.0} {"step": 12773, "train_loss": 3.413757801055908, "lr": 0.00027623854524111614, "tps": 14047, "wall": 59593.9} {"step": 12774, "train_loss": 3.452918529510498, "lr": 0.00027622034599741267, "tps": 14047, "wall": 59598.9} {"step": 12775, "train_loss": 3.4963202476501465, "lr": 0.0002762021461168421, "tps": 14047, "wall": 59603.8} {"step": 12776, "train_loss": 3.4832372665405273, "lr": 0.0002761839455996106, "tps": 14047, "wall": 59608.7} {"step": 12777, "train_loss": 3.521695613861084, "lr": 0.00027616574444592427, "tps": 14047, "wall": 59613.7} {"step": 12778, "train_loss": 3.3487532138824463, "lr": 0.00027614754265598945, "tps": 14047, "wall": 59618.6} {"step": 12779, "train_loss": 3.43424391746521, "lr": 0.00027612934023001214, "tps": 14047, "wall": 59623.5} {"step": 12780, "train_loss": 3.4866883754730225, "lr": 0.0002761111371681987, "tps": 14047, "wall": 59628.5} {"step": 12781, "train_loss": 3.556830406188965, "lr": 0.0002760929334707552, "tps": 14047, "wall": 59633.4} {"step": 12782, "train_loss": 3.3992667198181152, "lr": 0.00027607472913788794, "tps": 14047, "wall": 59638.4} {"step": 12783, "train_loss": 3.5643584728240967, "lr": 0.0002760565241698031, "tps": 14047, "wall": 59643.3} {"step": 12784, "train_loss": 3.4265456199645996, "lr": 0.0002760383185667069, "tps": 14046, "wall": 59648.2} {"step": 12785, "train_loss": 3.4714338779449463, "lr": 0.00027602011232880563, "tps": 14046, "wall": 59653.2} {"step": 12786, "train_loss": 3.4911086559295654, "lr": 0.00027600190545630553, "tps": 14046, "wall": 59658.1} {"step": 12787, "train_loss": 3.2960243225097656, "lr": 0.00027598369794941277, "tps": 14046, "wall": 59663.0} {"step": 12788, "train_loss": 3.442349672317505, "lr": 0.0002759654898083337, "tps": 14046, "wall": 59667.9} {"step": 12789, "train_loss": 3.4761152267456055, "lr": 0.0002759472810332744, "tps": 14046, "wall": 59672.8} {"step": 12790, "train_loss": 3.445513963699341, "lr": 0.0002759290716244414, "tps": 14046, "wall": 59677.8} {"step": 12791, "train_loss": 3.3450613021850586, "lr": 0.0002759108615820408, "tps": 14046, "wall": 59682.7} {"step": 12792, "train_loss": 3.4701361656188965, "lr": 0.000275892650906279, "tps": 14046, "wall": 59687.6} {"step": 12793, "train_loss": 3.4348437786102295, "lr": 0.0002758744395973621, "tps": 14046, "wall": 59692.5} {"step": 12794, "train_loss": 3.4230189323425293, "lr": 0.00027585622765549666, "tps": 14046, "wall": 59697.5} {"step": 12795, "train_loss": 3.4339754581451416, "lr": 0.0002758380150808888, "tps": 14046, "wall": 59702.4} {"step": 12796, "train_loss": 3.5002951622009277, "lr": 0.0002758198018737449, "tps": 14046, "wall": 59707.3} {"step": 12797, "train_loss": 3.374460220336914, "lr": 0.00027580158803427123, "tps": 14046, "wall": 59712.2} {"step": 12798, "train_loss": 3.406240701675415, "lr": 0.00027578337356267416, "tps": 14046, "wall": 59717.2} {"step": 12799, "train_loss": 3.483710289001465, "lr": 0.00027576515845916005, "tps": 14046, "wall": 59722.1} {"step": 12800, "train_loss": 3.433037757873535, "lr": 0.00027574694272393516, "tps": 14046, "wall": 59727.0} {"step": 12801, "train_loss": 3.4286625385284424, "lr": 0.00027572872635720587, "tps": 14045, "wall": 59731.9} {"step": 12802, "train_loss": 3.3923768997192383, "lr": 0.00027571050935917867, "tps": 14045, "wall": 59736.8} {"step": 12803, "train_loss": 3.459730863571167, "lr": 0.00027569229173005967, "tps": 14045, "wall": 59741.8} {"step": 12804, "train_loss": 3.4916815757751465, "lr": 0.00027567407347005546, "tps": 14045, "wall": 59746.7} {"step": 12805, "train_loss": 3.508652687072754, "lr": 0.0002756558545793723, "tps": 14045, "wall": 59751.6} {"step": 12806, "train_loss": 3.424903631210327, "lr": 0.00027563763505821664, "tps": 14045, "wall": 59756.6} {"step": 12807, "train_loss": 3.486988067626953, "lr": 0.0002756194149067948, "tps": 14045, "wall": 59761.5} {"step": 12808, "train_loss": 3.4605984687805176, "lr": 0.00027560119412531326, "tps": 14045, "wall": 59766.4} {"step": 12809, "train_loss": 3.4346392154693604, "lr": 0.00027558297271397834, "tps": 14045, "wall": 59771.3} {"step": 12810, "train_loss": 3.4760653972625732, "lr": 0.0002755647506729965, "tps": 14045, "wall": 59776.3} {"step": 12811, "train_loss": 3.389108180999756, "lr": 0.00027554652800257417, "tps": 14045, "wall": 59781.2} {"step": 12812, "train_loss": 3.4547529220581055, "lr": 0.00027552830470291777, "tps": 14045, "wall": 59786.1} {"step": 12813, "train_loss": 3.5143911838531494, "lr": 0.0002755100807742338, "tps": 14045, "wall": 59791.0} {"step": 12814, "train_loss": 3.4441146850585938, "lr": 0.00027549185621672854, "tps": 14045, "wall": 59795.9} {"step": 12815, "train_loss": 3.338968276977539, "lr": 0.00027547363103060855, "tps": 14045, "wall": 59800.9} {"step": 12816, "train_loss": 3.434176206588745, "lr": 0.00027545540521608033, "tps": 14045, "wall": 59805.8} {"step": 12817, "train_loss": 3.442866325378418, "lr": 0.00027543717877335014, "tps": 14044, "wall": 59810.7} {"step": 12818, "train_loss": 3.422959566116333, "lr": 0.00027541895170262473, "tps": 14044, "wall": 59815.6} {"step": 12819, "train_loss": 3.4367775917053223, "lr": 0.0002754007240041104, "tps": 14044, "wall": 59820.6} {"step": 12820, "train_loss": 3.4087696075439453, "lr": 0.0002753824956780136, "tps": 14044, "wall": 59825.5} {"step": 12821, "train_loss": 3.369767665863037, "lr": 0.00027536426672454095, "tps": 14044, "wall": 59830.5} {"step": 12822, "train_loss": 3.4964187145233154, "lr": 0.00027534603714389884, "tps": 14044, "wall": 59835.4} {"step": 12823, "train_loss": 3.3715436458587646, "lr": 0.0002753278069362939, "tps": 14044, "wall": 59840.3} {"step": 12824, "train_loss": 3.3921332359313965, "lr": 0.00027530957610193255, "tps": 14044, "wall": 59845.2} {"step": 12825, "train_loss": 3.488544225692749, "lr": 0.0002752913446410214, "tps": 14044, "wall": 59850.2} {"step": 12826, "train_loss": 3.5539445877075195, "lr": 0.00027527311255376674, "tps": 14044, "wall": 59855.1} {"step": 12827, "train_loss": 3.4008588790893555, "lr": 0.00027525487984037537, "tps": 14044, "wall": 59860.0} {"step": 12828, "train_loss": 3.4175989627838135, "lr": 0.0002752366465010537, "tps": 14044, "wall": 59865.0} {"step": 12829, "train_loss": 3.3724634647369385, "lr": 0.00027521841253600837, "tps": 14044, "wall": 59869.9} {"step": 12830, "train_loss": 3.5048828125, "lr": 0.00027520017794544583, "tps": 14044, "wall": 59874.8} {"step": 12831, "train_loss": 3.3839943408966064, "lr": 0.0002751819427295727, "tps": 14044, "wall": 59879.8} {"step": 12832, "train_loss": 3.3486504554748535, "lr": 0.00027516370688859555, "tps": 14044, "wall": 59884.7} {"step": 12833, "train_loss": 3.4947140216827393, "lr": 0.0002751454704227209, "tps": 14043, "wall": 59889.7} {"step": 12834, "train_loss": 3.6317081451416016, "lr": 0.0002751272333321554, "tps": 14043, "wall": 59894.6} {"step": 12835, "train_loss": 3.4540536403656006, "lr": 0.00027510899561710567, "tps": 14043, "wall": 59899.5} {"step": 12836, "train_loss": 3.323972463607788, "lr": 0.00027509075727777816, "tps": 14043, "wall": 59904.5} {"step": 12837, "train_loss": 3.553007125854492, "lr": 0.00027507251831437965, "tps": 14043, "wall": 59909.4} {"step": 12838, "train_loss": 3.4893405437469482, "lr": 0.0002750542787271166, "tps": 14043, "wall": 59914.3} {"step": 12839, "train_loss": 3.417330026626587, "lr": 0.00027503603851619575, "tps": 14043, "wall": 59919.2} {"step": 12840, "train_loss": 3.4183695316314697, "lr": 0.0002750177976818237, "tps": 14043, "wall": 59924.1} {"step": 12841, "train_loss": 3.4784345626831055, "lr": 0.000274999556224207, "tps": 14043, "wall": 59929.1} {"step": 12842, "train_loss": 3.401031494140625, "lr": 0.0002749813141435524, "tps": 14043, "wall": 59934.0} {"step": 12843, "train_loss": 3.4470772743225098, "lr": 0.0002749630714400665, "tps": 14043, "wall": 59939.0} {"step": 12844, "train_loss": 3.421703815460205, "lr": 0.00027494482811395594, "tps": 14043, "wall": 59943.9} {"step": 12845, "train_loss": 3.4825401306152344, "lr": 0.0002749265841654274, "tps": 14043, "wall": 59948.8} {"step": 12846, "train_loss": 3.3442463874816895, "lr": 0.0002749083395946876, "tps": 14043, "wall": 59953.7} {"step": 12847, "train_loss": 3.427105665206909, "lr": 0.00027489009440194304, "tps": 14043, "wall": 59958.7} {"step": 12848, "train_loss": 3.4362716674804688, "lr": 0.00027487184858740053, "tps": 14043, "wall": 59963.6} {"step": 12849, "train_loss": 3.385864734649658, "lr": 0.0002748536021512668, "tps": 14043, "wall": 59968.5} {"step": 12850, "train_loss": 3.3850746154785156, "lr": 0.0002748353550937486, "tps": 14042, "wall": 59973.4} {"step": 12851, "train_loss": 3.3651862144470215, "lr": 0.0002748171074150524, "tps": 14042, "wall": 59978.4} {"step": 12852, "train_loss": 3.5160465240478516, "lr": 0.00027479885911538504, "tps": 14042, "wall": 59983.3} {"step": 12853, "train_loss": 3.5148136615753174, "lr": 0.0002747806101949533, "tps": 14042, "wall": 59988.2} {"step": 12854, "train_loss": 3.4347565174102783, "lr": 0.0002747623606539638, "tps": 14042, "wall": 59993.1} {"step": 12855, "train_loss": 3.425062894821167, "lr": 0.0002747441104926233, "tps": 14042, "wall": 59998.1} {"step": 12856, "train_loss": 3.4861230850219727, "lr": 0.0002747258597111386, "tps": 14042, "wall": 60003.0} {"step": 12857, "train_loss": 3.5395450592041016, "lr": 0.00027470760830971636, "tps": 14042, "wall": 60007.9} {"step": 12858, "train_loss": 3.411935806274414, "lr": 0.0002746893562885634, "tps": 14042, "wall": 60012.9} {"step": 12859, "train_loss": 3.452498197555542, "lr": 0.00027467110364788643, "tps": 14042, "wall": 60017.8} {"step": 12860, "train_loss": 3.4286985397338867, "lr": 0.0002746528503878923, "tps": 14042, "wall": 60022.7} {"step": 12861, "train_loss": 3.3341383934020996, "lr": 0.0002746345965087877, "tps": 14042, "wall": 60027.6} {"step": 12862, "train_loss": 3.630190372467041, "lr": 0.00027461634201077944, "tps": 14042, "wall": 60032.5} {"step": 12863, "train_loss": 3.414320230484009, "lr": 0.00027459808689407427, "tps": 14042, "wall": 60037.5} {"step": 12864, "train_loss": 3.3256845474243164, "lr": 0.00027457983115887903, "tps": 14042, "wall": 60042.4} {"step": 12865, "train_loss": 3.4377458095550537, "lr": 0.0002745615748054005, "tps": 14042, "wall": 60047.3} {"step": 12866, "train_loss": 3.366386651992798, "lr": 0.0002745433178338455, "tps": 14041, "wall": 60052.2} {"step": 12867, "train_loss": 3.4011714458465576, "lr": 0.00027452506024442085, "tps": 14041, "wall": 60057.2} {"step": 12868, "train_loss": 3.3274450302124023, "lr": 0.00027450680203733335, "tps": 14041, "wall": 60062.1} {"step": 12869, "train_loss": 3.526052951812744, "lr": 0.00027448854321278983, "tps": 14041, "wall": 60067.1} {"step": 12870, "train_loss": 3.428244113922119, "lr": 0.0002744702837709972, "tps": 14041, "wall": 60072.0} {"step": 12871, "train_loss": 3.4066407680511475, "lr": 0.00027445202371216223, "tps": 14041, "wall": 60076.9} {"step": 12872, "train_loss": 3.4577417373657227, "lr": 0.00027443376303649177, "tps": 14041, "wall": 60081.8} {"step": 12873, "train_loss": 3.4170002937316895, "lr": 0.00027441550174419276, "tps": 14041, "wall": 60086.8} {"step": 12874, "train_loss": 3.450515031814575, "lr": 0.00027439723983547197, "tps": 14041, "wall": 60091.7} {"step": 12875, "train_loss": 3.3949098587036133, "lr": 0.00027437897731053624, "tps": 14041, "wall": 60096.6} {"step": 12876, "train_loss": 3.367629289627075, "lr": 0.00027436071416959263, "tps": 14041, "wall": 60101.5} {"step": 12877, "train_loss": 3.4385738372802734, "lr": 0.0002743424504128478, "tps": 14041, "wall": 60106.4} {"step": 12878, "train_loss": 3.397921562194824, "lr": 0.0002743241860405088, "tps": 14041, "wall": 60111.4} {"step": 12879, "train_loss": 3.44113826751709, "lr": 0.0002743059210527825, "tps": 14041, "wall": 60116.3} {"step": 12880, "train_loss": 3.5037081241607666, "lr": 0.0002742876554498758, "tps": 14041, "wall": 60121.2} {"step": 12881, "train_loss": 3.3215346336364746, "lr": 0.0002742693892319956, "tps": 14041, "wall": 60126.2} {"step": 12882, "train_loss": 3.4140536785125732, "lr": 0.0002742511223993488, "tps": 14040, "wall": 60131.1} {"step": 12883, "train_loss": 3.577103614807129, "lr": 0.0002742328549521423, "tps": 14040, "wall": 60136.0} {"step": 12884, "train_loss": 3.458404541015625, "lr": 0.0002742145868905831, "tps": 14040, "wall": 60140.9} {"step": 12885, "train_loss": 3.4736733436584473, "lr": 0.0002741963182148782, "tps": 14040, "wall": 60145.9} {"step": 12886, "train_loss": 3.441002368927002, "lr": 0.0002741780489252344, "tps": 14040, "wall": 60150.8} {"step": 12887, "train_loss": 3.432445526123047, "lr": 0.0002741597790218588, "tps": 14040, "wall": 60155.7} {"step": 12888, "train_loss": 3.4406466484069824, "lr": 0.00027414150850495824, "tps": 14040, "wall": 60160.6} {"step": 12889, "train_loss": 3.364226818084717, "lr": 0.0002741232373747398, "tps": 14040, "wall": 60165.5} {"step": 12890, "train_loss": 3.414867877960205, "lr": 0.00027410496563141034, "tps": 14040, "wall": 60170.4} {"step": 12891, "train_loss": 3.472160816192627, "lr": 0.0002740866932751769, "tps": 14040, "wall": 60175.4} {"step": 12892, "train_loss": 3.378838062286377, "lr": 0.0002740684203062465, "tps": 14040, "wall": 60180.3} {"step": 12893, "train_loss": 3.412539482116699, "lr": 0.0002740501467248261, "tps": 14040, "wall": 60185.3} {"step": 12894, "train_loss": 3.3540916442871094, "lr": 0.00027403187253112276, "tps": 14040, "wall": 60190.2} {"step": 12895, "train_loss": 3.4538087844848633, "lr": 0.0002740135977253434, "tps": 14040, "wall": 60195.1} {"step": 12896, "train_loss": 3.4994914531707764, "lr": 0.00027399532230769504, "tps": 14040, "wall": 60200.0} {"step": 12897, "train_loss": 3.3780951499938965, "lr": 0.0002739770462783848, "tps": 14040, "wall": 60205.0} {"step": 12898, "train_loss": 3.425663471221924, "lr": 0.0002739587696376197, "tps": 14040, "wall": 60209.9} {"step": 12899, "train_loss": 3.3973352909088135, "lr": 0.0002739404923856066, "tps": 14039, "wall": 60214.9} {"step": 12900, "train_loss": 3.417593002319336, "lr": 0.00027392221452255284, "tps": 14039, "wall": 60219.8} {"step": 12901, "train_loss": 3.422356128692627, "lr": 0.0002739039360486652, "tps": 14039, "wall": 60224.7} {"step": 12902, "train_loss": 3.4874329566955566, "lr": 0.0002738856569641509, "tps": 14039, "wall": 60229.6} {"step": 12903, "train_loss": 3.5851552486419678, "lr": 0.00027386737726921696, "tps": 14039, "wall": 60234.5} {"step": 12904, "train_loss": 3.4262962341308594, "lr": 0.0002738490969640705, "tps": 14039, "wall": 60239.5} {"step": 12905, "train_loss": 3.433011293411255, "lr": 0.0002738308160489185, "tps": 14039, "wall": 60244.4} {"step": 12906, "train_loss": 3.3972206115722656, "lr": 0.0002738125345239682, "tps": 14039, "wall": 60249.3} {"step": 12907, "train_loss": 3.4653964042663574, "lr": 0.00027379425238942647, "tps": 14039, "wall": 60254.3} {"step": 12908, "train_loss": 3.344581365585327, "lr": 0.0002737759696455006, "tps": 14039, "wall": 60259.2} {"step": 12909, "train_loss": 3.430922031402588, "lr": 0.0002737576862923976, "tps": 14039, "wall": 60264.1} {"step": 12910, "train_loss": 3.452113151550293, "lr": 0.00027373940233032466, "tps": 14039, "wall": 60269.0} {"step": 12911, "train_loss": 3.409270763397217, "lr": 0.00027372111775948884, "tps": 14039, "wall": 60273.9} {"step": 12912, "train_loss": 3.3435890674591064, "lr": 0.00027370283258009733, "tps": 14039, "wall": 60278.9} {"step": 12913, "train_loss": 3.3530702590942383, "lr": 0.00027368454679235716, "tps": 14039, "wall": 60283.8} {"step": 12914, "train_loss": 3.423508644104004, "lr": 0.0002736662603964756, "tps": 14039, "wall": 60288.7} {"step": 12915, "train_loss": 3.4967727661132812, "lr": 0.00027364797339265973, "tps": 14039, "wall": 60293.6} {"step": 12916, "train_loss": 3.446465492248535, "lr": 0.00027362968578111674, "tps": 14038, "wall": 60298.6} {"step": 12917, "train_loss": 3.4752752780914307, "lr": 0.00027361139756205375, "tps": 14038, "wall": 60303.5} {"step": 12918, "train_loss": 3.3951985836029053, "lr": 0.0002735931087356779, "tps": 14038, "wall": 60308.4} {"step": 12919, "train_loss": 3.3789258003234863, "lr": 0.00027357481930219646, "tps": 14038, "wall": 60313.4} {"step": 12920, "train_loss": 3.3552892208099365, "lr": 0.00027355652926181655, "tps": 14038, "wall": 60318.3} {"step": 12921, "train_loss": 3.41312313079834, "lr": 0.0002735382386147454, "tps": 14038, "wall": 60323.2} {"step": 12922, "train_loss": 3.392190456390381, "lr": 0.00027351994736119015, "tps": 14038, "wall": 60328.1} {"step": 12923, "train_loss": 3.363387107849121, "lr": 0.00027350165550135805, "tps": 14038, "wall": 60333.0} {"step": 12924, "train_loss": 3.429673910140991, "lr": 0.0002734833630354564, "tps": 14038, "wall": 60338.0} {"step": 12925, "train_loss": 3.364825487136841, "lr": 0.0002734650699636922, "tps": 14038, "wall": 60342.9} {"step": 12926, "train_loss": 3.414473533630371, "lr": 0.00027344677628627284, "tps": 14038, "wall": 60347.8} {"step": 12927, "train_loss": 3.4867103099823, "lr": 0.0002734284820034055, "tps": 14038, "wall": 60352.7} {"step": 12928, "train_loss": 3.450103282928467, "lr": 0.0002734101871152974, "tps": 14038, "wall": 60357.7} {"step": 12929, "train_loss": 3.4137065410614014, "lr": 0.00027339189162215577, "tps": 14038, "wall": 60362.6} {"step": 12930, "train_loss": 3.5200514793395996, "lr": 0.000273373595524188, "tps": 14038, "wall": 60367.5} {"step": 12931, "train_loss": 3.4590888023376465, "lr": 0.0002733552988216012, "tps": 14038, "wall": 60372.4} {"step": 12932, "train_loss": 3.390934467315674, "lr": 0.0002733370015146027, "tps": 14038, "wall": 60377.3} {"step": 12933, "train_loss": 3.4906816482543945, "lr": 0.00027331870360339976, "tps": 14037, "wall": 60382.2} {"step": 12934, "train_loss": 3.4913668632507324, "lr": 0.0002733004050881997, "tps": 14037, "wall": 60387.2} {"step": 12935, "train_loss": 3.2950613498687744, "lr": 0.0002732821059692098, "tps": 14037, "wall": 60392.1} {"step": 12936, "train_loss": 3.411780834197998, "lr": 0.00027326380624663726, "tps": 14037, "wall": 60397.0} {"step": 12937, "train_loss": 3.425895929336548, "lr": 0.0002732455059206894, "tps": 14037, "wall": 60401.9} {"step": 12938, "train_loss": 3.4011943340301514, "lr": 0.0002732272049915736, "tps": 14037, "wall": 60406.9} {"step": 12939, "train_loss": 3.3892698287963867, "lr": 0.0002732089034594972, "tps": 14037, "wall": 60411.8} {"step": 12940, "train_loss": 3.566909074783325, "lr": 0.00027319060132466734, "tps": 14037, "wall": 60416.7} {"step": 12941, "train_loss": 3.4439008235931396, "lr": 0.0002731722985872916, "tps": 14037, "wall": 60421.7} {"step": 12942, "train_loss": 3.423623561859131, "lr": 0.00027315399524757716, "tps": 14037, "wall": 60426.6} {"step": 12943, "train_loss": 3.3426120281219482, "lr": 0.00027313569130573133, "tps": 14037, "wall": 60431.5} {"step": 12944, "train_loss": 3.420668125152588, "lr": 0.00027311738676196156, "tps": 14037, "wall": 60436.4} {"step": 12945, "train_loss": 3.472766160964966, "lr": 0.00027309908161647514, "tps": 14037, "wall": 60441.3} {"step": 12946, "train_loss": 3.335115432739258, "lr": 0.00027308077586947943, "tps": 14037, "wall": 60446.3} {"step": 12947, "train_loss": 3.341761589050293, "lr": 0.00027306246952118183, "tps": 14037, "wall": 60451.2} {"step": 12948, "train_loss": 3.46812105178833, "lr": 0.00027304416257178975, "tps": 14037, "wall": 60456.1} {"step": 12949, "train_loss": 3.4067087173461914, "lr": 0.0002730258550215105, "tps": 14036, "wall": 60461.0} {"step": 12950, "train_loss": 3.4477007389068604, "lr": 0.0002730075468705514, "tps": 14036, "wall": 60466.0} {"step": 12951, "train_loss": 3.3919577598571777, "lr": 0.0002729892381191201, "tps": 14036, "wall": 60470.9} {"step": 12952, "train_loss": 3.413670063018799, "lr": 0.00027297092876742374, "tps": 14036, "wall": 60475.8} {"step": 12953, "train_loss": 3.4547324180603027, "lr": 0.00027295261881566985, "tps": 14036, "wall": 60480.8} {"step": 12954, "train_loss": 3.4402458667755127, "lr": 0.0002729343082640658, "tps": 14036, "wall": 60485.7} {"step": 12955, "train_loss": 3.491389274597168, "lr": 0.00027291599711281916, "tps": 14036, "wall": 60490.6} {"step": 12956, "train_loss": 3.461717128753662, "lr": 0.00027289768536213713, "tps": 14036, "wall": 60495.6} {"step": 12957, "train_loss": 3.3745853900909424, "lr": 0.00027287937301222735, "tps": 14036, "wall": 60500.5} {"step": 12958, "train_loss": 3.4563167095184326, "lr": 0.00027286106006329706, "tps": 14036, "wall": 60505.4} {"step": 12959, "train_loss": 3.4734535217285156, "lr": 0.0002728427465155539, "tps": 14036, "wall": 60510.4} {"step": 12960, "train_loss": 3.4666500091552734, "lr": 0.00027282443236920523, "tps": 14036, "wall": 60515.3} {"step": 12961, "train_loss": 3.466923236846924, "lr": 0.0002728061176244585, "tps": 14036, "wall": 60520.2} {"step": 12962, "train_loss": 3.3568429946899414, "lr": 0.0002727878022815213, "tps": 14036, "wall": 60525.1} {"step": 12963, "train_loss": 3.4762930870056152, "lr": 0.00027276948634060095, "tps": 14036, "wall": 60530.1} {"step": 12964, "train_loss": 3.4545421600341797, "lr": 0.000272751169801905, "tps": 14036, "wall": 60535.0} {"step": 12965, "train_loss": 3.4199769496917725, "lr": 0.00027273285266564103, "tps": 14036, "wall": 60539.9} {"step": 12966, "train_loss": 3.529452323913574, "lr": 0.00027271453493201634, "tps": 14035, "wall": 60544.9} {"step": 12967, "train_loss": 3.443203926086426, "lr": 0.0002726962166012386, "tps": 14035, "wall": 60549.8} {"step": 12968, "train_loss": 3.4301319122314453, "lr": 0.0002726778976735153, "tps": 14035, "wall": 60554.7} {"step": 12969, "train_loss": 3.4653074741363525, "lr": 0.0002726595781490538, "tps": 14035, "wall": 60559.6} {"step": 12970, "train_loss": 3.408914566040039, "lr": 0.00027264125802806187, "tps": 14035, "wall": 60564.5} {"step": 12971, "train_loss": 3.332188129425049, "lr": 0.00027262293731074685, "tps": 14035, "wall": 60569.5} {"step": 12972, "train_loss": 3.3915624618530273, "lr": 0.00027260461599731644, "tps": 14035, "wall": 60574.4} {"step": 12973, "train_loss": 3.4268791675567627, "lr": 0.00027258629408797805, "tps": 14035, "wall": 60579.3} {"step": 12974, "train_loss": 3.4481773376464844, "lr": 0.00027256797158293925, "tps": 14035, "wall": 60584.2} {"step": 12975, "train_loss": 3.368853807449341, "lr": 0.0002725496484824076, "tps": 14035, "wall": 60589.1} {"step": 12976, "train_loss": 3.4380860328674316, "lr": 0.0002725313247865908, "tps": 14035, "wall": 60594.0} {"step": 12977, "train_loss": 3.4363913536071777, "lr": 0.0002725130004956962, "tps": 14035, "wall": 60599.0} {"step": 12978, "train_loss": 3.3774445056915283, "lr": 0.0002724946756099315, "tps": 14035, "wall": 60603.9} {"step": 12979, "train_loss": 3.5790696144104004, "lr": 0.00027247635012950434, "tps": 14035, "wall": 60608.9} {"step": 12980, "train_loss": 3.4078729152679443, "lr": 0.0002724580240546222, "tps": 14035, "wall": 60613.8} {"step": 12981, "train_loss": 3.4306752681732178, "lr": 0.0002724396973854927, "tps": 14035, "wall": 60618.7} {"step": 12982, "train_loss": 3.402945041656494, "lr": 0.00027242137012232354, "tps": 14035, "wall": 60623.7} {"step": 12983, "train_loss": 3.4163923263549805, "lr": 0.0002724030422653222, "tps": 14034, "wall": 60628.6} {"step": 12984, "train_loss": 3.4580020904541016, "lr": 0.00027238471381469645, "tps": 14034, "wall": 60633.5} {"step": 12985, "train_loss": 3.4029407501220703, "lr": 0.0002723663847706538, "tps": 14034, "wall": 60638.4} {"step": 12986, "train_loss": 3.3414368629455566, "lr": 0.00027234805513340186, "tps": 14034, "wall": 60643.4} {"step": 12987, "train_loss": 3.4158432483673096, "lr": 0.0002723297249031483, "tps": 14034, "wall": 60648.3} {"step": 12988, "train_loss": 3.4156479835510254, "lr": 0.0002723113940801008, "tps": 14034, "wall": 60653.2} {"step": 12989, "train_loss": 3.548638105392456, "lr": 0.00027229306266446704, "tps": 14034, "wall": 60658.2} {"step": 12990, "train_loss": 3.3130722045898438, "lr": 0.00027227473065645464, "tps": 14034, "wall": 60663.1} {"step": 12991, "train_loss": 3.4708268642425537, "lr": 0.00027225639805627123, "tps": 14034, "wall": 60668.0} {"step": 12992, "train_loss": 3.4444355964660645, "lr": 0.00027223806486412455, "tps": 14034, "wall": 60672.9} {"step": 12993, "train_loss": 3.4728384017944336, "lr": 0.0002722197310802222, "tps": 14034, "wall": 60677.9} {"step": 12994, "train_loss": 3.4425039291381836, "lr": 0.0002722013967047719, "tps": 14034, "wall": 60682.8} {"step": 12995, "train_loss": 3.517503261566162, "lr": 0.00027218306173798143, "tps": 14034, "wall": 60687.7} {"step": 12996, "train_loss": 3.493809223175049, "lr": 0.0002721647261800584, "tps": 14034, "wall": 60692.6} {"step": 12997, "train_loss": 3.3368406295776367, "lr": 0.0002721463900312105, "tps": 14034, "wall": 60697.6} {"step": 12998, "train_loss": 3.4149928092956543, "lr": 0.0002721280532916454, "tps": 14034, "wall": 60702.5} {"step": 12999, "train_loss": 3.3628032207489014, "lr": 0.00027210971596157104, "tps": 14034, "wall": 60707.4} {"step": 13000, "train_loss": 3.491302013397217, "lr": 0.00027209137804119494, "tps": 14033, "wall": 60712.3, "val_loss_monitor": 3.4635174247601137} {"step": 13001, "train_loss": 3.4565417766571045, "lr": 0.00027207303953072484, "tps": 14022, "wall": 60765.4} {"step": 13002, "train_loss": 3.4013490676879883, "lr": 0.00027205470043036863, "tps": 14022, "wall": 60770.4} {"step": 13003, "train_loss": 3.4030489921569824, "lr": 0.00027203636074033384, "tps": 14022, "wall": 60775.3} {"step": 13004, "train_loss": 3.4155564308166504, "lr": 0.0002720180204608284, "tps": 14022, "wall": 60780.3} {"step": 13005, "train_loss": 3.393908977508545, "lr": 0.00027199967959206, "tps": 14022, "wall": 60785.2} {"step": 13006, "train_loss": 3.41365647315979, "lr": 0.00027198133813423645, "tps": 14022, "wall": 60790.1} {"step": 13007, "train_loss": 3.467794895172119, "lr": 0.00027196299608756545, "tps": 14022, "wall": 60795.1} {"step": 13008, "train_loss": 3.429621696472168, "lr": 0.0002719446534522548, "tps": 14022, "wall": 60800.0} {"step": 13009, "train_loss": 3.4434738159179688, "lr": 0.0002719263102285124, "tps": 14022, "wall": 60804.9} {"step": 13010, "train_loss": 3.401536226272583, "lr": 0.00027190796641654585, "tps": 14022, "wall": 60809.9} {"step": 13011, "train_loss": 3.278881072998047, "lr": 0.0002718896220165631, "tps": 14022, "wall": 60814.8} {"step": 13012, "train_loss": 3.3915536403656006, "lr": 0.0002718712770287719, "tps": 14022, "wall": 60819.7} {"step": 13013, "train_loss": 3.427912712097168, "lr": 0.00027185293145338003, "tps": 14022, "wall": 60824.6} {"step": 13014, "train_loss": 3.4053165912628174, "lr": 0.0002718345852905954, "tps": 14021, "wall": 60829.6} {"step": 13015, "train_loss": 3.3811144828796387, "lr": 0.0002718162385406257, "tps": 14021, "wall": 60834.5} {"step": 13016, "train_loss": 3.3622257709503174, "lr": 0.00027179789120367894, "tps": 14021, "wall": 60839.5} {"step": 13017, "train_loss": 3.451411247253418, "lr": 0.00027177954327996283, "tps": 14021, "wall": 60844.4} {"step": 13018, "train_loss": 3.432002067565918, "lr": 0.00027176119476968527, "tps": 14021, "wall": 60849.3} {"step": 13019, "train_loss": 3.4855668544769287, "lr": 0.00027174284567305405, "tps": 14021, "wall": 60854.2} {"step": 13020, "train_loss": 3.501988172531128, "lr": 0.00027172449599027716, "tps": 14021, "wall": 60859.2} {"step": 13021, "train_loss": 3.398249626159668, "lr": 0.0002717061457215623, "tps": 14021, "wall": 60864.1} {"step": 13022, "train_loss": 3.4115219116210938, "lr": 0.00027168779486711744, "tps": 14021, "wall": 60869.0} {"step": 13023, "train_loss": 3.475785493850708, "lr": 0.0002716694434271505, "tps": 14021, "wall": 60873.9} {"step": 13024, "train_loss": 3.508089542388916, "lr": 0.00027165109140186923, "tps": 14021, "wall": 60878.8} {"step": 13025, "train_loss": 3.449190855026245, "lr": 0.00027163273879148166, "tps": 14021, "wall": 60883.8} {"step": 13026, "train_loss": 3.444120407104492, "lr": 0.00027161438559619564, "tps": 14021, "wall": 60888.7} {"step": 13027, "train_loss": 3.4869801998138428, "lr": 0.000271596031816219, "tps": 14021, "wall": 60893.6} {"step": 13028, "train_loss": 3.3975179195404053, "lr": 0.00027157767745175973, "tps": 14021, "wall": 60898.6} {"step": 13029, "train_loss": 3.3770534992218018, "lr": 0.00027155932250302574, "tps": 14021, "wall": 60903.5} {"step": 13030, "train_loss": 3.4006266593933105, "lr": 0.00027154096697022505, "tps": 14021, "wall": 60908.4} {"step": 13031, "train_loss": 3.4814116954803467, "lr": 0.0002715226108535654, "tps": 14020, "wall": 60913.4} {"step": 13032, "train_loss": 3.479018211364746, "lr": 0.0002715042541532548, "tps": 14020, "wall": 60918.3} {"step": 13033, "train_loss": 3.433886766433716, "lr": 0.0002714858968695013, "tps": 14020, "wall": 60923.2} {"step": 13034, "train_loss": 3.491398572921753, "lr": 0.00027146753900251277, "tps": 14020, "wall": 60928.1} {"step": 13035, "train_loss": 3.3748831748962402, "lr": 0.0002714491805524971, "tps": 14020, "wall": 60933.1} {"step": 13036, "train_loss": 3.3350682258605957, "lr": 0.00027143082151966243, "tps": 14020, "wall": 60938.0} {"step": 13037, "train_loss": 3.4508440494537354, "lr": 0.0002714124619042166, "tps": 14020, "wall": 60942.9} {"step": 13038, "train_loss": 3.3576321601867676, "lr": 0.00027139410170636755, "tps": 14020, "wall": 60947.8} {"step": 13039, "train_loss": 3.530529022216797, "lr": 0.0002713757409263234, "tps": 14020, "wall": 60952.7} {"step": 13040, "train_loss": 3.417093276977539, "lr": 0.0002713573795642921, "tps": 14020, "wall": 60957.7} {"step": 13041, "train_loss": 3.4036998748779297, "lr": 0.0002713390176204816, "tps": 14020, "wall": 60962.6} {"step": 13042, "train_loss": 3.39142107963562, "lr": 0.00027132065509509994, "tps": 14020, "wall": 60967.5} {"step": 13043, "train_loss": 3.330087184906006, "lr": 0.0002713022919883551, "tps": 14020, "wall": 60972.5} {"step": 13044, "train_loss": 3.393371343612671, "lr": 0.00027128392830045515, "tps": 14020, "wall": 60977.4} {"step": 13045, "train_loss": 3.452418327331543, "lr": 0.000271265564031608, "tps": 14020, "wall": 60982.3} {"step": 13046, "train_loss": 3.5949318408966064, "lr": 0.00027124719918202186, "tps": 14020, "wall": 60987.2} {"step": 13047, "train_loss": 3.423001289367676, "lr": 0.0002712288337519047, "tps": 14020, "wall": 60992.1} {"step": 13048, "train_loss": 3.43990159034729, "lr": 0.00027121046774146446, "tps": 14020, "wall": 60997.1} {"step": 13049, "train_loss": 3.4235146045684814, "lr": 0.0002711921011509093, "tps": 14019, "wall": 61002.0} {"step": 13050, "train_loss": 3.4450981616973877, "lr": 0.0002711737339804472, "tps": 14019, "wall": 61006.9} {"step": 13051, "train_loss": 3.4370007514953613, "lr": 0.0002711553662302863, "tps": 14019, "wall": 61011.8} {"step": 13052, "train_loss": 3.5676496028900146, "lr": 0.0002711369979006347, "tps": 14019, "wall": 61016.8} {"step": 13053, "train_loss": 3.3421339988708496, "lr": 0.0002711186289917004, "tps": 14019, "wall": 61021.7} {"step": 13054, "train_loss": 3.384902238845825, "lr": 0.0002711002595036915, "tps": 14019, "wall": 61026.6} {"step": 13055, "train_loss": 3.3854286670684814, "lr": 0.0002710818894368161, "tps": 14019, "wall": 61031.5} {"step": 13056, "train_loss": 3.363950729370117, "lr": 0.0002710635187912823, "tps": 14019, "wall": 61036.5} {"step": 13057, "train_loss": 3.4213547706604004, "lr": 0.00027104514756729815, "tps": 14019, "wall": 61041.4} {"step": 13058, "train_loss": 3.541499137878418, "lr": 0.0002710267757650718, "tps": 14019, "wall": 61046.3} {"step": 13059, "train_loss": 3.3773744106292725, "lr": 0.0002710084033848114, "tps": 14019, "wall": 61051.2} {"step": 13060, "train_loss": 3.354112148284912, "lr": 0.0002709900304267251, "tps": 14019, "wall": 61056.2} {"step": 13061, "train_loss": 3.395185947418213, "lr": 0.0002709716568910209, "tps": 14019, "wall": 61061.1} {"step": 13062, "train_loss": 3.3812990188598633, "lr": 0.00027095328277790704, "tps": 14019, "wall": 61066.0} {"step": 13063, "train_loss": 3.4829745292663574, "lr": 0.00027093490808759163, "tps": 14019, "wall": 61071.0} {"step": 13064, "train_loss": 3.4801430702209473, "lr": 0.00027091653282028286, "tps": 14019, "wall": 61075.9} {"step": 13065, "train_loss": 3.4176931381225586, "lr": 0.0002708981569761888, "tps": 14019, "wall": 61080.8} {"step": 13066, "train_loss": 3.4075098037719727, "lr": 0.0002708797805555177, "tps": 14018, "wall": 61085.8} {"step": 13067, "train_loss": 3.3392293453216553, "lr": 0.0002708614035584777, "tps": 14018, "wall": 61090.7} {"step": 13068, "train_loss": 3.376734495162964, "lr": 0.00027084302598527697, "tps": 14018, "wall": 61095.6} {"step": 13069, "train_loss": 3.412442207336426, "lr": 0.00027082464783612363, "tps": 14018, "wall": 61100.5} {"step": 13070, "train_loss": 3.3792479038238525, "lr": 0.00027080626911122604, "tps": 14018, "wall": 61105.4} {"step": 13071, "train_loss": 3.27394437789917, "lr": 0.0002707878898107922, "tps": 14018, "wall": 61110.4} {"step": 13072, "train_loss": 3.4213707447052, "lr": 0.00027076950993503037, "tps": 14018, "wall": 61115.3} {"step": 13073, "train_loss": 3.478832483291626, "lr": 0.00027075112948414884, "tps": 14018, "wall": 61120.2} {"step": 13074, "train_loss": 3.472750663757324, "lr": 0.00027073274845835577, "tps": 14018, "wall": 61125.2} {"step": 13075, "train_loss": 3.371326446533203, "lr": 0.0002707143668578594, "tps": 14018, "wall": 61130.1} {"step": 13076, "train_loss": 3.4932103157043457, "lr": 0.0002706959846828679, "tps": 14018, "wall": 61135.0} {"step": 13077, "train_loss": 3.49006986618042, "lr": 0.0002706776019335896, "tps": 14018, "wall": 61140.0} {"step": 13078, "train_loss": 3.440788745880127, "lr": 0.0002706592186102326, "tps": 14018, "wall": 61144.9} {"step": 13079, "train_loss": 3.3629684448242188, "lr": 0.0002706408347130052, "tps": 14018, "wall": 61149.9} {"step": 13080, "train_loss": 3.3737988471984863, "lr": 0.0002706224502421158, "tps": 14018, "wall": 61154.8} {"step": 13081, "train_loss": 3.564655303955078, "lr": 0.0002706040651977725, "tps": 14018, "wall": 61159.7} {"step": 13082, "train_loss": 3.4182658195495605, "lr": 0.0002705856795801836, "tps": 14018, "wall": 61164.6} {"step": 13083, "train_loss": 3.3072495460510254, "lr": 0.0002705672933895574, "tps": 14017, "wall": 61169.6} {"step": 13084, "train_loss": 3.4390411376953125, "lr": 0.00027054890662610217, "tps": 14017, "wall": 61174.5} {"step": 13085, "train_loss": 3.488450527191162, "lr": 0.0002705305192900262, "tps": 14017, "wall": 61179.4} {"step": 13086, "train_loss": 3.435572385787964, "lr": 0.0002705121313815377, "tps": 14017, "wall": 61184.3} {"step": 13087, "train_loss": 3.4221510887145996, "lr": 0.00027049374290084513, "tps": 14017, "wall": 61189.3} {"step": 13088, "train_loss": 3.531904697418213, "lr": 0.00027047535384815667, "tps": 14017, "wall": 61194.2} {"step": 13089, "train_loss": 3.361650228500366, "lr": 0.0002704569642236807, "tps": 14017, "wall": 61199.1} {"step": 13090, "train_loss": 3.3916351795196533, "lr": 0.0002704385740276254, "tps": 14017, "wall": 61204.1} {"step": 13091, "train_loss": 3.3782920837402344, "lr": 0.00027042018326019934, "tps": 14017, "wall": 61209.0} {"step": 13092, "train_loss": 3.345659017562866, "lr": 0.0002704017919216107, "tps": 14017, "wall": 61213.9} {"step": 13093, "train_loss": 3.6060736179351807, "lr": 0.0002703834000120678, "tps": 14017, "wall": 61218.8} {"step": 13094, "train_loss": 3.3866238594055176, "lr": 0.000270365007531779, "tps": 14017, "wall": 61223.7} {"step": 13095, "train_loss": 3.548299551010132, "lr": 0.0002703466144809527, "tps": 14017, "wall": 61228.7} {"step": 13096, "train_loss": 3.49025297164917, "lr": 0.0002703282208597972, "tps": 14017, "wall": 61233.6} {"step": 13097, "train_loss": 3.3794984817504883, "lr": 0.00027030982666852095, "tps": 14017, "wall": 61238.5} {"step": 13098, "train_loss": 3.395231246948242, "lr": 0.0002702914319073322, "tps": 14017, "wall": 61243.4} {"step": 13099, "train_loss": 3.4098782539367676, "lr": 0.0002702730365764394, "tps": 14017, "wall": 61248.4} {"step": 13100, "train_loss": 3.349681854248047, "lr": 0.00027025464067605094, "tps": 14016, "wall": 61253.3} {"step": 13101, "train_loss": 3.511050224304199, "lr": 0.0002702362442063752, "tps": 14016, "wall": 61258.3} {"step": 13102, "train_loss": 3.3498587608337402, "lr": 0.0002702178471676205, "tps": 14016, "wall": 61263.2} {"step": 13103, "train_loss": 3.3557019233703613, "lr": 0.0002701994495599954, "tps": 14016, "wall": 61268.1} {"step": 13104, "train_loss": 3.3805360794067383, "lr": 0.0002701810513837082, "tps": 14016, "wall": 61273.0} {"step": 13105, "train_loss": 3.5058813095092773, "lr": 0.00027016265263896734, "tps": 14016, "wall": 61278.0} {"step": 13106, "train_loss": 3.3447482585906982, "lr": 0.0002701442533259812, "tps": 14016, "wall": 61282.9} {"step": 13107, "train_loss": 3.4166884422302246, "lr": 0.0002701258534449582, "tps": 14016, "wall": 61287.8} {"step": 13108, "train_loss": 3.4396417140960693, "lr": 0.0002701074529961069, "tps": 14016, "wall": 61292.7} {"step": 13109, "train_loss": 3.33610463142395, "lr": 0.00027008905197963565, "tps": 14016, "wall": 61297.7} {"step": 13110, "train_loss": 3.5095713138580322, "lr": 0.0002700706503957529, "tps": 14016, "wall": 61302.6} {"step": 13111, "train_loss": 3.415358781814575, "lr": 0.00027005224824466713, "tps": 14016, "wall": 61307.5} {"step": 13112, "train_loss": 3.4484643936157227, "lr": 0.0002700338455265868, "tps": 14016, "wall": 61312.4} {"step": 13113, "train_loss": 3.433542251586914, "lr": 0.0002700154422417203, "tps": 14016, "wall": 61317.5} {"step": 13114, "train_loss": 3.495767116546631, "lr": 0.00026999703839027616, "tps": 14016, "wall": 61322.3} {"step": 13115, "train_loss": 3.4574227333068848, "lr": 0.00026997863397246294, "tps": 14016, "wall": 61327.3} {"step": 13116, "train_loss": 3.416146993637085, "lr": 0.000269960228988489, "tps": 14016, "wall": 61332.2} {"step": 13117, "train_loss": 3.3472559452056885, "lr": 0.0002699418234385629, "tps": 14016, "wall": 61337.1} {"step": 13118, "train_loss": 3.386697769165039, "lr": 0.00026992341732289313, "tps": 14015, "wall": 61342.0} {"step": 13119, "train_loss": 3.485812187194824, "lr": 0.0002699050106416882, "tps": 14015, "wall": 61347.0} {"step": 13120, "train_loss": 3.431717872619629, "lr": 0.00026988660339515654, "tps": 14015, "wall": 61351.9} {"step": 13121, "train_loss": 3.3946919441223145, "lr": 0.0002698681955835068, "tps": 14015, "wall": 61356.8} {"step": 13122, "train_loss": 3.465427875518799, "lr": 0.0002698497872069474, "tps": 14015, "wall": 61361.7} {"step": 13123, "train_loss": 3.3471879959106445, "lr": 0.00026983137826568695, "tps": 14015, "wall": 61366.6} {"step": 13124, "train_loss": 3.382862091064453, "lr": 0.0002698129687599339, "tps": 14015, "wall": 61371.6} {"step": 13125, "train_loss": 3.4765281677246094, "lr": 0.0002697945586898969, "tps": 14015, "wall": 61376.5} {"step": 13126, "train_loss": 3.446145534515381, "lr": 0.00026977614805578443, "tps": 14015, "wall": 61381.5} {"step": 13127, "train_loss": 3.442786455154419, "lr": 0.00026975773685780505, "tps": 14015, "wall": 61386.4} {"step": 13128, "train_loss": 3.3932032585144043, "lr": 0.0002697393250961674, "tps": 14015, "wall": 61391.3} {"step": 13129, "train_loss": 3.412759780883789, "lr": 0.00026972091277107995, "tps": 14015, "wall": 61396.2} {"step": 13130, "train_loss": 3.447803020477295, "lr": 0.0002697024998827512, "tps": 14015, "wall": 61401.1} {"step": 13131, "train_loss": 3.4258790016174316, "lr": 0.00026968408643138995, "tps": 14015, "wall": 61406.1} {"step": 13132, "train_loss": 3.387924909591675, "lr": 0.0002696656724172047, "tps": 14015, "wall": 61411.0} {"step": 13133, "train_loss": 3.4818668365478516, "lr": 0.000269647257840404, "tps": 14015, "wall": 61416.0} {"step": 13134, "train_loss": 3.323519706726074, "lr": 0.0002696288427011964, "tps": 14015, "wall": 61420.9} {"step": 13135, "train_loss": 3.5355823040008545, "lr": 0.0002696104269997907, "tps": 14014, "wall": 61425.8} {"step": 13136, "train_loss": 3.419496536254883, "lr": 0.00026959201073639536, "tps": 14014, "wall": 61430.7} {"step": 13137, "train_loss": 3.3287081718444824, "lr": 0.000269573593911219, "tps": 14014, "wall": 61435.7} {"step": 13138, "train_loss": 3.3884730339050293, "lr": 0.0002695551765244704, "tps": 14014, "wall": 61440.6} {"step": 13139, "train_loss": 3.465036392211914, "lr": 0.00026953675857635794, "tps": 14014, "wall": 61445.6} {"step": 13140, "train_loss": 3.3332223892211914, "lr": 0.00026951834006709043, "tps": 14014, "wall": 61450.5} {"step": 13141, "train_loss": 3.353781223297119, "lr": 0.00026949992099687656, "tps": 14014, "wall": 61455.5} {"step": 13142, "train_loss": 3.376681327819824, "lr": 0.0002694815013659248, "tps": 14014, "wall": 61460.4} {"step": 13143, "train_loss": 3.4083590507507324, "lr": 0.00026946308117444396, "tps": 14014, "wall": 61465.3} {"step": 13144, "train_loss": 3.5003182888031006, "lr": 0.0002694446604226427, "tps": 14014, "wall": 61470.2} {"step": 13145, "train_loss": 3.426966667175293, "lr": 0.00026942623911072966, "tps": 14014, "wall": 61475.1} {"step": 13146, "train_loss": 3.3080828189849854, "lr": 0.0002694078172389134, "tps": 14014, "wall": 61480.1} {"step": 13147, "train_loss": 3.432560920715332, "lr": 0.0002693893948074028, "tps": 14014, "wall": 61485.0} {"step": 13148, "train_loss": 3.484220504760742, "lr": 0.00026937097181640643, "tps": 14014, "wall": 61489.9} {"step": 13149, "train_loss": 3.3908467292785645, "lr": 0.00026935254826613306, "tps": 14014, "wall": 61494.8} {"step": 13150, "train_loss": 3.475634813308716, "lr": 0.0002693341241567914, "tps": 14014, "wall": 61499.8} {"step": 13151, "train_loss": 3.329141139984131, "lr": 0.00026931569948859, "tps": 14014, "wall": 61504.7} {"step": 13152, "train_loss": 3.5166029930114746, "lr": 0.00026929727426173777, "tps": 14013, "wall": 61509.6} {"step": 13153, "train_loss": 3.5275051593780518, "lr": 0.0002692788484764433, "tps": 14013, "wall": 61514.6} {"step": 13154, "train_loss": 3.3998639583587646, "lr": 0.0002692604221329154, "tps": 14013, "wall": 61519.5} {"step": 13155, "train_loss": 3.3631606101989746, "lr": 0.00026924199523136274, "tps": 14013, "wall": 61524.4} {"step": 13156, "train_loss": 3.4779391288757324, "lr": 0.00026922356777199415, "tps": 14013, "wall": 61529.4} {"step": 13157, "train_loss": 3.4045369625091553, "lr": 0.0002692051397550182, "tps": 14013, "wall": 61534.3} {"step": 13158, "train_loss": 3.415390729904175, "lr": 0.00026918671118064387, "tps": 14013, "wall": 61539.2} {"step": 13159, "train_loss": 3.4953274726867676, "lr": 0.0002691682820490798, "tps": 14013, "wall": 61544.1} {"step": 13160, "train_loss": 3.474102020263672, "lr": 0.0002691498523605348, "tps": 14013, "wall": 61549.1} {"step": 13161, "train_loss": 3.4504027366638184, "lr": 0.00026913142211521754, "tps": 14013, "wall": 61554.0} {"step": 13162, "train_loss": 3.451265335083008, "lr": 0.000269112991313337, "tps": 14013, "wall": 61558.9} {"step": 13163, "train_loss": 3.4572486877441406, "lr": 0.00026909455995510165, "tps": 14013, "wall": 61563.9} {"step": 13164, "train_loss": 3.4752442836761475, "lr": 0.0002690761280407206, "tps": 14013, "wall": 61568.8} {"step": 13165, "train_loss": 3.441002130508423, "lr": 0.0002690576955704025, "tps": 14013, "wall": 61573.7} {"step": 13166, "train_loss": 3.3627541065216064, "lr": 0.0002690392625443561, "tps": 14013, "wall": 61578.6} {"step": 13167, "train_loss": 3.388974189758301, "lr": 0.0002690208289627903, "tps": 14013, "wall": 61583.5} {"step": 13168, "train_loss": 3.460747480392456, "lr": 0.000269002394825914, "tps": 14013, "wall": 61588.4} {"step": 13169, "train_loss": 3.4420595169067383, "lr": 0.0002689839601339358, "tps": 14013, "wall": 61593.4} {"step": 13170, "train_loss": 3.484767436981201, "lr": 0.00026896552488706477, "tps": 14012, "wall": 61598.3} {"step": 13171, "train_loss": 3.4658617973327637, "lr": 0.00026894708908550954, "tps": 14012, "wall": 61603.2} {"step": 13172, "train_loss": 3.4103593826293945, "lr": 0.000268928652729479, "tps": 14012, "wall": 61608.2} {"step": 13173, "train_loss": 3.4109625816345215, "lr": 0.0002689102158191821, "tps": 14012, "wall": 61613.1} {"step": 13174, "train_loss": 3.4245052337646484, "lr": 0.00026889177835482764, "tps": 14012, "wall": 61618.1} {"step": 13175, "train_loss": 3.5457377433776855, "lr": 0.0002688733403366245, "tps": 14012, "wall": 61623.0} {"step": 13176, "train_loss": 3.4866864681243896, "lr": 0.0002688549017647814, "tps": 14012, "wall": 61627.9} {"step": 13177, "train_loss": 3.42897367477417, "lr": 0.0002688364626395074, "tps": 14012, "wall": 61632.8} {"step": 13178, "train_loss": 3.405594825744629, "lr": 0.0002688180229610113, "tps": 14012, "wall": 61637.7} {"step": 13179, "train_loss": 3.3666181564331055, "lr": 0.00026879958272950203, "tps": 14012, "wall": 61642.7} {"step": 13180, "train_loss": 3.424903392791748, "lr": 0.0002687811419451884, "tps": 14012, "wall": 61647.6} {"step": 13181, "train_loss": 3.2689595222473145, "lr": 0.00026876270060827937, "tps": 14012, "wall": 61652.5} {"step": 13182, "train_loss": 3.5261926651000977, "lr": 0.00026874425871898386, "tps": 14012, "wall": 61657.5} {"step": 13183, "train_loss": 3.302725315093994, "lr": 0.0002687258162775107, "tps": 14012, "wall": 61662.4} {"step": 13184, "train_loss": 3.3865504264831543, "lr": 0.00026870737328406883, "tps": 14012, "wall": 61667.3} {"step": 13185, "train_loss": 3.368067741394043, "lr": 0.0002686889297388672, "tps": 14012, "wall": 61672.2} {"step": 13186, "train_loss": 3.48113751411438, "lr": 0.00026867048564211483, "tps": 14012, "wall": 61677.2} {"step": 13187, "train_loss": 3.283801794052124, "lr": 0.00026865204099402054, "tps": 14011, "wall": 61682.1} {"step": 13188, "train_loss": 3.404625654220581, "lr": 0.00026863359579479333, "tps": 14011, "wall": 61687.0} {"step": 13189, "train_loss": 3.404855489730835, "lr": 0.000268615150044642, "tps": 14011, "wall": 61691.9} {"step": 13190, "train_loss": 3.4123504161834717, "lr": 0.0002685967037437758, "tps": 14011, "wall": 61696.8} {"step": 13191, "train_loss": 3.395556926727295, "lr": 0.00026857825689240335, "tps": 14011, "wall": 61701.8} {"step": 13192, "train_loss": 3.4097843170166016, "lr": 0.0002685598094907338, "tps": 14011, "wall": 61706.7} {"step": 13193, "train_loss": 3.3567395210266113, "lr": 0.0002685413615389762, "tps": 14011, "wall": 61711.6} {"step": 13194, "train_loss": 3.4274253845214844, "lr": 0.0002685229130373393, "tps": 14011, "wall": 61716.5} {"step": 13195, "train_loss": 3.516861915588379, "lr": 0.00026850446398603224, "tps": 14011, "wall": 61721.5} {"step": 13196, "train_loss": 3.3620071411132812, "lr": 0.000268486014385264, "tps": 14011, "wall": 61726.4} {"step": 13197, "train_loss": 3.4469425678253174, "lr": 0.00026846756423524364, "tps": 14011, "wall": 61731.3} {"step": 13198, "train_loss": 3.327268600463867, "lr": 0.00026844911353618005, "tps": 14011, "wall": 61736.2} {"step": 13199, "train_loss": 3.379981756210327, "lr": 0.0002684306622882822, "tps": 14011, "wall": 61741.2} {"step": 13200, "train_loss": 3.378046751022339, "lr": 0.0002684122104917593, "tps": 14011, "wall": 61746.1} {"step": 13201, "train_loss": 3.385430335998535, "lr": 0.00026839375814682024, "tps": 14011, "wall": 61751.1} {"step": 13202, "train_loss": 3.4282805919647217, "lr": 0.00026837530525367396, "tps": 14011, "wall": 61756.0} {"step": 13203, "train_loss": 3.362393856048584, "lr": 0.0002683568518125298, "tps": 14011, "wall": 61760.9} {"step": 13204, "train_loss": 3.563363790512085, "lr": 0.00026833839782359646, "tps": 14011, "wall": 61765.8} {"step": 13205, "train_loss": 3.4385337829589844, "lr": 0.0002683199432870832, "tps": 14010, "wall": 61770.8} {"step": 13206, "train_loss": 3.4988186359405518, "lr": 0.00026830148820319893, "tps": 14010, "wall": 61775.7} {"step": 13207, "train_loss": 3.4421629905700684, "lr": 0.00026828303257215284, "tps": 14010, "wall": 61780.6} {"step": 13208, "train_loss": 3.406607151031494, "lr": 0.00026826457639415397, "tps": 14010, "wall": 61785.6} {"step": 13209, "train_loss": 3.5065417289733887, "lr": 0.0002682461196694113, "tps": 14010, "wall": 61790.5} {"step": 13210, "train_loss": 3.485809803009033, "lr": 0.00026822766239813407, "tps": 14010, "wall": 61795.4} {"step": 13211, "train_loss": 3.3887362480163574, "lr": 0.0002682092045805312, "tps": 14010, "wall": 61800.4} {"step": 13212, "train_loss": 3.3599960803985596, "lr": 0.0002681907462168119, "tps": 14010, "wall": 61805.3} {"step": 13213, "train_loss": 3.3709397315979004, "lr": 0.00026817228730718516, "tps": 14010, "wall": 61810.2} {"step": 13214, "train_loss": 3.422488212585449, "lr": 0.0002681538278518602, "tps": 14010, "wall": 61815.2} {"step": 13215, "train_loss": 3.3700950145721436, "lr": 0.00026813536785104603, "tps": 14010, "wall": 61820.1} {"step": 13216, "train_loss": 3.3474278450012207, "lr": 0.00026811690730495176, "tps": 14010, "wall": 61825.0} {"step": 13217, "train_loss": 3.4394588470458984, "lr": 0.00026809844621378666, "tps": 14010, "wall": 61830.0} {"step": 13218, "train_loss": 3.4357829093933105, "lr": 0.00026807998457775977, "tps": 14010, "wall": 61834.9} {"step": 13219, "train_loss": 3.4603161811828613, "lr": 0.0002680615223970802, "tps": 14010, "wall": 61839.8} {"step": 13220, "train_loss": 3.333479404449463, "lr": 0.000268043059671957, "tps": 14010, "wall": 61844.7} {"step": 13221, "train_loss": 3.364119291305542, "lr": 0.0002680245964025995, "tps": 14010, "wall": 61849.7} {"step": 13222, "train_loss": 3.462954044342041, "lr": 0.0002680061325892168, "tps": 14009, "wall": 61854.6} {"step": 13223, "train_loss": 3.388195037841797, "lr": 0.00026798766823201797, "tps": 14009, "wall": 61859.6} {"step": 13224, "train_loss": 3.4073376655578613, "lr": 0.00026796920333121234, "tps": 14009, "wall": 61864.5} {"step": 13225, "train_loss": 3.4055418968200684, "lr": 0.00026795073788700885, "tps": 14009, "wall": 61869.4} {"step": 13226, "train_loss": 3.410456895828247, "lr": 0.00026793227189961683, "tps": 14009, "wall": 61874.3} {"step": 13227, "train_loss": 3.518824815750122, "lr": 0.0002679138053692455, "tps": 14009, "wall": 61879.2} {"step": 13228, "train_loss": 3.5237321853637695, "lr": 0.000267895338296104, "tps": 14009, "wall": 61884.1} {"step": 13229, "train_loss": 3.5041933059692383, "lr": 0.00026787687068040143, "tps": 14009, "wall": 61889.1} {"step": 13230, "train_loss": 3.3908004760742188, "lr": 0.00026785840252234716, "tps": 14009, "wall": 61894.0} {"step": 13231, "train_loss": 3.4857263565063477, "lr": 0.0002678399338221503, "tps": 14009, "wall": 61898.9} {"step": 13232, "train_loss": 3.5492687225341797, "lr": 0.0002678214645800201, "tps": 14009, "wall": 61903.8} {"step": 13233, "train_loss": 3.4862327575683594, "lr": 0.00026780299479616567, "tps": 14009, "wall": 61908.7} {"step": 13234, "train_loss": 3.4940171241760254, "lr": 0.0002677845244707964, "tps": 14009, "wall": 61913.7} {"step": 13235, "train_loss": 3.3296332359313965, "lr": 0.0002677660536041215, "tps": 14009, "wall": 61918.6} {"step": 13236, "train_loss": 3.3858346939086914, "lr": 0.0002677475821963501, "tps": 14009, "wall": 61923.6} {"step": 13237, "train_loss": 3.3721282482147217, "lr": 0.00026772911024769153, "tps": 14009, "wall": 61928.5} {"step": 13238, "train_loss": 3.399484872817993, "lr": 0.00026771063775835497, "tps": 14009, "wall": 61933.4} {"step": 13239, "train_loss": 3.3865554332733154, "lr": 0.00026769216472854974, "tps": 14009, "wall": 61938.3} {"step": 13240, "train_loss": 3.402238130569458, "lr": 0.0002676736911584851, "tps": 14008, "wall": 61943.2} {"step": 13241, "train_loss": 3.4835591316223145, "lr": 0.0002676552170483703, "tps": 14008, "wall": 61948.2} {"step": 13242, "train_loss": 3.4348442554473877, "lr": 0.00026763674239841463, "tps": 14008, "wall": 61953.1} {"step": 13243, "train_loss": 3.4243829250335693, "lr": 0.00026761826720882734, "tps": 14008, "wall": 61958.0} {"step": 13244, "train_loss": 3.362264633178711, "lr": 0.0002675997914798178, "tps": 14008, "wall": 61962.9} {"step": 13245, "train_loss": 3.511929512023926, "lr": 0.00026758131521159524, "tps": 14008, "wall": 61967.9} {"step": 13246, "train_loss": 3.3484396934509277, "lr": 0.00026756283840436893, "tps": 14008, "wall": 61972.8} {"step": 13247, "train_loss": 3.5234487056732178, "lr": 0.0002675443610583482, "tps": 14008, "wall": 61977.8} {"step": 13248, "train_loss": 3.5017924308776855, "lr": 0.00026752588317374243, "tps": 14008, "wall": 61982.7} {"step": 13249, "train_loss": 3.4646148681640625, "lr": 0.0002675074047507608, "tps": 14008, "wall": 61987.6} {"step": 13250, "train_loss": 3.4892966747283936, "lr": 0.0002674889257896128, "tps": 14008, "wall": 61992.6} {"step": 13251, "train_loss": 3.3458175659179688, "lr": 0.0002674704462905077, "tps": 14008, "wall": 61997.5} {"step": 13252, "train_loss": 3.432044744491577, "lr": 0.00026745196625365476, "tps": 14008, "wall": 62002.4} {"step": 13253, "train_loss": 3.470557928085327, "lr": 0.0002674334856792634, "tps": 14008, "wall": 62007.3} {"step": 13254, "train_loss": 3.3736538887023926, "lr": 0.0002674150045675429, "tps": 14008, "wall": 62012.3} {"step": 13255, "train_loss": 3.3174259662628174, "lr": 0.00026739652291870274, "tps": 14008, "wall": 62017.2} {"step": 13256, "train_loss": 3.4822030067443848, "lr": 0.00026737804073295214, "tps": 14008, "wall": 62022.1} {"step": 13257, "train_loss": 3.359997510910034, "lr": 0.0002673595580105006, "tps": 14008, "wall": 62027.0} {"step": 13258, "train_loss": 3.3818602561950684, "lr": 0.00026734107475155736, "tps": 14007, "wall": 62032.0} {"step": 13259, "train_loss": 3.4030165672302246, "lr": 0.00026732259095633184, "tps": 14007, "wall": 62036.9} {"step": 13260, "train_loss": 3.423459768295288, "lr": 0.0002673041066250335, "tps": 14007, "wall": 62041.8} {"step": 13261, "train_loss": 3.4319777488708496, "lr": 0.0002672856217578717, "tps": 14007, "wall": 62046.8} {"step": 13262, "train_loss": 3.3637125492095947, "lr": 0.0002672671363550558, "tps": 14007, "wall": 62051.7} {"step": 13263, "train_loss": 3.508805990219116, "lr": 0.0002672486504167952, "tps": 14007, "wall": 62056.6} {"step": 13264, "train_loss": 3.410224676132202, "lr": 0.00026723016394329945, "tps": 14007, "wall": 62061.5} {"step": 13265, "train_loss": 3.3041446208953857, "lr": 0.0002672116769347777, "tps": 14007, "wall": 62066.5} {"step": 13266, "train_loss": 3.3439648151397705, "lr": 0.0002671931893914396, "tps": 14007, "wall": 62071.4} {"step": 13267, "train_loss": 3.3051087856292725, "lr": 0.00026717470131349443, "tps": 14007, "wall": 62076.3} {"step": 13268, "train_loss": 3.500352382659912, "lr": 0.0002671562127011517, "tps": 14007, "wall": 62081.2} {"step": 13269, "train_loss": 3.4404971599578857, "lr": 0.0002671377235546209, "tps": 14007, "wall": 62086.1} {"step": 13270, "train_loss": 3.389517307281494, "lr": 0.00026711923387411134, "tps": 14007, "wall": 62091.1} {"step": 13271, "train_loss": 3.3974506855010986, "lr": 0.0002671007436598326, "tps": 14007, "wall": 62096.0} {"step": 13272, "train_loss": 3.4159348011016846, "lr": 0.0002670822529119941, "tps": 14007, "wall": 62101.0} {"step": 13273, "train_loss": 3.348937511444092, "lr": 0.00026706376163080535, "tps": 14007, "wall": 62105.9} {"step": 13274, "train_loss": 3.3795433044433594, "lr": 0.00026704526981647563, "tps": 14007, "wall": 62110.8} {"step": 13275, "train_loss": 3.381282091140747, "lr": 0.0002670267774692146, "tps": 14007, "wall": 62115.7} {"step": 13276, "train_loss": 3.4869580268859863, "lr": 0.0002670082845892317, "tps": 14006, "wall": 62120.7} {"step": 13277, "train_loss": 3.4415125846862793, "lr": 0.0002669897911767364, "tps": 14006, "wall": 62125.6} {"step": 13278, "train_loss": 3.3767333030700684, "lr": 0.00026697129723193824, "tps": 14006, "wall": 62130.5} {"step": 13279, "train_loss": 3.327399492263794, "lr": 0.00026695280275504667, "tps": 14006, "wall": 62135.4} {"step": 13280, "train_loss": 3.3969407081604004, "lr": 0.00026693430774627115, "tps": 14006, "wall": 62140.3} {"step": 13281, "train_loss": 3.368720054626465, "lr": 0.0002669158122058213, "tps": 14006, "wall": 62145.3} {"step": 13282, "train_loss": 3.3665218353271484, "lr": 0.0002668973161339066, "tps": 14006, "wall": 62150.2} {"step": 13283, "train_loss": 3.3046247959136963, "lr": 0.0002668788195307366, "tps": 14006, "wall": 62155.1} {"step": 13284, "train_loss": 3.557464361190796, "lr": 0.0002668603223965207, "tps": 14006, "wall": 62160.1} {"step": 13285, "train_loss": 3.5381152629852295, "lr": 0.00026684182473146864, "tps": 14006, "wall": 62165.0} {"step": 13286, "train_loss": 3.349015235900879, "lr": 0.00026682332653578974, "tps": 14006, "wall": 62169.9} {"step": 13287, "train_loss": 3.4313783645629883, "lr": 0.00026680482780969367, "tps": 14006, "wall": 62174.9} {"step": 13288, "train_loss": 3.248269557952881, "lr": 0.0002667863285533901, "tps": 14006, "wall": 62179.8} {"step": 13289, "train_loss": 3.4831628799438477, "lr": 0.00026676782876708843, "tps": 14006, "wall": 62184.7} {"step": 13290, "train_loss": 3.42594051361084, "lr": 0.00026674932845099816, "tps": 14006, "wall": 62189.6} {"step": 13291, "train_loss": 3.321658134460449, "lr": 0.00026673082760532906, "tps": 14006, "wall": 62194.5} {"step": 13292, "train_loss": 3.4539356231689453, "lr": 0.0002667123262302906, "tps": 14006, "wall": 62199.5} {"step": 13293, "train_loss": 3.4272947311401367, "lr": 0.00026669382432609233, "tps": 14006, "wall": 62204.4} {"step": 13294, "train_loss": 3.3043243885040283, "lr": 0.00026667532189294396, "tps": 14005, "wall": 62209.3} {"step": 13295, "train_loss": 3.4421236515045166, "lr": 0.000266656818931055, "tps": 14005, "wall": 62214.2} {"step": 13296, "train_loss": 3.490683078765869, "lr": 0.00026663831544063507, "tps": 14005, "wall": 62219.2} {"step": 13297, "train_loss": 3.436521053314209, "lr": 0.0002666198114218938, "tps": 14005, "wall": 62224.1} {"step": 13298, "train_loss": 3.409463405609131, "lr": 0.0002666013068750408, "tps": 14005, "wall": 62229.0} {"step": 13299, "train_loss": 3.4245736598968506, "lr": 0.00026658280180028563, "tps": 14005, "wall": 62233.9} {"step": 13300, "train_loss": 3.3882651329040527, "lr": 0.00026656429619783796, "tps": 14005, "wall": 62238.9} {"step": 13301, "train_loss": 3.3326072692871094, "lr": 0.0002665457900679074, "tps": 14005, "wall": 62243.8} {"step": 13302, "train_loss": 3.37249493598938, "lr": 0.00026652728341070367, "tps": 14005, "wall": 62248.7} {"step": 13303, "train_loss": 3.449673652648926, "lr": 0.00026650877622643636, "tps": 14005, "wall": 62253.6} {"step": 13304, "train_loss": 3.3555197715759277, "lr": 0.00026649026851531505, "tps": 14005, "wall": 62258.6} {"step": 13305, "train_loss": 3.481166362762451, "lr": 0.0002664717602775495, "tps": 14005, "wall": 62263.5} {"step": 13306, "train_loss": 3.453150510787964, "lr": 0.00026645325151334936, "tps": 14005, "wall": 62268.4} {"step": 13307, "train_loss": 3.417724609375, "lr": 0.00026643474222292425, "tps": 14005, "wall": 62273.3} {"step": 13308, "train_loss": 3.3116114139556885, "lr": 0.0002664162324064838, "tps": 14005, "wall": 62278.3} {"step": 13309, "train_loss": 3.486208200454712, "lr": 0.00026639772206423786, "tps": 14005, "wall": 62283.2} {"step": 13310, "train_loss": 3.3572001457214355, "lr": 0.00026637921119639606, "tps": 14005, "wall": 62288.2} {"step": 13311, "train_loss": 3.2866506576538086, "lr": 0.00026636069980316793, "tps": 14005, "wall": 62293.1} {"step": 13312, "train_loss": 3.5300192832946777, "lr": 0.00026634218788476334, "tps": 14004, "wall": 62298.0} {"step": 13313, "train_loss": 3.409496307373047, "lr": 0.0002663236754413919, "tps": 14004, "wall": 62303.0} {"step": 13314, "train_loss": 3.479668140411377, "lr": 0.00026630516247326335, "tps": 14004, "wall": 62307.9} {"step": 13315, "train_loss": 3.4113330841064453, "lr": 0.00026628664898058755, "tps": 14004, "wall": 62312.8} {"step": 13316, "train_loss": 3.500948667526245, "lr": 0.0002662681349635739, "tps": 14004, "wall": 62317.7} {"step": 13317, "train_loss": 3.4015722274780273, "lr": 0.00026624962042243243, "tps": 14004, "wall": 62322.7} {"step": 13318, "train_loss": 3.5584468841552734, "lr": 0.0002662311053573727, "tps": 14004, "wall": 62327.6} {"step": 13319, "train_loss": 3.4791626930236816, "lr": 0.00026621258976860455, "tps": 14004, "wall": 62332.5} {"step": 13320, "train_loss": 3.4467453956604004, "lr": 0.0002661940736563377, "tps": 14004, "wall": 62337.5} {"step": 13321, "train_loss": 3.427027702331543, "lr": 0.00026617555702078177, "tps": 14004, "wall": 62342.4} {"step": 13322, "train_loss": 3.4486706256866455, "lr": 0.0002661570398621468, "tps": 14004, "wall": 62347.4} {"step": 13323, "train_loss": 3.3300559520721436, "lr": 0.0002661385221806422, "tps": 14004, "wall": 62352.3} {"step": 13324, "train_loss": 3.4381954669952393, "lr": 0.00026612000397647806, "tps": 14004, "wall": 62357.2} {"step": 13325, "train_loss": 3.4245667457580566, "lr": 0.000266101485249864, "tps": 14004, "wall": 62362.1} {"step": 13326, "train_loss": 3.432102680206299, "lr": 0.00026608296600100977, "tps": 14004, "wall": 62367.0} {"step": 13327, "train_loss": 3.5301525592803955, "lr": 0.00026606444623012527, "tps": 14004, "wall": 62371.9} {"step": 13328, "train_loss": 3.5245361328125, "lr": 0.0002660459259374202, "tps": 14004, "wall": 62376.9} {"step": 13329, "train_loss": 3.4047226905822754, "lr": 0.0002660274051231044, "tps": 14004, "wall": 62381.8} {"step": 13330, "train_loss": 3.413588762283325, "lr": 0.00026600888378738765, "tps": 14003, "wall": 62386.7} {"step": 13331, "train_loss": 3.4223830699920654, "lr": 0.00026599036193047975, "tps": 14003, "wall": 62391.6} {"step": 13332, "train_loss": 3.4625134468078613, "lr": 0.0002659718395525906, "tps": 14003, "wall": 62396.5} {"step": 13333, "train_loss": 3.468515396118164, "lr": 0.00026595331665392994, "tps": 14003, "wall": 62401.5} {"step": 13334, "train_loss": 3.560304641723633, "lr": 0.0002659347932347076, "tps": 14003, "wall": 62406.4} {"step": 13335, "train_loss": 3.51882266998291, "lr": 0.00026591626929513344, "tps": 14003, "wall": 62411.3} {"step": 13336, "train_loss": 3.5104329586029053, "lr": 0.0002658977448354174, "tps": 14003, "wall": 62416.3} {"step": 13337, "train_loss": 3.3725390434265137, "lr": 0.00026587921985576907, "tps": 14003, "wall": 62421.2} {"step": 13338, "train_loss": 3.3856091499328613, "lr": 0.00026586069435639853, "tps": 14003, "wall": 62426.2} {"step": 13339, "train_loss": 3.29746675491333, "lr": 0.0002658421683375156, "tps": 14003, "wall": 62431.1} {"step": 13340, "train_loss": 3.4234395027160645, "lr": 0.00026582364179933004, "tps": 14003, "wall": 62436.0} {"step": 13341, "train_loss": 3.4310855865478516, "lr": 0.00026580511474205183, "tps": 14003, "wall": 62441.0} {"step": 13342, "train_loss": 3.4815540313720703, "lr": 0.00026578658716589073, "tps": 14003, "wall": 62445.9} {"step": 13343, "train_loss": 3.4227242469787598, "lr": 0.0002657680590710568, "tps": 14003, "wall": 62450.8} {"step": 13344, "train_loss": 3.443309783935547, "lr": 0.0002657495304577597, "tps": 14003, "wall": 62455.7} {"step": 13345, "train_loss": 3.396358013153076, "lr": 0.0002657310013262095, "tps": 14003, "wall": 62460.7} {"step": 13346, "train_loss": 3.3842785358428955, "lr": 0.00026571247167661615, "tps": 14003, "wall": 62465.6} {"step": 13347, "train_loss": 3.462080717086792, "lr": 0.0002656939415091893, "tps": 14002, "wall": 62470.5} {"step": 13348, "train_loss": 3.3566644191741943, "lr": 0.000265675410824139, "tps": 14002, "wall": 62475.4} {"step": 13349, "train_loss": 3.4018592834472656, "lr": 0.0002656568796216753, "tps": 14002, "wall": 62480.4} {"step": 13350, "train_loss": 3.4274942874908447, "lr": 0.00026563834790200794, "tps": 14002, "wall": 62485.3} {"step": 13351, "train_loss": 3.427147388458252, "lr": 0.0002656198156653468, "tps": 14002, "wall": 62490.2} {"step": 13352, "train_loss": 3.3957302570343018, "lr": 0.0002656012829119021, "tps": 14002, "wall": 62495.1} {"step": 13353, "train_loss": 3.456862211227417, "lr": 0.0002655827496418835, "tps": 14002, "wall": 62500.0} {"step": 13354, "train_loss": 3.4237074851989746, "lr": 0.0002655642158555011, "tps": 14002, "wall": 62505.0} {"step": 13355, "train_loss": 3.504648208618164, "lr": 0.00026554568155296473, "tps": 14002, "wall": 62509.9} {"step": 13356, "train_loss": 3.4219915866851807, "lr": 0.00026552714673448453, "tps": 14002, "wall": 62514.8} {"step": 13357, "train_loss": 3.3483145236968994, "lr": 0.0002655086114002702, "tps": 14002, "wall": 62519.8} {"step": 13358, "train_loss": 3.4790549278259277, "lr": 0.000265490075550532, "tps": 14002, "wall": 62524.7} {"step": 13359, "train_loss": 3.434915542602539, "lr": 0.0002654715391854796, "tps": 14002, "wall": 62529.6} {"step": 13360, "train_loss": 3.4274215698242188, "lr": 0.0002654530023053233, "tps": 14002, "wall": 62534.5} {"step": 13361, "train_loss": 3.330212116241455, "lr": 0.00026543446491027287, "tps": 14002, "wall": 62539.4} {"step": 13362, "train_loss": 3.3887903690338135, "lr": 0.00026541592700053836, "tps": 14002, "wall": 62544.4} {"step": 13363, "train_loss": 3.3197999000549316, "lr": 0.00026539738857632976, "tps": 14002, "wall": 62549.3} {"step": 13364, "train_loss": 3.3790931701660156, "lr": 0.0002653788496378571, "tps": 14002, "wall": 62554.2} {"step": 13365, "train_loss": 3.456540107727051, "lr": 0.00026536031018533035, "tps": 14002, "wall": 62559.1} {"step": 13366, "train_loss": 3.354053020477295, "lr": 0.00026534177021895957, "tps": 14001, "wall": 62564.1} {"step": 13367, "train_loss": 3.283663749694824, "lr": 0.0002653232297389548, "tps": 14001, "wall": 62569.0} {"step": 13368, "train_loss": 3.374325752258301, "lr": 0.000265304688745526, "tps": 14001, "wall": 62573.9} {"step": 13369, "train_loss": 3.466978073120117, "lr": 0.00026528614723888324, "tps": 14001, "wall": 62578.9} {"step": 13370, "train_loss": 3.4000089168548584, "lr": 0.00026526760521923656, "tps": 14001, "wall": 62583.8} {"step": 13371, "train_loss": 3.3632731437683105, "lr": 0.000265249062686796, "tps": 14001, "wall": 62588.7} {"step": 13372, "train_loss": 3.3887829780578613, "lr": 0.00026523051964177154, "tps": 14001, "wall": 62593.7} {"step": 13373, "train_loss": 3.47092342376709, "lr": 0.0002652119760843734, "tps": 14001, "wall": 62598.6} {"step": 13374, "train_loss": 3.4467108249664307, "lr": 0.0002651934320148115, "tps": 14001, "wall": 62603.5} {"step": 13375, "train_loss": 3.4534544944763184, "lr": 0.0002651748874332959, "tps": 14001, "wall": 62608.4} {"step": 13376, "train_loss": 3.4147331714630127, "lr": 0.00026515634234003686, "tps": 14001, "wall": 62613.3} {"step": 13377, "train_loss": 3.3562047481536865, "lr": 0.0002651377967352443, "tps": 14001, "wall": 62618.3} {"step": 13378, "train_loss": 3.40329909324646, "lr": 0.00026511925061912834, "tps": 14001, "wall": 62623.2} {"step": 13379, "train_loss": 3.4872958660125732, "lr": 0.000265100703991899, "tps": 14001, "wall": 62628.2} {"step": 13380, "train_loss": 3.4098851680755615, "lr": 0.0002650821568537665, "tps": 14001, "wall": 62633.1} {"step": 13381, "train_loss": 3.3619165420532227, "lr": 0.00026506360920494084, "tps": 14001, "wall": 62638.1} {"step": 13382, "train_loss": 3.445647954940796, "lr": 0.00026504506104563225, "tps": 14001, "wall": 62643.1} {"step": 13383, "train_loss": 3.4146862030029297, "lr": 0.0002650265123760507, "tps": 14000, "wall": 62648.0} {"step": 13384, "train_loss": 3.371882915496826, "lr": 0.00026500796319640647, "tps": 14000, "wall": 62652.9} {"step": 13385, "train_loss": 3.4465725421905518, "lr": 0.00026498941350690947, "tps": 14000, "wall": 62657.9} {"step": 13386, "train_loss": 3.3221893310546875, "lr": 0.00026497086330777006, "tps": 14000, "wall": 62662.8} {"step": 13387, "train_loss": 3.368319511413574, "lr": 0.00026495231259919826, "tps": 14000, "wall": 62667.8} {"step": 13388, "train_loss": 3.306797504425049, "lr": 0.0002649337613814042, "tps": 14000, "wall": 62672.7} {"step": 13389, "train_loss": 3.4063262939453125, "lr": 0.00026491520965459805, "tps": 14000, "wall": 62677.6} {"step": 13390, "train_loss": 3.435746669769287, "lr": 0.00026489665741899005, "tps": 14000, "wall": 62682.6} {"step": 13391, "train_loss": 3.3396658897399902, "lr": 0.00026487810467479023, "tps": 14000, "wall": 62687.5} {"step": 13392, "train_loss": 3.4892828464508057, "lr": 0.00026485955142220883, "tps": 14000, "wall": 62692.5} {"step": 13393, "train_loss": 3.3784561157226562, "lr": 0.00026484099766145596, "tps": 14000, "wall": 62697.5} {"step": 13394, "train_loss": 3.4738073348999023, "lr": 0.00026482244339274196, "tps": 14000, "wall": 62702.5} {"step": 13395, "train_loss": 3.435518264770508, "lr": 0.00026480388861627673, "tps": 14000, "wall": 62707.4} {"step": 13396, "train_loss": 3.4303336143493652, "lr": 0.0002647853333322707, "tps": 14000, "wall": 62712.3} {"step": 13397, "train_loss": 3.4123642444610596, "lr": 0.00026476677754093403, "tps": 14000, "wall": 62717.3} {"step": 13398, "train_loss": 3.281588315963745, "lr": 0.00026474822124247685, "tps": 14000, "wall": 62722.3} {"step": 13399, "train_loss": 3.4864981174468994, "lr": 0.00026472966443710945, "tps": 14000, "wall": 62727.2} {"step": 13400, "train_loss": 3.369932174682617, "lr": 0.00026471110712504196, "tps": 13999, "wall": 62732.2} {"step": 13401, "train_loss": 3.527987480163574, "lr": 0.00026469254930648454, "tps": 13999, "wall": 62737.1} {"step": 13402, "train_loss": 3.3519034385681152, "lr": 0.00026467399098164764, "tps": 13999, "wall": 62742.1} {"step": 13403, "train_loss": 3.4910829067230225, "lr": 0.0002646554321507412, "tps": 13999, "wall": 62747.0} {"step": 13404, "train_loss": 3.476494312286377, "lr": 0.0002646368728139758, "tps": 13999, "wall": 62752.0} {"step": 13405, "train_loss": 3.4653728008270264, "lr": 0.00026461831297156137, "tps": 13999, "wall": 62756.9} {"step": 13406, "train_loss": 3.4336464405059814, "lr": 0.0002645997526237082, "tps": 13999, "wall": 62761.9} {"step": 13407, "train_loss": 3.348961353302002, "lr": 0.00026458119177062684, "tps": 13999, "wall": 62766.9} {"step": 13408, "train_loss": 3.379356861114502, "lr": 0.00026456263041252717, "tps": 13999, "wall": 62771.8} {"step": 13409, "train_loss": 3.3476781845092773, "lr": 0.00026454406854961967, "tps": 13999, "wall": 62776.7} {"step": 13410, "train_loss": 3.275981903076172, "lr": 0.0002645255061821145, "tps": 13999, "wall": 62781.7} {"step": 13411, "train_loss": 3.432523727416992, "lr": 0.00026450694331022205, "tps": 13999, "wall": 62786.6} {"step": 13412, "train_loss": 3.4090771675109863, "lr": 0.00026448837993415245, "tps": 13999, "wall": 62791.6} {"step": 13413, "train_loss": 3.426992416381836, "lr": 0.00026446981605411613, "tps": 13999, "wall": 62796.5} {"step": 13414, "train_loss": 3.4617998600006104, "lr": 0.00026445125167032333, "tps": 13999, "wall": 62801.4} {"step": 13415, "train_loss": 3.374586582183838, "lr": 0.00026443268678298437, "tps": 13999, "wall": 62806.4} {"step": 13416, "train_loss": 3.3939027786254883, "lr": 0.0002644141213923095, "tps": 13999, "wall": 62811.3} {"step": 13417, "train_loss": 3.423858404159546, "lr": 0.0002643955554985091, "tps": 13998, "wall": 62816.3} {"step": 13418, "train_loss": 3.2693593502044678, "lr": 0.0002643769891017934, "tps": 13998, "wall": 62821.3} {"step": 13419, "train_loss": 3.36616849899292, "lr": 0.00026435842220237275, "tps": 13998, "wall": 62826.2} {"step": 13420, "train_loss": 3.4272656440734863, "lr": 0.0002643398548004575, "tps": 13998, "wall": 62831.1} {"step": 13421, "train_loss": 3.3470072746276855, "lr": 0.00026432128689625803, "tps": 13998, "wall": 62836.1} {"step": 13422, "train_loss": 3.4646167755126953, "lr": 0.0002643027184899846, "tps": 13998, "wall": 62841.0} {"step": 13423, "train_loss": 3.4404454231262207, "lr": 0.00026428414958184755, "tps": 13998, "wall": 62846.0} {"step": 13424, "train_loss": 3.456057071685791, "lr": 0.00026426558017205733, "tps": 13998, "wall": 62850.9} {"step": 13425, "train_loss": 3.3531720638275146, "lr": 0.00026424701026082415, "tps": 13998, "wall": 62855.8} {"step": 13426, "train_loss": 3.3590621948242188, "lr": 0.00026422843984835845, "tps": 13998, "wall": 62860.8} {"step": 13427, "train_loss": 3.500429630279541, "lr": 0.0002642098689348706, "tps": 13998, "wall": 62865.7} {"step": 13428, "train_loss": 3.4750254154205322, "lr": 0.00026419129752057094, "tps": 13998, "wall": 62870.7} {"step": 13429, "train_loss": 3.442603588104248, "lr": 0.0002641727256056699, "tps": 13998, "wall": 62875.6} {"step": 13430, "train_loss": 3.3889501094818115, "lr": 0.00026415415319037787, "tps": 13998, "wall": 62880.6} {"step": 13431, "train_loss": 3.4261302947998047, "lr": 0.00026413558027490514, "tps": 13998, "wall": 62885.6} {"step": 13432, "train_loss": 3.44537091255188, "lr": 0.00026411700685946224, "tps": 13998, "wall": 62890.5} {"step": 13433, "train_loss": 3.3820583820343018, "lr": 0.00026409843294425943, "tps": 13998, "wall": 62895.4} {"step": 13434, "train_loss": 3.277831554412842, "lr": 0.0002640798585295072, "tps": 13997, "wall": 62900.4} {"step": 13435, "train_loss": 3.455474853515625, "lr": 0.000264061283615416, "tps": 13997, "wall": 62905.3} {"step": 13436, "train_loss": 3.312328815460205, "lr": 0.0002640427082021961, "tps": 13997, "wall": 62910.2} {"step": 13437, "train_loss": 3.451737880706787, "lr": 0.00026402413229005805, "tps": 13997, "wall": 62915.2} {"step": 13438, "train_loss": 3.3020901679992676, "lr": 0.00026400555587921233, "tps": 13997, "wall": 62920.1} {"step": 13439, "train_loss": 3.409689426422119, "lr": 0.0002639869789698692, "tps": 13997, "wall": 62925.1} {"step": 13440, "train_loss": 3.4274959564208984, "lr": 0.0002639684015622393, "tps": 13997, "wall": 62930.0} {"step": 13441, "train_loss": 3.354569435119629, "lr": 0.0002639498236565328, "tps": 13997, "wall": 62934.9} {"step": 13442, "train_loss": 3.449765682220459, "lr": 0.0002639312452529605, "tps": 13997, "wall": 62939.9} {"step": 13443, "train_loss": 3.367952823638916, "lr": 0.00026391266635173257, "tps": 13997, "wall": 62944.9} {"step": 13444, "train_loss": 3.4156534671783447, "lr": 0.0002638940869530596, "tps": 13997, "wall": 62949.8} {"step": 13445, "train_loss": 3.363891124725342, "lr": 0.0002638755070571521, "tps": 13997, "wall": 62954.7} {"step": 13446, "train_loss": 3.2869715690612793, "lr": 0.0002638569266642204, "tps": 13997, "wall": 62959.6} {"step": 13447, "train_loss": 3.419656276702881, "lr": 0.00026383834577447504, "tps": 13997, "wall": 62964.6} {"step": 13448, "train_loss": 3.420623779296875, "lr": 0.0002638197643881266, "tps": 13997, "wall": 62969.5} {"step": 13449, "train_loss": 3.4292969703674316, "lr": 0.00026380118250538546, "tps": 13997, "wall": 62974.5} {"step": 13450, "train_loss": 3.439230442047119, "lr": 0.00026378260012646215, "tps": 13997, "wall": 62979.4} {"step": 13451, "train_loss": 3.4012279510498047, "lr": 0.0002637640172515672, "tps": 13996, "wall": 62984.3} {"step": 13452, "train_loss": 3.4260270595550537, "lr": 0.0002637454338809111, "tps": 13996, "wall": 62989.3} {"step": 13453, "train_loss": 3.4319422245025635, "lr": 0.00026372685001470434, "tps": 13996, "wall": 62994.2} {"step": 13454, "train_loss": 3.4186511039733887, "lr": 0.00026370826565315743, "tps": 13996, "wall": 62999.2} {"step": 13455, "train_loss": 3.444002628326416, "lr": 0.000263689680796481, "tps": 13996, "wall": 63004.1} {"step": 13456, "train_loss": 3.305385112762451, "lr": 0.00026367109544488544, "tps": 13996, "wall": 63009.1} {"step": 13457, "train_loss": 3.4227850437164307, "lr": 0.0002636525095985814, "tps": 13996, "wall": 63014.0} {"step": 13458, "train_loss": 3.348757028579712, "lr": 0.00026363392325777924, "tps": 13996, "wall": 63019.0} {"step": 13459, "train_loss": 3.4116415977478027, "lr": 0.0002636153364226898, "tps": 13996, "wall": 63023.9} {"step": 13460, "train_loss": 3.3747828006744385, "lr": 0.00026359674909352343, "tps": 13996, "wall": 63028.9} {"step": 13461, "train_loss": 3.4153027534484863, "lr": 0.00026357816127049066, "tps": 13996, "wall": 63033.8} {"step": 13462, "train_loss": 3.405536413192749, "lr": 0.0002635595729538022, "tps": 13996, "wall": 63038.7} {"step": 13463, "train_loss": 3.4228029251098633, "lr": 0.00026354098414366846, "tps": 13996, "wall": 63043.7} {"step": 13464, "train_loss": 3.4088187217712402, "lr": 0.00026352239484030013, "tps": 13996, "wall": 63048.6} {"step": 13465, "train_loss": 3.4716334342956543, "lr": 0.00026350380504390784, "tps": 13996, "wall": 63053.5} {"step": 13466, "train_loss": 3.454976797103882, "lr": 0.00026348521475470197, "tps": 13996, "wall": 63058.6} {"step": 13467, "train_loss": 3.3891139030456543, "lr": 0.0002634666239728933, "tps": 13996, "wall": 63063.5} {"step": 13468, "train_loss": 3.4462954998016357, "lr": 0.0002634480326986923, "tps": 13995, "wall": 63068.4} {"step": 13469, "train_loss": 3.436142921447754, "lr": 0.00026342944093230974, "tps": 13995, "wall": 63073.4} {"step": 13470, "train_loss": 3.499056816101074, "lr": 0.0002634108486739561, "tps": 13995, "wall": 63078.3} {"step": 13471, "train_loss": 3.3129940032958984, "lr": 0.0002633922559238419, "tps": 13995, "wall": 63083.3} {"step": 13472, "train_loss": 3.3381261825561523, "lr": 0.00026337366268217797, "tps": 13995, "wall": 63088.2} {"step": 13473, "train_loss": 3.4089138507843018, "lr": 0.0002633550689491748, "tps": 13995, "wall": 63093.2} {"step": 13474, "train_loss": 3.434691905975342, "lr": 0.0002633364747250431, "tps": 13995, "wall": 63098.1} {"step": 13475, "train_loss": 3.3098952770233154, "lr": 0.00026331788000999353, "tps": 13995, "wall": 63103.0} {"step": 13476, "train_loss": 3.43989896774292, "lr": 0.00026329928480423655, "tps": 13995, "wall": 63108.0} {"step": 13477, "train_loss": 3.4568371772766113, "lr": 0.000263280689107983, "tps": 13995, "wall": 63112.9} {"step": 13478, "train_loss": 3.3191800117492676, "lr": 0.00026326209292144344, "tps": 13995, "wall": 63118.0} {"step": 13479, "train_loss": 3.4374237060546875, "lr": 0.0002632434962448286, "tps": 13995, "wall": 63122.9} {"step": 13480, "train_loss": 3.391009569168091, "lr": 0.00026322489907834904, "tps": 13995, "wall": 63127.9} {"step": 13481, "train_loss": 3.5353269577026367, "lr": 0.0002632063014222155, "tps": 13995, "wall": 63132.8} {"step": 13482, "train_loss": 3.506465435028076, "lr": 0.00026318770327663865, "tps": 13995, "wall": 63137.7} {"step": 13483, "train_loss": 3.4910855293273926, "lr": 0.00026316910464182916, "tps": 13995, "wall": 63142.7} {"step": 13484, "train_loss": 3.452777862548828, "lr": 0.0002631505055179977, "tps": 13995, "wall": 63147.6} {"step": 13485, "train_loss": 3.432734251022339, "lr": 0.00026313190590535496, "tps": 13994, "wall": 63152.6} {"step": 13486, "train_loss": 3.3352577686309814, "lr": 0.00026311330580411173, "tps": 13994, "wall": 63157.5} {"step": 13487, "train_loss": 3.469715118408203, "lr": 0.00026309470521447857, "tps": 13994, "wall": 63162.5} {"step": 13488, "train_loss": 3.5809507369995117, "lr": 0.0002630761041366663, "tps": 13994, "wall": 63167.4} {"step": 13489, "train_loss": 3.437307357788086, "lr": 0.0002630575025708856, "tps": 13994, "wall": 63172.4} {"step": 13490, "train_loss": 3.3691353797912598, "lr": 0.0002630389005173471, "tps": 13994, "wall": 63177.4} {"step": 13491, "train_loss": 3.46665620803833, "lr": 0.00026302029797626165, "tps": 13994, "wall": 63182.3} {"step": 13492, "train_loss": 3.3070497512817383, "lr": 0.00026300169494784, "tps": 13994, "wall": 63187.2} {"step": 13493, "train_loss": 3.4391579627990723, "lr": 0.0002629830914322928, "tps": 13994, "wall": 63192.2} {"step": 13494, "train_loss": 3.4516353607177734, "lr": 0.0002629644874298307, "tps": 13994, "wall": 63197.1} {"step": 13495, "train_loss": 3.4781241416931152, "lr": 0.00026294588294066464, "tps": 13994, "wall": 63202.1} {"step": 13496, "train_loss": 3.4736416339874268, "lr": 0.00026292727796500533, "tps": 13994, "wall": 63207.0} {"step": 13497, "train_loss": 3.3784987926483154, "lr": 0.00026290867250306345, "tps": 13994, "wall": 63212.0} {"step": 13498, "train_loss": 3.468139171600342, "lr": 0.00026289006655504983, "tps": 13994, "wall": 63216.9} {"step": 13499, "train_loss": 3.5431113243103027, "lr": 0.0002628714601211752, "tps": 13994, "wall": 63221.8} {"step": 13500, "train_loss": 3.3699400424957275, "lr": 0.0002628528532016504, "tps": 13994, "wall": 63226.8} {"step": 13501, "train_loss": 3.475586414337158, "lr": 0.0002628342457966861, "tps": 13994, "wall": 63231.9} {"step": 13502, "train_loss": 3.4268710613250732, "lr": 0.00026281563790649316, "tps": 13993, "wall": 63236.9} {"step": 13503, "train_loss": 3.370553493499756, "lr": 0.0002627970295312824, "tps": 13993, "wall": 63241.9} {"step": 13504, "train_loss": 3.363956928253174, "lr": 0.0002627784206712645, "tps": 13993, "wall": 63246.8} {"step": 13505, "train_loss": 3.246717691421509, "lr": 0.0002627598113266504, "tps": 13993, "wall": 63251.8} {"step": 13506, "train_loss": 3.442704200744629, "lr": 0.00026274120149765085, "tps": 13993, "wall": 63256.7} {"step": 13507, "train_loss": 3.3354361057281494, "lr": 0.0002627225911844766, "tps": 13993, "wall": 63261.6} {"step": 13508, "train_loss": 3.378847599029541, "lr": 0.0002627039803873385, "tps": 13993, "wall": 63266.6} {"step": 13509, "train_loss": 3.345463275909424, "lr": 0.00026268536910644747, "tps": 13993, "wall": 63271.5} {"step": 13510, "train_loss": 3.4436144828796387, "lr": 0.00026266675734201424, "tps": 13993, "wall": 63276.4} {"step": 13511, "train_loss": 3.3766984939575195, "lr": 0.0002626481450942497, "tps": 13993, "wall": 63281.4} {"step": 13512, "train_loss": 3.390681266784668, "lr": 0.0002626295323633646, "tps": 13993, "wall": 63286.3} {"step": 13513, "train_loss": 3.3792009353637695, "lr": 0.00026261091914956997, "tps": 13993, "wall": 63291.3} {"step": 13514, "train_loss": 3.267099380493164, "lr": 0.0002625923054530765, "tps": 13993, "wall": 63296.2} {"step": 13515, "train_loss": 3.382582187652588, "lr": 0.00026257369127409504, "tps": 13993, "wall": 63301.2} {"step": 13516, "train_loss": 3.254855155944824, "lr": 0.00026255507661283655, "tps": 13993, "wall": 63306.2} {"step": 13517, "train_loss": 3.486830711364746, "lr": 0.0002625364614695118, "tps": 13993, "wall": 63311.1} {"step": 13518, "train_loss": 3.5447161197662354, "lr": 0.00026251784584433173, "tps": 13992, "wall": 63316.1} {"step": 13519, "train_loss": 3.466524362564087, "lr": 0.00026249922973750725, "tps": 13992, "wall": 63321.0} {"step": 13520, "train_loss": 3.455552101135254, "lr": 0.00026248061314924914, "tps": 13992, "wall": 63325.9} {"step": 13521, "train_loss": 3.3765146732330322, "lr": 0.0002624619960797683, "tps": 13992, "wall": 63330.9} {"step": 13522, "train_loss": 3.566826820373535, "lr": 0.00026244337852927575, "tps": 13992, "wall": 63335.8} {"step": 13523, "train_loss": 3.3676137924194336, "lr": 0.00026242476049798233, "tps": 13992, "wall": 63340.7} {"step": 13524, "train_loss": 3.396712303161621, "lr": 0.00026240614198609895, "tps": 13992, "wall": 63345.7} {"step": 13525, "train_loss": 3.4526052474975586, "lr": 0.0002623875229938364, "tps": 13992, "wall": 63350.6} {"step": 13526, "train_loss": 3.37577223777771, "lr": 0.0002623689035214057, "tps": 13992, "wall": 63355.6} {"step": 13527, "train_loss": 3.5739712715148926, "lr": 0.0002623502835690179, "tps": 13992, "wall": 63360.6} {"step": 13528, "train_loss": 3.460489273071289, "lr": 0.00026233166313688365, "tps": 13992, "wall": 63365.5} {"step": 13529, "train_loss": 3.4223151206970215, "lr": 0.00026231304222521407, "tps": 13992, "wall": 63370.4} {"step": 13530, "train_loss": 3.3665966987609863, "lr": 0.0002622944208342201, "tps": 13992, "wall": 63375.4} {"step": 13531, "train_loss": 3.473799705505371, "lr": 0.0002622757989641126, "tps": 13992, "wall": 63380.3} {"step": 13532, "train_loss": 3.311349630355835, "lr": 0.00026225717661510254, "tps": 13992, "wall": 63385.3} {"step": 13533, "train_loss": 3.426952838897705, "lr": 0.00026223855378740095, "tps": 13992, "wall": 63390.2} {"step": 13534, "train_loss": 3.405247688293457, "lr": 0.00026221993048121877, "tps": 13992, "wall": 63395.2} {"step": 13535, "train_loss": 3.4876108169555664, "lr": 0.0002622013066967669, "tps": 13992, "wall": 63400.1} {"step": 13536, "train_loss": 3.5368828773498535, "lr": 0.00026218268243425626, "tps": 13991, "wall": 63405.1} {"step": 13537, "train_loss": 3.463428020477295, "lr": 0.00026216405769389806, "tps": 13991, "wall": 63410.0} {"step": 13538, "train_loss": 3.3092637062072754, "lr": 0.00026214543247590305, "tps": 13991, "wall": 63414.9} {"step": 13539, "train_loss": 3.424743175506592, "lr": 0.00026212680678048227, "tps": 13991, "wall": 63419.9} {"step": 13540, "train_loss": 3.3990445137023926, "lr": 0.0002621081806078468, "tps": 13991, "wall": 63424.9} {"step": 13541, "train_loss": 3.375577926635742, "lr": 0.00026208955395820756, "tps": 13991, "wall": 63429.8} {"step": 13542, "train_loss": 3.365205764770508, "lr": 0.0002620709268317756, "tps": 13991, "wall": 63434.8} {"step": 13543, "train_loss": 3.431906223297119, "lr": 0.00026205229922876186, "tps": 13991, "wall": 63439.7} {"step": 13544, "train_loss": 3.336902618408203, "lr": 0.00026203367114937745, "tps": 13991, "wall": 63444.6} {"step": 13545, "train_loss": 3.3703362941741943, "lr": 0.0002620150425938333, "tps": 13991, "wall": 63449.6} {"step": 13546, "train_loss": 3.486168622970581, "lr": 0.0002619964135623405, "tps": 13991, "wall": 63454.5} {"step": 13547, "train_loss": 3.448472023010254, "lr": 0.00026197778405511005, "tps": 13991, "wall": 63459.4} {"step": 13548, "train_loss": 3.3688879013061523, "lr": 0.00026195915407235294, "tps": 13991, "wall": 63464.4} {"step": 13549, "train_loss": 3.53617000579834, "lr": 0.0002619405236142803, "tps": 13991, "wall": 63469.3} {"step": 13550, "train_loss": 3.3318538665771484, "lr": 0.00026192189268110317, "tps": 13991, "wall": 63474.3} {"step": 13551, "train_loss": 3.416604995727539, "lr": 0.0002619032612730326, "tps": 13991, "wall": 63479.3} {"step": 13552, "train_loss": 3.303999423980713, "lr": 0.0002618846293902795, "tps": 13991, "wall": 63484.2} {"step": 13553, "train_loss": 3.4876961708068848, "lr": 0.0002618659970330551, "tps": 13990, "wall": 63489.2} {"step": 13554, "train_loss": 3.4848780632019043, "lr": 0.0002618473642015705, "tps": 13990, "wall": 63494.2} {"step": 13555, "train_loss": 3.293639898300171, "lr": 0.0002618287308960366, "tps": 13990, "wall": 63499.1} {"step": 13556, "train_loss": 3.390561580657959, "lr": 0.0002618100971166646, "tps": 13990, "wall": 63504.0} {"step": 13557, "train_loss": 3.398763656616211, "lr": 0.0002617914628636656, "tps": 13990, "wall": 63509.0} {"step": 13558, "train_loss": 3.4569602012634277, "lr": 0.0002617728281372506, "tps": 13990, "wall": 63513.9} {"step": 13559, "train_loss": 3.413264751434326, "lr": 0.00026175419293763077, "tps": 13990, "wall": 63518.9} {"step": 13560, "train_loss": 3.5076935291290283, "lr": 0.00026173555726501715, "tps": 13990, "wall": 63523.8} {"step": 13561, "train_loss": 3.363158941268921, "lr": 0.0002617169211196209, "tps": 13990, "wall": 63528.8} {"step": 13562, "train_loss": 3.57269549369812, "lr": 0.0002616982845016531, "tps": 13990, "wall": 63533.7} {"step": 13563, "train_loss": 3.362461566925049, "lr": 0.00026167964741132487, "tps": 13990, "wall": 63538.7} {"step": 13564, "train_loss": 3.3907551765441895, "lr": 0.0002616610098488474, "tps": 13990, "wall": 63543.6} {"step": 13565, "train_loss": 3.361565113067627, "lr": 0.0002616423718144317, "tps": 13990, "wall": 63548.6} {"step": 13566, "train_loss": 3.394287586212158, "lr": 0.000261623733308289, "tps": 13990, "wall": 63553.5} {"step": 13567, "train_loss": 3.467036247253418, "lr": 0.0002616050943306303, "tps": 13990, "wall": 63558.4} {"step": 13568, "train_loss": 3.399202346801758, "lr": 0.00026158645488166696, "tps": 13990, "wall": 63563.4} {"step": 13569, "train_loss": 3.3831801414489746, "lr": 0.00026156781496160995, "tps": 13990, "wall": 63568.3} {"step": 13570, "train_loss": 3.397353172302246, "lr": 0.00026154917457067045, "tps": 13989, "wall": 63573.3} {"step": 13571, "train_loss": 3.549882411956787, "lr": 0.00026153053370905975, "tps": 13989, "wall": 63578.2} {"step": 13572, "train_loss": 3.4259915351867676, "lr": 0.00026151189237698884, "tps": 13989, "wall": 63583.2} {"step": 13573, "train_loss": 3.467745304107666, "lr": 0.000261493250574669, "tps": 13989, "wall": 63588.1} {"step": 13574, "train_loss": 3.3841824531555176, "lr": 0.00026147460830231134, "tps": 13989, "wall": 63593.0} {"step": 13575, "train_loss": 3.2715320587158203, "lr": 0.00026145596556012714, "tps": 13989, "wall": 63598.0} {"step": 13576, "train_loss": 3.357647180557251, "lr": 0.00026143732234832744, "tps": 13989, "wall": 63602.9} {"step": 13577, "train_loss": 3.494732618331909, "lr": 0.0002614186786671236, "tps": 13989, "wall": 63607.9} {"step": 13578, "train_loss": 3.3771708011627197, "lr": 0.0002614000345167266, "tps": 13989, "wall": 63612.8} {"step": 13579, "train_loss": 3.461574077606201, "lr": 0.0002613813898973479, "tps": 13989, "wall": 63617.8} {"step": 13580, "train_loss": 3.3534164428710938, "lr": 0.0002613627448091985, "tps": 13989, "wall": 63622.7} {"step": 13581, "train_loss": 3.4541561603546143, "lr": 0.00026134409925248974, "tps": 13989, "wall": 63627.6} {"step": 13582, "train_loss": 3.434638738632202, "lr": 0.0002613254532274327, "tps": 13989, "wall": 63632.5} {"step": 13583, "train_loss": 3.422149419784546, "lr": 0.00026130680673423876, "tps": 13989, "wall": 63637.5} {"step": 13584, "train_loss": 3.3285980224609375, "lr": 0.0002612881597731191, "tps": 13989, "wall": 63642.4} {"step": 13585, "train_loss": 3.4899702072143555, "lr": 0.0002612695123442849, "tps": 13989, "wall": 63647.4} {"step": 13586, "train_loss": 3.4455440044403076, "lr": 0.0002612508644479474, "tps": 13989, "wall": 63652.3} {"step": 13587, "train_loss": 3.3469550609588623, "lr": 0.00026123221608431794, "tps": 13989, "wall": 63657.3} {"step": 13588, "train_loss": 3.3076515197753906, "lr": 0.0002612135672536077, "tps": 13988, "wall": 63662.2} {"step": 13589, "train_loss": 3.421438217163086, "lr": 0.00026119491795602783, "tps": 13988, "wall": 63667.2} {"step": 13590, "train_loss": 3.285874366760254, "lr": 0.0002611762681917898, "tps": 13988, "wall": 63672.1} {"step": 13591, "train_loss": 3.4488158226013184, "lr": 0.0002611576179611048, "tps": 13988, "wall": 63677.0} {"step": 13592, "train_loss": 3.33675479888916, "lr": 0.000261138967264184, "tps": 13988, "wall": 63682.0} {"step": 13593, "train_loss": 3.4824862480163574, "lr": 0.0002611203161012388, "tps": 13988, "wall": 63686.9} {"step": 13594, "train_loss": 3.400468587875366, "lr": 0.0002611016644724805, "tps": 13988, "wall": 63691.9} {"step": 13595, "train_loss": 3.3276138305664062, "lr": 0.0002610830123781202, "tps": 13988, "wall": 63696.8} {"step": 13596, "train_loss": 3.3405022621154785, "lr": 0.0002610643598183693, "tps": 13988, "wall": 63701.8} {"step": 13597, "train_loss": 3.4189398288726807, "lr": 0.00026104570679343916, "tps": 13988, "wall": 63706.7} {"step": 13598, "train_loss": 3.394401788711548, "lr": 0.0002610270533035411, "tps": 13988, "wall": 63711.6} {"step": 13599, "train_loss": 3.3268001079559326, "lr": 0.0002610083993488863, "tps": 13988, "wall": 63716.6} {"step": 13600, "train_loss": 3.4479589462280273, "lr": 0.00026098974492968607, "tps": 13988, "wall": 63721.6} {"step": 13601, "train_loss": 3.4597721099853516, "lr": 0.00026097109004615194, "tps": 13988, "wall": 63726.5} {"step": 13602, "train_loss": 3.480407953262329, "lr": 0.000260952434698495, "tps": 13988, "wall": 63731.4} {"step": 13603, "train_loss": 3.367661952972412, "lr": 0.0002609337788869266, "tps": 13988, "wall": 63736.4} {"step": 13604, "train_loss": 3.4689910411834717, "lr": 0.00026091512261165826, "tps": 13988, "wall": 63741.3} {"step": 13605, "train_loss": 3.3265559673309326, "lr": 0.0002608964658729011, "tps": 13988, "wall": 63746.2} {"step": 13606, "train_loss": 3.392110824584961, "lr": 0.0002608778086708666, "tps": 13987, "wall": 63751.2} {"step": 13607, "train_loss": 3.373011589050293, "lr": 0.00026085915100576606, "tps": 13987, "wall": 63756.1} {"step": 13608, "train_loss": 3.4111955165863037, "lr": 0.00026084049287781097, "tps": 13987, "wall": 63761.1} {"step": 13609, "train_loss": 3.348599910736084, "lr": 0.00026082183428721245, "tps": 13987, "wall": 63766.0} {"step": 13610, "train_loss": 3.449129819869995, "lr": 0.00026080317523418197, "tps": 13987, "wall": 63771.0} {"step": 13611, "train_loss": 3.41264009475708, "lr": 0.00026078451571893095, "tps": 13987, "wall": 63775.9} {"step": 13612, "train_loss": 3.416588306427002, "lr": 0.00026076585574167076, "tps": 13987, "wall": 63780.9} {"step": 13613, "train_loss": 3.331575393676758, "lr": 0.00026074719530261265, "tps": 13987, "wall": 63785.8} {"step": 13614, "train_loss": 3.5296790599823, "lr": 0.00026072853440196815, "tps": 13987, "wall": 63790.8} {"step": 13615, "train_loss": 3.34607195854187, "lr": 0.00026070987303994863, "tps": 13987, "wall": 63795.7} {"step": 13616, "train_loss": 3.4694695472717285, "lr": 0.00026069121121676545, "tps": 13987, "wall": 63800.7} {"step": 13617, "train_loss": 3.439220666885376, "lr": 0.00026067254893263, "tps": 13987, "wall": 63805.6} {"step": 13618, "train_loss": 3.4296488761901855, "lr": 0.0002606538861877538, "tps": 13987, "wall": 63810.6} {"step": 13619, "train_loss": 3.436608076095581, "lr": 0.0002606352229823482, "tps": 13987, "wall": 63815.6} {"step": 13620, "train_loss": 3.405862808227539, "lr": 0.0002606165593166245, "tps": 13987, "wall": 63820.5} {"step": 13621, "train_loss": 3.35914945602417, "lr": 0.00026059789519079416, "tps": 13987, "wall": 63825.5} {"step": 13622, "train_loss": 3.4582228660583496, "lr": 0.0002605792306050688, "tps": 13987, "wall": 63830.4} {"step": 13623, "train_loss": 3.492255210876465, "lr": 0.00026056056555965966, "tps": 13986, "wall": 63835.3} {"step": 13624, "train_loss": 3.3604512214660645, "lr": 0.00026054190005477825, "tps": 13986, "wall": 63840.3} {"step": 13625, "train_loss": 3.5067543983459473, "lr": 0.00026052323409063606, "tps": 13986, "wall": 63845.3} {"step": 13626, "train_loss": 3.4649200439453125, "lr": 0.0002605045676674444, "tps": 13986, "wall": 63850.2} {"step": 13627, "train_loss": 3.4818291664123535, "lr": 0.0002604859007854148, "tps": 13986, "wall": 63855.2} {"step": 13628, "train_loss": 3.387110710144043, "lr": 0.00026046723344475876, "tps": 13986, "wall": 63860.1} {"step": 13629, "train_loss": 3.436103105545044, "lr": 0.00026044856564568777, "tps": 13986, "wall": 63865.1} {"step": 13630, "train_loss": 3.4815402030944824, "lr": 0.0002604298973884131, "tps": 13986, "wall": 63870.0} {"step": 13631, "train_loss": 3.3439841270446777, "lr": 0.0002604112286731465, "tps": 13986, "wall": 63875.0} {"step": 13632, "train_loss": 3.39174747467041, "lr": 0.00026039255950009927, "tps": 13986, "wall": 63879.9} {"step": 13633, "train_loss": 3.363312244415283, "lr": 0.00026037388986948295, "tps": 13986, "wall": 63884.8} {"step": 13634, "train_loss": 3.411426305770874, "lr": 0.00026035521978150895, "tps": 13986, "wall": 63889.8} {"step": 13635, "train_loss": 3.4071130752563477, "lr": 0.0002603365492363889, "tps": 13986, "wall": 63894.7} {"step": 13636, "train_loss": 3.438492774963379, "lr": 0.00026031787823433425, "tps": 13986, "wall": 63899.7} {"step": 13637, "train_loss": 3.5204520225524902, "lr": 0.0002602992067755565, "tps": 13986, "wall": 63904.7} {"step": 13638, "train_loss": 3.395157814025879, "lr": 0.000260280534860267, "tps": 13986, "wall": 63909.7} {"step": 13639, "train_loss": 3.4130754470825195, "lr": 0.00026026186248867767, "tps": 13986, "wall": 63914.6} {"step": 13640, "train_loss": 3.3497514724731445, "lr": 0.00026024318966099964, "tps": 13985, "wall": 63919.6} {"step": 13641, "train_loss": 3.4108996391296387, "lr": 0.0002602245163774446, "tps": 13985, "wall": 63924.5} {"step": 13642, "train_loss": 3.420574903488159, "lr": 0.00026020584263822407, "tps": 13985, "wall": 63929.4} {"step": 13643, "train_loss": 3.4212355613708496, "lr": 0.0002601871684435496, "tps": 13985, "wall": 63934.4} {"step": 13644, "train_loss": 3.3581109046936035, "lr": 0.00026016849379363263, "tps": 13985, "wall": 63939.3} {"step": 13645, "train_loss": 3.438542366027832, "lr": 0.00026014981868868487, "tps": 13985, "wall": 63944.3} {"step": 13646, "train_loss": 3.3891079425811768, "lr": 0.00026013114312891777, "tps": 13985, "wall": 63949.2} {"step": 13647, "train_loss": 3.3474106788635254, "lr": 0.00026011246711454285, "tps": 13985, "wall": 63954.1} {"step": 13648, "train_loss": 3.3351171016693115, "lr": 0.0002600937906457718, "tps": 13985, "wall": 63959.1} {"step": 13649, "train_loss": 3.319941997528076, "lr": 0.0002600751137228162, "tps": 13985, "wall": 63964.1} {"step": 13650, "train_loss": 3.432326078414917, "lr": 0.0002600564363458874, "tps": 13985, "wall": 63969.0} {"step": 13651, "train_loss": 3.382559299468994, "lr": 0.0002600377585151972, "tps": 13985, "wall": 63974.0} {"step": 13652, "train_loss": 3.424989700317383, "lr": 0.0002600190802309571, "tps": 13985, "wall": 63978.9} {"step": 13653, "train_loss": 3.4069368839263916, "lr": 0.00026000040149337867, "tps": 13985, "wall": 63983.8} {"step": 13654, "train_loss": 3.350754737854004, "lr": 0.00025998172230267346, "tps": 13985, "wall": 63988.8} {"step": 13655, "train_loss": 3.431323289871216, "lr": 0.0002599630426590532, "tps": 13985, "wall": 63993.7} {"step": 13656, "train_loss": 3.4036340713500977, "lr": 0.0002599443625627295, "tps": 13985, "wall": 63998.6} {"step": 13657, "train_loss": 3.3279943466186523, "lr": 0.00025992568201391387, "tps": 13985, "wall": 64003.6} {"step": 13658, "train_loss": 3.373886823654175, "lr": 0.0002599070010128179, "tps": 13984, "wall": 64008.5} {"step": 13659, "train_loss": 3.3513741493225098, "lr": 0.0002598883195596533, "tps": 13984, "wall": 64013.5} {"step": 13660, "train_loss": 3.4548585414886475, "lr": 0.00025986963765463165, "tps": 13984, "wall": 64018.5} {"step": 13661, "train_loss": 3.488943338394165, "lr": 0.00025985095529796454, "tps": 13984, "wall": 64023.4} {"step": 13662, "train_loss": 3.476851463317871, "lr": 0.0002598322724898638, "tps": 13984, "wall": 64028.4} {"step": 13663, "train_loss": 3.400897979736328, "lr": 0.00025981358923054073, "tps": 13984, "wall": 64033.3} {"step": 13664, "train_loss": 3.5106594562530518, "lr": 0.00025979490552020725, "tps": 13984, "wall": 64038.3} {"step": 13665, "train_loss": 3.3187448978424072, "lr": 0.000259776221359075, "tps": 13984, "wall": 64043.2} {"step": 13666, "train_loss": 3.4104666709899902, "lr": 0.0002597575367473555, "tps": 13984, "wall": 64048.1} {"step": 13667, "train_loss": 3.5211191177368164, "lr": 0.00025973885168526043, "tps": 13984, "wall": 64053.0} {"step": 13668, "train_loss": 3.3525710105895996, "lr": 0.0002597201661730015, "tps": 13984, "wall": 64058.0} {"step": 13669, "train_loss": 3.3933191299438477, "lr": 0.0002597014802107905, "tps": 13984, "wall": 64062.9} {"step": 13670, "train_loss": 3.4304065704345703, "lr": 0.00025968279379883885, "tps": 13984, "wall": 64067.9} {"step": 13671, "train_loss": 3.401512622833252, "lr": 0.0002596641069373584, "tps": 13984, "wall": 64072.8} {"step": 13672, "train_loss": 3.4313416481018066, "lr": 0.0002596454196265608, "tps": 13984, "wall": 64077.8} {"step": 13673, "train_loss": 3.427237033843994, "lr": 0.0002596267318666578, "tps": 13984, "wall": 64082.8} {"step": 13674, "train_loss": 3.4275431632995605, "lr": 0.000259608043657861, "tps": 13984, "wall": 64087.7} {"step": 13675, "train_loss": 3.427314281463623, "lr": 0.00025958935500038213, "tps": 13983, "wall": 64092.6} {"step": 13676, "train_loss": 3.349780559539795, "lr": 0.00025957066589443295, "tps": 13983, "wall": 64097.6} {"step": 13677, "train_loss": 3.3097314834594727, "lr": 0.00025955197634022504, "tps": 13983, "wall": 64102.5} {"step": 13678, "train_loss": 3.517922878265381, "lr": 0.0002595332863379702, "tps": 13983, "wall": 64107.5} {"step": 13679, "train_loss": 3.3091351985931396, "lr": 0.0002595145958878803, "tps": 13983, "wall": 64112.4} {"step": 13680, "train_loss": 3.4196510314941406, "lr": 0.0002594959049901668, "tps": 13983, "wall": 64117.3} {"step": 13681, "train_loss": 3.4852731227874756, "lr": 0.00025947721364504153, "tps": 13983, "wall": 64122.3} {"step": 13682, "train_loss": 3.392530679702759, "lr": 0.00025945852185271627, "tps": 13983, "wall": 64127.2} {"step": 13683, "train_loss": 3.5254225730895996, "lr": 0.0002594398296134028, "tps": 13983, "wall": 64132.2} {"step": 13684, "train_loss": 3.388511896133423, "lr": 0.00025942113692731277, "tps": 13983, "wall": 64137.1} {"step": 13685, "train_loss": 3.3780057430267334, "lr": 0.0002594024437946579, "tps": 13983, "wall": 64142.1} {"step": 13686, "train_loss": 3.508549451828003, "lr": 0.00025938375021565015, "tps": 13983, "wall": 64147.1} {"step": 13687, "train_loss": 3.4315176010131836, "lr": 0.0002593650561905011, "tps": 13983, "wall": 64152.0} {"step": 13688, "train_loss": 3.472775936126709, "lr": 0.0002593463617194225, "tps": 13983, "wall": 64157.0} {"step": 13689, "train_loss": 3.462278127670288, "lr": 0.00025932766680262625, "tps": 13983, "wall": 64161.9} {"step": 13690, "train_loss": 3.4110329151153564, "lr": 0.00025930897144032405, "tps": 13983, "wall": 64166.8} {"step": 13691, "train_loss": 3.4126768112182617, "lr": 0.00025929027563272765, "tps": 13983, "wall": 64171.8} {"step": 13692, "train_loss": 3.422092914581299, "lr": 0.0002592715793800489, "tps": 13983, "wall": 64176.7} {"step": 13693, "train_loss": 3.424323558807373, "lr": 0.0002592528826824997, "tps": 13982, "wall": 64181.7} {"step": 13694, "train_loss": 3.367300510406494, "lr": 0.0002592341855402916, "tps": 13982, "wall": 64186.6} {"step": 13695, "train_loss": 3.509188413619995, "lr": 0.0002592154879536365, "tps": 13982, "wall": 64191.5} {"step": 13696, "train_loss": 3.406240940093994, "lr": 0.00025919678992274625, "tps": 13982, "wall": 64196.5} {"step": 13697, "train_loss": 3.42818546295166, "lr": 0.0002591780914478327, "tps": 13982, "wall": 64201.5} {"step": 13698, "train_loss": 3.364877700805664, "lr": 0.0002591593925291076, "tps": 13982, "wall": 64206.4} {"step": 13699, "train_loss": 3.4144582748413086, "lr": 0.00025914069316678264, "tps": 13982, "wall": 64211.4} {"step": 13700, "train_loss": 3.4212582111358643, "lr": 0.00025912199336106996, "tps": 13982, "wall": 64216.3} {"step": 13701, "train_loss": 3.364757537841797, "lr": 0.0002591032931121812, "tps": 13982, "wall": 64221.2} {"step": 13702, "train_loss": 3.4848246574401855, "lr": 0.0002590845924203282, "tps": 13982, "wall": 64226.2} {"step": 13703, "train_loss": 3.4031734466552734, "lr": 0.00025906589128572274, "tps": 13982, "wall": 64231.1} {"step": 13704, "train_loss": 3.438599109649658, "lr": 0.0002590471897085769, "tps": 13982, "wall": 64236.1} {"step": 13705, "train_loss": 3.417640209197998, "lr": 0.0002590284876891023, "tps": 13982, "wall": 64241.0} {"step": 13706, "train_loss": 3.5240635871887207, "lr": 0.0002590097852275108, "tps": 13982, "wall": 64245.9} {"step": 13707, "train_loss": 3.394864559173584, "lr": 0.0002589910823240145, "tps": 13982, "wall": 64250.9} {"step": 13708, "train_loss": 3.2981483936309814, "lr": 0.00025897237897882505, "tps": 13982, "wall": 64255.8} {"step": 13709, "train_loss": 3.3456578254699707, "lr": 0.00025895367519215433, "tps": 13982, "wall": 64260.8} {"step": 13710, "train_loss": 3.4177708625793457, "lr": 0.00025893497096421436, "tps": 13982, "wall": 64265.7} {"step": 13711, "train_loss": 3.3709895610809326, "lr": 0.0002589162662952168, "tps": 13981, "wall": 64270.7} {"step": 13712, "train_loss": 3.471982955932617, "lr": 0.00025889756118537374, "tps": 13981, "wall": 64275.6} {"step": 13713, "train_loss": 3.379368782043457, "lr": 0.00025887885563489707, "tps": 13981, "wall": 64280.5} {"step": 13714, "train_loss": 3.466381072998047, "lr": 0.00025886014964399855, "tps": 13981, "wall": 64285.5} {"step": 13715, "train_loss": 3.5079381465911865, "lr": 0.0002588414432128902, "tps": 13981, "wall": 64290.4} {"step": 13716, "train_loss": 3.417466640472412, "lr": 0.0002588227363417838, "tps": 13981, "wall": 64295.4} {"step": 13717, "train_loss": 3.408912181854248, "lr": 0.00025880402903089136, "tps": 13981, "wall": 64300.3} {"step": 13718, "train_loss": 3.422677993774414, "lr": 0.00025878532128042483, "tps": 13981, "wall": 64305.2} {"step": 13719, "train_loss": 3.415030002593994, "lr": 0.0002587666130905961, "tps": 13981, "wall": 64310.2} {"step": 13720, "train_loss": 3.3312478065490723, "lr": 0.000258747904461617, "tps": 13981, "wall": 64315.1} {"step": 13721, "train_loss": 3.3997654914855957, "lr": 0.0002587291953936996, "tps": 13981, "wall": 64320.1} {"step": 13722, "train_loss": 3.3567352294921875, "lr": 0.00025871048588705574, "tps": 13981, "wall": 64325.1} {"step": 13723, "train_loss": 3.3866684436798096, "lr": 0.0002586917759418974, "tps": 13981, "wall": 64330.0} {"step": 13724, "train_loss": 3.4033234119415283, "lr": 0.0002586730655584366, "tps": 13981, "wall": 64335.0} {"step": 13725, "train_loss": 3.4361846446990967, "lr": 0.0002586543547368852, "tps": 13981, "wall": 64339.9} {"step": 13726, "train_loss": 3.3776135444641113, "lr": 0.0002586356434774551, "tps": 13981, "wall": 64344.9} {"step": 13727, "train_loss": 3.434352397918701, "lr": 0.0002586169317803584, "tps": 13981, "wall": 64349.8} {"step": 13728, "train_loss": 3.3599891662597656, "lr": 0.00025859821964580704, "tps": 13980, "wall": 64354.8} {"step": 13729, "train_loss": 3.414119243621826, "lr": 0.0002585795070740129, "tps": 13980, "wall": 64359.7} {"step": 13730, "train_loss": 3.408566951751709, "lr": 0.000258560794065188, "tps": 13980, "wall": 64364.6} {"step": 13731, "train_loss": 3.3347561359405518, "lr": 0.0002585420806195444, "tps": 13980, "wall": 64369.6} {"step": 13732, "train_loss": 3.4264473915100098, "lr": 0.000258523366737294, "tps": 13980, "wall": 64374.6} {"step": 13733, "train_loss": 3.470813274383545, "lr": 0.00025850465241864884, "tps": 13980, "wall": 64379.6} {"step": 13734, "train_loss": 3.4135148525238037, "lr": 0.0002584859376638209, "tps": 13980, "wall": 64384.5} {"step": 13735, "train_loss": 3.3902575969696045, "lr": 0.00025846722247302217, "tps": 13980, "wall": 64389.5} {"step": 13736, "train_loss": 3.3188517093658447, "lr": 0.0002584485068464646, "tps": 13980, "wall": 64394.4} {"step": 13737, "train_loss": 3.382154941558838, "lr": 0.0002584297907843603, "tps": 13980, "wall": 64399.4} {"step": 13738, "train_loss": 3.455944061279297, "lr": 0.0002584110742869213, "tps": 13980, "wall": 64404.3} {"step": 13739, "train_loss": 3.3660387992858887, "lr": 0.00025839235735435946, "tps": 13980, "wall": 64409.3} {"step": 13740, "train_loss": 3.4434683322906494, "lr": 0.000258373639986887, "tps": 13980, "wall": 64414.2} {"step": 13741, "train_loss": 3.3792502880096436, "lr": 0.00025835492218471593, "tps": 13980, "wall": 64419.1} {"step": 13742, "train_loss": 3.4013612270355225, "lr": 0.0002583362039480581, "tps": 13980, "wall": 64424.1} {"step": 13743, "train_loss": 3.365654945373535, "lr": 0.00025831748527712576, "tps": 13980, "wall": 64429.0} {"step": 13744, "train_loss": 3.45121431350708, "lr": 0.00025829876617213085, "tps": 13980, "wall": 64434.0} {"step": 13745, "train_loss": 3.3636555671691895, "lr": 0.00025828004663328545, "tps": 13980, "wall": 64439.0} {"step": 13746, "train_loss": 3.3863654136657715, "lr": 0.00025826132666080157, "tps": 13979, "wall": 64443.9} {"step": 13747, "train_loss": 3.333564043045044, "lr": 0.00025824260625489134, "tps": 13979, "wall": 64448.9} {"step": 13748, "train_loss": 3.4412009716033936, "lr": 0.0002582238854157668, "tps": 13979, "wall": 64453.8} {"step": 13749, "train_loss": 3.350564956665039, "lr": 0.00025820516414364, "tps": 13979, "wall": 64458.7} {"step": 13750, "train_loss": 3.3980069160461426, "lr": 0.00025818644243872307, "tps": 13979, "wall": 64463.7} {"step": 13751, "train_loss": 3.4675803184509277, "lr": 0.00025816772030122807, "tps": 13979, "wall": 64468.6} {"step": 13752, "train_loss": 3.438171148300171, "lr": 0.000258148997731367, "tps": 13979, "wall": 64473.5} {"step": 13753, "train_loss": 3.3831582069396973, "lr": 0.0002581302747293521, "tps": 13979, "wall": 64478.5} {"step": 13754, "train_loss": 3.4739696979522705, "lr": 0.00025811155129539534, "tps": 13979, "wall": 64483.4} {"step": 13755, "train_loss": 3.2980082035064697, "lr": 0.00025809282742970886, "tps": 13979, "wall": 64488.3} {"step": 13756, "train_loss": 3.4428493976593018, "lr": 0.0002580741031325047, "tps": 13979, "wall": 64493.3} {"step": 13757, "train_loss": 3.3653883934020996, "lr": 0.0002580553784039952, "tps": 13979, "wall": 64498.3} {"step": 13758, "train_loss": 3.4028007984161377, "lr": 0.00025803665324439223, "tps": 13979, "wall": 64503.2} {"step": 13759, "train_loss": 3.3505632877349854, "lr": 0.00025801792765390793, "tps": 13979, "wall": 64508.2} {"step": 13760, "train_loss": 3.388456344604492, "lr": 0.00025799920163275457, "tps": 13979, "wall": 64513.1} {"step": 13761, "train_loss": 3.445676803588867, "lr": 0.0002579804751811442, "tps": 13979, "wall": 64518.1} {"step": 13762, "train_loss": 3.5272438526153564, "lr": 0.000257961748299289, "tps": 13979, "wall": 64523.0} {"step": 13763, "train_loss": 3.488450527191162, "lr": 0.00025794302098740095, "tps": 13979, "wall": 64528.0} {"step": 13764, "train_loss": 3.401796340942383, "lr": 0.0002579242932456924, "tps": 13978, "wall": 64532.9} {"step": 13765, "train_loss": 3.3005661964416504, "lr": 0.0002579055650743753, "tps": 13978, "wall": 64537.8} {"step": 13766, "train_loss": 3.3356082439422607, "lr": 0.00025788683647366196, "tps": 13978, "wall": 64542.8} {"step": 13767, "train_loss": 3.4383106231689453, "lr": 0.0002578681074437645, "tps": 13978, "wall": 64547.7} {"step": 13768, "train_loss": 3.4139232635498047, "lr": 0.00025784937798489506, "tps": 13978, "wall": 64552.7} {"step": 13769, "train_loss": 3.4411911964416504, "lr": 0.0002578306480972658, "tps": 13978, "wall": 64557.7} {"step": 13770, "train_loss": 3.4053008556365967, "lr": 0.00025781191778108896, "tps": 13978, "wall": 64562.6} {"step": 13771, "train_loss": 3.325974225997925, "lr": 0.0002577931870365767, "tps": 13978, "wall": 64567.6} {"step": 13772, "train_loss": 3.5081169605255127, "lr": 0.0002577744558639411, "tps": 13978, "wall": 64572.5} {"step": 13773, "train_loss": 3.404165267944336, "lr": 0.0002577557242633944, "tps": 13978, "wall": 64577.4} {"step": 13774, "train_loss": 3.411214828491211, "lr": 0.0002577369922351488, "tps": 13978, "wall": 64582.4} {"step": 13775, "train_loss": 3.414029359817505, "lr": 0.0002577182597794166, "tps": 13978, "wall": 64587.3} {"step": 13776, "train_loss": 3.405433177947998, "lr": 0.00025769952689640987, "tps": 13978, "wall": 64592.3} {"step": 13777, "train_loss": 3.2846460342407227, "lr": 0.00025768079358634094, "tps": 13978, "wall": 64597.2} {"step": 13778, "train_loss": 3.433563709259033, "lr": 0.0002576620598494218, "tps": 13978, "wall": 64602.2} {"step": 13779, "train_loss": 3.4484190940856934, "lr": 0.00025764332568586494, "tps": 13978, "wall": 64607.1} {"step": 13780, "train_loss": 3.485110282897949, "lr": 0.00025762459109588234, "tps": 13978, "wall": 64612.0} {"step": 13781, "train_loss": 3.4435224533081055, "lr": 0.0002576058560796864, "tps": 13978, "wall": 64617.0} {"step": 13782, "train_loss": 3.460904121398926, "lr": 0.00025758712063748924, "tps": 13977, "wall": 64621.9} {"step": 13783, "train_loss": 3.369626522064209, "lr": 0.00025756838476950316, "tps": 13977, "wall": 64626.9} {"step": 13784, "train_loss": 3.490863800048828, "lr": 0.0002575496484759404, "tps": 13977, "wall": 64631.8} {"step": 13785, "train_loss": 3.455319881439209, "lr": 0.0002575309117570132, "tps": 13977, "wall": 64636.8} {"step": 13786, "train_loss": 3.4233741760253906, "lr": 0.00025751217461293376, "tps": 13977, "wall": 64641.7} {"step": 13787, "train_loss": 3.505113124847412, "lr": 0.00025749343704391443, "tps": 13977, "wall": 64646.6} {"step": 13788, "train_loss": 3.3563599586486816, "lr": 0.0002574746990501674, "tps": 13977, "wall": 64651.6} {"step": 13789, "train_loss": 3.4014227390289307, "lr": 0.00025745596063190494, "tps": 13977, "wall": 64656.6} {"step": 13790, "train_loss": 3.4077932834625244, "lr": 0.0002574372217893393, "tps": 13977, "wall": 64661.5} {"step": 13791, "train_loss": 3.391866445541382, "lr": 0.0002574184825226828, "tps": 13977, "wall": 64666.4} {"step": 13792, "train_loss": 3.370974540710449, "lr": 0.00025739974283214785, "tps": 13977, "wall": 64671.3} {"step": 13793, "train_loss": 3.3748059272766113, "lr": 0.0002573810027179464, "tps": 13977, "wall": 64676.3} {"step": 13794, "train_loss": 3.4780454635620117, "lr": 0.00025736226218029095, "tps": 13977, "wall": 64681.3} {"step": 13795, "train_loss": 3.575155258178711, "lr": 0.00025734352121939386, "tps": 13977, "wall": 64686.2} {"step": 13796, "train_loss": 3.4093992710113525, "lr": 0.0002573247798354673, "tps": 13977, "wall": 64691.2} {"step": 13797, "train_loss": 3.4394495487213135, "lr": 0.00025730603802872357, "tps": 13977, "wall": 64696.1} {"step": 13798, "train_loss": 3.441446542739868, "lr": 0.0002572872957993751, "tps": 13977, "wall": 64701.0} {"step": 13799, "train_loss": 3.4498956203460693, "lr": 0.0002572685531476341, "tps": 13977, "wall": 64706.0} {"step": 13800, "train_loss": 3.3748362064361572, "lr": 0.0002572498100737129, "tps": 13976, "wall": 64710.9} {"step": 13801, "train_loss": 3.403076648712158, "lr": 0.00025723106657782384, "tps": 13976, "wall": 64715.9} {"step": 13802, "train_loss": 3.355621337890625, "lr": 0.00025721232266017927, "tps": 13976, "wall": 64720.8} {"step": 13803, "train_loss": 3.392963171005249, "lr": 0.0002571935783209915, "tps": 13976, "wall": 64725.8} {"step": 13804, "train_loss": 3.5507121086120605, "lr": 0.0002571748335604728, "tps": 13976, "wall": 64730.7} {"step": 13805, "train_loss": 3.359358072280884, "lr": 0.0002571560883788356, "tps": 13976, "wall": 64735.6} {"step": 13806, "train_loss": 3.3421645164489746, "lr": 0.00025713734277629227, "tps": 13976, "wall": 64740.6} {"step": 13807, "train_loss": 3.419409990310669, "lr": 0.0002571185967530551, "tps": 13976, "wall": 64745.6} {"step": 13808, "train_loss": 3.471235513687134, "lr": 0.00025709985030933634, "tps": 13976, "wall": 64750.5} {"step": 13809, "train_loss": 3.4053759574890137, "lr": 0.00025708110344534863, "tps": 13976, "wall": 64755.5} {"step": 13810, "train_loss": 3.5129079818725586, "lr": 0.0002570623561613041, "tps": 13976, "wall": 64760.4} {"step": 13811, "train_loss": 3.3355793952941895, "lr": 0.0002570436084574152, "tps": 13976, "wall": 64765.3} {"step": 13812, "train_loss": 3.3663368225097656, "lr": 0.0002570248603338943, "tps": 13976, "wall": 64770.3} {"step": 13813, "train_loss": 3.422757625579834, "lr": 0.0002570061117909537, "tps": 13976, "wall": 64775.2} {"step": 13814, "train_loss": 3.4330854415893555, "lr": 0.000256987362828806, "tps": 13976, "wall": 64780.2} {"step": 13815, "train_loss": 3.455864667892456, "lr": 0.0002569686134476634, "tps": 13976, "wall": 64785.1} {"step": 13816, "train_loss": 3.39625883102417, "lr": 0.0002569498636477383, "tps": 13976, "wall": 64790.1} {"step": 13817, "train_loss": 3.424549102783203, "lr": 0.00025693111342924317, "tps": 13976, "wall": 64795.0} {"step": 13818, "train_loss": 3.4777374267578125, "lr": 0.00025691236279239046, "tps": 13975, "wall": 64800.0} {"step": 13819, "train_loss": 3.3706915378570557, "lr": 0.0002568936117373924, "tps": 13975, "wall": 64804.9} {"step": 13820, "train_loss": 3.3749518394470215, "lr": 0.0002568748602644616, "tps": 13975, "wall": 64809.9} {"step": 13821, "train_loss": 3.647693157196045, "lr": 0.0002568561083738104, "tps": 13975, "wall": 64814.8} {"step": 13822, "train_loss": 3.2839865684509277, "lr": 0.00025683735606565113, "tps": 13975, "wall": 64819.8} {"step": 13823, "train_loss": 3.3584752082824707, "lr": 0.0002568186033401963, "tps": 13975, "wall": 64824.7} {"step": 13824, "train_loss": 3.3892626762390137, "lr": 0.00025679985019765836, "tps": 13975, "wall": 64829.6} {"step": 13825, "train_loss": 3.356161594390869, "lr": 0.00025678109663824974, "tps": 13975, "wall": 64834.6} {"step": 13826, "train_loss": 3.5336716175079346, "lr": 0.00025676234266218287, "tps": 13975, "wall": 64839.5} {"step": 13827, "train_loss": 3.4583373069763184, "lr": 0.00025674358826967015, "tps": 13975, "wall": 64844.5} {"step": 13828, "train_loss": 3.358613967895508, "lr": 0.0002567248334609241, "tps": 13975, "wall": 64849.4} {"step": 13829, "train_loss": 3.408487319946289, "lr": 0.0002567060782361572, "tps": 13975, "wall": 64854.4} {"step": 13830, "train_loss": 3.3413124084472656, "lr": 0.0002566873225955818, "tps": 13975, "wall": 64859.4} {"step": 13831, "train_loss": 3.419529438018799, "lr": 0.0002566685665394104, "tps": 13975, "wall": 64864.4} {"step": 13832, "train_loss": 3.457005500793457, "lr": 0.00025664981006785553, "tps": 13975, "wall": 64869.3} {"step": 13833, "train_loss": 3.4645605087280273, "lr": 0.0002566310531811297, "tps": 13975, "wall": 64874.2} {"step": 13834, "train_loss": 3.4224610328674316, "lr": 0.0002566122958794452, "tps": 13975, "wall": 64879.2} {"step": 13835, "train_loss": 3.4950432777404785, "lr": 0.00025659353816301475, "tps": 13975, "wall": 64884.1} {"step": 13836, "train_loss": 3.320042133331299, "lr": 0.00025657478003205064, "tps": 13974, "wall": 64889.1} {"step": 13837, "train_loss": 3.4920482635498047, "lr": 0.00025655602148676545, "tps": 13974, "wall": 64894.1} {"step": 13838, "train_loss": 3.4498684406280518, "lr": 0.0002565372625273717, "tps": 13974, "wall": 64899.0} {"step": 13839, "train_loss": 3.4854636192321777, "lr": 0.00025651850315408183, "tps": 13974, "wall": 64904.0} {"step": 13840, "train_loss": 3.415247678756714, "lr": 0.0002564997433671084, "tps": 13974, "wall": 64909.0} {"step": 13841, "train_loss": 3.365715980529785, "lr": 0.0002564809831666639, "tps": 13974, "wall": 64913.9} {"step": 13842, "train_loss": 3.477355480194092, "lr": 0.0002564622225529608, "tps": 13974, "wall": 64919.0} {"step": 13843, "train_loss": 3.447460174560547, "lr": 0.00025644346152621175, "tps": 13974, "wall": 64923.9} {"step": 13844, "train_loss": 3.324981451034546, "lr": 0.0002564247000866292, "tps": 13974, "wall": 64928.9} {"step": 13845, "train_loss": 3.4252002239227295, "lr": 0.0002564059382344256, "tps": 13974, "wall": 64933.8} {"step": 13846, "train_loss": 3.4392545223236084, "lr": 0.00025638717596981365, "tps": 13974, "wall": 64938.8} {"step": 13847, "train_loss": 3.463468313217163, "lr": 0.0002563684132930057, "tps": 13974, "wall": 64943.7} {"step": 13848, "train_loss": 3.4625983238220215, "lr": 0.0002563496502042145, "tps": 13974, "wall": 64948.7} {"step": 13849, "train_loss": 3.3562655448913574, "lr": 0.00025633088670365243, "tps": 13974, "wall": 64953.7} {"step": 13850, "train_loss": 3.298464775085449, "lr": 0.0002563121227915321, "tps": 13974, "wall": 64958.6} {"step": 13851, "train_loss": 3.452754259109497, "lr": 0.0002562933584680661, "tps": 13974, "wall": 64963.6} {"step": 13852, "train_loss": 3.3112919330596924, "lr": 0.000256274593733467, "tps": 13974, "wall": 64968.5} {"step": 13853, "train_loss": 3.3463807106018066, "lr": 0.0002562558285879473, "tps": 13973, "wall": 64973.5} {"step": 13854, "train_loss": 3.3612723350524902, "lr": 0.00025623706303171963, "tps": 13973, "wall": 64978.5} {"step": 13855, "train_loss": 3.325094699859619, "lr": 0.0002562182970649965, "tps": 13973, "wall": 64983.4} {"step": 13856, "train_loss": 3.4245381355285645, "lr": 0.00025619953068799065, "tps": 13973, "wall": 64988.4} {"step": 13857, "train_loss": 3.3790817260742188, "lr": 0.00025618076390091453, "tps": 13973, "wall": 64993.3} {"step": 13858, "train_loss": 3.5006468296051025, "lr": 0.00025616199670398066, "tps": 13973, "wall": 64998.3} {"step": 13859, "train_loss": 3.396235466003418, "lr": 0.0002561432290974018, "tps": 13973, "wall": 65003.3} {"step": 13860, "train_loss": 3.395355224609375, "lr": 0.0002561244610813905, "tps": 13973, "wall": 65008.2} {"step": 13861, "train_loss": 3.4326131343841553, "lr": 0.0002561056926561594, "tps": 13973, "wall": 65013.2} {"step": 13862, "train_loss": 3.4082093238830566, "lr": 0.00025608692382192097, "tps": 13973, "wall": 65018.1} {"step": 13863, "train_loss": 3.379373073577881, "lr": 0.0002560681545788879, "tps": 13973, "wall": 65023.1} {"step": 13864, "train_loss": 3.365466833114624, "lr": 0.00025604938492727295, "tps": 13973, "wall": 65028.0} {"step": 13865, "train_loss": 3.4500341415405273, "lr": 0.00025603061486728857, "tps": 13973, "wall": 65033.0} {"step": 13866, "train_loss": 3.386533737182617, "lr": 0.00025601184439914734, "tps": 13973, "wall": 65038.0} {"step": 13867, "train_loss": 3.4672112464904785, "lr": 0.00025599307352306203, "tps": 13973, "wall": 65043.0} {"step": 13868, "train_loss": 3.4658737182617188, "lr": 0.00025597430223924525, "tps": 13973, "wall": 65047.9} {"step": 13869, "train_loss": 3.372255325317383, "lr": 0.0002559555305479097, "tps": 13973, "wall": 65052.9} {"step": 13870, "train_loss": 3.4099478721618652, "lr": 0.0002559367584492678, "tps": 13972, "wall": 65057.8} {"step": 13871, "train_loss": 3.4753236770629883, "lr": 0.00025591798594353253, "tps": 13972, "wall": 65062.8} {"step": 13872, "train_loss": 3.4641199111938477, "lr": 0.0002558992130309163, "tps": 13972, "wall": 65067.7} {"step": 13873, "train_loss": 3.4418606758117676, "lr": 0.00025588043971163174, "tps": 13972, "wall": 65072.7} {"step": 13874, "train_loss": 3.4175922870635986, "lr": 0.0002558616659858918, "tps": 13972, "wall": 65077.7} {"step": 13875, "train_loss": 3.373589038848877, "lr": 0.0002558428918539088, "tps": 13972, "wall": 65082.6} {"step": 13876, "train_loss": 3.292862892150879, "lr": 0.00025582411731589564, "tps": 13972, "wall": 65087.6} {"step": 13877, "train_loss": 3.3548312187194824, "lr": 0.000255805342372065, "tps": 13972, "wall": 65092.5} {"step": 13878, "train_loss": 3.502046823501587, "lr": 0.00025578656702262946, "tps": 13972, "wall": 65097.6} {"step": 13879, "train_loss": 3.4242348670959473, "lr": 0.0002557677912678017, "tps": 13972, "wall": 65102.5} {"step": 13880, "train_loss": 3.393336296081543, "lr": 0.00025574901510779457, "tps": 13972, "wall": 65107.5} {"step": 13881, "train_loss": 3.307981014251709, "lr": 0.0002557302385428206, "tps": 13972, "wall": 65112.4} {"step": 13882, "train_loss": 3.3757424354553223, "lr": 0.00025571146157309256, "tps": 13972, "wall": 65117.4} {"step": 13883, "train_loss": 3.467569351196289, "lr": 0.00025569268419882316, "tps": 13972, "wall": 65122.3} {"step": 13884, "train_loss": 3.4234962463378906, "lr": 0.00025567390642022516, "tps": 13972, "wall": 65127.3} {"step": 13885, "train_loss": 3.3489582538604736, "lr": 0.00025565512823751114, "tps": 13972, "wall": 65132.2} {"step": 13886, "train_loss": 3.4256739616394043, "lr": 0.0002556363496508939, "tps": 13972, "wall": 65137.2} {"step": 13887, "train_loss": 3.330040454864502, "lr": 0.0002556175706605862, "tps": 13971, "wall": 65142.2} {"step": 13888, "train_loss": 3.5380051136016846, "lr": 0.0002555987912668007, "tps": 13971, "wall": 65147.1} {"step": 13889, "train_loss": 3.4820923805236816, "lr": 0.00025558001146975016, "tps": 13971, "wall": 65152.1} {"step": 13890, "train_loss": 3.4669899940490723, "lr": 0.00025556123126964733, "tps": 13971, "wall": 65157.1} {"step": 13891, "train_loss": 3.3637237548828125, "lr": 0.000255542450666705, "tps": 13971, "wall": 65162.1} {"step": 13892, "train_loss": 3.4078752994537354, "lr": 0.00025552366966113586, "tps": 13971, "wall": 65167.0} {"step": 13893, "train_loss": 3.510222911834717, "lr": 0.0002555048882531526, "tps": 13971, "wall": 65172.0} {"step": 13894, "train_loss": 3.3702523708343506, "lr": 0.0002554861064429681, "tps": 13971, "wall": 65176.9} {"step": 13895, "train_loss": 3.3367652893066406, "lr": 0.000255467324230795, "tps": 13971, "wall": 65181.9} {"step": 13896, "train_loss": 3.376523733139038, "lr": 0.00025544854161684623, "tps": 13971, "wall": 65186.9} {"step": 13897, "train_loss": 3.3883895874023438, "lr": 0.0002554297586013344, "tps": 13971, "wall": 65191.9} {"step": 13898, "train_loss": 3.446664333343506, "lr": 0.00025541097518447237, "tps": 13971, "wall": 65196.8} {"step": 13899, "train_loss": 3.4703598022460938, "lr": 0.00025539219136647286, "tps": 13971, "wall": 65201.8} {"step": 13900, "train_loss": 3.455951452255249, "lr": 0.00025537340714754873, "tps": 13971, "wall": 65206.8} {"step": 13901, "train_loss": 3.3964004516601562, "lr": 0.00025535462252791275, "tps": 13971, "wall": 65211.7} {"step": 13902, "train_loss": 3.402644157409668, "lr": 0.00025533583750777763, "tps": 13971, "wall": 65216.7} {"step": 13903, "train_loss": 3.350785732269287, "lr": 0.00025531705208735626, "tps": 13971, "wall": 65221.7} {"step": 13904, "train_loss": 3.3880209922790527, "lr": 0.0002552982662668614, "tps": 13970, "wall": 65226.7} {"step": 13905, "train_loss": 3.3488173484802246, "lr": 0.00025527948004650593, "tps": 13970, "wall": 65231.7} {"step": 13906, "train_loss": 3.4684066772460938, "lr": 0.0002552606934265025, "tps": 13970, "wall": 65236.7} {"step": 13907, "train_loss": 3.45454478263855, "lr": 0.0002552419064070641, "tps": 13970, "wall": 65241.6} {"step": 13908, "train_loss": 3.473054885864258, "lr": 0.0002552231189884035, "tps": 13970, "wall": 65246.6} {"step": 13909, "train_loss": 3.49399471282959, "lr": 0.00025520433117073345, "tps": 13970, "wall": 65251.6} {"step": 13910, "train_loss": 3.390188694000244, "lr": 0.00025518554295426684, "tps": 13970, "wall": 65256.5} {"step": 13911, "train_loss": 3.389197826385498, "lr": 0.00025516675433921655, "tps": 13970, "wall": 65261.5} {"step": 13912, "train_loss": 3.458832263946533, "lr": 0.0002551479653257953, "tps": 13970, "wall": 65266.4} {"step": 13913, "train_loss": 3.4384138584136963, "lr": 0.00025512917591421596, "tps": 13970, "wall": 65271.4} {"step": 13914, "train_loss": 3.43731689453125, "lr": 0.0002551103861046916, "tps": 13970, "wall": 65276.4} {"step": 13915, "train_loss": 3.40238094329834, "lr": 0.0002550915958974347, "tps": 13970, "wall": 65281.4} {"step": 13916, "train_loss": 3.3737902641296387, "lr": 0.00025507280529265836, "tps": 13970, "wall": 65286.3} {"step": 13917, "train_loss": 3.4240944385528564, "lr": 0.0002550540142905754, "tps": 13970, "wall": 65291.3} {"step": 13918, "train_loss": 3.4149413108825684, "lr": 0.00025503522289139867, "tps": 13970, "wall": 65296.3} {"step": 13919, "train_loss": 3.466426372528076, "lr": 0.000255016431095341, "tps": 13970, "wall": 65301.2} {"step": 13920, "train_loss": 3.504472017288208, "lr": 0.0002549976389026153, "tps": 13969, "wall": 65306.2} {"step": 13921, "train_loss": 3.4109649658203125, "lr": 0.00025497884631343453, "tps": 13969, "wall": 65311.2} {"step": 13922, "train_loss": 3.4320626258850098, "lr": 0.0002549600533280114, "tps": 13969, "wall": 65316.2} {"step": 13923, "train_loss": 3.352769374847412, "lr": 0.00025494125994655897, "tps": 13969, "wall": 65321.1} {"step": 13924, "train_loss": 3.3836967945098877, "lr": 0.00025492246616929006, "tps": 13969, "wall": 65326.1} {"step": 13925, "train_loss": 3.3432140350341797, "lr": 0.0002549036719964175, "tps": 13969, "wall": 65331.0} {"step": 13926, "train_loss": 3.5343427658081055, "lr": 0.0002548848774281543, "tps": 13969, "wall": 65336.0} {"step": 13927, "train_loss": 3.4053900241851807, "lr": 0.0002548660824647133, "tps": 13969, "wall": 65341.1} {"step": 13928, "train_loss": 3.4279098510742188, "lr": 0.00025484728710630747, "tps": 13969, "wall": 65346.1} {"step": 13929, "train_loss": 3.4989840984344482, "lr": 0.00025482849135314965, "tps": 13969, "wall": 65351.1} {"step": 13930, "train_loss": 3.385411024093628, "lr": 0.00025480969520545277, "tps": 13969, "wall": 65356.0} {"step": 13931, "train_loss": 3.2748072147369385, "lr": 0.0002547908986634299, "tps": 13969, "wall": 65361.0} {"step": 13932, "train_loss": 3.461613655090332, "lr": 0.00025477210172729375, "tps": 13969, "wall": 65366.0} {"step": 13933, "train_loss": 3.4756577014923096, "lr": 0.0002547533043972573, "tps": 13969, "wall": 65371.0} {"step": 13934, "train_loss": 3.4182145595550537, "lr": 0.00025473450667353365, "tps": 13969, "wall": 65376.0} {"step": 13935, "train_loss": 3.3861196041107178, "lr": 0.0002547157085563356, "tps": 13969, "wall": 65381.0} {"step": 13936, "train_loss": 3.392767906188965, "lr": 0.00025469691004587606, "tps": 13968, "wall": 65385.9} {"step": 13937, "train_loss": 3.4961085319519043, "lr": 0.00025467811114236814, "tps": 13968, "wall": 65390.9} {"step": 13938, "train_loss": 3.460145950317383, "lr": 0.00025465931184602466, "tps": 13968, "wall": 65395.9} {"step": 13939, "train_loss": 3.3332390785217285, "lr": 0.0002546405121570586, "tps": 13968, "wall": 65400.9} {"step": 13940, "train_loss": 3.4851953983306885, "lr": 0.00025462171207568294, "tps": 13968, "wall": 65405.9} {"step": 13941, "train_loss": 3.2755773067474365, "lr": 0.0002546029116021107, "tps": 13968, "wall": 65410.8} {"step": 13942, "train_loss": 3.3939735889434814, "lr": 0.0002545841107365548, "tps": 13968, "wall": 65415.8} {"step": 13943, "train_loss": 3.4286980628967285, "lr": 0.00025456530947922816, "tps": 13968, "wall": 65420.7} {"step": 13944, "train_loss": 3.431723117828369, "lr": 0.0002545465078303439, "tps": 13968, "wall": 65425.7} {"step": 13945, "train_loss": 3.4491658210754395, "lr": 0.0002545277057901148, "tps": 13968, "wall": 65430.6} {"step": 13946, "train_loss": 3.413681983947754, "lr": 0.00025450890335875414, "tps": 13968, "wall": 65435.6} {"step": 13947, "train_loss": 3.2730045318603516, "lr": 0.00025449010053647466, "tps": 13968, "wall": 65440.6} {"step": 13948, "train_loss": 3.4042584896087646, "lr": 0.0002544712973234895, "tps": 13968, "wall": 65445.6} {"step": 13949, "train_loss": 3.349031925201416, "lr": 0.0002544524937200116, "tps": 13968, "wall": 65450.5} {"step": 13950, "train_loss": 3.3628945350646973, "lr": 0.000254433689726254, "tps": 13968, "wall": 65455.5} {"step": 13951, "train_loss": 3.4085583686828613, "lr": 0.0002544148853424297, "tps": 13968, "wall": 65460.6} {"step": 13952, "train_loss": 3.4877207279205322, "lr": 0.00025439608056875175, "tps": 13968, "wall": 65465.6} {"step": 13953, "train_loss": 3.35945725440979, "lr": 0.00025437727540543307, "tps": 13967, "wall": 65470.5} {"step": 13954, "train_loss": 3.3780219554901123, "lr": 0.00025435846985268675, "tps": 13967, "wall": 65475.5} {"step": 13955, "train_loss": 3.3621253967285156, "lr": 0.0002543396639107259, "tps": 13967, "wall": 65480.5} {"step": 13956, "train_loss": 3.4206223487854004, "lr": 0.00025432085757976343, "tps": 13967, "wall": 65485.4} {"step": 13957, "train_loss": 3.4146523475646973, "lr": 0.0002543020508600124, "tps": 13967, "wall": 65490.4} {"step": 13958, "train_loss": 3.3548474311828613, "lr": 0.00025428324375168594, "tps": 13967, "wall": 65495.4} {"step": 13959, "train_loss": 3.57173490524292, "lr": 0.00025426443625499706, "tps": 13967, "wall": 65500.3} {"step": 13960, "train_loss": 3.4516148567199707, "lr": 0.00025424562837015875, "tps": 13967, "wall": 65505.3} {"step": 13961, "train_loss": 3.4507131576538086, "lr": 0.000254226820097384, "tps": 13967, "wall": 65510.3} {"step": 13962, "train_loss": 3.405458927154541, "lr": 0.0002542080114368862, "tps": 13967, "wall": 65515.2} {"step": 13963, "train_loss": 3.3844358921051025, "lr": 0.00025418920238887805, "tps": 13967, "wall": 65520.3} {"step": 13964, "train_loss": 3.383596420288086, "lr": 0.0002541703929535728, "tps": 13967, "wall": 65525.2} {"step": 13965, "train_loss": 3.413325309753418, "lr": 0.00025415158313118346, "tps": 13967, "wall": 65530.2} {"step": 13966, "train_loss": 3.363119602203369, "lr": 0.0002541327729219232, "tps": 13967, "wall": 65535.1} {"step": 13967, "train_loss": 3.4835057258605957, "lr": 0.00025411396232600495, "tps": 13967, "wall": 65540.1} {"step": 13968, "train_loss": 3.4136972427368164, "lr": 0.000254095151343642, "tps": 13967, "wall": 65545.1} {"step": 13969, "train_loss": 3.333134412765503, "lr": 0.0002540763399750473, "tps": 13967, "wall": 65550.1} {"step": 13970, "train_loss": 3.355532169342041, "lr": 0.00025405752822043394, "tps": 13966, "wall": 65555.0} {"step": 13971, "train_loss": 3.398942470550537, "lr": 0.00025403871608001505, "tps": 13966, "wall": 65560.0} {"step": 13972, "train_loss": 3.343202590942383, "lr": 0.00025401990355400383, "tps": 13966, "wall": 65565.0} {"step": 13973, "train_loss": 3.4683375358581543, "lr": 0.0002540010906426132, "tps": 13966, "wall": 65570.0} {"step": 13974, "train_loss": 3.377486228942871, "lr": 0.0002539822773460564, "tps": 13966, "wall": 65574.9} {"step": 13975, "train_loss": 3.439462423324585, "lr": 0.0002539634636645466, "tps": 13966, "wall": 65580.0} {"step": 13976, "train_loss": 3.464982748031616, "lr": 0.00025394464959829674, "tps": 13966, "wall": 65585.0} {"step": 13977, "train_loss": 3.5234336853027344, "lr": 0.00025392583514752016, "tps": 13966, "wall": 65589.9} {"step": 13978, "train_loss": 3.23281192779541, "lr": 0.0002539070203124298, "tps": 13966, "wall": 65594.9} {"step": 13979, "train_loss": 3.4791650772094727, "lr": 0.0002538882050932389, "tps": 13966, "wall": 65599.9} {"step": 13980, "train_loss": 3.5384955406188965, "lr": 0.00025386938949016055, "tps": 13966, "wall": 65604.8} {"step": 13981, "train_loss": 3.3967809677124023, "lr": 0.0002538505735034079, "tps": 13966, "wall": 65609.8} {"step": 13982, "train_loss": 3.4829816818237305, "lr": 0.00025383175713319424, "tps": 13966, "wall": 65614.8} {"step": 13983, "train_loss": 3.43337345123291, "lr": 0.0002538129403797326, "tps": 13966, "wall": 65619.8} {"step": 13984, "train_loss": 3.3907527923583984, "lr": 0.00025379412324323604, "tps": 13966, "wall": 65624.8} {"step": 13985, "train_loss": 3.389716863632202, "lr": 0.0002537753057239179, "tps": 13966, "wall": 65629.7} {"step": 13986, "train_loss": 3.31522798538208, "lr": 0.00025375648782199124, "tps": 13965, "wall": 65634.7} {"step": 13987, "train_loss": 3.4595251083374023, "lr": 0.00025373766953766926, "tps": 13965, "wall": 65639.7} {"step": 13988, "train_loss": 3.48362135887146, "lr": 0.0002537188508711651, "tps": 13965, "wall": 65644.7} {"step": 13989, "train_loss": 3.3769490718841553, "lr": 0.000253700031822692, "tps": 13965, "wall": 65649.6} {"step": 13990, "train_loss": 3.447835922241211, "lr": 0.00025368121239246317, "tps": 13965, "wall": 65654.6} {"step": 13991, "train_loss": 3.3193869590759277, "lr": 0.0002536623925806916, "tps": 13965, "wall": 65659.6} {"step": 13992, "train_loss": 3.3709731101989746, "lr": 0.00025364357238759073, "tps": 13965, "wall": 65664.6} {"step": 13993, "train_loss": 3.351088047027588, "lr": 0.0002536247518133737, "tps": 13965, "wall": 65669.5} {"step": 13994, "train_loss": 3.347970724105835, "lr": 0.00025360593085825366, "tps": 13965, "wall": 65674.5} {"step": 13995, "train_loss": 3.4154052734375, "lr": 0.00025358710952244374, "tps": 13965, "wall": 65679.4} {"step": 13996, "train_loss": 3.4162893295288086, "lr": 0.00025356828780615724, "tps": 13965, "wall": 65684.4} {"step": 13997, "train_loss": 3.3841891288757324, "lr": 0.0002535494657096073, "tps": 13965, "wall": 65689.4} {"step": 13998, "train_loss": 3.4393162727355957, "lr": 0.0002535306432330073, "tps": 13965, "wall": 65694.3} {"step": 13999, "train_loss": 3.3772096633911133, "lr": 0.0002535118203765704, "tps": 13965, "wall": 65699.4} {"step": 14000, "train_loss": 3.308689594268799, "lr": 0.00025349299714050967, "tps": 13965, "wall": 65704.4, "val_loss_monitor": 3.4438035607704} {"step": 14001, "train_loss": 3.470637798309326, "lr": 0.0002534741735250385, "tps": 13954, "wall": 65758.0} {"step": 14002, "train_loss": 3.4232840538024902, "lr": 0.00025345534953037, "tps": 13954, "wall": 65763.0} {"step": 14003, "train_loss": 3.410712718963623, "lr": 0.00025343652515671765, "tps": 13954, "wall": 65768.0} {"step": 14004, "train_loss": 3.368408203125, "lr": 0.00025341770040429443, "tps": 13954, "wall": 65773.0} {"step": 14005, "train_loss": 3.329796314239502, "lr": 0.0002533988752733137, "tps": 13954, "wall": 65778.0} {"step": 14006, "train_loss": 3.4237160682678223, "lr": 0.00025338004976398876, "tps": 13954, "wall": 65782.9} {"step": 14007, "train_loss": 3.3386688232421875, "lr": 0.0002533612238765328, "tps": 13954, "wall": 65787.9} {"step": 14008, "train_loss": 3.3814191818237305, "lr": 0.00025334239761115905, "tps": 13954, "wall": 65792.9} {"step": 14009, "train_loss": 3.2957892417907715, "lr": 0.00025332357096808077, "tps": 13954, "wall": 65797.9} {"step": 14010, "train_loss": 3.411607503890991, "lr": 0.0002533047439475114, "tps": 13954, "wall": 65802.8} {"step": 14011, "train_loss": 3.420741558074951, "lr": 0.000253285916549664, "tps": 13954, "wall": 65807.8} {"step": 14012, "train_loss": 3.3935563564300537, "lr": 0.0002532670887747519, "tps": 13954, "wall": 65812.8} {"step": 14013, "train_loss": 3.3831803798675537, "lr": 0.00025324826062298855, "tps": 13953, "wall": 65817.8} {"step": 14014, "train_loss": 3.474799633026123, "lr": 0.000253229432094587, "tps": 13953, "wall": 65822.8} {"step": 14015, "train_loss": 3.38464617729187, "lr": 0.00025321060318976064, "tps": 13953, "wall": 65827.7} {"step": 14016, "train_loss": 3.4628047943115234, "lr": 0.00025319177390872285, "tps": 13953, "wall": 65832.7} {"step": 14017, "train_loss": 3.386552572250366, "lr": 0.0002531729442516868, "tps": 13953, "wall": 65837.7} {"step": 14018, "train_loss": 3.3108444213867188, "lr": 0.0002531541142188658, "tps": 13953, "wall": 65842.6} {"step": 14019, "train_loss": 3.3486618995666504, "lr": 0.0002531352838104733, "tps": 13953, "wall": 65847.6} {"step": 14020, "train_loss": 3.350985288619995, "lr": 0.0002531164530267225, "tps": 13953, "wall": 65852.6} {"step": 14021, "train_loss": 3.3686370849609375, "lr": 0.00025309762186782664, "tps": 13953, "wall": 65857.6} {"step": 14022, "train_loss": 3.519737958908081, "lr": 0.0002530787903339992, "tps": 13953, "wall": 65862.6} {"step": 14023, "train_loss": 3.3902297019958496, "lr": 0.0002530599584254534, "tps": 13953, "wall": 65867.5} {"step": 14024, "train_loss": 3.4730026721954346, "lr": 0.00025304112614240264, "tps": 13953, "wall": 65872.5} {"step": 14025, "train_loss": 3.510312557220459, "lr": 0.0002530222934850602, "tps": 13953, "wall": 65877.5} {"step": 14026, "train_loss": 3.3180789947509766, "lr": 0.0002530034604536394, "tps": 13953, "wall": 65882.5} {"step": 14027, "train_loss": 3.4168734550476074, "lr": 0.00025298462704835366, "tps": 13953, "wall": 65887.4} {"step": 14028, "train_loss": 3.3561809062957764, "lr": 0.00025296579326941626, "tps": 13953, "wall": 65892.4} {"step": 14029, "train_loss": 3.467012405395508, "lr": 0.0002529469591170406, "tps": 13953, "wall": 65897.4} {"step": 14030, "train_loss": 3.434810161590576, "lr": 0.00025292812459143995, "tps": 13952, "wall": 65902.4} {"step": 14031, "train_loss": 3.2705917358398438, "lr": 0.0002529092896928278, "tps": 13952, "wall": 65907.3} {"step": 14032, "train_loss": 3.3375802040100098, "lr": 0.00025289045442141735, "tps": 13952, "wall": 65912.3} {"step": 14033, "train_loss": 3.476468086242676, "lr": 0.00025287161877742204, "tps": 13952, "wall": 65917.3} {"step": 14034, "train_loss": 3.365067720413208, "lr": 0.0002528527827610554, "tps": 13952, "wall": 65922.2} {"step": 14035, "train_loss": 3.53336238861084, "lr": 0.0002528339463725305, "tps": 13952, "wall": 65927.2} {"step": 14036, "train_loss": 3.4297409057617188, "lr": 0.00025281510961206095, "tps": 13952, "wall": 65932.1} {"step": 14037, "train_loss": 3.371208667755127, "lr": 0.0002527962724798601, "tps": 13952, "wall": 65937.2} {"step": 14038, "train_loss": 3.3921871185302734, "lr": 0.00025277743497614124, "tps": 13952, "wall": 65942.1} {"step": 14039, "train_loss": 3.5102343559265137, "lr": 0.0002527585971011178, "tps": 13952, "wall": 65947.1} {"step": 14040, "train_loss": 3.4467368125915527, "lr": 0.00025273975885500323, "tps": 13952, "wall": 65952.1} {"step": 14041, "train_loss": 3.47804594039917, "lr": 0.00025272092023801096, "tps": 13952, "wall": 65957.1} {"step": 14042, "train_loss": 3.395352840423584, "lr": 0.00025270208125035426, "tps": 13952, "wall": 65962.0} {"step": 14043, "train_loss": 3.4888463020324707, "lr": 0.00025268324189224665, "tps": 13952, "wall": 65967.0} {"step": 14044, "train_loss": 3.4170074462890625, "lr": 0.0002526644021639015, "tps": 13952, "wall": 65972.0} {"step": 14045, "train_loss": 3.3242783546447754, "lr": 0.0002526455620655322, "tps": 13952, "wall": 65977.0} {"step": 14046, "train_loss": 3.486375331878662, "lr": 0.0002526267215973523, "tps": 13952, "wall": 65981.9} {"step": 14047, "train_loss": 3.317931652069092, "lr": 0.0002526078807595751, "tps": 13952, "wall": 65986.9} {"step": 14048, "train_loss": 3.3989524841308594, "lr": 0.000252589039552414, "tps": 13951, "wall": 65991.9} {"step": 14049, "train_loss": 3.442455768585205, "lr": 0.0002525701979760825, "tps": 13951, "wall": 65996.8} {"step": 14050, "train_loss": 3.4727783203125, "lr": 0.00025255135603079404, "tps": 13951, "wall": 66001.9} {"step": 14051, "train_loss": 3.464566230773926, "lr": 0.0002525325137167621, "tps": 13951, "wall": 66006.8} {"step": 14052, "train_loss": 3.4459190368652344, "lr": 0.00025251367103420005, "tps": 13951, "wall": 66011.8} {"step": 14053, "train_loss": 3.304286479949951, "lr": 0.00025249482798332136, "tps": 13951, "wall": 66016.7} {"step": 14054, "train_loss": 3.432220458984375, "lr": 0.0002524759845643396, "tps": 13951, "wall": 66021.7} {"step": 14055, "train_loss": 3.382150650024414, "lr": 0.00025245714077746806, "tps": 13951, "wall": 66026.6} {"step": 14056, "train_loss": 3.4867873191833496, "lr": 0.00025243829662292025, "tps": 13951, "wall": 66031.6} {"step": 14057, "train_loss": 3.4283626079559326, "lr": 0.00025241945210090975, "tps": 13951, "wall": 66036.6} {"step": 14058, "train_loss": 3.3763842582702637, "lr": 0.00025240060721164984, "tps": 13951, "wall": 66041.6} {"step": 14059, "train_loss": 3.3632702827453613, "lr": 0.00025238176195535415, "tps": 13951, "wall": 66046.5} {"step": 14060, "train_loss": 3.4399447441101074, "lr": 0.00025236291633223606, "tps": 13951, "wall": 66051.5} {"step": 14061, "train_loss": 3.3663833141326904, "lr": 0.0002523440703425092, "tps": 13951, "wall": 66056.4} {"step": 14062, "train_loss": 3.3848962783813477, "lr": 0.0002523252239863869, "tps": 13951, "wall": 66061.5} {"step": 14063, "train_loss": 3.3166303634643555, "lr": 0.00025230637726408265, "tps": 13951, "wall": 66066.5} {"step": 14064, "train_loss": 3.40004301071167, "lr": 0.0002522875301758102, "tps": 13951, "wall": 66071.4} {"step": 14065, "train_loss": 3.3715319633483887, "lr": 0.0002522686827217827, "tps": 13950, "wall": 66076.4} {"step": 14066, "train_loss": 3.4455435276031494, "lr": 0.0002522498349022138, "tps": 13950, "wall": 66081.4} {"step": 14067, "train_loss": 3.5181899070739746, "lr": 0.0002522309867173171, "tps": 13950, "wall": 66086.3} {"step": 14068, "train_loss": 3.4561638832092285, "lr": 0.000252212138167306, "tps": 13950, "wall": 66091.3} {"step": 14069, "train_loss": 3.3772788047790527, "lr": 0.0002521932892523941, "tps": 13950, "wall": 66096.2} {"step": 14070, "train_loss": 3.386326313018799, "lr": 0.0002521744399727948, "tps": 13950, "wall": 66101.2} {"step": 14071, "train_loss": 3.3339807987213135, "lr": 0.0002521555903287219, "tps": 13950, "wall": 66106.1} {"step": 14072, "train_loss": 3.426578998565674, "lr": 0.0002521367403203885, "tps": 13950, "wall": 66111.1} {"step": 14073, "train_loss": 3.369779109954834, "lr": 0.00025211788994800846, "tps": 13950, "wall": 66116.1} {"step": 14074, "train_loss": 3.392739772796631, "lr": 0.00025209903921179526, "tps": 13950, "wall": 66121.1} {"step": 14075, "train_loss": 3.3529162406921387, "lr": 0.0002520801881119624, "tps": 13950, "wall": 66126.0} {"step": 14076, "train_loss": 3.3439528942108154, "lr": 0.00025206133664872337, "tps": 13950, "wall": 66131.0} {"step": 14077, "train_loss": 3.373751163482666, "lr": 0.00025204248482229175, "tps": 13950, "wall": 66135.9} {"step": 14078, "train_loss": 3.471412181854248, "lr": 0.0002520236326328813, "tps": 13950, "wall": 66140.9} {"step": 14079, "train_loss": 3.36096453666687, "lr": 0.0002520047800807052, "tps": 13950, "wall": 66145.9} {"step": 14080, "train_loss": 3.3455424308776855, "lr": 0.00025198592716597733, "tps": 13950, "wall": 66150.8} {"step": 14081, "train_loss": 3.4567816257476807, "lr": 0.0002519670738889112, "tps": 13950, "wall": 66155.8} {"step": 14082, "train_loss": 3.445280075073242, "lr": 0.00025194822024972026, "tps": 13950, "wall": 66160.7} {"step": 14083, "train_loss": 3.4006924629211426, "lr": 0.00025192936624861815, "tps": 13949, "wall": 66165.7} {"step": 14084, "train_loss": 3.477365732192993, "lr": 0.0002519105118858185, "tps": 13949, "wall": 66170.6} {"step": 14085, "train_loss": 3.2519283294677734, "lr": 0.00025189165716153473, "tps": 13949, "wall": 66175.6} {"step": 14086, "train_loss": 3.3708109855651855, "lr": 0.00025187280207598066, "tps": 13949, "wall": 66180.6} {"step": 14087, "train_loss": 3.3705334663391113, "lr": 0.00025185394662936974, "tps": 13949, "wall": 66185.6} {"step": 14088, "train_loss": 3.5195703506469727, "lr": 0.00025183509082191553, "tps": 13949, "wall": 66190.5} {"step": 14089, "train_loss": 3.316650867462158, "lr": 0.00025181623465383177, "tps": 13949, "wall": 66195.5} {"step": 14090, "train_loss": 3.384992837905884, "lr": 0.00025179737812533194, "tps": 13949, "wall": 66200.4} {"step": 14091, "train_loss": 3.3745672702789307, "lr": 0.00025177852123662973, "tps": 13949, "wall": 66205.4} {"step": 14092, "train_loss": 3.3770084381103516, "lr": 0.00025175966398793863, "tps": 13949, "wall": 66210.3} {"step": 14093, "train_loss": 3.332365036010742, "lr": 0.0002517408063794724, "tps": 13949, "wall": 66215.3} {"step": 14094, "train_loss": 3.4592208862304688, "lr": 0.0002517219484114446, "tps": 13949, "wall": 66220.2} {"step": 14095, "train_loss": 3.4192986488342285, "lr": 0.0002517030900840688, "tps": 13949, "wall": 66225.2} {"step": 14096, "train_loss": 3.3992738723754883, "lr": 0.0002516842313975587, "tps": 13949, "wall": 66230.1} {"step": 14097, "train_loss": 3.4224624633789062, "lr": 0.00025166537235212796, "tps": 13949, "wall": 66235.1} {"step": 14098, "train_loss": 3.478297233581543, "lr": 0.00025164651294799014, "tps": 13949, "wall": 66240.1} {"step": 14099, "train_loss": 3.364717721939087, "lr": 0.00025162765318535886, "tps": 13949, "wall": 66245.1} {"step": 14100, "train_loss": 3.389733076095581, "lr": 0.0002516087930644479, "tps": 13949, "wall": 66250.1} {"step": 14101, "train_loss": 3.5293192863464355, "lr": 0.0002515899325854708, "tps": 13948, "wall": 66255.1} {"step": 14102, "train_loss": 3.4857380390167236, "lr": 0.00025157107174864123, "tps": 13948, "wall": 66260.0} {"step": 14103, "train_loss": 3.4793577194213867, "lr": 0.00025155221055417283, "tps": 13948, "wall": 66265.0} {"step": 14104, "train_loss": 3.398747682571411, "lr": 0.00025153334900227924, "tps": 13948, "wall": 66270.0} {"step": 14105, "train_loss": 3.3657379150390625, "lr": 0.00025151448709317427, "tps": 13948, "wall": 66274.9} {"step": 14106, "train_loss": 3.3701353073120117, "lr": 0.0002514956248270714, "tps": 13948, "wall": 66279.9} {"step": 14107, "train_loss": 3.444340705871582, "lr": 0.0002514767622041844, "tps": 13948, "wall": 66284.9} {"step": 14108, "train_loss": 3.4525647163391113, "lr": 0.000251457899224727, "tps": 13948, "wall": 66289.8} {"step": 14109, "train_loss": 3.4341471195220947, "lr": 0.0002514390358889128, "tps": 13948, "wall": 66294.8} {"step": 14110, "train_loss": 3.3672752380371094, "lr": 0.00025142017219695545, "tps": 13948, "wall": 66299.8} {"step": 14111, "train_loss": 3.4224915504455566, "lr": 0.0002514013081490687, "tps": 13948, "wall": 66304.8} {"step": 14112, "train_loss": 3.443763494491577, "lr": 0.0002513824437454662, "tps": 13948, "wall": 66309.8} {"step": 14113, "train_loss": 3.3774325847625732, "lr": 0.00025136357898636173, "tps": 13948, "wall": 66314.7} {"step": 14114, "train_loss": 3.3756041526794434, "lr": 0.000251344713871969, "tps": 13948, "wall": 66319.7} {"step": 14115, "train_loss": 3.533236026763916, "lr": 0.00025132584840250157, "tps": 13948, "wall": 66324.6} {"step": 14116, "train_loss": 3.4260315895080566, "lr": 0.00025130698257817325, "tps": 13948, "wall": 66329.6} {"step": 14117, "train_loss": 3.3980817794799805, "lr": 0.00025128811639919775, "tps": 13948, "wall": 66334.5} {"step": 14118, "train_loss": 3.3684263229370117, "lr": 0.00025126924986578874, "tps": 13947, "wall": 66339.5} {"step": 14119, "train_loss": 3.35404109954834, "lr": 0.00025125038297816004, "tps": 13947, "wall": 66344.5} {"step": 14120, "train_loss": 3.56318998336792, "lr": 0.00025123151573652524, "tps": 13947, "wall": 66349.4} {"step": 14121, "train_loss": 3.364097833633423, "lr": 0.0002512126481410982, "tps": 13947, "wall": 66354.4} {"step": 14122, "train_loss": 3.4001731872558594, "lr": 0.0002511937801920926, "tps": 13947, "wall": 66359.4} {"step": 14123, "train_loss": 3.467686176300049, "lr": 0.0002511749118897221, "tps": 13947, "wall": 66364.3} {"step": 14124, "train_loss": 3.467358112335205, "lr": 0.0002511560432342005, "tps": 13947, "wall": 66369.3} {"step": 14125, "train_loss": 3.359252452850342, "lr": 0.0002511371742257416, "tps": 13947, "wall": 66374.3} {"step": 14126, "train_loss": 3.3667263984680176, "lr": 0.00025111830486455915, "tps": 13947, "wall": 66379.3} {"step": 14127, "train_loss": 3.4220573902130127, "lr": 0.00025109943515086685, "tps": 13947, "wall": 66384.3} {"step": 14128, "train_loss": 3.363015651702881, "lr": 0.0002510805650848784, "tps": 13947, "wall": 66389.2} {"step": 14129, "train_loss": 3.2739624977111816, "lr": 0.0002510616946668077, "tps": 13947, "wall": 66394.2} {"step": 14130, "train_loss": 3.4732840061187744, "lr": 0.00025104282389686836, "tps": 13947, "wall": 66399.1} {"step": 14131, "train_loss": 3.3637278079986572, "lr": 0.00025102395277527427, "tps": 13947, "wall": 66404.1} {"step": 14132, "train_loss": 3.3676042556762695, "lr": 0.00025100508130223925, "tps": 13947, "wall": 66409.1} {"step": 14133, "train_loss": 3.3420872688293457, "lr": 0.00025098620947797693, "tps": 13947, "wall": 66414.0} {"step": 14134, "train_loss": 3.4904768466949463, "lr": 0.00025096733730270107, "tps": 13947, "wall": 66419.1} {"step": 14135, "train_loss": 3.576692819595337, "lr": 0.0002509484647766256, "tps": 13947, "wall": 66424.0} {"step": 14136, "train_loss": 3.395979881286621, "lr": 0.00025092959189996426, "tps": 13946, "wall": 66429.0} {"step": 14137, "train_loss": 3.3724727630615234, "lr": 0.0002509107186729308, "tps": 13946, "wall": 66433.9} {"step": 14138, "train_loss": 3.2731049060821533, "lr": 0.0002508918450957391, "tps": 13946, "wall": 66438.9} {"step": 14139, "train_loss": 3.4781100749969482, "lr": 0.00025087297116860286, "tps": 13946, "wall": 66443.8} {"step": 14140, "train_loss": 3.4297943115234375, "lr": 0.00025085409689173596, "tps": 13946, "wall": 66448.8} {"step": 14141, "train_loss": 3.3510987758636475, "lr": 0.00025083522226535215, "tps": 13946, "wall": 66453.8} {"step": 14142, "train_loss": 3.47647762298584, "lr": 0.0002508163472896653, "tps": 13946, "wall": 66458.7} {"step": 14143, "train_loss": 3.3602232933044434, "lr": 0.0002507974719648892, "tps": 13946, "wall": 66463.7} {"step": 14144, "train_loss": 3.4505786895751953, "lr": 0.0002507785962912377, "tps": 13946, "wall": 66468.7} {"step": 14145, "train_loss": 3.385145664215088, "lr": 0.0002507597202689245, "tps": 13946, "wall": 66473.6} {"step": 14146, "train_loss": 3.3508853912353516, "lr": 0.00025074084389816364, "tps": 13946, "wall": 66478.7} {"step": 14147, "train_loss": 3.4556210041046143, "lr": 0.00025072196717916876, "tps": 13946, "wall": 66483.6} {"step": 14148, "train_loss": 3.4792888164520264, "lr": 0.00025070309011215376, "tps": 13946, "wall": 66488.6} {"step": 14149, "train_loss": 3.3653717041015625, "lr": 0.00025068421269733255, "tps": 13946, "wall": 66493.5} {"step": 14150, "train_loss": 3.468667984008789, "lr": 0.0002506653349349189, "tps": 13946, "wall": 66498.5} {"step": 14151, "train_loss": 3.4175751209259033, "lr": 0.0002506464568251267, "tps": 13946, "wall": 66503.5} {"step": 14152, "train_loss": 3.3487372398376465, "lr": 0.0002506275783681697, "tps": 13946, "wall": 66508.4} {"step": 14153, "train_loss": 3.3774163722991943, "lr": 0.0002506086995642619, "tps": 13946, "wall": 66513.4} {"step": 14154, "train_loss": 3.436814785003662, "lr": 0.00025058982041361715, "tps": 13945, "wall": 66518.4} {"step": 14155, "train_loss": 3.3925538063049316, "lr": 0.0002505709409164492, "tps": 13945, "wall": 66523.4} {"step": 14156, "train_loss": 3.358299732208252, "lr": 0.00025055206107297195, "tps": 13945, "wall": 66528.4} {"step": 14157, "train_loss": 3.4243907928466797, "lr": 0.0002505331808833993, "tps": 13945, "wall": 66533.3} {"step": 14158, "train_loss": 3.424996852874756, "lr": 0.00025051430034794516, "tps": 13945, "wall": 66538.4} {"step": 14159, "train_loss": 3.3556108474731445, "lr": 0.00025049541946682336, "tps": 13945, "wall": 66543.3} {"step": 14160, "train_loss": 3.339280128479004, "lr": 0.0002504765382402478, "tps": 13945, "wall": 66548.3} {"step": 14161, "train_loss": 3.3451225757598877, "lr": 0.00025045765666843235, "tps": 13945, "wall": 66553.3} {"step": 14162, "train_loss": 3.3175179958343506, "lr": 0.0002504387747515909, "tps": 13945, "wall": 66558.2} {"step": 14163, "train_loss": 3.485398530960083, "lr": 0.0002504198924899374, "tps": 13945, "wall": 66563.2} {"step": 14164, "train_loss": 3.293922185897827, "lr": 0.00025040100988368575, "tps": 13945, "wall": 66568.2} {"step": 14165, "train_loss": 3.387904405593872, "lr": 0.00025038212693304974, "tps": 13945, "wall": 66573.1} {"step": 14166, "train_loss": 3.4356577396392822, "lr": 0.0002503632436382435, "tps": 13945, "wall": 66578.1} {"step": 14167, "train_loss": 3.3162009716033936, "lr": 0.00025034435999948064, "tps": 13945, "wall": 66583.1} {"step": 14168, "train_loss": 3.3208398818969727, "lr": 0.0002503254760169752, "tps": 13945, "wall": 66588.1} {"step": 14169, "train_loss": 3.40419340133667, "lr": 0.00025030659169094125, "tps": 13945, "wall": 66593.0} {"step": 14170, "train_loss": 3.4436330795288086, "lr": 0.00025028770702159256, "tps": 13945, "wall": 66598.1} {"step": 14171, "train_loss": 3.484541416168213, "lr": 0.000250268822009143, "tps": 13944, "wall": 66603.0} {"step": 14172, "train_loss": 3.4607315063476562, "lr": 0.0002502499366538067, "tps": 13944, "wall": 66608.0} {"step": 14173, "train_loss": 3.5070440769195557, "lr": 0.0002502310509557974, "tps": 13944, "wall": 66612.9} {"step": 14174, "train_loss": 3.338846206665039, "lr": 0.00025021216491532915, "tps": 13944, "wall": 66617.9} {"step": 14175, "train_loss": 3.4401538372039795, "lr": 0.00025019327853261587, "tps": 13944, "wall": 66622.9} {"step": 14176, "train_loss": 3.364874839782715, "lr": 0.0002501743918078715, "tps": 13944, "wall": 66627.8} {"step": 14177, "train_loss": 3.5681381225585938, "lr": 0.00025015550474130995, "tps": 13944, "wall": 66632.8} {"step": 14178, "train_loss": 3.2873635292053223, "lr": 0.00025013661733314525, "tps": 13944, "wall": 66637.7} {"step": 14179, "train_loss": 3.2970328330993652, "lr": 0.0002501177295835913, "tps": 13944, "wall": 66642.7} {"step": 14180, "train_loss": 3.3635711669921875, "lr": 0.0002500988414928621, "tps": 13944, "wall": 66647.7} {"step": 14181, "train_loss": 3.2807278633117676, "lr": 0.0002500799530611716, "tps": 13944, "wall": 66652.6} {"step": 14182, "train_loss": 3.2922143936157227, "lr": 0.00025006106428873367, "tps": 13944, "wall": 66657.7} {"step": 14183, "train_loss": 3.4656355381011963, "lr": 0.0002500421751757625, "tps": 13944, "wall": 66662.6} {"step": 14184, "train_loss": 3.408450126647949, "lr": 0.0002500232857224719, "tps": 13944, "wall": 66667.6} {"step": 14185, "train_loss": 3.287278652191162, "lr": 0.0002500043959290759, "tps": 13944, "wall": 66672.6} {"step": 14186, "train_loss": 3.435422897338867, "lr": 0.00024998550579578843, "tps": 13944, "wall": 66677.5} {"step": 14187, "train_loss": 3.320584297180176, "lr": 0.0002499666153228236, "tps": 13944, "wall": 66682.5} {"step": 14188, "train_loss": 3.3229358196258545, "lr": 0.00024994772451039524, "tps": 13944, "wall": 66687.4} {"step": 14189, "train_loss": 3.3274402618408203, "lr": 0.00024992883335871755, "tps": 13943, "wall": 66692.4} {"step": 14190, "train_loss": 3.432033061981201, "lr": 0.00024990994186800436, "tps": 13943, "wall": 66697.3} {"step": 14191, "train_loss": 3.4727931022644043, "lr": 0.00024989105003846976, "tps": 13943, "wall": 66702.3} {"step": 14192, "train_loss": 3.3982815742492676, "lr": 0.00024987215787032765, "tps": 13943, "wall": 66707.3} {"step": 14193, "train_loss": 3.350827693939209, "lr": 0.0002498532653637922, "tps": 13943, "wall": 66712.2} {"step": 14194, "train_loss": 3.4990789890289307, "lr": 0.0002498343725190773, "tps": 13943, "wall": 66717.2} {"step": 14195, "train_loss": 3.353386402130127, "lr": 0.00024981547933639704, "tps": 13943, "wall": 66722.2} {"step": 14196, "train_loss": 3.424960136413574, "lr": 0.0002497965858159654, "tps": 13943, "wall": 66727.2} {"step": 14197, "train_loss": 3.4608092308044434, "lr": 0.00024977769195799645, "tps": 13943, "wall": 66732.1} {"step": 14198, "train_loss": 3.3576903343200684, "lr": 0.0002497587977627042, "tps": 13943, "wall": 66737.1} {"step": 14199, "train_loss": 3.5331342220306396, "lr": 0.0002497399032303027, "tps": 13943, "wall": 66742.0} {"step": 14200, "train_loss": 3.373720645904541, "lr": 0.00024972100836100585, "tps": 13943, "wall": 66747.0} {"step": 14201, "train_loss": 3.406287670135498, "lr": 0.0002497021131550279, "tps": 13943, "wall": 66751.9} {"step": 14202, "train_loss": 3.373352527618408, "lr": 0.0002496832176125828, "tps": 13943, "wall": 66756.9} {"step": 14203, "train_loss": 3.4369988441467285, "lr": 0.00024966432173388457, "tps": 13943, "wall": 66761.9} {"step": 14204, "train_loss": 3.426757574081421, "lr": 0.0002496454255191473, "tps": 13943, "wall": 66766.8} {"step": 14205, "train_loss": 3.3421576023101807, "lr": 0.0002496265289685851, "tps": 13943, "wall": 66771.8} {"step": 14206, "train_loss": 3.3840038776397705, "lr": 0.00024960763208241196, "tps": 13943, "wall": 66776.8} {"step": 14207, "train_loss": 3.311330556869507, "lr": 0.0002495887348608419, "tps": 13942, "wall": 66781.8} {"step": 14208, "train_loss": 3.3436079025268555, "lr": 0.0002495698373040892, "tps": 13942, "wall": 66786.7} {"step": 14209, "train_loss": 3.4099292755126953, "lr": 0.00024955093941236763, "tps": 13942, "wall": 66791.7} {"step": 14210, "train_loss": 3.2877371311187744, "lr": 0.0002495320411858914, "tps": 13942, "wall": 66796.6} {"step": 14211, "train_loss": 3.3465325832366943, "lr": 0.00024951314262487473, "tps": 13942, "wall": 66801.7} {"step": 14212, "train_loss": 3.454145908355713, "lr": 0.00024949424372953157, "tps": 13942, "wall": 66806.6} {"step": 14213, "train_loss": 3.38957142829895, "lr": 0.0002494753445000759, "tps": 13942, "wall": 66811.6} {"step": 14214, "train_loss": 3.3784894943237305, "lr": 0.0002494564449367221, "tps": 13942, "wall": 66816.6} {"step": 14215, "train_loss": 3.412564277648926, "lr": 0.000249437545039684, "tps": 13942, "wall": 66821.5} {"step": 14216, "train_loss": 3.4647092819213867, "lr": 0.0002494186448091758, "tps": 13942, "wall": 66826.5} {"step": 14217, "train_loss": 3.4030919075012207, "lr": 0.00024939974424541164, "tps": 13942, "wall": 66831.5} {"step": 14218, "train_loss": 3.3922119140625, "lr": 0.0002493808433486055, "tps": 13942, "wall": 66836.4} {"step": 14219, "train_loss": 3.4208788871765137, "lr": 0.0002493619421189716, "tps": 13942, "wall": 66841.5} {"step": 14220, "train_loss": 3.366018772125244, "lr": 0.00024934304055672406, "tps": 13942, "wall": 66846.4} {"step": 14221, "train_loss": 3.336510181427002, "lr": 0.00024932413866207703, "tps": 13942, "wall": 66851.4} {"step": 14222, "train_loss": 3.3676352500915527, "lr": 0.00024930523643524455, "tps": 13942, "wall": 66856.3} {"step": 14223, "train_loss": 3.3560259342193604, "lr": 0.0002492863338764407, "tps": 13942, "wall": 66861.3} {"step": 14224, "train_loss": 3.412196159362793, "lr": 0.0002492674309858797, "tps": 13941, "wall": 66866.3} {"step": 14225, "train_loss": 3.402548313140869, "lr": 0.0002492485277637757, "tps": 13941, "wall": 66871.2} {"step": 14226, "train_loss": 3.3453447818756104, "lr": 0.0002492296242103427, "tps": 13941, "wall": 66876.2} {"step": 14227, "train_loss": 3.370063304901123, "lr": 0.000249210720325795, "tps": 13941, "wall": 66881.2} {"step": 14228, "train_loss": 3.443635940551758, "lr": 0.00024919181611034673, "tps": 13941, "wall": 66886.1} {"step": 14229, "train_loss": 3.498805046081543, "lr": 0.0002491729115642119, "tps": 13941, "wall": 66891.1} {"step": 14230, "train_loss": 3.4169516563415527, "lr": 0.0002491540066876048, "tps": 13941, "wall": 66896.1} {"step": 14231, "train_loss": 3.424731492996216, "lr": 0.00024913510148073955, "tps": 13941, "wall": 66901.1} {"step": 14232, "train_loss": 3.352047920227051, "lr": 0.00024911619594383024, "tps": 13941, "wall": 66906.0} {"step": 14233, "train_loss": 3.3958444595336914, "lr": 0.00024909729007709114, "tps": 13941, "wall": 66911.0} {"step": 14234, "train_loss": 3.3031277656555176, "lr": 0.0002490783838807363, "tps": 13941, "wall": 66916.0} {"step": 14235, "train_loss": 3.4314045906066895, "lr": 0.00024905947735498, "tps": 13941, "wall": 66921.0} {"step": 14236, "train_loss": 3.4576497077941895, "lr": 0.00024904057050003633, "tps": 13941, "wall": 66925.9} {"step": 14237, "train_loss": 3.454880475997925, "lr": 0.0002490216633161195, "tps": 13941, "wall": 66930.9} {"step": 14238, "train_loss": 3.4553794860839844, "lr": 0.0002490027558034438, "tps": 13941, "wall": 66935.9} {"step": 14239, "train_loss": 3.487710475921631, "lr": 0.00024898384796222326, "tps": 13941, "wall": 66940.8} {"step": 14240, "train_loss": 3.366645574569702, "lr": 0.0002489649397926721, "tps": 13941, "wall": 66945.8} {"step": 14241, "train_loss": 3.3900787830352783, "lr": 0.0002489460312950045, "tps": 13941, "wall": 66950.8} {"step": 14242, "train_loss": 3.5656206607818604, "lr": 0.0002489271224694348, "tps": 13940, "wall": 66955.7} {"step": 14243, "train_loss": 3.3850035667419434, "lr": 0.000248908213316177, "tps": 13940, "wall": 66960.7} {"step": 14244, "train_loss": 3.4803872108459473, "lr": 0.00024888930383544543, "tps": 13940, "wall": 66965.7} {"step": 14245, "train_loss": 3.409334659576416, "lr": 0.00024887039402745427, "tps": 13940, "wall": 66970.7} {"step": 14246, "train_loss": 3.4485743045806885, "lr": 0.00024885148389241775, "tps": 13940, "wall": 66975.6} {"step": 14247, "train_loss": 3.3470141887664795, "lr": 0.00024883257343054994, "tps": 13940, "wall": 66980.6} {"step": 14248, "train_loss": 3.3410251140594482, "lr": 0.0002488136626420653, "tps": 13940, "wall": 66985.5} {"step": 14249, "train_loss": 3.482219934463501, "lr": 0.0002487947515271779, "tps": 13940, "wall": 66990.5} {"step": 14250, "train_loss": 3.352940082550049, "lr": 0.00024877584008610194, "tps": 13940, "wall": 66995.4} {"step": 14251, "train_loss": 3.424994707107544, "lr": 0.00024875692831905177, "tps": 13940, "wall": 67000.4} {"step": 14252, "train_loss": 3.385315418243408, "lr": 0.00024873801622624157, "tps": 13940, "wall": 67005.3} {"step": 14253, "train_loss": 3.411858558654785, "lr": 0.0002487191038078855, "tps": 13940, "wall": 67010.3} {"step": 14254, "train_loss": 3.4074904918670654, "lr": 0.0002487001910641979, "tps": 13940, "wall": 67015.3} {"step": 14255, "train_loss": 3.397667646408081, "lr": 0.000248681277995393, "tps": 13940, "wall": 67020.3} {"step": 14256, "train_loss": 3.3723702430725098, "lr": 0.000248662364601685, "tps": 13940, "wall": 67025.2} {"step": 14257, "train_loss": 3.37766432762146, "lr": 0.0002486434508832882, "tps": 13940, "wall": 67030.2} {"step": 14258, "train_loss": 3.4138662815093994, "lr": 0.0002486245368404169, "tps": 13940, "wall": 67035.2} {"step": 14259, "train_loss": 3.317196846008301, "lr": 0.00024860562247328526, "tps": 13940, "wall": 67040.1} {"step": 14260, "train_loss": 3.381840229034424, "lr": 0.0002485867077821075, "tps": 13940, "wall": 67045.1} {"step": 14261, "train_loss": 3.402359962463379, "lr": 0.0002485677927670981, "tps": 13939, "wall": 67050.0} {"step": 14262, "train_loss": 3.2925846576690674, "lr": 0.0002485488774284711, "tps": 13939, "wall": 67055.0} {"step": 14263, "train_loss": 3.3667454719543457, "lr": 0.0002485299617664409, "tps": 13939, "wall": 67060.0} {"step": 14264, "train_loss": 3.3944129943847656, "lr": 0.0002485110457812218, "tps": 13939, "wall": 67064.9} {"step": 14265, "train_loss": 3.305185079574585, "lr": 0.00024849212947302795, "tps": 13939, "wall": 67069.9} {"step": 14266, "train_loss": 3.388306140899658, "lr": 0.00024847321284207375, "tps": 13939, "wall": 67074.9} {"step": 14267, "train_loss": 3.458766460418701, "lr": 0.0002484542958885734, "tps": 13939, "wall": 67079.9} {"step": 14268, "train_loss": 3.355297088623047, "lr": 0.00024843537861274134, "tps": 13939, "wall": 67084.8} {"step": 14269, "train_loss": 3.283602237701416, "lr": 0.00024841646101479177, "tps": 13939, "wall": 67089.8} {"step": 14270, "train_loss": 3.5457119941711426, "lr": 0.0002483975430949389, "tps": 13939, "wall": 67094.8} {"step": 14271, "train_loss": 3.3366448879241943, "lr": 0.0002483786248533972, "tps": 13939, "wall": 67099.7} {"step": 14272, "train_loss": 3.4117300510406494, "lr": 0.0002483597062903809, "tps": 13939, "wall": 67104.7} {"step": 14273, "train_loss": 3.3595566749572754, "lr": 0.00024834078740610424, "tps": 13939, "wall": 67109.7} {"step": 14274, "train_loss": 3.4073359966278076, "lr": 0.0002483218682007817, "tps": 13939, "wall": 67114.7} {"step": 14275, "train_loss": 3.321117639541626, "lr": 0.00024830294867462746, "tps": 13939, "wall": 67119.6} {"step": 14276, "train_loss": 3.3530771732330322, "lr": 0.00024828402882785594, "tps": 13939, "wall": 67124.6} {"step": 14277, "train_loss": 3.3781116008758545, "lr": 0.0002482651086606813, "tps": 13939, "wall": 67129.6} {"step": 14278, "train_loss": 3.3278675079345703, "lr": 0.0002482461881733181, "tps": 13938, "wall": 67134.6} {"step": 14279, "train_loss": 3.3512356281280518, "lr": 0.00024822726736598044, "tps": 13938, "wall": 67139.6} {"step": 14280, "train_loss": 3.4114139080047607, "lr": 0.00024820834623888287, "tps": 13938, "wall": 67144.6} {"step": 14281, "train_loss": 3.399311065673828, "lr": 0.00024818942479223953, "tps": 13938, "wall": 67149.6} {"step": 14282, "train_loss": 3.345921516418457, "lr": 0.000248170503026265, "tps": 13938, "wall": 67154.5} {"step": 14283, "train_loss": 3.319014549255371, "lr": 0.00024815158094117337, "tps": 13938, "wall": 67159.5} {"step": 14284, "train_loss": 3.3905014991760254, "lr": 0.0002481326585371792, "tps": 13938, "wall": 67164.5} {"step": 14285, "train_loss": 3.4649410247802734, "lr": 0.00024811373581449663, "tps": 13938, "wall": 67169.5} {"step": 14286, "train_loss": 3.3865323066711426, "lr": 0.00024809481277334025, "tps": 13938, "wall": 67174.4} {"step": 14287, "train_loss": 3.41054105758667, "lr": 0.00024807588941392424, "tps": 13938, "wall": 67179.4} {"step": 14288, "train_loss": 3.4135282039642334, "lr": 0.00024805696573646305, "tps": 13938, "wall": 67184.3} {"step": 14289, "train_loss": 3.4497649669647217, "lr": 0.0002480380417411711, "tps": 13938, "wall": 67189.3} {"step": 14290, "train_loss": 3.4274117946624756, "lr": 0.0002480191174282626, "tps": 13938, "wall": 67194.3} {"step": 14291, "train_loss": 3.375701427459717, "lr": 0.00024800019279795204, "tps": 13938, "wall": 67199.3} {"step": 14292, "train_loss": 3.4057905673980713, "lr": 0.0002479812678504538, "tps": 13938, "wall": 67204.3} {"step": 14293, "train_loss": 3.409241199493408, "lr": 0.00024796234258598227, "tps": 13938, "wall": 67209.2} {"step": 14294, "train_loss": 3.2670297622680664, "lr": 0.0002479434170047518, "tps": 13938, "wall": 67214.2} {"step": 14295, "train_loss": 3.3877367973327637, "lr": 0.0002479244911069767, "tps": 13938, "wall": 67219.1} {"step": 14296, "train_loss": 3.3726632595062256, "lr": 0.0002479055648928716, "tps": 13937, "wall": 67224.1} {"step": 14297, "train_loss": 3.4516148567199707, "lr": 0.00024788663836265067, "tps": 13937, "wall": 67229.1} {"step": 14298, "train_loss": 3.393432855606079, "lr": 0.00024786771151652845, "tps": 13937, "wall": 67234.0} {"step": 14299, "train_loss": 3.484264373779297, "lr": 0.0002478487843547192, "tps": 13937, "wall": 67239.0} {"step": 14300, "train_loss": 3.335942268371582, "lr": 0.00024782985687743747, "tps": 13937, "wall": 67243.9} {"step": 14301, "train_loss": 3.4533169269561768, "lr": 0.00024781092908489756, "tps": 13937, "wall": 67248.9} {"step": 14302, "train_loss": 3.432560920715332, "lr": 0.000247792000977314, "tps": 13937, "wall": 67253.9} {"step": 14303, "train_loss": 3.476228713989258, "lr": 0.0002477730725549011, "tps": 13937, "wall": 67258.9} {"step": 14304, "train_loss": 3.3561155796051025, "lr": 0.0002477541438178734, "tps": 13937, "wall": 67263.9} {"step": 14305, "train_loss": 3.4754700660705566, "lr": 0.0002477352147664452, "tps": 13937, "wall": 67268.9} {"step": 14306, "train_loss": 3.4344170093536377, "lr": 0.00024771628540083105, "tps": 13937, "wall": 67273.8} {"step": 14307, "train_loss": 3.4523508548736572, "lr": 0.0002476973557212453, "tps": 13937, "wall": 67278.8} {"step": 14308, "train_loss": 3.3883886337280273, "lr": 0.00024767842572790235, "tps": 13937, "wall": 67283.8} {"step": 14309, "train_loss": 3.38855242729187, "lr": 0.0002476594954210167, "tps": 13937, "wall": 67288.8} {"step": 14310, "train_loss": 3.452212333679199, "lr": 0.00024764056480080284, "tps": 13937, "wall": 67293.7} {"step": 14311, "train_loss": 3.2561488151550293, "lr": 0.00024762163386747517, "tps": 13937, "wall": 67298.7} {"step": 14312, "train_loss": 3.3675289154052734, "lr": 0.0002476027026212481, "tps": 13937, "wall": 67303.6} {"step": 14313, "train_loss": 3.3841488361358643, "lr": 0.0002475837710623361, "tps": 13937, "wall": 67308.6} {"step": 14314, "train_loss": 3.3175277709960938, "lr": 0.0002475648391909537, "tps": 13936, "wall": 67313.6} {"step": 14315, "train_loss": 3.491611957550049, "lr": 0.0002475459070073153, "tps": 13936, "wall": 67318.6} {"step": 14316, "train_loss": 3.458408832550049, "lr": 0.0002475269745116354, "tps": 13936, "wall": 67323.6} {"step": 14317, "train_loss": 3.463397264480591, "lr": 0.00024750804170412834, "tps": 13936, "wall": 67328.5} {"step": 14318, "train_loss": 3.477881908416748, "lr": 0.0002474891085850088, "tps": 13936, "wall": 67333.5} {"step": 14319, "train_loss": 3.390655755996704, "lr": 0.00024747017515449113, "tps": 13936, "wall": 67338.4} {"step": 14320, "train_loss": 3.436161518096924, "lr": 0.0002474512414127898, "tps": 13936, "wall": 67343.4} {"step": 14321, "train_loss": 3.4267663955688477, "lr": 0.00024743230736011936, "tps": 13936, "wall": 67348.4} {"step": 14322, "train_loss": 3.3672666549682617, "lr": 0.0002474133729966942, "tps": 13936, "wall": 67353.3} {"step": 14323, "train_loss": 3.559825897216797, "lr": 0.0002473944383227289, "tps": 13936, "wall": 67358.3} {"step": 14324, "train_loss": 3.389730930328369, "lr": 0.00024737550333843797, "tps": 13936, "wall": 67363.3} {"step": 14325, "train_loss": 3.4109878540039062, "lr": 0.00024735656804403575, "tps": 13936, "wall": 67368.3} {"step": 14326, "train_loss": 3.3907289505004883, "lr": 0.000247337632439737, "tps": 13936, "wall": 67373.2} {"step": 14327, "train_loss": 3.4227993488311768, "lr": 0.00024731869652575597, "tps": 13936, "wall": 67378.3} {"step": 14328, "train_loss": 3.447511911392212, "lr": 0.00024729976030230726, "tps": 13936, "wall": 67383.2} {"step": 14329, "train_loss": 3.4299983978271484, "lr": 0.00024728082376960543, "tps": 13936, "wall": 67388.2} {"step": 14330, "train_loss": 3.3080101013183594, "lr": 0.0002472618869278649, "tps": 13936, "wall": 67393.1} {"step": 14331, "train_loss": 3.4514732360839844, "lr": 0.00024724294977730027, "tps": 13936, "wall": 67398.1} {"step": 14332, "train_loss": 3.3712267875671387, "lr": 0.000247224012318126, "tps": 13935, "wall": 67403.0} {"step": 14333, "train_loss": 3.4122726917266846, "lr": 0.00024720507455055677, "tps": 13935, "wall": 67408.0} {"step": 14334, "train_loss": 3.2145493030548096, "lr": 0.00024718613647480687, "tps": 13935, "wall": 67413.0} {"step": 14335, "train_loss": 3.5324864387512207, "lr": 0.0002471671980910909, "tps": 13935, "wall": 67417.9} {"step": 14336, "train_loss": 3.406123161315918, "lr": 0.0002471482593996235, "tps": 13935, "wall": 67422.9} {"step": 14337, "train_loss": 3.336446762084961, "lr": 0.0002471293204006192, "tps": 13935, "wall": 67427.8} {"step": 14338, "train_loss": 3.42167329788208, "lr": 0.00024711038109429245, "tps": 13935, "wall": 67432.8} {"step": 14339, "train_loss": 3.4632606506347656, "lr": 0.00024709144148085785, "tps": 13935, "wall": 67437.8} {"step": 14340, "train_loss": 3.480654239654541, "lr": 0.00024707250156052985, "tps": 13935, "wall": 67442.8} {"step": 14341, "train_loss": 3.409489631652832, "lr": 0.0002470535613335232, "tps": 13935, "wall": 67447.7} {"step": 14342, "train_loss": 3.3845341205596924, "lr": 0.0002470346208000523, "tps": 13935, "wall": 67452.7} {"step": 14343, "train_loss": 3.4158482551574707, "lr": 0.00024701567996033175, "tps": 13935, "wall": 67457.7} {"step": 14344, "train_loss": 3.470994472503662, "lr": 0.0002469967388145761, "tps": 13935, "wall": 67462.6} {"step": 14345, "train_loss": 3.3509461879730225, "lr": 0.00024697779736299996, "tps": 13935, "wall": 67467.7} {"step": 14346, "train_loss": 3.357924461364746, "lr": 0.0002469588556058179, "tps": 13935, "wall": 67472.6} {"step": 14347, "train_loss": 3.4532008171081543, "lr": 0.0002469399135432444, "tps": 13935, "wall": 67477.6} {"step": 14348, "train_loss": 3.466089963912964, "lr": 0.00024692097117549416, "tps": 13935, "wall": 67482.6} {"step": 14349, "train_loss": 3.3130667209625244, "lr": 0.00024690202850278164, "tps": 13935, "wall": 67487.5} {"step": 14350, "train_loss": 3.408067464828491, "lr": 0.0002468830855253215, "tps": 13934, "wall": 67492.5} {"step": 14351, "train_loss": 3.3640177249908447, "lr": 0.00024686414224332835, "tps": 13934, "wall": 67497.5} {"step": 14352, "train_loss": 3.4999423027038574, "lr": 0.0002468451986570167, "tps": 13934, "wall": 67502.5} {"step": 14353, "train_loss": 3.416121006011963, "lr": 0.0002468262547666012, "tps": 13934, "wall": 67507.5} {"step": 14354, "train_loss": 3.3410820960998535, "lr": 0.0002468073105722965, "tps": 13934, "wall": 67512.4} {"step": 14355, "train_loss": 3.3632309436798096, "lr": 0.0002467883660743171, "tps": 13934, "wall": 67517.3} {"step": 14356, "train_loss": 3.423365831375122, "lr": 0.00024676942127287757, "tps": 13934, "wall": 67522.3} {"step": 14357, "train_loss": 3.390998363494873, "lr": 0.00024675047616819267, "tps": 13934, "wall": 67527.3} {"step": 14358, "train_loss": 3.4858431816101074, "lr": 0.00024673153076047684, "tps": 13934, "wall": 67532.2} {"step": 14359, "train_loss": 3.438399314880371, "lr": 0.00024671258504994486, "tps": 13934, "wall": 67537.2} {"step": 14360, "train_loss": 3.370640993118286, "lr": 0.0002466936390368113, "tps": 13934, "wall": 67542.2} {"step": 14361, "train_loss": 3.3540072441101074, "lr": 0.00024667469272129065, "tps": 13934, "wall": 67547.2} {"step": 14362, "train_loss": 3.514540433883667, "lr": 0.0002466557461035977, "tps": 13934, "wall": 67552.1} {"step": 14363, "train_loss": 3.281620502471924, "lr": 0.000246636799183947, "tps": 13934, "wall": 67557.1} {"step": 14364, "train_loss": 3.3895273208618164, "lr": 0.0002466178519625532, "tps": 13934, "wall": 67562.1} {"step": 14365, "train_loss": 3.3797011375427246, "lr": 0.00024659890443963094, "tps": 13934, "wall": 67567.0} {"step": 14366, "train_loss": 3.438399076461792, "lr": 0.00024657995661539483, "tps": 13934, "wall": 67572.0} {"step": 14367, "train_loss": 3.370708465576172, "lr": 0.00024656100849005963, "tps": 13934, "wall": 67576.9} {"step": 14368, "train_loss": 3.3042335510253906, "lr": 0.00024654206006383985, "tps": 13934, "wall": 67581.9} {"step": 14369, "train_loss": 3.38067889213562, "lr": 0.00024652311133695014, "tps": 13933, "wall": 67586.8} {"step": 14370, "train_loss": 3.3824594020843506, "lr": 0.00024650416230960514, "tps": 13933, "wall": 67591.8} {"step": 14371, "train_loss": 3.3264384269714355, "lr": 0.00024648521298201967, "tps": 13933, "wall": 67596.8} {"step": 14372, "train_loss": 3.3955626487731934, "lr": 0.0002464662633544082, "tps": 13933, "wall": 67601.7} {"step": 14373, "train_loss": 3.3795793056488037, "lr": 0.00024644731342698544, "tps": 13933, "wall": 67606.7} {"step": 14374, "train_loss": 3.3924639225006104, "lr": 0.0002464283631999662, "tps": 13933, "wall": 67611.7} {"step": 14375, "train_loss": 3.3696341514587402, "lr": 0.0002464094126735649, "tps": 13933, "wall": 67616.6} {"step": 14376, "train_loss": 3.3793468475341797, "lr": 0.00024639046184799635, "tps": 13933, "wall": 67621.6} {"step": 14377, "train_loss": 3.4268534183502197, "lr": 0.0002463715107234753, "tps": 13933, "wall": 67626.6} {"step": 14378, "train_loss": 3.529017210006714, "lr": 0.0002463525593002163, "tps": 13933, "wall": 67631.6} {"step": 14379, "train_loss": 3.285247564315796, "lr": 0.0002463336075784341, "tps": 13933, "wall": 67636.5} {"step": 14380, "train_loss": 3.417588233947754, "lr": 0.00024631465555834337, "tps": 13933, "wall": 67641.5} {"step": 14381, "train_loss": 3.400722026824951, "lr": 0.00024629570324015887, "tps": 13933, "wall": 67646.5} {"step": 14382, "train_loss": 3.435485601425171, "lr": 0.0002462767506240951, "tps": 13933, "wall": 67651.4} {"step": 14383, "train_loss": 3.3631820678710938, "lr": 0.00024625779771036694, "tps": 13933, "wall": 67656.4} {"step": 14384, "train_loss": 3.300142765045166, "lr": 0.000246238844499189, "tps": 13933, "wall": 67661.4} {"step": 14385, "train_loss": 3.42040753364563, "lr": 0.000246219890990776, "tps": 13933, "wall": 67666.3} {"step": 14386, "train_loss": 3.4025204181671143, "lr": 0.0002462009371853427, "tps": 13933, "wall": 67671.3} {"step": 14387, "train_loss": 3.441944122314453, "lr": 0.00024618198308310374, "tps": 13932, "wall": 67676.3} {"step": 14388, "train_loss": 3.3369367122650146, "lr": 0.00024616302868427385, "tps": 13932, "wall": 67681.3} {"step": 14389, "train_loss": 3.4427075386047363, "lr": 0.00024614407398906775, "tps": 13932, "wall": 67686.2} {"step": 14390, "train_loss": 3.5237526893615723, "lr": 0.00024612511899770024, "tps": 13932, "wall": 67691.2} {"step": 14391, "train_loss": 3.38541316986084, "lr": 0.0002461061637103859, "tps": 13932, "wall": 67696.1} {"step": 14392, "train_loss": 3.463481903076172, "lr": 0.00024608720812733956, "tps": 13932, "wall": 67701.1} {"step": 14393, "train_loss": 3.4431004524230957, "lr": 0.00024606825224877585, "tps": 13932, "wall": 67706.1} {"step": 14394, "train_loss": 3.439380407333374, "lr": 0.0002460492960749097, "tps": 13932, "wall": 67711.1} {"step": 14395, "train_loss": 3.353923797607422, "lr": 0.00024603033960595555, "tps": 13932, "wall": 67716.0} {"step": 14396, "train_loss": 3.3523473739624023, "lr": 0.0002460113828421284, "tps": 13932, "wall": 67721.0} {"step": 14397, "train_loss": 3.419870376586914, "lr": 0.0002459924257836428, "tps": 13932, "wall": 67725.9} {"step": 14398, "train_loss": 3.297389507293701, "lr": 0.00024597346843071373, "tps": 13932, "wall": 67730.9} {"step": 14399, "train_loss": 3.462186813354492, "lr": 0.0002459545107835558, "tps": 13932, "wall": 67735.9} {"step": 14400, "train_loss": 3.44865345954895, "lr": 0.00024593555284238366, "tps": 13932, "wall": 67740.9} {"step": 14401, "train_loss": 3.4697976112365723, "lr": 0.0002459165946074123, "tps": 13932, "wall": 67745.9} {"step": 14402, "train_loss": 3.3750946521759033, "lr": 0.0002458976360788563, "tps": 13932, "wall": 67750.8} {"step": 14403, "train_loss": 3.397531747817993, "lr": 0.00024587867725693043, "tps": 13932, "wall": 67755.8} {"step": 14404, "train_loss": 3.3127963542938232, "lr": 0.0002458597181418495, "tps": 13932, "wall": 67760.7} {"step": 14405, "train_loss": 3.373720169067383, "lr": 0.00024584075873382836, "tps": 13932, "wall": 67765.7} {"step": 14406, "train_loss": 3.3659486770629883, "lr": 0.00024582179903308163, "tps": 13931, "wall": 67770.7} {"step": 14407, "train_loss": 3.4015090465545654, "lr": 0.0002458028390398242, "tps": 13931, "wall": 67775.7} {"step": 14408, "train_loss": 3.377078056335449, "lr": 0.0002457838787542708, "tps": 13931, "wall": 67780.6} {"step": 14409, "train_loss": 3.3166706562042236, "lr": 0.00024576491817663627, "tps": 13931, "wall": 67785.6} {"step": 14410, "train_loss": 3.413357734680176, "lr": 0.0002457459573071353, "tps": 13931, "wall": 67790.6} {"step": 14411, "train_loss": 3.439387083053589, "lr": 0.0002457269961459828, "tps": 13931, "wall": 67795.5} {"step": 14412, "train_loss": 3.480846643447876, "lr": 0.0002457080346933935, "tps": 13931, "wall": 67800.5} {"step": 14413, "train_loss": 3.4020814895629883, "lr": 0.0002456890729495821, "tps": 13931, "wall": 67805.5} {"step": 14414, "train_loss": 3.2949752807617188, "lr": 0.0002456701109147635, "tps": 13931, "wall": 67810.5} {"step": 14415, "train_loss": 3.3703815937042236, "lr": 0.0002456511485891526, "tps": 13931, "wall": 67815.4} {"step": 14416, "train_loss": 3.286808490753174, "lr": 0.00024563218597296394, "tps": 13931, "wall": 67820.3} {"step": 14417, "train_loss": 3.309607744216919, "lr": 0.0002456132230664126, "tps": 13931, "wall": 67825.3} {"step": 14418, "train_loss": 3.4584736824035645, "lr": 0.00024559425986971333, "tps": 13931, "wall": 67830.3} {"step": 14419, "train_loss": 3.335530996322632, "lr": 0.00024557529638308083, "tps": 13931, "wall": 67835.2} {"step": 14420, "train_loss": 3.366804599761963, "lr": 0.00024555633260673, "tps": 13931, "wall": 67840.2} {"step": 14421, "train_loss": 3.3633790016174316, "lr": 0.0002455373685408757, "tps": 13931, "wall": 67845.1} {"step": 14422, "train_loss": 3.3078441619873047, "lr": 0.00024551840418573264, "tps": 13931, "wall": 67850.1} {"step": 14423, "train_loss": 3.414130210876465, "lr": 0.00024549943954151564, "tps": 13931, "wall": 67855.0} {"step": 14424, "train_loss": 3.3671016693115234, "lr": 0.00024548047460843975, "tps": 13930, "wall": 67860.1} {"step": 14425, "train_loss": 3.3930370807647705, "lr": 0.00024546150938671964, "tps": 13930, "wall": 67865.0} {"step": 14426, "train_loss": 3.3764641284942627, "lr": 0.00024544254387657015, "tps": 13930, "wall": 67870.0} {"step": 14427, "train_loss": 3.3834948539733887, "lr": 0.00024542357807820606, "tps": 13930, "wall": 67874.9} {"step": 14428, "train_loss": 3.383826494216919, "lr": 0.00024540461199184247, "tps": 13930, "wall": 67879.9} {"step": 14429, "train_loss": 3.38808274269104, "lr": 0.00024538564561769395, "tps": 13930, "wall": 67884.8} {"step": 14430, "train_loss": 3.3205347061157227, "lr": 0.0002453666789559755, "tps": 13930, "wall": 67889.8} {"step": 14431, "train_loss": 3.336907386779785, "lr": 0.00024534771200690193, "tps": 13930, "wall": 67894.7} {"step": 14432, "train_loss": 3.4134323596954346, "lr": 0.0002453287447706881, "tps": 13930, "wall": 67899.7} {"step": 14433, "train_loss": 3.4043526649475098, "lr": 0.0002453097772475489, "tps": 13930, "wall": 67904.6} {"step": 14434, "train_loss": 3.5312857627868652, "lr": 0.0002452908094376991, "tps": 13930, "wall": 67909.6} {"step": 14435, "train_loss": 3.4621100425720215, "lr": 0.00024527184134135377, "tps": 13930, "wall": 67914.5} {"step": 14436, "train_loss": 3.365487813949585, "lr": 0.0002452528729587276, "tps": 13930, "wall": 67919.6} {"step": 14437, "train_loss": 3.3158984184265137, "lr": 0.0002452339042900355, "tps": 13930, "wall": 67924.5} {"step": 14438, "train_loss": 3.4011964797973633, "lr": 0.0002452149353354924, "tps": 13930, "wall": 67929.4} {"step": 14439, "train_loss": 3.4313528537750244, "lr": 0.0002451959660953131, "tps": 13930, "wall": 67934.4} {"step": 14440, "train_loss": 3.359950542449951, "lr": 0.00024517699656971255, "tps": 13930, "wall": 67939.4} {"step": 14441, "train_loss": 3.389505624771118, "lr": 0.0002451580267589056, "tps": 13930, "wall": 67944.3} {"step": 14442, "train_loss": 3.393470287322998, "lr": 0.0002451390566631072, "tps": 13930, "wall": 67949.3} {"step": 14443, "train_loss": 3.3586015701293945, "lr": 0.00024512008628253226, "tps": 13929, "wall": 67954.3} {"step": 14444, "train_loss": 3.4061079025268555, "lr": 0.00024510111561739544, "tps": 13929, "wall": 67959.2} {"step": 14445, "train_loss": 3.387932300567627, "lr": 0.000245082144667912, "tps": 13929, "wall": 67964.2} {"step": 14446, "train_loss": 3.311544179916382, "lr": 0.0002450631734342966, "tps": 13929, "wall": 67969.1} {"step": 14447, "train_loss": 3.4592392444610596, "lr": 0.00024504420191676427, "tps": 13929, "wall": 67974.1} {"step": 14448, "train_loss": 3.3994271755218506, "lr": 0.00024502523011552983, "tps": 13929, "wall": 67979.1} {"step": 14449, "train_loss": 3.419436454772949, "lr": 0.00024500625803080823, "tps": 13929, "wall": 67984.1} {"step": 14450, "train_loss": 3.39980411529541, "lr": 0.00024498728566281437, "tps": 13929, "wall": 67989.0} {"step": 14451, "train_loss": 3.4484825134277344, "lr": 0.00024496831301176313, "tps": 13929, "wall": 67994.0} {"step": 14452, "train_loss": 3.301036834716797, "lr": 0.0002449493400778697, "tps": 13929, "wall": 67998.9} {"step": 14453, "train_loss": 3.3417418003082275, "lr": 0.0002449303668613486, "tps": 13929, "wall": 68003.9} {"step": 14454, "train_loss": 3.3781306743621826, "lr": 0.00024491139336241496, "tps": 13929, "wall": 68008.8} {"step": 14455, "train_loss": 3.426175117492676, "lr": 0.00024489241958128375, "tps": 13929, "wall": 68013.8} {"step": 14456, "train_loss": 3.403869152069092, "lr": 0.00024487344551816993, "tps": 13929, "wall": 68018.7} {"step": 14457, "train_loss": 3.3666088581085205, "lr": 0.00024485447117328824, "tps": 13929, "wall": 68023.7} {"step": 14458, "train_loss": 3.39406418800354, "lr": 0.0002448354965468538, "tps": 13929, "wall": 68028.6} {"step": 14459, "train_loss": 3.3827919960021973, "lr": 0.0002448165216390816, "tps": 13929, "wall": 68033.6} {"step": 14460, "train_loss": 3.438615322113037, "lr": 0.00024479754645018647, "tps": 13929, "wall": 68038.6} {"step": 14461, "train_loss": 3.3875820636749268, "lr": 0.00024477857098038333, "tps": 13929, "wall": 68043.6} {"step": 14462, "train_loss": 3.4620981216430664, "lr": 0.0002447595952298872, "tps": 13928, "wall": 68048.5} {"step": 14463, "train_loss": 3.4767704010009766, "lr": 0.00024474061919891314, "tps": 13928, "wall": 68053.5} {"step": 14464, "train_loss": 3.3911547660827637, "lr": 0.0002447216428876759, "tps": 13928, "wall": 68058.4} {"step": 14465, "train_loss": 3.298020601272583, "lr": 0.00024470266629639053, "tps": 13928, "wall": 68063.4} {"step": 14466, "train_loss": 3.4315545558929443, "lr": 0.0002446836894252722, "tps": 13928, "wall": 68068.3} {"step": 14467, "train_loss": 3.4963600635528564, "lr": 0.0002446647122745355, "tps": 13928, "wall": 68073.3} {"step": 14468, "train_loss": 3.3129115104675293, "lr": 0.00024464573484439566, "tps": 13928, "wall": 68078.3} {"step": 14469, "train_loss": 3.3665008544921875, "lr": 0.0002446267571350677, "tps": 13928, "wall": 68083.2} {"step": 14470, "train_loss": 3.4142777919769287, "lr": 0.0002446077791467664, "tps": 13928, "wall": 68088.2} {"step": 14471, "train_loss": 3.478978395462036, "lr": 0.0002445888008797068, "tps": 13928, "wall": 68093.1} {"step": 14472, "train_loss": 3.352756977081299, "lr": 0.000244569822334104, "tps": 13928, "wall": 68098.2} {"step": 14473, "train_loss": 3.38852596282959, "lr": 0.00024455084351017296, "tps": 13928, "wall": 68103.1} {"step": 14474, "train_loss": 3.276817798614502, "lr": 0.0002445318644081286, "tps": 13928, "wall": 68108.1} {"step": 14475, "train_loss": 3.458458662033081, "lr": 0.00024451288502818594, "tps": 13928, "wall": 68113.0} {"step": 14476, "train_loss": 3.490152359008789, "lr": 0.00024449390537056, "tps": 13928, "wall": 68118.0} {"step": 14477, "train_loss": 3.373793601989746, "lr": 0.00024447492543546584, "tps": 13928, "wall": 68122.9} {"step": 14478, "train_loss": 3.4763150215148926, "lr": 0.00024445594522311834, "tps": 13928, "wall": 68127.9} {"step": 14479, "train_loss": 3.3259246349334717, "lr": 0.00024443696473373257, "tps": 13928, "wall": 68132.8} {"step": 14480, "train_loss": 3.3878173828125, "lr": 0.0002444179839675236, "tps": 13928, "wall": 68137.8} {"step": 14481, "train_loss": 3.4320621490478516, "lr": 0.00024439900292470623, "tps": 13928, "wall": 68142.7} {"step": 14482, "train_loss": 3.387899398803711, "lr": 0.00024438002160549575, "tps": 13927, "wall": 68147.7} {"step": 14483, "train_loss": 3.358884811401367, "lr": 0.0002443610400101071, "tps": 13927, "wall": 68152.6} {"step": 14484, "train_loss": 3.416095733642578, "lr": 0.0002443420581387552, "tps": 13927, "wall": 68157.7} {"step": 14485, "train_loss": 3.3660290241241455, "lr": 0.0002443230759916552, "tps": 13927, "wall": 68162.6} {"step": 14486, "train_loss": 3.4394896030426025, "lr": 0.00024430409356902203, "tps": 13927, "wall": 68167.6} {"step": 14487, "train_loss": 3.392946243286133, "lr": 0.0002442851108710708, "tps": 13927, "wall": 68172.5} {"step": 14488, "train_loss": 3.3257994651794434, "lr": 0.0002442661278980165, "tps": 13927, "wall": 68177.5} {"step": 14489, "train_loss": 3.3005869388580322, "lr": 0.0002442471446500742, "tps": 13927, "wall": 68182.5} {"step": 14490, "train_loss": 3.3161840438842773, "lr": 0.000244228161127459, "tps": 13927, "wall": 68187.4} {"step": 14491, "train_loss": 3.4311728477478027, "lr": 0.0002442091773303858, "tps": 13927, "wall": 68192.4} {"step": 14492, "train_loss": 3.4709858894348145, "lr": 0.00024419019325906975, "tps": 13927, "wall": 68197.3} {"step": 14493, "train_loss": 3.4019360542297363, "lr": 0.0002441712089137259, "tps": 13927, "wall": 68202.3} {"step": 14494, "train_loss": 3.4431581497192383, "lr": 0.0002441522242945693, "tps": 13927, "wall": 68207.2} {"step": 14495, "train_loss": 3.483764171600342, "lr": 0.0002441332394018149, "tps": 13927, "wall": 68212.2} {"step": 14496, "train_loss": 3.4220147132873535, "lr": 0.00024411425423567792, "tps": 13927, "wall": 68217.2} {"step": 14497, "train_loss": 3.3955752849578857, "lr": 0.0002440952687963734, "tps": 13927, "wall": 68222.2} {"step": 14498, "train_loss": 3.4470810890197754, "lr": 0.00024407628308411634, "tps": 13927, "wall": 68227.1} {"step": 14499, "train_loss": 3.4158430099487305, "lr": 0.0002440572970991218, "tps": 13927, "wall": 68232.1} {"step": 14500, "train_loss": 3.297758102416992, "lr": 0.00024403831084160498, "tps": 13927, "wall": 68237.1} {"step": 14501, "train_loss": 3.4823081493377686, "lr": 0.00024401932431178085, "tps": 13926, "wall": 68242.2} {"step": 14502, "train_loss": 3.351689338684082, "lr": 0.00024400033750986445, "tps": 13926, "wall": 68247.2} {"step": 14503, "train_loss": 3.351167678833008, "lr": 0.00024398135043607102, "tps": 13926, "wall": 68252.2} {"step": 14504, "train_loss": 3.4286303520202637, "lr": 0.0002439623630906155, "tps": 13926, "wall": 68257.1} {"step": 14505, "train_loss": 3.284637212753296, "lr": 0.00024394337547371304, "tps": 13926, "wall": 68262.1} {"step": 14506, "train_loss": 3.3921332359313965, "lr": 0.00024392438758557875, "tps": 13926, "wall": 68267.1} {"step": 14507, "train_loss": 3.352426767349243, "lr": 0.00024390539942642766, "tps": 13926, "wall": 68272.0} {"step": 14508, "train_loss": 3.30930757522583, "lr": 0.00024388641099647496, "tps": 13926, "wall": 68277.0} {"step": 14509, "train_loss": 3.4431469440460205, "lr": 0.00024386742229593568, "tps": 13926, "wall": 68282.0} {"step": 14510, "train_loss": 3.4406607151031494, "lr": 0.00024384843332502496, "tps": 13926, "wall": 68286.9} {"step": 14511, "train_loss": 3.4094769954681396, "lr": 0.00024382944408395788, "tps": 13926, "wall": 68291.9} {"step": 14512, "train_loss": 3.323869228363037, "lr": 0.00024381045457294955, "tps": 13926, "wall": 68296.8} {"step": 14513, "train_loss": 3.494762659072876, "lr": 0.00024379146479221512, "tps": 13926, "wall": 68301.8} {"step": 14514, "train_loss": 3.3755722045898438, "lr": 0.0002437724747419697, "tps": 13926, "wall": 68306.7} {"step": 14515, "train_loss": 3.4298171997070312, "lr": 0.00024375348442242842, "tps": 13926, "wall": 68311.7} {"step": 14516, "train_loss": 3.3017337322235107, "lr": 0.00024373449383380632, "tps": 13926, "wall": 68316.7} {"step": 14517, "train_loss": 3.474104404449463, "lr": 0.0002437155029763187, "tps": 13926, "wall": 68321.6} {"step": 14518, "train_loss": 3.3311362266540527, "lr": 0.00024369651185018046, "tps": 13926, "wall": 68326.6} {"step": 14519, "train_loss": 3.487445116043091, "lr": 0.00024367752045560695, "tps": 13925, "wall": 68331.6} {"step": 14520, "train_loss": 3.476865530014038, "lr": 0.00024365852879281317, "tps": 13925, "wall": 68336.5} {"step": 14521, "train_loss": 3.4520084857940674, "lr": 0.00024363953686201427, "tps": 13925, "wall": 68341.5} {"step": 14522, "train_loss": 3.34883975982666, "lr": 0.00024362054466342542, "tps": 13925, "wall": 68346.5} {"step": 14523, "train_loss": 3.3878660202026367, "lr": 0.00024360155219726185, "tps": 13925, "wall": 68351.5} {"step": 14524, "train_loss": 3.365365505218506, "lr": 0.00024358255946373847, "tps": 13925, "wall": 68356.4} {"step": 14525, "train_loss": 3.27583384513855, "lr": 0.00024356356646307065, "tps": 13925, "wall": 68361.4} {"step": 14526, "train_loss": 3.3925299644470215, "lr": 0.00024354457319547348, "tps": 13925, "wall": 68366.3} {"step": 14527, "train_loss": 3.436022996902466, "lr": 0.00024352557966116214, "tps": 13925, "wall": 68371.3} {"step": 14528, "train_loss": 3.381807804107666, "lr": 0.0002435065858603517, "tps": 13925, "wall": 68376.3} {"step": 14529, "train_loss": 3.400932788848877, "lr": 0.00024348759179325743, "tps": 13925, "wall": 68381.2} {"step": 14530, "train_loss": 3.441842555999756, "lr": 0.0002434685974600945, "tps": 13925, "wall": 68386.2} {"step": 14531, "train_loss": 3.382808208465576, "lr": 0.00024344960286107795, "tps": 13925, "wall": 68391.2} {"step": 14532, "train_loss": 3.421262741088867, "lr": 0.00024343060799642297, "tps": 13925, "wall": 68396.2} {"step": 14533, "train_loss": 3.428596258163452, "lr": 0.00024341161286634493, "tps": 13925, "wall": 68401.2} {"step": 14534, "train_loss": 3.443777322769165, "lr": 0.00024339261747105884, "tps": 13925, "wall": 68406.2} {"step": 14535, "train_loss": 3.4187698364257812, "lr": 0.00024337362181077983, "tps": 13925, "wall": 68411.1} {"step": 14536, "train_loss": 3.3799147605895996, "lr": 0.00024335462588572326, "tps": 13925, "wall": 68416.1} {"step": 14537, "train_loss": 3.437072515487671, "lr": 0.0002433356296961042, "tps": 13924, "wall": 68421.1} {"step": 14538, "train_loss": 3.5268454551696777, "lr": 0.00024331663324213788, "tps": 13924, "wall": 68426.0} {"step": 14539, "train_loss": 3.3066158294677734, "lr": 0.00024329763652403946, "tps": 13924, "wall": 68431.0} {"step": 14540, "train_loss": 3.379021167755127, "lr": 0.00024327863954202409, "tps": 13924, "wall": 68436.0} {"step": 14541, "train_loss": 3.392641067504883, "lr": 0.0002432596422963071, "tps": 13924, "wall": 68440.9} {"step": 14542, "train_loss": 3.4456052780151367, "lr": 0.00024324064478710363, "tps": 13924, "wall": 68445.9} {"step": 14543, "train_loss": 3.3259549140930176, "lr": 0.00024322164701462887, "tps": 13924, "wall": 68450.9} {"step": 14544, "train_loss": 3.421515941619873, "lr": 0.00024320264897909803, "tps": 13924, "wall": 68455.9} {"step": 14545, "train_loss": 3.4359872341156006, "lr": 0.0002431836506807263, "tps": 13924, "wall": 68460.9} {"step": 14546, "train_loss": 3.4428963661193848, "lr": 0.0002431646521197289, "tps": 13924, "wall": 68465.9} {"step": 14547, "train_loss": 3.3373968601226807, "lr": 0.00024314565329632112, "tps": 13924, "wall": 68470.8} {"step": 14548, "train_loss": 3.4023451805114746, "lr": 0.00024312665421071815, "tps": 13924, "wall": 68475.8} {"step": 14549, "train_loss": 3.508975028991699, "lr": 0.00024310765486313516, "tps": 13924, "wall": 68480.8} {"step": 14550, "train_loss": 3.3479068279266357, "lr": 0.0002430886552537874, "tps": 13924, "wall": 68485.7} {"step": 14551, "train_loss": 3.3599259853363037, "lr": 0.00024306965538289013, "tps": 13924, "wall": 68490.7} {"step": 14552, "train_loss": 3.480239152908325, "lr": 0.0002430506552506585, "tps": 13924, "wall": 68495.6} {"step": 14553, "train_loss": 3.3594212532043457, "lr": 0.0002430316548573078, "tps": 13924, "wall": 68500.6} {"step": 14554, "train_loss": 3.391369342803955, "lr": 0.00024301265420305338, "tps": 13924, "wall": 68505.6} {"step": 14555, "train_loss": 3.310300350189209, "lr": 0.00024299365328811026, "tps": 13924, "wall": 68510.5} {"step": 14556, "train_loss": 3.4142141342163086, "lr": 0.00024297465211269378, "tps": 13923, "wall": 68515.5} {"step": 14557, "train_loss": 3.3371949195861816, "lr": 0.00024295565067701923, "tps": 13923, "wall": 68520.5} {"step": 14558, "train_loss": 3.357038974761963, "lr": 0.0002429366489813019, "tps": 13923, "wall": 68525.5} {"step": 14559, "train_loss": 3.3534891605377197, "lr": 0.00024291764702575686, "tps": 13923, "wall": 68530.5} {"step": 14560, "train_loss": 3.365328550338745, "lr": 0.00024289864481059952, "tps": 13923, "wall": 68535.4} {"step": 14561, "train_loss": 3.339332342147827, "lr": 0.00024287964233604516, "tps": 13923, "wall": 68540.4} {"step": 14562, "train_loss": 3.3168368339538574, "lr": 0.0002428606396023089, "tps": 13923, "wall": 68545.3} {"step": 14563, "train_loss": 3.460113525390625, "lr": 0.00024284163660960603, "tps": 13923, "wall": 68550.2} {"step": 14564, "train_loss": 3.391378879547119, "lr": 0.00024282263335815194, "tps": 13923, "wall": 68555.2} {"step": 14565, "train_loss": 3.3722245693206787, "lr": 0.00024280362984816184, "tps": 13923, "wall": 68560.1} {"step": 14566, "train_loss": 3.3167684078216553, "lr": 0.00024278462607985093, "tps": 13923, "wall": 68565.1} {"step": 14567, "train_loss": 3.3784618377685547, "lr": 0.00024276562205343454, "tps": 13923, "wall": 68570.1} {"step": 14568, "train_loss": 3.3931939601898193, "lr": 0.000242746617769128, "tps": 13923, "wall": 68575.0} {"step": 14569, "train_loss": 3.368950843811035, "lr": 0.0002427276132271465, "tps": 13923, "wall": 68580.1} {"step": 14570, "train_loss": 3.484391927719116, "lr": 0.0002427086084277054, "tps": 13923, "wall": 68585.0} {"step": 14571, "train_loss": 3.481750726699829, "lr": 0.00024268960337101993, "tps": 13923, "wall": 68590.0} {"step": 14572, "train_loss": 3.290926456451416, "lr": 0.00024267059805730545, "tps": 13923, "wall": 68595.0} {"step": 14573, "train_loss": 3.365560531616211, "lr": 0.00024265159248677715, "tps": 13923, "wall": 68600.0} {"step": 14574, "train_loss": 3.3191471099853516, "lr": 0.00024263258665965044, "tps": 13923, "wall": 68604.9} {"step": 14575, "train_loss": 3.434479236602783, "lr": 0.00024261358057614055, "tps": 13922, "wall": 68609.9} {"step": 14576, "train_loss": 3.39070725440979, "lr": 0.00024259457423646277, "tps": 13922, "wall": 68614.8} {"step": 14577, "train_loss": 3.369518280029297, "lr": 0.00024257556764083237, "tps": 13922, "wall": 68619.8} {"step": 14578, "train_loss": 3.404564380645752, "lr": 0.00024255656078946486, "tps": 13922, "wall": 68624.7} {"step": 14579, "train_loss": 3.4654479026794434, "lr": 0.00024253755368257532, "tps": 13922, "wall": 68629.7} {"step": 14580, "train_loss": 3.399261951446533, "lr": 0.00024251854632037918, "tps": 13922, "wall": 68634.6} {"step": 14581, "train_loss": 3.342507839202881, "lr": 0.00024249953870309173, "tps": 13922, "wall": 68639.7} {"step": 14582, "train_loss": 3.4071359634399414, "lr": 0.00024248053083092828, "tps": 13922, "wall": 68644.6} {"step": 14583, "train_loss": 3.285834789276123, "lr": 0.00024246152270410414, "tps": 13922, "wall": 68649.6} {"step": 14584, "train_loss": 3.3962085247039795, "lr": 0.0002424425143228347, "tps": 13922, "wall": 68654.5} {"step": 14585, "train_loss": 3.433345317840576, "lr": 0.00024242350568733523, "tps": 13922, "wall": 68659.5} {"step": 14586, "train_loss": 3.450929880142212, "lr": 0.00024240449679782105, "tps": 13922, "wall": 68664.4} {"step": 14587, "train_loss": 3.2830560207366943, "lr": 0.00024238548765450753, "tps": 13922, "wall": 68669.4} {"step": 14588, "train_loss": 3.3480446338653564, "lr": 0.00024236647825761002, "tps": 13922, "wall": 68674.3} {"step": 14589, "train_loss": 3.3746066093444824, "lr": 0.00024234746860734384, "tps": 13922, "wall": 68679.3} {"step": 14590, "train_loss": 3.391066551208496, "lr": 0.00024232845870392425, "tps": 13922, "wall": 68684.2} {"step": 14591, "train_loss": 3.3492250442504883, "lr": 0.00024230944854756667, "tps": 13922, "wall": 68689.2} {"step": 14592, "train_loss": 3.225295305252075, "lr": 0.00024229043813848655, "tps": 13922, "wall": 68694.2} {"step": 14593, "train_loss": 3.3854849338531494, "lr": 0.00024227142747689913, "tps": 13922, "wall": 68699.2} {"step": 14594, "train_loss": 3.446568489074707, "lr": 0.00024225241656301969, "tps": 13921, "wall": 68704.2} {"step": 14595, "train_loss": 3.4254024028778076, "lr": 0.00024223340539706372, "tps": 13921, "wall": 68709.1} {"step": 14596, "train_loss": 3.4059505462646484, "lr": 0.0002422143939792465, "tps": 13921, "wall": 68714.1} {"step": 14597, "train_loss": 3.338942527770996, "lr": 0.00024219538230978348, "tps": 13921, "wall": 68719.0} {"step": 14598, "train_loss": 3.3432703018188477, "lr": 0.00024217637038888995, "tps": 13921, "wall": 68724.0} {"step": 14599, "train_loss": 3.385007381439209, "lr": 0.00024215735821678128, "tps": 13921, "wall": 68728.9} {"step": 14600, "train_loss": 3.411297559738159, "lr": 0.00024213834579367286, "tps": 13921, "wall": 68733.9} {"step": 14601, "train_loss": 3.367053508758545, "lr": 0.00024211933311978006, "tps": 13921, "wall": 68738.8} {"step": 14602, "train_loss": 3.412181854248047, "lr": 0.0002421003201953183, "tps": 13921, "wall": 68743.8} {"step": 14603, "train_loss": 3.3844621181488037, "lr": 0.00024208130702050285, "tps": 13921, "wall": 68748.7} {"step": 14604, "train_loss": 3.343782901763916, "lr": 0.00024206229359554916, "tps": 13921, "wall": 68753.7} {"step": 14605, "train_loss": 3.5087428092956543, "lr": 0.00024204327992067271, "tps": 13921, "wall": 68758.7} {"step": 14606, "train_loss": 3.3710694313049316, "lr": 0.0002420242659960887, "tps": 13921, "wall": 68763.7} {"step": 14607, "train_loss": 3.32883882522583, "lr": 0.00024200525182201265, "tps": 13921, "wall": 68768.6} {"step": 14608, "train_loss": 3.5073888301849365, "lr": 0.00024198623739865994, "tps": 13921, "wall": 68773.5} {"step": 14609, "train_loss": 3.4869184494018555, "lr": 0.0002419672227262459, "tps": 13921, "wall": 68778.5} {"step": 14610, "train_loss": 3.315746784210205, "lr": 0.00024194820780498594, "tps": 13921, "wall": 68783.5} {"step": 14611, "train_loss": 3.506568193435669, "lr": 0.00024192919263509556, "tps": 13921, "wall": 68788.4} {"step": 14612, "train_loss": 3.367459535598755, "lr": 0.0002419101772167901, "tps": 13921, "wall": 68793.4} {"step": 14613, "train_loss": 3.4454152584075928, "lr": 0.00024189116155028494, "tps": 13921, "wall": 68798.4} {"step": 14614, "train_loss": 3.30220365524292, "lr": 0.0002418721456357955, "tps": 13920, "wall": 68803.3} {"step": 14615, "train_loss": 3.4025371074676514, "lr": 0.0002418531294735372, "tps": 13920, "wall": 68808.3} {"step": 14616, "train_loss": 3.3776779174804688, "lr": 0.00024183411306372555, "tps": 13920, "wall": 68813.3} {"step": 14617, "train_loss": 3.361738920211792, "lr": 0.00024181509640657577, "tps": 13920, "wall": 68818.4} {"step": 14618, "train_loss": 3.514618158340454, "lr": 0.0002417960795023035, "tps": 13920, "wall": 68823.3} {"step": 14619, "train_loss": 3.4578540325164795, "lr": 0.000241777062351124, "tps": 13920, "wall": 68828.3} {"step": 14620, "train_loss": 3.3720545768737793, "lr": 0.00024175804495325288, "tps": 13920, "wall": 68833.3} {"step": 14621, "train_loss": 3.409762382507324, "lr": 0.00024173902730890528, "tps": 13920, "wall": 68838.2} {"step": 14622, "train_loss": 3.3952550888061523, "lr": 0.00024172000941829688, "tps": 13920, "wall": 68843.2} {"step": 14623, "train_loss": 3.392400026321411, "lr": 0.00024170099128164308, "tps": 13920, "wall": 68848.1} {"step": 14624, "train_loss": 3.429839611053467, "lr": 0.00024168197289915923, "tps": 13920, "wall": 68853.1} {"step": 14625, "train_loss": 3.4572079181671143, "lr": 0.00024166295427106082, "tps": 13920, "wall": 68858.0} {"step": 14626, "train_loss": 3.41953444480896, "lr": 0.00024164393539756332, "tps": 13920, "wall": 68863.0} {"step": 14627, "train_loss": 3.4138054847717285, "lr": 0.00024162491627888208, "tps": 13920, "wall": 68867.9} {"step": 14628, "train_loss": 3.3843302726745605, "lr": 0.00024160589691523266, "tps": 13920, "wall": 68872.9} {"step": 14629, "train_loss": 3.39506196975708, "lr": 0.00024158687730683047, "tps": 13920, "wall": 68877.9} {"step": 14630, "train_loss": 3.4927117824554443, "lr": 0.00024156785745389097, "tps": 13920, "wall": 68882.9} {"step": 14631, "train_loss": 3.294459342956543, "lr": 0.0002415488373566296, "tps": 13920, "wall": 68887.9} {"step": 14632, "train_loss": 3.452977418899536, "lr": 0.00024152981701526183, "tps": 13920, "wall": 68892.8} {"step": 14633, "train_loss": 3.4128475189208984, "lr": 0.00024151079643000317, "tps": 13919, "wall": 68897.8} {"step": 14634, "train_loss": 3.409926652908325, "lr": 0.000241491775601069, "tps": 13919, "wall": 68902.8} {"step": 14635, "train_loss": 3.4107539653778076, "lr": 0.00024147275452867485, "tps": 13919, "wall": 68907.7} {"step": 14636, "train_loss": 3.318359375, "lr": 0.00024145373321303622, "tps": 13919, "wall": 68912.7} {"step": 14637, "train_loss": 3.4108476638793945, "lr": 0.00024143471165436847, "tps": 13919, "wall": 68917.6} {"step": 14638, "train_loss": 3.3290414810180664, "lr": 0.0002414156898528872, "tps": 13919, "wall": 68922.6} {"step": 14639, "train_loss": 3.3442089557647705, "lr": 0.00024139666780880777, "tps": 13919, "wall": 68927.5} {"step": 14640, "train_loss": 3.3884613513946533, "lr": 0.00024137764552234576, "tps": 13919, "wall": 68932.5} {"step": 14641, "train_loss": 3.346621513366699, "lr": 0.00024135862299371668, "tps": 13919, "wall": 68937.5} {"step": 14642, "train_loss": 3.426325798034668, "lr": 0.0002413396002231359, "tps": 13919, "wall": 68942.5} {"step": 14643, "train_loss": 3.4698214530944824, "lr": 0.000241320577210819, "tps": 13919, "wall": 68947.4} {"step": 14644, "train_loss": 3.3142499923706055, "lr": 0.00024130155395698144, "tps": 13919, "wall": 68952.4} {"step": 14645, "train_loss": 3.413543939590454, "lr": 0.00024128253046183873, "tps": 13919, "wall": 68957.3} {"step": 14646, "train_loss": 3.386014461517334, "lr": 0.00024126350672560638, "tps": 13919, "wall": 68962.3} {"step": 14647, "train_loss": 3.261519432067871, "lr": 0.00024124448274849984, "tps": 13919, "wall": 68967.2} {"step": 14648, "train_loss": 3.3756799697875977, "lr": 0.00024122545853073462, "tps": 13919, "wall": 68972.2} {"step": 14649, "train_loss": 3.3707165718078613, "lr": 0.0002412064340725263, "tps": 13919, "wall": 68977.2} {"step": 14650, "train_loss": 3.292819023132324, "lr": 0.00024118740937409037, "tps": 13919, "wall": 68982.1} {"step": 14651, "train_loss": 3.3115005493164062, "lr": 0.00024116838443564227, "tps": 13919, "wall": 68987.1} {"step": 14652, "train_loss": 3.4482421875, "lr": 0.00024114935925739764, "tps": 13918, "wall": 68992.0} {"step": 14653, "train_loss": 3.3428797721862793, "lr": 0.0002411303338395719, "tps": 13918, "wall": 68997.0} {"step": 14654, "train_loss": 3.4656906127929688, "lr": 0.0002411113081823805, "tps": 13918, "wall": 69002.0} {"step": 14655, "train_loss": 3.408738374710083, "lr": 0.00024109228228603918, "tps": 13918, "wall": 69007.0} {"step": 14656, "train_loss": 3.432875156402588, "lr": 0.0002410732561507633, "tps": 13918, "wall": 69012.0} {"step": 14657, "train_loss": 3.2859175205230713, "lr": 0.00024105422977676843, "tps": 13918, "wall": 69016.9} {"step": 14658, "train_loss": 3.363124370574951, "lr": 0.00024103520316427011, "tps": 13918, "wall": 69021.9} {"step": 14659, "train_loss": 3.357250928878784, "lr": 0.00024101617631348384, "tps": 13918, "wall": 69026.8} {"step": 14660, "train_loss": 3.433183193206787, "lr": 0.00024099714922462523, "tps": 13918, "wall": 69031.8} {"step": 14661, "train_loss": 3.5160791873931885, "lr": 0.00024097812189790974, "tps": 13918, "wall": 69036.7} {"step": 14662, "train_loss": 3.4777092933654785, "lr": 0.000240959094333553, "tps": 13918, "wall": 69041.7} {"step": 14663, "train_loss": 3.293877601623535, "lr": 0.00024094006653177052, "tps": 13918, "wall": 69046.6} {"step": 14664, "train_loss": 3.3039002418518066, "lr": 0.00024092103849277776, "tps": 13918, "wall": 69051.6} {"step": 14665, "train_loss": 3.470362663269043, "lr": 0.00024090201021679036, "tps": 13918, "wall": 69056.5} {"step": 14666, "train_loss": 3.287287712097168, "lr": 0.00024088298170402386, "tps": 13918, "wall": 69061.5} {"step": 14667, "train_loss": 3.478423595428467, "lr": 0.00024086395295469388, "tps": 13918, "wall": 69066.5} {"step": 14668, "train_loss": 3.4053916931152344, "lr": 0.00024084492396901581, "tps": 13918, "wall": 69071.4} {"step": 14669, "train_loss": 3.375539779663086, "lr": 0.00024082589474720535, "tps": 13918, "wall": 69076.4} {"step": 14670, "train_loss": 3.3825137615203857, "lr": 0.0002408068652894781, "tps": 13918, "wall": 69081.4} {"step": 14671, "train_loss": 3.2731881141662598, "lr": 0.00024078783559604948, "tps": 13918, "wall": 69086.3} {"step": 14672, "train_loss": 3.3392863273620605, "lr": 0.00024076880566713515, "tps": 13917, "wall": 69091.3} {"step": 14673, "train_loss": 3.3238725662231445, "lr": 0.00024074977550295068, "tps": 13917, "wall": 69096.2} {"step": 14674, "train_loss": 3.391296625137329, "lr": 0.00024073074510371162, "tps": 13917, "wall": 69101.2} {"step": 14675, "train_loss": 3.4984793663024902, "lr": 0.00024071171446963355, "tps": 13917, "wall": 69106.1} {"step": 14676, "train_loss": 3.328195095062256, "lr": 0.000240692683600932, "tps": 13917, "wall": 69111.1} {"step": 14677, "train_loss": 3.2944815158843994, "lr": 0.00024067365249782273, "tps": 13917, "wall": 69116.0} {"step": 14678, "train_loss": 3.4280500411987305, "lr": 0.00024065462116052113, "tps": 13917, "wall": 69121.1} {"step": 14679, "train_loss": 3.411160469055176, "lr": 0.00024063558958924288, "tps": 13917, "wall": 69126.0} {"step": 14680, "train_loss": 3.505622386932373, "lr": 0.00024061655778420362, "tps": 13917, "wall": 69131.0} {"step": 14681, "train_loss": 3.355182647705078, "lr": 0.00024059752574561878, "tps": 13917, "wall": 69135.9} {"step": 14682, "train_loss": 3.334841728210449, "lr": 0.00024057849347370404, "tps": 13917, "wall": 69140.9} {"step": 14683, "train_loss": 3.3915181159973145, "lr": 0.00024055946096867512, "tps": 13917, "wall": 69145.9} {"step": 14684, "train_loss": 3.3179891109466553, "lr": 0.00024054042823074746, "tps": 13917, "wall": 69150.8} {"step": 14685, "train_loss": 3.368687868118286, "lr": 0.0002405213952601367, "tps": 13917, "wall": 69155.8} {"step": 14686, "train_loss": 3.388983964920044, "lr": 0.00024050236205705843, "tps": 13917, "wall": 69160.7} {"step": 14687, "train_loss": 3.5059497356414795, "lr": 0.00024048332862172838, "tps": 13917, "wall": 69165.7} {"step": 14688, "train_loss": 3.376098155975342, "lr": 0.00024046429495436203, "tps": 13917, "wall": 69170.6} {"step": 14689, "train_loss": 3.452850580215454, "lr": 0.00024044526105517506, "tps": 13917, "wall": 69175.6} {"step": 14690, "train_loss": 3.4387905597686768, "lr": 0.00024042622692438306, "tps": 13917, "wall": 69180.6} {"step": 14691, "train_loss": 3.511465072631836, "lr": 0.0002404071925622016, "tps": 13916, "wall": 69185.6} {"step": 14692, "train_loss": 3.3905773162841797, "lr": 0.00024038815796884646, "tps": 13916, "wall": 69190.5} {"step": 14693, "train_loss": 3.359557628631592, "lr": 0.00024036912314453313, "tps": 13916, "wall": 69195.5} {"step": 14694, "train_loss": 3.3836183547973633, "lr": 0.00024035008808947721, "tps": 13916, "wall": 69200.5} {"step": 14695, "train_loss": 3.550902843475342, "lr": 0.00024033105280389446, "tps": 13916, "wall": 69205.4} {"step": 14696, "train_loss": 3.4524645805358887, "lr": 0.00024031201728800036, "tps": 13916, "wall": 69210.4} {"step": 14697, "train_loss": 3.341691493988037, "lr": 0.00024029298154201075, "tps": 13916, "wall": 69215.3} {"step": 14698, "train_loss": 3.3658194541931152, "lr": 0.0002402739455661411, "tps": 13916, "wall": 69220.3} {"step": 14699, "train_loss": 3.2982895374298096, "lr": 0.00024025490936060707, "tps": 13916, "wall": 69225.2} {"step": 14700, "train_loss": 3.372858762741089, "lr": 0.00024023587292562436, "tps": 13916, "wall": 69230.2} {"step": 14701, "train_loss": 3.4801392555236816, "lr": 0.00024021683626140856, "tps": 13916, "wall": 69235.2} {"step": 14702, "train_loss": 3.3756961822509766, "lr": 0.0002401977993681753, "tps": 13916, "wall": 69240.2} {"step": 14703, "train_loss": 3.3849682807922363, "lr": 0.00024017876224614036, "tps": 13916, "wall": 69245.2} {"step": 14704, "train_loss": 3.3671884536743164, "lr": 0.00024015972489551933, "tps": 13916, "wall": 69250.1} {"step": 14705, "train_loss": 3.2561254501342773, "lr": 0.00024014068731652776, "tps": 13916, "wall": 69255.0} {"step": 14706, "train_loss": 3.2787039279937744, "lr": 0.00024012164950938143, "tps": 13916, "wall": 69260.0} {"step": 14707, "train_loss": 3.416572093963623, "lr": 0.00024010261147429596, "tps": 13916, "wall": 69265.0} {"step": 14708, "train_loss": 3.3632681369781494, "lr": 0.00024008357321148708, "tps": 13916, "wall": 69269.9} {"step": 14709, "train_loss": 3.3574342727661133, "lr": 0.00024006453472117035, "tps": 13916, "wall": 69274.9} {"step": 14710, "train_loss": 3.4703938961029053, "lr": 0.00024004549600356145, "tps": 13916, "wall": 69279.9} {"step": 14711, "train_loss": 3.357422113418579, "lr": 0.0002400264570588761, "tps": 13915, "wall": 69284.8} {"step": 14712, "train_loss": 3.369868516921997, "lr": 0.00024000741788733, "tps": 13915, "wall": 69289.8} {"step": 14713, "train_loss": 3.416227340698242, "lr": 0.0002399883784891388, "tps": 13915, "wall": 69294.7} {"step": 14714, "train_loss": 3.374371290206909, "lr": 0.0002399693388645181, "tps": 13915, "wall": 69299.7} {"step": 14715, "train_loss": 3.436516284942627, "lr": 0.00023995029901368366, "tps": 13915, "wall": 69304.7} {"step": 14716, "train_loss": 3.4614341259002686, "lr": 0.00023993125893685116, "tps": 13915, "wall": 69309.6} {"step": 14717, "train_loss": 3.4508728981018066, "lr": 0.00023991221863423631, "tps": 13915, "wall": 69314.6} {"step": 14718, "train_loss": 3.399125099182129, "lr": 0.0002398931781060548, "tps": 13915, "wall": 69319.5} {"step": 14719, "train_loss": 3.4167113304138184, "lr": 0.00023987413735252223, "tps": 13915, "wall": 69324.5} {"step": 14720, "train_loss": 3.355253219604492, "lr": 0.0002398550963738544, "tps": 13915, "wall": 69329.4} {"step": 14721, "train_loss": 3.2898354530334473, "lr": 0.00023983605517026693, "tps": 13915, "wall": 69334.4} {"step": 14722, "train_loss": 3.2948012351989746, "lr": 0.00023981701374197557, "tps": 13915, "wall": 69339.3} {"step": 14723, "train_loss": 3.375340461730957, "lr": 0.00023979797208919593, "tps": 13915, "wall": 69344.2} {"step": 14724, "train_loss": 3.3177995681762695, "lr": 0.0002397789302121439, "tps": 13915, "wall": 69349.2} {"step": 14725, "train_loss": 3.4093377590179443, "lr": 0.00023975988811103505, "tps": 13915, "wall": 69354.1} {"step": 14726, "train_loss": 3.3683278560638428, "lr": 0.0002397408457860851, "tps": 13915, "wall": 69359.1} {"step": 14727, "train_loss": 3.4416656494140625, "lr": 0.00023972180323750974, "tps": 13915, "wall": 69364.1} {"step": 14728, "train_loss": 3.3053035736083984, "lr": 0.0002397027604655248, "tps": 13915, "wall": 69369.1} {"step": 14729, "train_loss": 3.358214855194092, "lr": 0.0002396837174703459, "tps": 13915, "wall": 69374.0} {"step": 14730, "train_loss": 3.2694082260131836, "lr": 0.00023966467425218878, "tps": 13915, "wall": 69379.0} {"step": 14731, "train_loss": 3.43533992767334, "lr": 0.00023964563081126921, "tps": 13914, "wall": 69383.9} {"step": 14732, "train_loss": 3.234485626220703, "lr": 0.00023962658714780276, "tps": 13914, "wall": 69388.9} {"step": 14733, "train_loss": 3.4150896072387695, "lr": 0.00023960754326200534, "tps": 13914, "wall": 69393.8} {"step": 14734, "train_loss": 3.393465042114258, "lr": 0.0002395884991540926, "tps": 13914, "wall": 69398.7} {"step": 14735, "train_loss": 3.318317413330078, "lr": 0.0002395694548242803, "tps": 13914, "wall": 69403.7} {"step": 14736, "train_loss": 3.251356840133667, "lr": 0.00023955041027278417, "tps": 13914, "wall": 69408.6} {"step": 14737, "train_loss": 3.396730422973633, "lr": 0.00023953136549981988, "tps": 13914, "wall": 69413.6} {"step": 14738, "train_loss": 3.416210174560547, "lr": 0.0002395123205056033, "tps": 13914, "wall": 69418.6} {"step": 14739, "train_loss": 3.39719557762146, "lr": 0.00023949327529035005, "tps": 13914, "wall": 69423.5} {"step": 14740, "train_loss": 3.351396083831787, "lr": 0.0002394742298542759, "tps": 13914, "wall": 69428.5} {"step": 14741, "train_loss": 3.4191322326660156, "lr": 0.00023945518419759667, "tps": 13914, "wall": 69433.4} {"step": 14742, "train_loss": 3.319020986557007, "lr": 0.00023943613832052803, "tps": 13914, "wall": 69438.4} {"step": 14743, "train_loss": 3.310839891433716, "lr": 0.00023941709222328577, "tps": 13914, "wall": 69443.4} {"step": 14744, "train_loss": 3.4424171447753906, "lr": 0.00023939804590608561, "tps": 13914, "wall": 69448.3} {"step": 14745, "train_loss": 3.465484142303467, "lr": 0.0002393789993691434, "tps": 13914, "wall": 69453.3} {"step": 14746, "train_loss": 3.4072840213775635, "lr": 0.0002393599526126748, "tps": 13914, "wall": 69458.3} {"step": 14747, "train_loss": 3.3389220237731934, "lr": 0.0002393409056368956, "tps": 13914, "wall": 69463.2} {"step": 14748, "train_loss": 3.3947958946228027, "lr": 0.0002393218584420216, "tps": 13914, "wall": 69468.2} {"step": 14749, "train_loss": 3.524064540863037, "lr": 0.0002393028110282685, "tps": 13914, "wall": 69473.1} {"step": 14750, "train_loss": 3.443830966949463, "lr": 0.00023928376339585214, "tps": 13914, "wall": 69478.2} {"step": 14751, "train_loss": 3.4291629791259766, "lr": 0.00023926471554498827, "tps": 13913, "wall": 69483.1} {"step": 14752, "train_loss": 3.367309093475342, "lr": 0.00023924566747589266, "tps": 13913, "wall": 69488.1} {"step": 14753, "train_loss": 3.4028053283691406, "lr": 0.00023922661918878108, "tps": 13913, "wall": 69493.0} {"step": 14754, "train_loss": 3.333940029144287, "lr": 0.00023920757068386932, "tps": 13913, "wall": 69498.0} {"step": 14755, "train_loss": 3.403629779815674, "lr": 0.0002391885219613732, "tps": 13913, "wall": 69503.0} {"step": 14756, "train_loss": 3.4983465671539307, "lr": 0.00023916947302150842, "tps": 13913, "wall": 69507.9} {"step": 14757, "train_loss": 3.3462793827056885, "lr": 0.00023915042386449077, "tps": 13913, "wall": 69512.9} {"step": 14758, "train_loss": 3.3693645000457764, "lr": 0.00023913137449053617, "tps": 13913, "wall": 69517.8} {"step": 14759, "train_loss": 3.3926353454589844, "lr": 0.0002391123248998603, "tps": 13913, "wall": 69522.8} {"step": 14760, "train_loss": 3.379105567932129, "lr": 0.00023909327509267895, "tps": 13913, "wall": 69527.8} {"step": 14761, "train_loss": 3.358654022216797, "lr": 0.00023907422506920796, "tps": 13913, "wall": 69532.7} {"step": 14762, "train_loss": 3.3768205642700195, "lr": 0.00023905517482966312, "tps": 13913, "wall": 69537.8} {"step": 14763, "train_loss": 3.439074993133545, "lr": 0.00023903612437426022, "tps": 13913, "wall": 69542.8} {"step": 14764, "train_loss": 3.3710379600524902, "lr": 0.00023901707370321509, "tps": 13913, "wall": 69547.7} {"step": 14765, "train_loss": 3.3811206817626953, "lr": 0.00023899802281674356, "tps": 13913, "wall": 69552.7} {"step": 14766, "train_loss": 3.353219509124756, "lr": 0.00023897897171506132, "tps": 13913, "wall": 69557.7} {"step": 14767, "train_loss": 3.4212067127227783, "lr": 0.00023895992039838428, "tps": 13913, "wall": 69562.6} {"step": 14768, "train_loss": 3.4472157955169678, "lr": 0.00023894086886692831, "tps": 13913, "wall": 69567.6} {"step": 14769, "train_loss": 3.325740098953247, "lr": 0.00023892181712090906, "tps": 13913, "wall": 69572.5} {"step": 14770, "train_loss": 3.3225321769714355, "lr": 0.00023890276516054244, "tps": 13913, "wall": 69577.5} {"step": 14771, "train_loss": 3.3561863899230957, "lr": 0.00023888371298604432, "tps": 13912, "wall": 69582.4} {"step": 14772, "train_loss": 3.19663143157959, "lr": 0.00023886466059763048, "tps": 13912, "wall": 69587.4} {"step": 14773, "train_loss": 3.3612399101257324, "lr": 0.0002388456079955167, "tps": 13912, "wall": 69592.4} {"step": 14774, "train_loss": 3.378596782684326, "lr": 0.00023882655517991886, "tps": 13912, "wall": 69597.3} {"step": 14775, "train_loss": 3.456606149673462, "lr": 0.00023880750215105287, "tps": 13912, "wall": 69602.3} {"step": 14776, "train_loss": 3.423229932785034, "lr": 0.00023878844890913437, "tps": 13912, "wall": 69607.3} {"step": 14777, "train_loss": 3.4183859825134277, "lr": 0.00023876939545437934, "tps": 13912, "wall": 69612.2} {"step": 14778, "train_loss": 3.3285632133483887, "lr": 0.00023875034178700362, "tps": 13912, "wall": 69617.2} {"step": 14779, "train_loss": 3.4537417888641357, "lr": 0.000238731287907223, "tps": 13912, "wall": 69622.1} {"step": 14780, "train_loss": 3.401632070541382, "lr": 0.0002387122338152533, "tps": 13912, "wall": 69627.1} {"step": 14781, "train_loss": 3.3709540367126465, "lr": 0.00023869317951131044, "tps": 13912, "wall": 69632.1} {"step": 14782, "train_loss": 3.437422275543213, "lr": 0.00023867412499561024, "tps": 13912, "wall": 69637.0} {"step": 14783, "train_loss": 3.402726173400879, "lr": 0.0002386550702683685, "tps": 13912, "wall": 69642.0} {"step": 14784, "train_loss": 3.42978572845459, "lr": 0.00023863601532980112, "tps": 13912, "wall": 69646.9} {"step": 14785, "train_loss": 3.3075666427612305, "lr": 0.00023861696018012398, "tps": 13912, "wall": 69651.9} {"step": 14786, "train_loss": 3.371574640274048, "lr": 0.00023859790481955292, "tps": 13912, "wall": 69656.8} {"step": 14787, "train_loss": 3.404773235321045, "lr": 0.00023857884924830374, "tps": 13912, "wall": 69661.9} {"step": 14788, "train_loss": 3.3599681854248047, "lr": 0.00023855979346659237, "tps": 13912, "wall": 69666.8} {"step": 14789, "train_loss": 3.3473925590515137, "lr": 0.00023854073747463467, "tps": 13912, "wall": 69671.8} {"step": 14790, "train_loss": 3.4322938919067383, "lr": 0.0002385216812726465, "tps": 13912, "wall": 69676.7} {"step": 14791, "train_loss": 3.254175901412964, "lr": 0.0002385026248608437, "tps": 13911, "wall": 69681.7} {"step": 14792, "train_loss": 3.342536449432373, "lr": 0.00023848356823944213, "tps": 13911, "wall": 69686.6} {"step": 14793, "train_loss": 3.3644957542419434, "lr": 0.0002384645114086578, "tps": 13911, "wall": 69691.6} {"step": 14794, "train_loss": 3.263766050338745, "lr": 0.00023844545436870642, "tps": 13911, "wall": 69696.5} {"step": 14795, "train_loss": 3.4426050186157227, "lr": 0.00023842639711980392, "tps": 13911, "wall": 69701.5} {"step": 14796, "train_loss": 3.3579888343811035, "lr": 0.00023840733966216623, "tps": 13911, "wall": 69706.4} {"step": 14797, "train_loss": 3.362785816192627, "lr": 0.00023838828199600917, "tps": 13911, "wall": 69711.4} {"step": 14798, "train_loss": 3.466160535812378, "lr": 0.00023836922412154868, "tps": 13911, "wall": 69716.3} {"step": 14799, "train_loss": 3.433973789215088, "lr": 0.00023835016603900058, "tps": 13911, "wall": 69721.3} {"step": 14800, "train_loss": 3.3218882083892822, "lr": 0.00023833110774858086, "tps": 13911, "wall": 69726.3} {"step": 14801, "train_loss": 3.4072299003601074, "lr": 0.00023831204925050536, "tps": 13911, "wall": 69731.2} {"step": 14802, "train_loss": 3.281200647354126, "lr": 0.00023829299054498995, "tps": 13911, "wall": 69736.2} {"step": 14803, "train_loss": 3.4073877334594727, "lr": 0.00023827393163225057, "tps": 13911, "wall": 69741.1} {"step": 14804, "train_loss": 3.304819107055664, "lr": 0.00023825487251250306, "tps": 13911, "wall": 69746.1} {"step": 14805, "train_loss": 3.3827757835388184, "lr": 0.00023823581318596344, "tps": 13911, "wall": 69751.1} {"step": 14806, "train_loss": 3.3274221420288086, "lr": 0.0002382167536528475, "tps": 13911, "wall": 69756.0} {"step": 14807, "train_loss": 3.374936819076538, "lr": 0.00023819769391337118, "tps": 13911, "wall": 69761.0} {"step": 14808, "train_loss": 3.3838253021240234, "lr": 0.0002381786339677504, "tps": 13911, "wall": 69765.9} {"step": 14809, "train_loss": 3.3551177978515625, "lr": 0.00023815957381620107, "tps": 13911, "wall": 69770.9} {"step": 14810, "train_loss": 3.298314094543457, "lr": 0.00023814051345893918, "tps": 13911, "wall": 69775.8} {"step": 14811, "train_loss": 3.452626943588257, "lr": 0.00023812145289618046, "tps": 13910, "wall": 69780.9} {"step": 14812, "train_loss": 3.3575572967529297, "lr": 0.00023810239212814098, "tps": 13910, "wall": 69785.9} {"step": 14813, "train_loss": 3.341705799102783, "lr": 0.00023808333115503665, "tps": 13910, "wall": 69790.8} {"step": 14814, "train_loss": 3.325432777404785, "lr": 0.00023806426997708332, "tps": 13910, "wall": 69795.8} {"step": 14815, "train_loss": 3.398850440979004, "lr": 0.000238045208594497, "tps": 13910, "wall": 69800.7} {"step": 14816, "train_loss": 3.341953754425049, "lr": 0.00023802614700749365, "tps": 13910, "wall": 69805.7} {"step": 14817, "train_loss": 3.448509693145752, "lr": 0.000238007085216289, "tps": 13910, "wall": 69810.6} {"step": 14818, "train_loss": 3.329267740249634, "lr": 0.00023798802322109916, "tps": 13910, "wall": 69815.6} {"step": 14819, "train_loss": 3.435798406600952, "lr": 0.00023796896102214, "tps": 13910, "wall": 69820.6} {"step": 14820, "train_loss": 3.4350109100341797, "lr": 0.00023794989861962757, "tps": 13910, "wall": 69825.5} {"step": 14821, "train_loss": 3.317089557647705, "lr": 0.00023793083601377762, "tps": 13910, "wall": 69830.5} {"step": 14822, "train_loss": 3.387298583984375, "lr": 0.00023791177320480622, "tps": 13910, "wall": 69835.4} {"step": 14823, "train_loss": 3.3833439350128174, "lr": 0.0002378927101929293, "tps": 13910, "wall": 69840.4} {"step": 14824, "train_loss": 3.392209053039551, "lr": 0.00023787364697836277, "tps": 13910, "wall": 69845.4} {"step": 14825, "train_loss": 3.2561185359954834, "lr": 0.00023785458356132263, "tps": 13910, "wall": 69850.3} {"step": 14826, "train_loss": 3.406407356262207, "lr": 0.00023783551994202475, "tps": 13910, "wall": 69855.3} {"step": 14827, "train_loss": 3.4530022144317627, "lr": 0.0002378164561206852, "tps": 13910, "wall": 69860.3} {"step": 14828, "train_loss": 3.2541306018829346, "lr": 0.00023779739209751978, "tps": 13910, "wall": 69865.2} {"step": 14829, "train_loss": 3.3233563899993896, "lr": 0.00023777832787274462, "tps": 13910, "wall": 69870.2} {"step": 14830, "train_loss": 3.288548469543457, "lr": 0.0002377592634465756, "tps": 13910, "wall": 69875.1} {"step": 14831, "train_loss": 3.355802059173584, "lr": 0.00023774019881922867, "tps": 13909, "wall": 69880.1} {"step": 14832, "train_loss": 3.4391911029815674, "lr": 0.00023772113399091977, "tps": 13909, "wall": 69885.0} {"step": 14833, "train_loss": 3.3908939361572266, "lr": 0.00023770206896186493, "tps": 13909, "wall": 69890.0} {"step": 14834, "train_loss": 3.490088939666748, "lr": 0.00023768300373228014, "tps": 13909, "wall": 69894.9} {"step": 14835, "train_loss": 3.2896363735198975, "lr": 0.00023766393830238129, "tps": 13909, "wall": 69899.9} {"step": 14836, "train_loss": 3.4549880027770996, "lr": 0.00023764487267238432, "tps": 13909, "wall": 69904.9} {"step": 14837, "train_loss": 3.3528568744659424, "lr": 0.00023762580684250537, "tps": 13909, "wall": 69909.9} {"step": 14838, "train_loss": 3.4199347496032715, "lr": 0.0002376067408129603, "tps": 13909, "wall": 69914.8} {"step": 14839, "train_loss": 3.314495086669922, "lr": 0.0002375876745839651, "tps": 13909, "wall": 69919.8} {"step": 14840, "train_loss": 3.2596375942230225, "lr": 0.00023756860815573583, "tps": 13909, "wall": 69924.7} {"step": 14841, "train_loss": 3.303375005722046, "lr": 0.00023754954152848838, "tps": 13909, "wall": 69929.7} {"step": 14842, "train_loss": 3.37294864654541, "lr": 0.00023753047470243877, "tps": 13909, "wall": 69934.7} {"step": 14843, "train_loss": 3.4031314849853516, "lr": 0.00023751140767780298, "tps": 13909, "wall": 69939.6} {"step": 14844, "train_loss": 3.440019369125366, "lr": 0.000237492340454797, "tps": 13909, "wall": 69944.6} {"step": 14845, "train_loss": 3.272597312927246, "lr": 0.00023747327303363686, "tps": 13909, "wall": 69949.5} {"step": 14846, "train_loss": 3.421647071838379, "lr": 0.00023745420541453855, "tps": 13909, "wall": 69954.5} {"step": 14847, "train_loss": 3.3435142040252686, "lr": 0.00023743513759771808, "tps": 13909, "wall": 69959.5} {"step": 14848, "train_loss": 3.4882116317749023, "lr": 0.0002374160695833914, "tps": 13909, "wall": 69964.5} {"step": 14849, "train_loss": 3.3830599784851074, "lr": 0.00023739700137177452, "tps": 13909, "wall": 69969.4} {"step": 14850, "train_loss": 3.3326778411865234, "lr": 0.00023737793296308354, "tps": 13909, "wall": 69974.4} {"step": 14851, "train_loss": 3.3866219520568848, "lr": 0.00023735886435753432, "tps": 13908, "wall": 69979.3} {"step": 14852, "train_loss": 3.411892890930176, "lr": 0.000237339795555343, "tps": 13908, "wall": 69984.3} {"step": 14853, "train_loss": 3.4251739978790283, "lr": 0.0002373207265567255, "tps": 13908, "wall": 69989.2} {"step": 14854, "train_loss": 3.4835729598999023, "lr": 0.0002373016573618979, "tps": 13908, "wall": 69994.2} {"step": 14855, "train_loss": 3.419968605041504, "lr": 0.00023728258797107613, "tps": 13908, "wall": 69999.2} {"step": 14856, "train_loss": 3.2960071563720703, "lr": 0.0002372635183844763, "tps": 13908, "wall": 70004.1} {"step": 14857, "train_loss": 3.2892112731933594, "lr": 0.00023724444860231448, "tps": 13908, "wall": 70009.1} {"step": 14858, "train_loss": 3.3723466396331787, "lr": 0.0002372253786248065, "tps": 13908, "wall": 70014.0} {"step": 14859, "train_loss": 3.395375967025757, "lr": 0.00023720630845216857, "tps": 13908, "wall": 70019.1} {"step": 14860, "train_loss": 3.389890193939209, "lr": 0.00023718723808461664, "tps": 13908, "wall": 70024.0} {"step": 14861, "train_loss": 3.371858596801758, "lr": 0.0002371681675223667, "tps": 13908, "wall": 70029.0} {"step": 14862, "train_loss": 3.3375167846679688, "lr": 0.00023714909676563487, "tps": 13908, "wall": 70033.9} {"step": 14863, "train_loss": 3.4066648483276367, "lr": 0.00023713002581463713, "tps": 13908, "wall": 70038.9} {"step": 14864, "train_loss": 3.3363595008850098, "lr": 0.00023711095466958954, "tps": 13908, "wall": 70043.9} {"step": 14865, "train_loss": 3.2962100505828857, "lr": 0.0002370918833307081, "tps": 13908, "wall": 70048.8} {"step": 14866, "train_loss": 3.3807120323181152, "lr": 0.00023707281179820888, "tps": 13908, "wall": 70053.8} {"step": 14867, "train_loss": 3.4225850105285645, "lr": 0.000237053740072308, "tps": 13908, "wall": 70058.7} {"step": 14868, "train_loss": 3.4124670028686523, "lr": 0.00023703466815322134, "tps": 13908, "wall": 70063.7} {"step": 14869, "train_loss": 3.319336175918579, "lr": 0.00023701559604116508, "tps": 13908, "wall": 70068.7} {"step": 14870, "train_loss": 3.4269919395446777, "lr": 0.00023699652373635526, "tps": 13908, "wall": 70073.6} {"step": 14871, "train_loss": 3.3446669578552246, "lr": 0.00023697745123900786, "tps": 13907, "wall": 70078.6} {"step": 14872, "train_loss": 3.557685375213623, "lr": 0.00023695837854933896, "tps": 13907, "wall": 70083.5} {"step": 14873, "train_loss": 3.299578905105591, "lr": 0.00023693930566756467, "tps": 13907, "wall": 70088.5} {"step": 14874, "train_loss": 3.3667564392089844, "lr": 0.000236920232593901, "tps": 13907, "wall": 70093.5} {"step": 14875, "train_loss": 3.3681042194366455, "lr": 0.00023690115932856401, "tps": 13907, "wall": 70098.4} {"step": 14876, "train_loss": 3.411252498626709, "lr": 0.00023688208587176974, "tps": 13907, "wall": 70103.4} {"step": 14877, "train_loss": 3.47489595413208, "lr": 0.0002368630122237343, "tps": 13907, "wall": 70108.3} {"step": 14878, "train_loss": 3.384019136428833, "lr": 0.00023684393838467377, "tps": 13907, "wall": 70113.3} {"step": 14879, "train_loss": 3.4147186279296875, "lr": 0.0002368248643548042, "tps": 13907, "wall": 70118.2} {"step": 14880, "train_loss": 3.3885762691497803, "lr": 0.00023680579013434164, "tps": 13907, "wall": 70123.2} {"step": 14881, "train_loss": 3.352379560470581, "lr": 0.00023678671572350223, "tps": 13907, "wall": 70128.1} {"step": 14882, "train_loss": 3.384202003479004, "lr": 0.00023676764112250194, "tps": 13907, "wall": 70133.1} {"step": 14883, "train_loss": 3.503485918045044, "lr": 0.00023674856633155688, "tps": 13907, "wall": 70138.1} {"step": 14884, "train_loss": 3.4640090465545654, "lr": 0.00023672949135088316, "tps": 13907, "wall": 70143.1} {"step": 14885, "train_loss": 3.4403557777404785, "lr": 0.00023671041618069692, "tps": 13907, "wall": 70148.0} {"step": 14886, "train_loss": 3.3179216384887695, "lr": 0.00023669134082121413, "tps": 13907, "wall": 70153.0} {"step": 14887, "train_loss": 3.3923492431640625, "lr": 0.0002366722652726509, "tps": 13907, "wall": 70157.9} {"step": 14888, "train_loss": 3.351714611053467, "lr": 0.00023665318953522345, "tps": 13907, "wall": 70162.9} {"step": 14889, "train_loss": 3.4347586631774902, "lr": 0.00023663411360914767, "tps": 13907, "wall": 70167.8} {"step": 14890, "train_loss": 3.3542888164520264, "lr": 0.00023661503749463982, "tps": 13907, "wall": 70172.8} {"step": 14891, "train_loss": 3.499755620956421, "lr": 0.00023659596119191592, "tps": 13906, "wall": 70177.8} {"step": 14892, "train_loss": 3.3994572162628174, "lr": 0.00023657688470119203, "tps": 13906, "wall": 70182.7} {"step": 14893, "train_loss": 3.437565565109253, "lr": 0.00023655780802268428, "tps": 13906, "wall": 70187.7} {"step": 14894, "train_loss": 3.3805041313171387, "lr": 0.00023653873115660884, "tps": 13906, "wall": 70192.6} {"step": 14895, "train_loss": 3.366506814956665, "lr": 0.00023651965410318172, "tps": 13906, "wall": 70197.6} {"step": 14896, "train_loss": 3.424818992614746, "lr": 0.00023650057686261912, "tps": 13906, "wall": 70202.6} {"step": 14897, "train_loss": 3.4147820472717285, "lr": 0.00023648149943513702, "tps": 13906, "wall": 70207.6} {"step": 14898, "train_loss": 3.3700368404388428, "lr": 0.00023646242182095168, "tps": 13906, "wall": 70212.5} {"step": 14899, "train_loss": 3.336956262588501, "lr": 0.0002364433440202791, "tps": 13906, "wall": 70217.5} {"step": 14900, "train_loss": 3.439047336578369, "lr": 0.0002364242660333354, "tps": 13906, "wall": 70222.4} {"step": 14901, "train_loss": 3.294832706451416, "lr": 0.0002364051878603368, "tps": 13906, "wall": 70227.4} {"step": 14902, "train_loss": 3.363858222961426, "lr": 0.00023638610950149925, "tps": 13906, "wall": 70232.3} {"step": 14903, "train_loss": 3.389314651489258, "lr": 0.00023636703095703898, "tps": 13906, "wall": 70237.3} {"step": 14904, "train_loss": 3.2561137676239014, "lr": 0.0002363479522271721, "tps": 13906, "wall": 70242.2} {"step": 14905, "train_loss": 3.3565475940704346, "lr": 0.00023632887331211482, "tps": 13906, "wall": 70247.1} {"step": 14906, "train_loss": 3.328450918197632, "lr": 0.0002363097942120831, "tps": 13906, "wall": 70252.1} {"step": 14907, "train_loss": 3.4232606887817383, "lr": 0.00023629071492729312, "tps": 13906, "wall": 70257.1} {"step": 14908, "train_loss": 3.4449679851531982, "lr": 0.00023627163545796113, "tps": 13906, "wall": 70262.1} {"step": 14909, "train_loss": 3.411821126937866, "lr": 0.0002362525558043031, "tps": 13906, "wall": 70267.1} {"step": 14910, "train_loss": 3.4451212882995605, "lr": 0.00023623347596653525, "tps": 13906, "wall": 70272.0} {"step": 14911, "train_loss": 3.3884739875793457, "lr": 0.0002362143959448737, "tps": 13906, "wall": 70277.0} {"step": 14912, "train_loss": 3.3420345783233643, "lr": 0.00023619531573953472, "tps": 13905, "wall": 70281.9} {"step": 14913, "train_loss": 3.3369693756103516, "lr": 0.00023617623535073418, "tps": 13905, "wall": 70286.9} {"step": 14914, "train_loss": 3.359590768814087, "lr": 0.0002361571547786884, "tps": 13905, "wall": 70291.9} {"step": 14915, "train_loss": 3.490172863006592, "lr": 0.00023613807402361357, "tps": 13905, "wall": 70296.8} {"step": 14916, "train_loss": 3.41603422164917, "lr": 0.00023611899308572566, "tps": 13905, "wall": 70301.8} {"step": 14917, "train_loss": 3.4954848289489746, "lr": 0.00023609991196524099, "tps": 13905, "wall": 70306.7} {"step": 14918, "train_loss": 3.3109285831451416, "lr": 0.00023608083066237564, "tps": 13905, "wall": 70311.7} {"step": 14919, "train_loss": 3.394613027572632, "lr": 0.00023606174917734576, "tps": 13905, "wall": 70316.6} {"step": 14920, "train_loss": 3.409250020980835, "lr": 0.00023604266751036748, "tps": 13905, "wall": 70321.7} {"step": 14921, "train_loss": 3.369748592376709, "lr": 0.00023602358566165706, "tps": 13905, "wall": 70326.6} {"step": 14922, "train_loss": 3.473562717437744, "lr": 0.00023600450363143059, "tps": 13905, "wall": 70331.6} {"step": 14923, "train_loss": 3.362260580062866, "lr": 0.0002359854214199042, "tps": 13905, "wall": 70336.5} {"step": 14924, "train_loss": 3.3530492782592773, "lr": 0.0002359663390272941, "tps": 13905, "wall": 70341.5} {"step": 14925, "train_loss": 3.32438588142395, "lr": 0.00023594725645381646, "tps": 13905, "wall": 70346.4} {"step": 14926, "train_loss": 3.3396997451782227, "lr": 0.00023592817369968741, "tps": 13905, "wall": 70351.4} {"step": 14927, "train_loss": 3.285457134246826, "lr": 0.00023590909076512317, "tps": 13905, "wall": 70356.3} {"step": 14928, "train_loss": 3.4383304119110107, "lr": 0.0002358900076503399, "tps": 13905, "wall": 70361.3} {"step": 14929, "train_loss": 3.290933609008789, "lr": 0.00023587092435555375, "tps": 13905, "wall": 70366.2} {"step": 14930, "train_loss": 3.449495553970337, "lr": 0.0002358518408809809, "tps": 13905, "wall": 70371.2} {"step": 14931, "train_loss": 3.3416547775268555, "lr": 0.00023583275722683755, "tps": 13905, "wall": 70376.2} {"step": 14932, "train_loss": 3.417814254760742, "lr": 0.00023581367339333987, "tps": 13904, "wall": 70381.2} {"step": 14933, "train_loss": 3.508981704711914, "lr": 0.000235794589380704, "tps": 13904, "wall": 70386.2} {"step": 14934, "train_loss": 3.274113655090332, "lr": 0.00023577550518914618, "tps": 13904, "wall": 70391.1} {"step": 14935, "train_loss": 3.356067419052124, "lr": 0.00023575642081888267, "tps": 13904, "wall": 70396.1} {"step": 14936, "train_loss": 3.3906326293945312, "lr": 0.0002357373362701295, "tps": 13904, "wall": 70401.1} {"step": 14937, "train_loss": 3.4512596130371094, "lr": 0.00023571825154310294, "tps": 13904, "wall": 70406.0} {"step": 14938, "train_loss": 3.364102363586426, "lr": 0.0002356991666380192, "tps": 13904, "wall": 70411.0} {"step": 14939, "train_loss": 3.462210178375244, "lr": 0.0002356800815550944, "tps": 13904, "wall": 70415.9} {"step": 14940, "train_loss": 3.393848180770874, "lr": 0.00023566099629454486, "tps": 13904, "wall": 70420.9} {"step": 14941, "train_loss": 3.3715996742248535, "lr": 0.00023564191085658664, "tps": 13904, "wall": 70425.9} {"step": 14942, "train_loss": 3.3230531215667725, "lr": 0.00023562282524143603, "tps": 13904, "wall": 70430.8} {"step": 14943, "train_loss": 3.368037223815918, "lr": 0.0002356037394493092, "tps": 13904, "wall": 70435.8} {"step": 14944, "train_loss": 3.2866530418395996, "lr": 0.00023558465348042242, "tps": 13904, "wall": 70440.8} {"step": 14945, "train_loss": 3.368077278137207, "lr": 0.0002355655673349918, "tps": 13904, "wall": 70445.8} {"step": 14946, "train_loss": 3.3964457511901855, "lr": 0.0002355464810132336, "tps": 13904, "wall": 70450.7} {"step": 14947, "train_loss": 3.3928065299987793, "lr": 0.00023552739451536398, "tps": 13904, "wall": 70455.7} {"step": 14948, "train_loss": 3.3421390056610107, "lr": 0.0002355083078415992, "tps": 13904, "wall": 70460.6} {"step": 14949, "train_loss": 3.389492988586426, "lr": 0.00023548922099215553, "tps": 13904, "wall": 70465.6} {"step": 14950, "train_loss": 3.385071277618408, "lr": 0.0002354701339672491, "tps": 13904, "wall": 70470.5} {"step": 14951, "train_loss": 3.466297149658203, "lr": 0.00023545104676709616, "tps": 13904, "wall": 70475.5} {"step": 14952, "train_loss": 3.3781259059906006, "lr": 0.00023543195939191295, "tps": 13903, "wall": 70480.4} {"step": 14953, "train_loss": 3.346996307373047, "lr": 0.0002354128718419156, "tps": 13903, "wall": 70485.4} {"step": 14954, "train_loss": 3.4622573852539062, "lr": 0.00023539378411732047, "tps": 13903, "wall": 70490.3} {"step": 14955, "train_loss": 3.389538288116455, "lr": 0.00023537469621834372, "tps": 13903, "wall": 70495.3} {"step": 14956, "train_loss": 3.441473960876465, "lr": 0.00023535560814520151, "tps": 13903, "wall": 70500.3} {"step": 14957, "train_loss": 3.4046778678894043, "lr": 0.00023533651989811016, "tps": 13903, "wall": 70505.2} {"step": 14958, "train_loss": 3.386478900909424, "lr": 0.00023531743147728594, "tps": 13903, "wall": 70510.2} {"step": 14959, "train_loss": 3.3953206539154053, "lr": 0.000235298342882945, "tps": 13903, "wall": 70515.2} {"step": 14960, "train_loss": 3.344376564025879, "lr": 0.00023527925411530364, "tps": 13903, "wall": 70520.1} {"step": 14961, "train_loss": 3.3808889389038086, "lr": 0.000235260165174578, "tps": 13903, "wall": 70525.1} {"step": 14962, "train_loss": 3.3495583534240723, "lr": 0.00023524107606098435, "tps": 13903, "wall": 70530.0} {"step": 14963, "train_loss": 3.4188284873962402, "lr": 0.00023522198677473907, "tps": 13903, "wall": 70535.0} {"step": 14964, "train_loss": 3.4005086421966553, "lr": 0.0002352028973160582, "tps": 13903, "wall": 70539.9} {"step": 14965, "train_loss": 3.4988183975219727, "lr": 0.00023518380768515815, "tps": 13903, "wall": 70544.9} {"step": 14966, "train_loss": 3.3693103790283203, "lr": 0.00023516471788225513, "tps": 13903, "wall": 70549.9} {"step": 14967, "train_loss": 3.3586277961730957, "lr": 0.00023514562790756535, "tps": 13903, "wall": 70554.8} {"step": 14968, "train_loss": 3.2545104026794434, "lr": 0.000235126537761305, "tps": 13903, "wall": 70559.8} {"step": 14969, "train_loss": 3.419074058532715, "lr": 0.00023510744744369047, "tps": 13903, "wall": 70564.8} {"step": 14970, "train_loss": 3.4865503311157227, "lr": 0.000235088356954938, "tps": 13903, "wall": 70569.7} {"step": 14971, "train_loss": 3.3782289028167725, "lr": 0.00023506926629526372, "tps": 13903, "wall": 70574.7} {"step": 14972, "train_loss": 3.3189616203308105, "lr": 0.000235050175464884, "tps": 13903, "wall": 70579.7} {"step": 14973, "train_loss": 3.341984272003174, "lr": 0.00023503108446401515, "tps": 13902, "wall": 70584.6} {"step": 14974, "train_loss": 3.4107513427734375, "lr": 0.00023501199329287328, "tps": 13902, "wall": 70589.6} {"step": 14975, "train_loss": 3.413163900375366, "lr": 0.00023499290195167473, "tps": 13902, "wall": 70594.5} {"step": 14976, "train_loss": 3.3444294929504395, "lr": 0.00023497381044063585, "tps": 13902, "wall": 70599.5} {"step": 14977, "train_loss": 3.378333568572998, "lr": 0.00023495471875997282, "tps": 13902, "wall": 70604.5} {"step": 14978, "train_loss": 3.426740884780884, "lr": 0.00023493562690990184, "tps": 13902, "wall": 70609.5} {"step": 14979, "train_loss": 3.464024066925049, "lr": 0.00023491653489063935, "tps": 13902, "wall": 70614.4} {"step": 14980, "train_loss": 3.421964406967163, "lr": 0.00023489744270240154, "tps": 13902, "wall": 70619.5} {"step": 14981, "train_loss": 3.3451004028320312, "lr": 0.0002348783503454047, "tps": 13902, "wall": 70624.5} {"step": 14982, "train_loss": 3.385852336883545, "lr": 0.00023485925781986503, "tps": 13902, "wall": 70629.4} {"step": 14983, "train_loss": 3.435089111328125, "lr": 0.000234840165125999, "tps": 13902, "wall": 70634.4} {"step": 14984, "train_loss": 3.360621452331543, "lr": 0.00023482107226402267, "tps": 13902, "wall": 70639.3} {"step": 14985, "train_loss": 3.3458752632141113, "lr": 0.00023480197923415254, "tps": 13902, "wall": 70644.3} {"step": 14986, "train_loss": 3.5083820819854736, "lr": 0.00023478288603660468, "tps": 13902, "wall": 70649.3} {"step": 14987, "train_loss": 3.4884114265441895, "lr": 0.00023476379267159555, "tps": 13902, "wall": 70654.2} {"step": 14988, "train_loss": 3.323639392852783, "lr": 0.00023474469913934134, "tps": 13902, "wall": 70659.2} {"step": 14989, "train_loss": 3.3792672157287598, "lr": 0.00023472560544005836, "tps": 13902, "wall": 70664.1} {"step": 14990, "train_loss": 3.3413734436035156, "lr": 0.000234706511573963, "tps": 13902, "wall": 70669.1} {"step": 14991, "train_loss": 3.4186086654663086, "lr": 0.0002346874175412715, "tps": 13902, "wall": 70674.0} {"step": 14992, "train_loss": 3.37009859085083, "lr": 0.00023466832334220007, "tps": 13902, "wall": 70679.1} {"step": 14993, "train_loss": 3.3717384338378906, "lr": 0.0002346492289769651, "tps": 13901, "wall": 70684.0} {"step": 14994, "train_loss": 3.292323589324951, "lr": 0.00023463013444578284, "tps": 13901, "wall": 70689.0} {"step": 14995, "train_loss": 3.3433728218078613, "lr": 0.00023461103974886966, "tps": 13901, "wall": 70693.9} {"step": 14996, "train_loss": 3.4056482315063477, "lr": 0.00023459194488644177, "tps": 13901, "wall": 70698.9} {"step": 14997, "train_loss": 3.4219396114349365, "lr": 0.00023457284985871563, "tps": 13901, "wall": 70703.9} {"step": 14998, "train_loss": 3.425722599029541, "lr": 0.00023455375466590738, "tps": 13901, "wall": 70708.8} {"step": 14999, "train_loss": 3.3550188541412354, "lr": 0.00023453465930823347, "tps": 13901, "wall": 70713.8} {"step": 15000, "train_loss": 3.356438159942627, "lr": 0.00023451556378591018, "tps": 13901, "wall": 70718.8, "val_loss_monitor": 3.424423245104943, "val_loss_full": 3.4419859595496067} {"step": 15001, "train_loss": 3.457839012145996, "lr": 0.00023449646809915376, "tps": 13868, "wall": 70893.1} {"step": 15002, "train_loss": 3.4726037979125977, "lr": 0.00023447737224818052, "tps": 13868, "wall": 70898.1} {"step": 15003, "train_loss": 3.382439136505127, "lr": 0.00023445827623320685, "tps": 13868, "wall": 70903.1} {"step": 15004, "train_loss": 3.4037439823150635, "lr": 0.00023443918005444908, "tps": 13868, "wall": 70908.0} {"step": 15005, "train_loss": 3.270106077194214, "lr": 0.0002344200837121235, "tps": 13868, "wall": 70913.0} {"step": 15006, "train_loss": 3.356696128845215, "lr": 0.00023440098720644632, "tps": 13868, "wall": 70918.0} {"step": 15007, "train_loss": 3.4188990592956543, "lr": 0.0002343818905376341, "tps": 13868, "wall": 70923.0} {"step": 15008, "train_loss": 3.3812003135681152, "lr": 0.000234362793705903, "tps": 13868, "wall": 70928.0} {"step": 15009, "train_loss": 3.3425188064575195, "lr": 0.00023434369671146942, "tps": 13867, "wall": 70932.9} {"step": 15010, "train_loss": 3.467750072479248, "lr": 0.00023432459955454964, "tps": 13867, "wall": 70937.9} {"step": 15011, "train_loss": 3.3147974014282227, "lr": 0.00023430550223536004, "tps": 13867, "wall": 70942.8} {"step": 15012, "train_loss": 3.3607711791992188, "lr": 0.00023428640475411694, "tps": 13867, "wall": 70947.8} {"step": 15013, "train_loss": 3.2381296157836914, "lr": 0.00023426730711103666, "tps": 13867, "wall": 70952.8} {"step": 15014, "train_loss": 3.4069578647613525, "lr": 0.00023424820930633558, "tps": 13867, "wall": 70957.7} {"step": 15015, "train_loss": 3.391230821609497, "lr": 0.00023422911134023, "tps": 13867, "wall": 70962.7} {"step": 15016, "train_loss": 3.3656821250915527, "lr": 0.00023421001321293622, "tps": 13867, "wall": 70967.6} {"step": 15017, "train_loss": 3.4882397651672363, "lr": 0.00023419091492467073, "tps": 13867, "wall": 70972.6} {"step": 15018, "train_loss": 3.3108890056610107, "lr": 0.0002341718164756497, "tps": 13867, "wall": 70977.6} {"step": 15019, "train_loss": 3.34578800201416, "lr": 0.0002341527178660896, "tps": 13867, "wall": 70982.6} {"step": 15020, "train_loss": 3.357039451599121, "lr": 0.0002341336190962068, "tps": 13867, "wall": 70987.6} {"step": 15021, "train_loss": 3.224456310272217, "lr": 0.00023411452016621756, "tps": 13867, "wall": 70992.5} {"step": 15022, "train_loss": 3.433115005493164, "lr": 0.0002340954210763383, "tps": 13867, "wall": 70997.5} {"step": 15023, "train_loss": 3.3080344200134277, "lr": 0.00023407632182678527, "tps": 13867, "wall": 71002.4} {"step": 15024, "train_loss": 3.349400520324707, "lr": 0.00023405722241777498, "tps": 13867, "wall": 71007.4} {"step": 15025, "train_loss": 3.3620193004608154, "lr": 0.00023403812284952368, "tps": 13867, "wall": 71012.4} {"step": 15026, "train_loss": 3.419518232345581, "lr": 0.00023401902312224774, "tps": 13867, "wall": 71017.3} {"step": 15027, "train_loss": 3.351381301879883, "lr": 0.00023399992323616363, "tps": 13867, "wall": 71022.3} {"step": 15028, "train_loss": 3.364258289337158, "lr": 0.00023398082319148756, "tps": 13867, "wall": 71027.2} {"step": 15029, "train_loss": 3.473315954208374, "lr": 0.00023396172298843597, "tps": 13867, "wall": 71032.2} {"step": 15030, "train_loss": 3.428173065185547, "lr": 0.0002339426226272253, "tps": 13866, "wall": 71037.2} {"step": 15031, "train_loss": 3.4697391986846924, "lr": 0.00023392352210807179, "tps": 13866, "wall": 71042.2} {"step": 15032, "train_loss": 3.3780765533447266, "lr": 0.00023390442143119184, "tps": 13866, "wall": 71047.1} {"step": 15033, "train_loss": 3.4151055812835693, "lr": 0.00023388532059680185, "tps": 13866, "wall": 71052.1} {"step": 15034, "train_loss": 3.343099355697632, "lr": 0.00023386621960511832, "tps": 13866, "wall": 71057.0} {"step": 15035, "train_loss": 3.5034642219543457, "lr": 0.00023384711845635735, "tps": 13866, "wall": 71062.0} {"step": 15036, "train_loss": 3.368086338043213, "lr": 0.00023382801715073556, "tps": 13866, "wall": 71067.0} {"step": 15037, "train_loss": 3.3059823513031006, "lr": 0.00023380891568846926, "tps": 13866, "wall": 71071.9} {"step": 15038, "train_loss": 3.3902475833892822, "lr": 0.00023378981406977473, "tps": 13866, "wall": 71076.9} {"step": 15039, "train_loss": 3.4200522899627686, "lr": 0.00023377071229486847, "tps": 13866, "wall": 71081.8} {"step": 15040, "train_loss": 3.322861671447754, "lr": 0.00023375161036396684, "tps": 13866, "wall": 71086.8} {"step": 15041, "train_loss": 3.4444448947906494, "lr": 0.00023373250827728629, "tps": 13866, "wall": 71091.8} {"step": 15042, "train_loss": 3.258063793182373, "lr": 0.00023371340603504313, "tps": 13866, "wall": 71096.7} {"step": 15043, "train_loss": 3.330251693725586, "lr": 0.0002336943036374537, "tps": 13866, "wall": 71101.7} {"step": 15044, "train_loss": 3.430185317993164, "lr": 0.00023367520108473445, "tps": 13866, "wall": 71106.6} {"step": 15045, "train_loss": 3.4610118865966797, "lr": 0.00023365609837710185, "tps": 13866, "wall": 71111.6} {"step": 15046, "train_loss": 3.4026060104370117, "lr": 0.0002336369955147722, "tps": 13866, "wall": 71116.6} {"step": 15047, "train_loss": 3.390629768371582, "lr": 0.0002336178924979619, "tps": 13866, "wall": 71121.5} {"step": 15048, "train_loss": 3.3362245559692383, "lr": 0.00023359878932688744, "tps": 13866, "wall": 71126.5} {"step": 15049, "train_loss": 3.350118398666382, "lr": 0.00023357968600176509, "tps": 13866, "wall": 71131.4} {"step": 15050, "train_loss": 3.360166549682617, "lr": 0.00023356058252281135, "tps": 13866, "wall": 71136.4} {"step": 15051, "train_loss": 3.4395041465759277, "lr": 0.00023354147889024263, "tps": 13866, "wall": 71141.3} {"step": 15052, "train_loss": 3.4150261878967285, "lr": 0.00023352237510427523, "tps": 13865, "wall": 71146.3} {"step": 15053, "train_loss": 3.374906063079834, "lr": 0.0002335032711651257, "tps": 13865, "wall": 71151.3} {"step": 15054, "train_loss": 3.341169595718384, "lr": 0.00023348416707301035, "tps": 13865, "wall": 71156.2} {"step": 15055, "train_loss": 3.343510389328003, "lr": 0.00023346506282814563, "tps": 13865, "wall": 71161.2} {"step": 15056, "train_loss": 3.4245996475219727, "lr": 0.00023344595843074797, "tps": 13865, "wall": 71166.2} {"step": 15057, "train_loss": 3.428619861602783, "lr": 0.0002334268538810337, "tps": 13865, "wall": 71171.2} {"step": 15058, "train_loss": 3.507695198059082, "lr": 0.00023340774917921943, "tps": 13865, "wall": 71176.2} {"step": 15059, "train_loss": 3.3986308574676514, "lr": 0.00023338864432552133, "tps": 13865, "wall": 71181.1} {"step": 15060, "train_loss": 3.3809456825256348, "lr": 0.00023336953932015595, "tps": 13865, "wall": 71186.1} {"step": 15061, "train_loss": 3.3490219116210938, "lr": 0.00023335043416333978, "tps": 13865, "wall": 71191.0} {"step": 15062, "train_loss": 3.314910411834717, "lr": 0.00023333132885528914, "tps": 13865, "wall": 71196.0} {"step": 15063, "train_loss": 3.2426345348358154, "lr": 0.00023331222339622047, "tps": 13865, "wall": 71200.9} {"step": 15064, "train_loss": 3.3737003803253174, "lr": 0.0002332931177863502, "tps": 13865, "wall": 71205.9} {"step": 15065, "train_loss": 3.3416881561279297, "lr": 0.00023327401202589485, "tps": 13865, "wall": 71210.8} {"step": 15066, "train_loss": 3.449977159500122, "lr": 0.0002332549061150707, "tps": 13865, "wall": 71215.8} {"step": 15067, "train_loss": 3.4101614952087402, "lr": 0.00023323580005409428, "tps": 13865, "wall": 71220.8} {"step": 15068, "train_loss": 3.348379611968994, "lr": 0.00023321669384318198, "tps": 13865, "wall": 71225.8} {"step": 15069, "train_loss": 3.418940544128418, "lr": 0.00023319758748255027, "tps": 13865, "wall": 71230.7} {"step": 15070, "train_loss": 3.3989713191986084, "lr": 0.00023317848097241558, "tps": 13865, "wall": 71235.7} {"step": 15071, "train_loss": 3.389364719390869, "lr": 0.00023315937431299432, "tps": 13865, "wall": 71240.7} {"step": 15072, "train_loss": 3.332411766052246, "lr": 0.00023314026750450299, "tps": 13865, "wall": 71245.6} {"step": 15073, "train_loss": 3.3241729736328125, "lr": 0.00023312116054715799, "tps": 13865, "wall": 71250.6} {"step": 15074, "train_loss": 3.3719913959503174, "lr": 0.00023310205344117578, "tps": 13864, "wall": 71255.5} {"step": 15075, "train_loss": 3.3855857849121094, "lr": 0.00023308294618677283, "tps": 13864, "wall": 71260.5} {"step": 15076, "train_loss": 3.3998236656188965, "lr": 0.00023306383878416548, "tps": 13864, "wall": 71265.5} {"step": 15077, "train_loss": 3.42568039894104, "lr": 0.00023304473123357026, "tps": 13864, "wall": 71270.4} {"step": 15078, "train_loss": 3.217466354370117, "lr": 0.0002330256235352037, "tps": 13864, "wall": 71275.4} {"step": 15079, "train_loss": 3.392106533050537, "lr": 0.00023300651568928214, "tps": 13864, "wall": 71280.4} {"step": 15080, "train_loss": 3.3053855895996094, "lr": 0.00023298740769602203, "tps": 13864, "wall": 71285.4} {"step": 15081, "train_loss": 3.333357810974121, "lr": 0.00023296829955563982, "tps": 13864, "wall": 71290.3} {"step": 15082, "train_loss": 3.3212289810180664, "lr": 0.00023294919126835219, "tps": 13864, "wall": 71295.3} {"step": 15083, "train_loss": 3.4268922805786133, "lr": 0.00023293008283437522, "tps": 13864, "wall": 71300.3} {"step": 15084, "train_loss": 3.3337035179138184, "lr": 0.00023291097425392568, "tps": 13864, "wall": 71305.3} {"step": 15085, "train_loss": 3.3505866527557373, "lr": 0.0002328918655272199, "tps": 13864, "wall": 71310.2} {"step": 15086, "train_loss": 3.363318920135498, "lr": 0.0002328727566544744, "tps": 13864, "wall": 71315.2} {"step": 15087, "train_loss": 3.3485934734344482, "lr": 0.00023285364763590556, "tps": 13864, "wall": 71320.1} {"step": 15088, "train_loss": 3.4873430728912354, "lr": 0.00023283453847172992, "tps": 13864, "wall": 71325.1} {"step": 15089, "train_loss": 3.262406587600708, "lr": 0.000232815429162164, "tps": 13864, "wall": 71330.1} {"step": 15090, "train_loss": 3.324429988861084, "lr": 0.00023279631970742415, "tps": 13864, "wall": 71335.0} {"step": 15091, "train_loss": 3.320964813232422, "lr": 0.00023277721010772688, "tps": 13864, "wall": 71340.1} {"step": 15092, "train_loss": 3.3501532077789307, "lr": 0.00023275810036328868, "tps": 13864, "wall": 71345.1} {"step": 15093, "train_loss": 3.300344944000244, "lr": 0.0002327389904743261, "tps": 13864, "wall": 71350.0} {"step": 15094, "train_loss": 3.2359893321990967, "lr": 0.00023271988044105548, "tps": 13863, "wall": 71355.0} {"step": 15095, "train_loss": 3.4178237915039062, "lr": 0.00023270077026369342, "tps": 13863, "wall": 71360.0} {"step": 15096, "train_loss": 3.3283286094665527, "lr": 0.0002326816599424563, "tps": 13863, "wall": 71365.0} {"step": 15097, "train_loss": 3.3564798831939697, "lr": 0.00023266254947756064, "tps": 13863, "wall": 71369.9} {"step": 15098, "train_loss": 3.4304890632629395, "lr": 0.00023264343886922296, "tps": 13863, "wall": 71374.9} {"step": 15099, "train_loss": 3.267770767211914, "lr": 0.00023262432811765974, "tps": 13863, "wall": 71379.9} {"step": 15100, "train_loss": 3.465627431869507, "lr": 0.00023260521722308743, "tps": 13863, "wall": 71384.9} {"step": 15101, "train_loss": 3.384580135345459, "lr": 0.0002325861061857225, "tps": 13863, "wall": 71389.9} {"step": 15102, "train_loss": 3.3483216762542725, "lr": 0.0002325669950057815, "tps": 13863, "wall": 71394.8} {"step": 15103, "train_loss": 3.316484212875366, "lr": 0.00023254788368348096, "tps": 13863, "wall": 71399.8} {"step": 15104, "train_loss": 3.408048629760742, "lr": 0.00023252877221903724, "tps": 13863, "wall": 71404.8} {"step": 15105, "train_loss": 3.5132551193237305, "lr": 0.00023250966061266697, "tps": 13863, "wall": 71409.8} {"step": 15106, "train_loss": 3.3346290588378906, "lr": 0.00023249054886458653, "tps": 13863, "wall": 71414.7} {"step": 15107, "train_loss": 3.402771472930908, "lr": 0.0002324714369750125, "tps": 13863, "wall": 71419.7} {"step": 15108, "train_loss": 3.357658863067627, "lr": 0.00023245232494416133, "tps": 13863, "wall": 71424.7} {"step": 15109, "train_loss": 3.1910552978515625, "lr": 0.00023243321277224962, "tps": 13863, "wall": 71429.6} {"step": 15110, "train_loss": 3.3967537879943848, "lr": 0.0002324141004594938, "tps": 13863, "wall": 71434.6} {"step": 15111, "train_loss": 3.369847059249878, "lr": 0.0002323949880061103, "tps": 13863, "wall": 71439.6} {"step": 15112, "train_loss": 3.430835008621216, "lr": 0.00023237587541231577, "tps": 13863, "wall": 71444.5} {"step": 15113, "train_loss": 3.4287586212158203, "lr": 0.0002323567626783266, "tps": 13863, "wall": 71449.5} {"step": 15114, "train_loss": 3.4035563468933105, "lr": 0.00023233764980435938, "tps": 13863, "wall": 71454.4} {"step": 15115, "train_loss": 3.314539909362793, "lr": 0.0002323185367906306, "tps": 13862, "wall": 71459.5} {"step": 15116, "train_loss": 3.323455572128296, "lr": 0.0002322994236373568, "tps": 13862, "wall": 71464.4} {"step": 15117, "train_loss": 3.419455051422119, "lr": 0.00023228031034475444, "tps": 13862, "wall": 71469.4} {"step": 15118, "train_loss": 3.3974356651306152, "lr": 0.00023226119691303998, "tps": 13862, "wall": 71474.4} {"step": 15119, "train_loss": 3.4481863975524902, "lr": 0.00023224208334243014, "tps": 13862, "wall": 71479.4} {"step": 15120, "train_loss": 3.5054948329925537, "lr": 0.00023222296963314122, "tps": 13862, "wall": 71484.3} {"step": 15121, "train_loss": 3.3803558349609375, "lr": 0.00023220385578538993, "tps": 13862, "wall": 71489.3} {"step": 15122, "train_loss": 3.2445638179779053, "lr": 0.00023218474179939272, "tps": 13862, "wall": 71494.3} {"step": 15123, "train_loss": 3.4251651763916016, "lr": 0.00023216562767536597, "tps": 13862, "wall": 71499.2} {"step": 15124, "train_loss": 3.378997325897217, "lr": 0.00023214651341352637, "tps": 13862, "wall": 71504.2} {"step": 15125, "train_loss": 3.354963779449463, "lr": 0.00023212739901409045, "tps": 13862, "wall": 71509.2} {"step": 15126, "train_loss": 3.3419089317321777, "lr": 0.00023210828447727474, "tps": 13862, "wall": 71514.1} {"step": 15127, "train_loss": 3.365640163421631, "lr": 0.00023208916980329566, "tps": 13862, "wall": 71519.2} {"step": 15128, "train_loss": 3.363485813140869, "lr": 0.00023207005499236984, "tps": 13862, "wall": 71524.1} {"step": 15129, "train_loss": 3.3883743286132812, "lr": 0.00023205094004471373, "tps": 13862, "wall": 71529.1} {"step": 15130, "train_loss": 3.342963695526123, "lr": 0.000232031824960544, "tps": 13862, "wall": 71534.1} {"step": 15131, "train_loss": 3.3629331588745117, "lr": 0.00023201270974007704, "tps": 13862, "wall": 71539.1} {"step": 15132, "train_loss": 3.426280975341797, "lr": 0.00023199359438352946, "tps": 13862, "wall": 71544.0} {"step": 15133, "train_loss": 3.3600544929504395, "lr": 0.00023197447889111784, "tps": 13862, "wall": 71549.0} {"step": 15134, "train_loss": 3.4758920669555664, "lr": 0.00023195536326305863, "tps": 13862, "wall": 71554.0} {"step": 15135, "train_loss": 3.363865375518799, "lr": 0.00023193624749956842, "tps": 13862, "wall": 71558.9} {"step": 15136, "train_loss": 3.3778011798858643, "lr": 0.0002319171316008638, "tps": 13861, "wall": 71563.9} {"step": 15137, "train_loss": 3.3716659545898438, "lr": 0.0002318980155671612, "tps": 13861, "wall": 71568.9} {"step": 15138, "train_loss": 3.3715546131134033, "lr": 0.00023187889939867726, "tps": 13861, "wall": 71573.9} {"step": 15139, "train_loss": 3.309054136276245, "lr": 0.00023185978309562852, "tps": 13861, "wall": 71578.9} {"step": 15140, "train_loss": 3.3680455684661865, "lr": 0.00023184066665823152, "tps": 13861, "wall": 71583.9} {"step": 15141, "train_loss": 3.2824411392211914, "lr": 0.00023182155008670278, "tps": 13861, "wall": 71588.9} {"step": 15142, "train_loss": 3.362534999847412, "lr": 0.00023180243338125886, "tps": 13861, "wall": 71593.9} {"step": 15143, "train_loss": 3.213547706604004, "lr": 0.0002317833165421164, "tps": 13861, "wall": 71598.8} {"step": 15144, "train_loss": 3.390489101409912, "lr": 0.00023176419956949187, "tps": 13861, "wall": 71603.8} {"step": 15145, "train_loss": 3.4141788482666016, "lr": 0.00023174508246360186, "tps": 13861, "wall": 71608.8} {"step": 15146, "train_loss": 3.3737502098083496, "lr": 0.00023172596522466287, "tps": 13861, "wall": 71613.8} {"step": 15147, "train_loss": 3.4377269744873047, "lr": 0.0002317068478528916, "tps": 13861, "wall": 71618.7} {"step": 15148, "train_loss": 3.327080249786377, "lr": 0.00023168773034850447, "tps": 13861, "wall": 71623.7} {"step": 15149, "train_loss": 3.4013290405273438, "lr": 0.00023166861271171806, "tps": 13861, "wall": 71628.7} {"step": 15150, "train_loss": 3.468928575515747, "lr": 0.00023164949494274906, "tps": 13861, "wall": 71633.7} {"step": 15151, "train_loss": 3.3750715255737305, "lr": 0.00023163037704181392, "tps": 13861, "wall": 71638.7} {"step": 15152, "train_loss": 3.4392333030700684, "lr": 0.0002316112590091292, "tps": 13861, "wall": 71643.7} {"step": 15153, "train_loss": 3.203826427459717, "lr": 0.00023159214084491155, "tps": 13861, "wall": 71648.7} {"step": 15154, "train_loss": 3.3220105171203613, "lr": 0.0002315730225493775, "tps": 13861, "wall": 71653.7} {"step": 15155, "train_loss": 3.460308074951172, "lr": 0.00023155390412274362, "tps": 13861, "wall": 71658.6} {"step": 15156, "train_loss": 3.3325307369232178, "lr": 0.00023153478556522643, "tps": 13861, "wall": 71663.6} {"step": 15157, "train_loss": 3.396610975265503, "lr": 0.00023151566687704266, "tps": 13860, "wall": 71668.6} {"step": 15158, "train_loss": 3.4538767337799072, "lr": 0.00023149654805840872, "tps": 13860, "wall": 71673.6} {"step": 15159, "train_loss": 3.403015613555908, "lr": 0.00023147742910954126, "tps": 13860, "wall": 71678.5} {"step": 15160, "train_loss": 3.486374855041504, "lr": 0.00023145831003065697, "tps": 13860, "wall": 71683.5} {"step": 15161, "train_loss": 3.444324016571045, "lr": 0.00023143919082197224, "tps": 13860, "wall": 71688.5} {"step": 15162, "train_loss": 3.329622507095337, "lr": 0.00023142007148370373, "tps": 13860, "wall": 71693.5} {"step": 15163, "train_loss": 3.347856044769287, "lr": 0.00023140095201606804, "tps": 13860, "wall": 71698.5} {"step": 15164, "train_loss": 3.409475088119507, "lr": 0.0002313818324192818, "tps": 13860, "wall": 71703.5} {"step": 15165, "train_loss": 3.4150543212890625, "lr": 0.00023136271269356143, "tps": 13860, "wall": 71708.5} {"step": 15166, "train_loss": 3.3866987228393555, "lr": 0.00023134359283912375, "tps": 13860, "wall": 71713.5} {"step": 15167, "train_loss": 3.4516444206237793, "lr": 0.00023132447285618518, "tps": 13860, "wall": 71718.5} {"step": 15168, "train_loss": 3.521458625793457, "lr": 0.00023130535274496237, "tps": 13860, "wall": 71723.4} {"step": 15169, "train_loss": 3.3751144409179688, "lr": 0.00023128623250567195, "tps": 13860, "wall": 71728.4} {"step": 15170, "train_loss": 3.3629512786865234, "lr": 0.00023126711213853046, "tps": 13860, "wall": 71733.4} {"step": 15171, "train_loss": 3.3797736167907715, "lr": 0.00023124799164375451, "tps": 13860, "wall": 71738.4} {"step": 15172, "train_loss": 3.437005043029785, "lr": 0.00023122887102156067, "tps": 13860, "wall": 71743.3} {"step": 15173, "train_loss": 3.3967294692993164, "lr": 0.0002312097502721656, "tps": 13860, "wall": 71748.3} {"step": 15174, "train_loss": 3.3171584606170654, "lr": 0.0002311906293957859, "tps": 13860, "wall": 71753.3} {"step": 15175, "train_loss": 3.3993730545043945, "lr": 0.00023117150839263814, "tps": 13860, "wall": 71758.4} {"step": 15176, "train_loss": 3.4035165309906006, "lr": 0.00023115238726293885, "tps": 13859, "wall": 71763.4} {"step": 15177, "train_loss": 3.3342511653900146, "lr": 0.0002311332660069048, "tps": 13859, "wall": 71768.3} {"step": 15178, "train_loss": 3.3985962867736816, "lr": 0.0002311141446247525, "tps": 13859, "wall": 71773.3} {"step": 15179, "train_loss": 3.3028879165649414, "lr": 0.00023109502311669853, "tps": 13859, "wall": 71778.3} {"step": 15180, "train_loss": 3.3038434982299805, "lr": 0.0002310759014829596, "tps": 13859, "wall": 71783.3} {"step": 15181, "train_loss": 3.35477352142334, "lr": 0.00023105677972375216, "tps": 13859, "wall": 71788.3} {"step": 15182, "train_loss": 3.343884229660034, "lr": 0.00023103765783929298, "tps": 13859, "wall": 71793.2} {"step": 15183, "train_loss": 3.4225635528564453, "lr": 0.00023101853582979863, "tps": 13859, "wall": 71798.2} {"step": 15184, "train_loss": 3.3484115600585938, "lr": 0.0002309994136954857, "tps": 13859, "wall": 71803.2} {"step": 15185, "train_loss": 3.280062675476074, "lr": 0.0002309802914365708, "tps": 13859, "wall": 71808.2} {"step": 15186, "train_loss": 3.4540913105010986, "lr": 0.00023096116905327055, "tps": 13859, "wall": 71813.2} {"step": 15187, "train_loss": 3.32312273979187, "lr": 0.00023094204654580165, "tps": 13859, "wall": 71818.3} {"step": 15188, "train_loss": 3.4332125186920166, "lr": 0.0002309229239143806, "tps": 13859, "wall": 71823.2} {"step": 15189, "train_loss": 3.409921646118164, "lr": 0.0002309038011592241, "tps": 13859, "wall": 71828.2} {"step": 15190, "train_loss": 3.4225170612335205, "lr": 0.00023088467828054877, "tps": 13859, "wall": 71833.3} {"step": 15191, "train_loss": 3.363607406616211, "lr": 0.0002308655552785712, "tps": 13859, "wall": 71838.2} {"step": 15192, "train_loss": 3.3361144065856934, "lr": 0.00023084643215350793, "tps": 13859, "wall": 71843.2} {"step": 15193, "train_loss": 3.430647373199463, "lr": 0.00023082730890557583, "tps": 13859, "wall": 71848.2} {"step": 15194, "train_loss": 3.37424373626709, "lr": 0.00023080818553499133, "tps": 13859, "wall": 71853.2} {"step": 15195, "train_loss": 3.385288715362549, "lr": 0.00023078906204197113, "tps": 13859, "wall": 71858.2} {"step": 15196, "train_loss": 3.4271881580352783, "lr": 0.00023076993842673186, "tps": 13858, "wall": 71863.2} {"step": 15197, "train_loss": 3.387258529663086, "lr": 0.0002307508146894901, "tps": 13858, "wall": 71868.2} {"step": 15198, "train_loss": 3.3440804481506348, "lr": 0.00023073169083046255, "tps": 13858, "wall": 71873.2} {"step": 15199, "train_loss": 3.2899820804595947, "lr": 0.00023071256684986584, "tps": 13858, "wall": 71878.3} {"step": 15200, "train_loss": 3.4345507621765137, "lr": 0.0002306934427479166, "tps": 13858, "wall": 71883.3} {"step": 15201, "train_loss": 3.270636558532715, "lr": 0.00023067431852483145, "tps": 13858, "wall": 71888.3} {"step": 15202, "train_loss": 3.329317808151245, "lr": 0.00023065519418082704, "tps": 13858, "wall": 71893.4} {"step": 15203, "train_loss": 3.3237063884735107, "lr": 0.00023063606971612002, "tps": 13858, "wall": 71898.4} {"step": 15204, "train_loss": 3.4096336364746094, "lr": 0.00023061694513092706, "tps": 13858, "wall": 71903.4} {"step": 15205, "train_loss": 3.3809099197387695, "lr": 0.00023059782042546476, "tps": 13858, "wall": 71908.5} {"step": 15206, "train_loss": 3.260801315307617, "lr": 0.00023057869559994974, "tps": 13858, "wall": 71913.5} {"step": 15207, "train_loss": 3.402864456176758, "lr": 0.0002305595706545987, "tps": 13858, "wall": 71918.6} {"step": 15208, "train_loss": 3.3089280128479004, "lr": 0.0002305404455896283, "tps": 13858, "wall": 71923.7} {"step": 15209, "train_loss": 3.312314748764038, "lr": 0.00023052132040525506, "tps": 13858, "wall": 71928.8} {"step": 15210, "train_loss": 3.3977999687194824, "lr": 0.0002305021951016958, "tps": 13858, "wall": 71934.0} {"step": 15211, "train_loss": 3.4544107913970947, "lr": 0.0002304830696791672, "tps": 13858, "wall": 71939.2} {"step": 15212, "train_loss": 3.4030866622924805, "lr": 0.00023046394413788574, "tps": 13857, "wall": 71944.5} {"step": 15213, "train_loss": 3.4046781063079834, "lr": 0.0002304448184780681, "tps": 13857, "wall": 71949.8} {"step": 15214, "train_loss": 3.325747489929199, "lr": 0.00023042569269993103, "tps": 13857, "wall": 71955.0} {"step": 15215, "train_loss": 3.387570381164551, "lr": 0.00023040656680369117, "tps": 13857, "wall": 71960.2} {"step": 15216, "train_loss": 3.3636670112609863, "lr": 0.00023038744078956517, "tps": 13857, "wall": 71965.4} {"step": 15217, "train_loss": 3.330258846282959, "lr": 0.00023036831465776962, "tps": 13857, "wall": 71970.6} {"step": 15218, "train_loss": 3.3131377696990967, "lr": 0.0002303491884085213, "tps": 13857, "wall": 71975.8} {"step": 15219, "train_loss": 3.4225945472717285, "lr": 0.00023033006204203676, "tps": 13857, "wall": 71981.0} {"step": 15220, "train_loss": 3.3685827255249023, "lr": 0.00023031093555853275, "tps": 13857, "wall": 71986.2} {"step": 15221, "train_loss": 3.3183679580688477, "lr": 0.0002302918089582259, "tps": 13857, "wall": 71991.4} {"step": 15222, "train_loss": 3.3052563667297363, "lr": 0.0002302726822413329, "tps": 13856, "wall": 71996.6} {"step": 15223, "train_loss": 3.3687987327575684, "lr": 0.0002302535554080704, "tps": 13856, "wall": 72002.0} {"step": 15224, "train_loss": 3.347850799560547, "lr": 0.000230234428458655, "tps": 13856, "wall": 72007.1} {"step": 15225, "train_loss": 3.2990927696228027, "lr": 0.00023021530139330355, "tps": 13856, "wall": 72012.4} {"step": 15226, "train_loss": 3.3545312881469727, "lr": 0.00023019617421223253, "tps": 13856, "wall": 72017.6} {"step": 15227, "train_loss": 3.403795003890991, "lr": 0.0002301770469156587, "tps": 13856, "wall": 72022.9} {"step": 15228, "train_loss": 3.347970962524414, "lr": 0.0002301579195037988, "tps": 13856, "wall": 72028.1} {"step": 15229, "train_loss": 3.3234052658081055, "lr": 0.00023013879197686938, "tps": 13856, "wall": 72033.4} {"step": 15230, "train_loss": 3.300001859664917, "lr": 0.00023011966433508717, "tps": 13856, "wall": 72038.6} {"step": 15231, "train_loss": 3.3584835529327393, "lr": 0.00023010053657866885, "tps": 13856, "wall": 72043.9} {"step": 15232, "train_loss": 3.421687602996826, "lr": 0.00023008140870783118, "tps": 13855, "wall": 72049.1} {"step": 15233, "train_loss": 3.3517842292785645, "lr": 0.0002300622807227907, "tps": 13855, "wall": 72054.4} {"step": 15234, "train_loss": 3.443202495574951, "lr": 0.00023004315262376416, "tps": 13855, "wall": 72059.7} {"step": 15235, "train_loss": 3.3835086822509766, "lr": 0.0002300240244109683, "tps": 13855, "wall": 72065.0} {"step": 15236, "train_loss": 3.4876184463500977, "lr": 0.0002300048960846197, "tps": 13855, "wall": 72070.3} {"step": 15237, "train_loss": 3.4289467334747314, "lr": 0.00022998576764493507, "tps": 13855, "wall": 72075.5} {"step": 15238, "train_loss": 3.3983259201049805, "lr": 0.00022996663909213117, "tps": 13855, "wall": 72080.8} {"step": 15239, "train_loss": 3.402482271194458, "lr": 0.00022994751042642464, "tps": 13855, "wall": 72086.0} {"step": 15240, "train_loss": 3.332458257675171, "lr": 0.00022992838164803217, "tps": 13855, "wall": 72091.3} {"step": 15241, "train_loss": 3.418715238571167, "lr": 0.0002299092527571704, "tps": 13855, "wall": 72096.5} {"step": 15242, "train_loss": 3.3365821838378906, "lr": 0.0002298901237540562, "tps": 13854, "wall": 72101.8} {"step": 15243, "train_loss": 3.4487388134002686, "lr": 0.00022987099463890606, "tps": 13854, "wall": 72107.1} {"step": 15244, "train_loss": 3.376600980758667, "lr": 0.00022985186541193674, "tps": 13854, "wall": 72112.4} {"step": 15245, "train_loss": 3.377556800842285, "lr": 0.000229832736073365, "tps": 13854, "wall": 72117.8} {"step": 15246, "train_loss": 3.3702735900878906, "lr": 0.00022981360662340748, "tps": 13854, "wall": 72123.2} {"step": 15247, "train_loss": 3.497098684310913, "lr": 0.00022979447706228086, "tps": 13854, "wall": 72128.5} {"step": 15248, "train_loss": 3.2850022315979004, "lr": 0.00022977534739020193, "tps": 13854, "wall": 72133.8} {"step": 15249, "train_loss": 3.2817835807800293, "lr": 0.00022975621760738734, "tps": 13854, "wall": 72139.1} {"step": 15250, "train_loss": 3.47822642326355, "lr": 0.00022973708771405375, "tps": 13854, "wall": 72144.4} {"step": 15251, "train_loss": 3.3685154914855957, "lr": 0.0002297179577104179, "tps": 13853, "wall": 72149.6} {"step": 15252, "train_loss": 3.4215431213378906, "lr": 0.00022969882759669652, "tps": 13853, "wall": 72154.9} {"step": 15253, "train_loss": 3.2736735343933105, "lr": 0.0002296796973731063, "tps": 13853, "wall": 72160.1} {"step": 15254, "train_loss": 3.375432014465332, "lr": 0.00022966056703986395, "tps": 13853, "wall": 72165.3} {"step": 15255, "train_loss": 3.344747543334961, "lr": 0.00022964143659718613, "tps": 13853, "wall": 72170.6} {"step": 15256, "train_loss": 3.421863079071045, "lr": 0.00022962230604528966, "tps": 13853, "wall": 72176.0} {"step": 15257, "train_loss": 3.347975492477417, "lr": 0.0002296031753843911, "tps": 13853, "wall": 72181.5} {"step": 15258, "train_loss": 3.3374757766723633, "lr": 0.0002295840446147073, "tps": 13853, "wall": 72185.9} {"step": 15259, "train_loss": 3.413158893585205, "lr": 0.00022956491373645496, "tps": 13853, "wall": 72191.9} {"step": 15260, "train_loss": 3.2772738933563232, "lr": 0.00022954578274985075, "tps": 13852, "wall": 72197.5} {"step": 15261, "train_loss": 3.3539884090423584, "lr": 0.00022952665165511133, "tps": 13852, "wall": 72202.9} {"step": 15001, "train_loss": 3.3675849437713623, "lr": 0.00023449646809915376, "tps": 200096899, "wall": 4.9} {"step": 15002, "train_loss": 3.3552727699279785, "lr": 0.00023447737224818052, "tps": 107280863, "wall": 9.2} {"step": 15003, "train_loss": 3.3553473949432373, "lr": 0.00023445827623320685, "tps": 71720941, "wall": 13.7} {"step": 15004, "train_loss": 3.4603543281555176, "lr": 0.00023443918005444908, "tps": 53964785, "wall": 18.2} {"step": 15005, "train_loss": 3.31911563873291, "lr": 0.0002344200837121235, "tps": 43135794, "wall": 22.8} {"step": 15006, "train_loss": 3.348647117614746, "lr": 0.00023440098720644632, "tps": 35758279, "wall": 27.5} {"step": 15007, "train_loss": 3.343111515045166, "lr": 0.0002343818905376341, "tps": 30478991, "wall": 32.3} {"step": 15008, "train_loss": 3.4472413063049316, "lr": 0.000234362793705903, "tps": 26599861, "wall": 37.0} {"step": 15009, "train_loss": 3.4315896034240723, "lr": 0.00023434369671146942, "tps": 23595532, "wall": 41.7} {"step": 15010, "train_loss": 3.428272247314453, "lr": 0.00023432459955454964, "tps": 21162656, "wall": 46.5} {"step": 15011, "train_loss": 3.3374104499816895, "lr": 0.00023430550223536004, "tps": 19199201, "wall": 51.2} {"step": 15012, "train_loss": 3.4275898933410645, "lr": 0.00023428640475411694, "tps": 17555228, "wall": 56.0} {"step": 15013, "train_loss": 3.305713653564453, "lr": 0.00023426730711103666, "tps": 16161636, "wall": 60.9} {"step": 15014, "train_loss": 3.3364415168762207, "lr": 0.00023424820930633558, "tps": 14966189, "wall": 65.7} {"step": 15015, "train_loss": 3.4940459728240967, "lr": 0.00023422911134023, "tps": 13923727, "wall": 70.7} {"step": 15016, "train_loss": 3.4102649688720703, "lr": 0.00023421001321293622, "tps": 12983430, "wall": 75.8} {"step": 15017, "train_loss": 3.3035335540771484, "lr": 0.00023419091492467073, "tps": 12148938, "wall": 81.0} {"step": 15018, "train_loss": 3.4505414962768555, "lr": 0.0002341718164756497, "tps": 11401860, "wall": 86.3} {"step": 15019, "train_loss": 3.426044464111328, "lr": 0.0002341527178660896, "tps": 10732675, "wall": 91.7} {"step": 15020, "train_loss": 3.4021172523498535, "lr": 0.0002341336190962068, "tps": 10142842, "wall": 97.1} {"step": 15021, "train_loss": 3.462549924850464, "lr": 0.00023411452016621756, "tps": 9618107, "wall": 102.4} {"step": 15022, "train_loss": 3.4633092880249023, "lr": 0.0002340954210763383, "tps": 9140950, "wall": 107.7} {"step": 15023, "train_loss": 3.3776400089263916, "lr": 0.00023407632182678527, "tps": 8721564, "wall": 112.9} {"step": 15024, "train_loss": 3.3128459453582764, "lr": 0.00023405722241777498, "tps": 8340211, "wall": 118.1} {"step": 15025, "train_loss": 3.362015724182129, "lr": 0.00023403812284952368, "tps": 7987403, "wall": 123.3} {"step": 15026, "train_loss": 3.2636842727661133, "lr": 0.00023401902312224774, "tps": 7661931, "wall": 128.5} {"step": 15027, "train_loss": 3.3610024452209473, "lr": 0.00023399992323616363, "tps": 7360245, "wall": 133.8} {"step": 15028, "train_loss": 3.4675588607788086, "lr": 0.00023398082319148756, "tps": 7081183, "wall": 139.1} {"step": 15029, "train_loss": 3.3729910850524902, "lr": 0.00023396172298843597, "tps": 6823568, "wall": 144.4} {"step": 15030, "train_loss": 3.4209043979644775, "lr": 0.0002339426226272253, "tps": 6581788, "wall": 149.7} {"step": 15031, "train_loss": 3.350155830383301, "lr": 0.00023392352210807179, "tps": 6355521, "wall": 155.0} {"step": 15032, "train_loss": 3.4135751724243164, "lr": 0.00023390442143119184, "tps": 6144156, "wall": 160.3} {"step": 15033, "train_loss": 3.4140946865081787, "lr": 0.00023388532059680185, "tps": 5940961, "wall": 165.8} {"step": 15034, "train_loss": 3.2375986576080322, "lr": 0.00023386621960511832, "tps": 5748571, "wall": 171.4} {"step": 15035, "train_loss": 3.437398910522461, "lr": 0.00023384711845635735, "tps": 5571882, "wall": 176.9} {"step": 15036, "train_loss": 3.380068302154541, "lr": 0.00023382801715073556, "tps": 5399659, "wall": 182.5} {"step": 15037, "train_loss": 3.444274425506592, "lr": 0.00023380891568846926, "tps": 5230036, "wall": 188.4} {"step": 15038, "train_loss": 3.3624014854431152, "lr": 0.00023378981406977473, "tps": 5080717, "wall": 194.0} {"step": 15039, "train_loss": 3.3268818855285645, "lr": 0.00023377071229486847, "tps": 4937262, "wall": 199.6} {"step": 15040, "train_loss": 3.3552374839782715, "lr": 0.00023375161036396684, "tps": 4803030, "wall": 205.2} {"step": 15041, "train_loss": 3.332770586013794, "lr": 0.00023373250827728629, "tps": 4680302, "wall": 210.6} {"step": 15042, "train_loss": 3.4261929988861084, "lr": 0.00023371340603504313, "tps": 4566968, "wall": 215.9} {"step": 15043, "train_loss": 3.2673020362854004, "lr": 0.0002336943036374537, "tps": 4460746, "wall": 221.0} {"step": 15044, "train_loss": 3.4447073936462402, "lr": 0.00023367520108473445, "tps": 4357927, "wall": 226.3} {"step": 15045, "train_loss": 3.2891812324523926, "lr": 0.00023365609837710185, "tps": 4261058, "wall": 231.4} {"step": 15046, "train_loss": 3.4625439643859863, "lr": 0.0002336369955147722, "tps": 4168614, "wall": 236.6} {"step": 15047, "train_loss": 3.2428131103515625, "lr": 0.0002336178924979619, "tps": 4080990, "wall": 241.7} {"step": 15048, "train_loss": 3.4202632904052734, "lr": 0.00023359878932688744, "tps": 3997927, "wall": 246.7} {"step": 15049, "train_loss": 3.471238851547241, "lr": 0.00023357968600176509, "tps": 3918393, "wall": 251.7} {"step": 15050, "train_loss": 3.3830173015594482, "lr": 0.00023356058252281135, "tps": 3840858, "wall": 256.8} {"step": 15051, "train_loss": 3.300666093826294, "lr": 0.00023354147889024263, "tps": 3768790, "wall": 261.7} {"step": 15052, "train_loss": 3.390669345855713, "lr": 0.00023352237510427523, "tps": 3701001, "wall": 266.6} {"step": 15053, "train_loss": 3.4351792335510254, "lr": 0.0002335032711651257, "tps": 3631719, "wall": 271.7} {"step": 15054, "train_loss": 3.375786781311035, "lr": 0.00023348416707301035, "tps": 3565391, "wall": 276.7} {"step": 15055, "train_loss": 3.349392890930176, "lr": 0.00023346506282814563, "tps": 3502184, "wall": 281.7} {"step": 15056, "train_loss": 3.301877498626709, "lr": 0.00023344595843074797, "tps": 3441203, "wall": 286.8} {"step": 15057, "train_loss": 3.416653633117676, "lr": 0.0002334268538810337, "tps": 3381717, "wall": 291.8} {"step": 15058, "train_loss": 3.396346092224121, "lr": 0.00023340774917921943, "tps": 3323819, "wall": 296.9} {"step": 15059, "train_loss": 3.375877857208252, "lr": 0.00023338864432552133, "tps": 3270288, "wall": 301.8} {"step": 15060, "train_loss": 3.506164312362671, "lr": 0.00023336953932015595, "tps": 3219319, "wall": 306.6} {"step": 15061, "train_loss": 3.403367042541504, "lr": 0.00023335043416333978, "tps": 3169838, "wall": 311.4} {"step": 15062, "train_loss": 3.3750967979431152, "lr": 0.00023333132885528914, "tps": 3121800, "wall": 316.2} {"step": 15063, "train_loss": 3.4462907314300537, "lr": 0.00023331222339622047, "tps": 3075188, "wall": 321.0} {"step": 15064, "train_loss": 3.358680009841919, "lr": 0.0002332931177863502, "tps": 3029856, "wall": 325.9} {"step": 15065, "train_loss": 3.3676185607910156, "lr": 0.00023327401202589485, "tps": 2985890, "wall": 330.7} {"step": 15066, "train_loss": 3.4475326538085938, "lr": 0.0002332549061150707, "tps": 2943433, "wall": 335.5} {"step": 15067, "train_loss": 3.4878177642822266, "lr": 0.00023323580005409428, "tps": 2902030, "wall": 340.3} {"step": 15068, "train_loss": 3.33498215675354, "lr": 0.00023321669384318198, "tps": 2861546, "wall": 345.1} {"step": 15069, "train_loss": 3.300154685974121, "lr": 0.00023319758748255027, "tps": 2821696, "wall": 350.0} {"step": 15070, "train_loss": 3.482825517654419, "lr": 0.00023317848097241558, "tps": 2783170, "wall": 354.9} {"step": 15071, "train_loss": 3.385712146759033, "lr": 0.00023315937431299432, "tps": 2744899, "wall": 359.9} {"step": 15072, "train_loss": 3.349860668182373, "lr": 0.00023314026750450299, "tps": 2706499, "wall": 365.0} {"step": 15073, "train_loss": 3.427929401397705, "lr": 0.00023312116054715799, "tps": 2669506, "wall": 370.1} {"step": 15074, "train_loss": 3.332988739013672, "lr": 0.00023310205344117578, "tps": 2633375, "wall": 375.2} {"step": 15075, "train_loss": 3.3960442543029785, "lr": 0.00023308294618677283, "tps": 2598162, "wall": 380.3} {"step": 15076, "train_loss": 3.4167075157165527, "lr": 0.00023306383878416548, "tps": 2563367, "wall": 385.5} {"step": 15077, "train_loss": 3.3994698524475098, "lr": 0.00023304473123357026, "tps": 2528716, "wall": 390.8} {"step": 15078, "train_loss": 3.410067081451416, "lr": 0.0002330256235352037, "tps": 2494956, "wall": 396.1} {"step": 15079, "train_loss": 3.514540672302246, "lr": 0.00023300651568928214, "tps": 2462089, "wall": 401.4} {"step": 15080, "train_loss": 3.3366708755493164, "lr": 0.00023298740769602203, "tps": 2429957, "wall": 406.7} {"step": 15081, "train_loss": 3.401669979095459, "lr": 0.00023296829955563982, "tps": 2399090, "wall": 412.0} {"step": 15082, "train_loss": 3.3516273498535156, "lr": 0.00023294919126835219, "tps": 2370633, "wall": 417.0} {"step": 15083, "train_loss": 3.347747325897217, "lr": 0.00023293008283437522, "tps": 2342990, "wall": 421.9} {"step": 15084, "train_loss": 3.3952534198760986, "lr": 0.00023291097425392568, "tps": 2315808, "wall": 426.9} {"step": 15085, "train_loss": 3.4421193599700928, "lr": 0.0002328918655272199, "tps": 2289511, "wall": 431.8} {"step": 15086, "train_loss": 3.388914108276367, "lr": 0.0002328727566544744, "tps": 2263678, "wall": 436.8} {"step": 15087, "train_loss": 3.3815057277679443, "lr": 0.00023285364763590556, "tps": 2238525, "wall": 441.7} {"step": 15088, "train_loss": 3.3932087421417236, "lr": 0.00023283453847172992, "tps": 2213941, "wall": 446.7} {"step": 15089, "train_loss": 3.3948163986206055, "lr": 0.000232815429162164, "tps": 2189902, "wall": 451.6} {"step": 15090, "train_loss": 3.358440399169922, "lr": 0.00023279631970742415, "tps": 2166420, "wall": 456.5} {"step": 15091, "train_loss": 3.3147785663604736, "lr": 0.00023277721010772688, "tps": 2143297, "wall": 461.5} {"step": 15092, "train_loss": 3.404323101043701, "lr": 0.00023275810036328868, "tps": 2120230, "wall": 466.5} {"step": 15093, "train_loss": 3.3967199325561523, "lr": 0.0002327389904743261, "tps": 2098055, "wall": 471.5} {"step": 15094, "train_loss": 3.429917812347412, "lr": 0.00023271988044105548, "tps": 2076399, "wall": 476.4} {"step": 15095, "train_loss": 3.323721408843994, "lr": 0.00023270077026369342, "tps": 2054496, "wall": 481.5} {"step": 15096, "train_loss": 3.3781375885009766, "lr": 0.0002326816599424563, "tps": 2033866, "wall": 486.5} {"step": 15097, "train_loss": 3.362761974334717, "lr": 0.00023266254947756064, "tps": 2013506, "wall": 491.4} {"step": 15098, "train_loss": 3.4261441230773926, "lr": 0.00023264343886922296, "tps": 1993662, "wall": 496.3} {"step": 15099, "train_loss": 3.4601166248321533, "lr": 0.00023262432811765974, "tps": 1974255, "wall": 501.2} {"step": 15100, "train_loss": 3.3952879905700684, "lr": 0.00023260521722308743, "tps": 1955299, "wall": 506.1} {"step": 15101, "train_loss": 3.288877248764038, "lr": 0.0002325861061857225, "tps": 1936629, "wall": 511.1} {"step": 15102, "train_loss": 3.3386337757110596, "lr": 0.0002325669950057815, "tps": 1918367, "wall": 516.0} {"step": 15103, "train_loss": 3.30387544631958, "lr": 0.00023254788368348096, "tps": 1900396, "wall": 520.9} {"step": 15104, "train_loss": 3.310441017150879, "lr": 0.00023252877221903724, "tps": 1882448, "wall": 525.9} {"step": 15105, "train_loss": 3.3438172340393066, "lr": 0.00023250966061266697, "tps": 1865306, "wall": 530.7} {"step": 15106, "train_loss": 3.4280498027801514, "lr": 0.00023249054886458653, "tps": 1848291, "wall": 535.7} {"step": 15107, "train_loss": 3.313934326171875, "lr": 0.0002324714369750125, "tps": 1831740, "wall": 540.5} {"step": 15108, "train_loss": 3.454746961593628, "lr": 0.00023245232494416133, "tps": 1815388, "wall": 545.4} {"step": 15109, "train_loss": 3.353860378265381, "lr": 0.00023243321277224962, "tps": 1799366, "wall": 550.3} {"step": 15110, "train_loss": 3.391284942626953, "lr": 0.0002324141004594938, "tps": 1783582, "wall": 555.2} {"step": 15111, "train_loss": 3.3383872509002686, "lr": 0.0002323949880061103, "tps": 1768089, "wall": 560.1} {"step": 15112, "train_loss": 3.38150954246521, "lr": 0.00023237587541231577, "tps": 1752944, "wall": 565.0} {"step": 15113, "train_loss": 3.387237071990967, "lr": 0.0002323567626783266, "tps": 1736847, "wall": 570.3} {"step": 15114, "train_loss": 3.3607401847839355, "lr": 0.00023233764980435938, "tps": 1721592, "wall": 575.4} {"step": 15115, "train_loss": 3.3645505905151367, "lr": 0.0002323185367906306, "tps": 1706700, "wall": 580.4} {"step": 15116, "train_loss": 3.382455587387085, "lr": 0.0002322994236373568, "tps": 1691921, "wall": 585.6} {"step": 15117, "train_loss": 3.3904473781585693, "lr": 0.00023228031034475444, "tps": 1677506, "wall": 590.6} {"step": 15118, "train_loss": 3.3114235401153564, "lr": 0.00023226119691303998, "tps": 1662677, "wall": 595.9} {"step": 15119, "train_loss": 3.4443283081054688, "lr": 0.00023224208334243014, "tps": 1648286, "wall": 601.2} {"step": 15120, "train_loss": 3.46244478225708, "lr": 0.00023222296963314122, "tps": 1634657, "wall": 606.2} {"step": 15121, "train_loss": 3.3669281005859375, "lr": 0.00023220385578538993, "tps": 1621693, "wall": 611.1} {"step": 15122, "train_loss": 3.4234347343444824, "lr": 0.00023218474179939272, "tps": 1608871, "wall": 616.0} {"step": 15123, "train_loss": 3.377974510192871, "lr": 0.00023216562767536597, "tps": 1596342, "wall": 620.9} {"step": 15124, "train_loss": 3.3655238151550293, "lr": 0.00023214651341352637, "tps": 1583873, "wall": 625.8} {"step": 15125, "train_loss": 3.381173610687256, "lr": 0.00023212739901409045, "tps": 1571731, "wall": 630.7} {"step": 15126, "train_loss": 3.320424795150757, "lr": 0.00023210828447727474, "tps": 1559756, "wall": 635.6} {"step": 15127, "train_loss": 3.434915781021118, "lr": 0.00023208916980329566, "tps": 1547982, "wall": 640.5} {"step": 15128, "train_loss": 3.389761447906494, "lr": 0.00023207005499236984, "tps": 1536213, "wall": 645.4} {"step": 15129, "train_loss": 3.3576440811157227, "lr": 0.00023205094004471373, "tps": 1524797, "wall": 650.3} {"step": 15130, "train_loss": 3.3962478637695312, "lr": 0.000232031824960544, "tps": 1513475, "wall": 655.2} {"step": 15131, "train_loss": 3.3720285892486572, "lr": 0.00023201270974007704, "tps": 1502434, "wall": 660.1} {"step": 15132, "train_loss": 3.483656883239746, "lr": 0.00023199359438352946, "tps": 1491529, "wall": 664.9} {"step": 15133, "train_loss": 3.2598352432250977, "lr": 0.00023197447889111784, "tps": 1480755, "wall": 669.8} {"step": 15134, "train_loss": 3.271158218383789, "lr": 0.00023195536326305863, "tps": 1470141, "wall": 674.7} {"step": 15135, "train_loss": 3.2691128253936768, "lr": 0.00023193624749956842, "tps": 1459687, "wall": 679.6} {"step": 15136, "train_loss": 3.5016698837280273, "lr": 0.0002319171316008638, "tps": 1449428, "wall": 684.4} {"step": 15137, "train_loss": 3.417754650115967, "lr": 0.0002318980155671612, "tps": 1439290, "wall": 689.3} {"step": 15138, "train_loss": 3.299356698989868, "lr": 0.00023187889939867726, "tps": 1429293, "wall": 694.2} {"step": 15139, "train_loss": 3.5016345977783203, "lr": 0.00023185978309562852, "tps": 1419430, "wall": 699.0} {"step": 15140, "train_loss": 3.2791106700897217, "lr": 0.00023184066665823152, "tps": 1409718, "wall": 703.9} {"step": 15141, "train_loss": 3.406789541244507, "lr": 0.00023182155008670278, "tps": 1400047, "wall": 708.8} {"step": 15142, "train_loss": 3.367314100265503, "lr": 0.00023180243338125886, "tps": 1390593, "wall": 713.7} {"step": 15143, "train_loss": 3.478074550628662, "lr": 0.0002317833165421164, "tps": 1381271, "wall": 718.5} {"step": 15144, "train_loss": 3.5199942588806152, "lr": 0.00023176419956949187, "tps": 1372069, "wall": 723.4} {"step": 15145, "train_loss": 3.3984365463256836, "lr": 0.00023174508246360186, "tps": 1362977, "wall": 728.3} {"step": 15146, "train_loss": 3.2967963218688965, "lr": 0.00023172596522466287, "tps": 1354017, "wall": 733.1} {"step": 15147, "train_loss": 3.3512425422668457, "lr": 0.0002317068478528916, "tps": 1345147, "wall": 738.0} {"step": 15148, "train_loss": 3.3868799209594727, "lr": 0.00023168773034850447, "tps": 1336444, "wall": 742.9} {"step": 15149, "train_loss": 3.3882670402526855, "lr": 0.00023166861271171806, "tps": 1327808, "wall": 747.8} {"step": 15150, "train_loss": 3.241823673248291, "lr": 0.00023164949494274906, "tps": 1319330, "wall": 752.6} {"step": 15151, "train_loss": 3.3493196964263916, "lr": 0.00023163037704181392, "tps": 1310957, "wall": 757.5} {"step": 15152, "train_loss": 3.3942644596099854, "lr": 0.0002316112590091292, "tps": 1302666, "wall": 762.3} {"step": 15153, "train_loss": 3.4197909832000732, "lr": 0.00023159214084491155, "tps": 1294406, "wall": 767.2} {"step": 15154, "train_loss": 3.375269889831543, "lr": 0.0002315730225493775, "tps": 1286344, "wall": 772.1} {"step": 15155, "train_loss": 3.3141443729400635, "lr": 0.00023155390412274362, "tps": 1278414, "wall": 776.9} {"step": 15156, "train_loss": 3.3766934871673584, "lr": 0.00023153478556522643, "tps": 1270532, "wall": 781.8} {"step": 15157, "train_loss": 3.3438706398010254, "lr": 0.00023151566687704266, "tps": 1262778, "wall": 786.7} {"step": 15158, "train_loss": 3.4200806617736816, "lr": 0.00023149654805840872, "tps": 1255116, "wall": 791.5} {"step": 15159, "train_loss": 3.346554756164551, "lr": 0.00023147742910954126, "tps": 1247489, "wall": 796.4} {"step": 15160, "train_loss": 3.391231060028076, "lr": 0.00023145831003065697, "tps": 1240025, "wall": 801.3} {"step": 15161, "train_loss": 3.4963014125823975, "lr": 0.00023143919082197224, "tps": 1232591, "wall": 806.2} {"step": 15162, "train_loss": 3.3060669898986816, "lr": 0.00023142007148370373, "tps": 1225273, "wall": 811.0} {"step": 15163, "train_loss": 3.3935413360595703, "lr": 0.00023140095201606804, "tps": 1218054, "wall": 815.9} {"step": 15164, "train_loss": 3.3103761672973633, "lr": 0.0002313818324192818, "tps": 1210917, "wall": 820.7} {"step": 15165, "train_loss": 3.3575942516326904, "lr": 0.00023136271269356143, "tps": 1203699, "wall": 825.7} {"step": 15166, "train_loss": 3.524453639984131, "lr": 0.00023134359283912375, "tps": 1196742, "wall": 830.6} {"step": 15167, "train_loss": 3.2648308277130127, "lr": 0.00023132447285618518, "tps": 1189847, "wall": 835.4} {"step": 15168, "train_loss": 3.290846824645996, "lr": 0.00023130535274496237, "tps": 1183065, "wall": 840.3} {"step": 15169, "train_loss": 3.318739414215088, "lr": 0.00023128623250567195, "tps": 1176290, "wall": 845.2} {"step": 15170, "train_loss": 3.402500629425049, "lr": 0.00023126711213853046, "tps": 1169665, "wall": 850.0} {"step": 15171, "train_loss": 3.4132156372070312, "lr": 0.00023124799164375451, "tps": 1163076, "wall": 854.9} {"step": 15172, "train_loss": 3.440383195877075, "lr": 0.00023122887102156067, "tps": 1156565, "wall": 859.8} {"step": 15173, "train_loss": 3.2601404190063477, "lr": 0.0002312097502721656, "tps": 1150122, "wall": 864.6} {"step": 15174, "train_loss": 3.361626148223877, "lr": 0.0002311906293957859, "tps": 1143773, "wall": 869.5} {"step": 15175, "train_loss": 3.4914698600769043, "lr": 0.00023117150839263814, "tps": 1137482, "wall": 874.4} {"step": 15176, "train_loss": 3.3759937286376953, "lr": 0.00023115238726293885, "tps": 1131277, "wall": 879.2} {"step": 15177, "train_loss": 3.3822598457336426, "lr": 0.0002311332660069048, "tps": 1125155, "wall": 884.1} {"step": 15178, "train_loss": 3.352863311767578, "lr": 0.0002311141446247525, "tps": 1118961, "wall": 889.0} {"step": 15179, "train_loss": 3.3579463958740234, "lr": 0.00023109502311669853, "tps": 1112955, "wall": 893.9} {"step": 15180, "train_loss": 3.281524658203125, "lr": 0.0002310759014829596, "tps": 1107024, "wall": 898.7} {"step": 15181, "train_loss": 3.4477434158325195, "lr": 0.00023105677972375216, "tps": 1101142, "wall": 903.6} {"step": 15182, "train_loss": 3.3355302810668945, "lr": 0.00023103765783929298, "tps": 1095316, "wall": 908.4} {"step": 15183, "train_loss": 3.435917854309082, "lr": 0.00023101853582979863, "tps": 1089555, "wall": 913.3} {"step": 15184, "train_loss": 3.3745241165161133, "lr": 0.0002309994136954857, "tps": 1083833, "wall": 918.2} {"step": 15185, "train_loss": 3.402463436126709, "lr": 0.0002309802914365708, "tps": 1078191, "wall": 923.1} {"step": 15186, "train_loss": 3.4828267097473145, "lr": 0.00023096116905327055, "tps": 1072601, "wall": 927.9} {"step": 15187, "train_loss": 3.3986332416534424, "lr": 0.00023094204654580165, "tps": 1067078, "wall": 932.8} {"step": 15188, "train_loss": 3.437822103500366, "lr": 0.0002309229239143806, "tps": 1061620, "wall": 937.6} {"step": 15189, "train_loss": 3.3828065395355225, "lr": 0.0002309038011592241, "tps": 1056205, "wall": 942.5} {"step": 15190, "train_loss": 3.267902135848999, "lr": 0.00023088467828054877, "tps": 1050768, "wall": 947.5} {"step": 15191, "train_loss": 3.504542112350464, "lr": 0.0002308655552785712, "tps": 1045472, "wall": 952.3} {"step": 15192, "train_loss": 3.2964928150177, "lr": 0.00023084643215350793, "tps": 1040243, "wall": 957.2} {"step": 15193, "train_loss": 3.2573866844177246, "lr": 0.00023082730890557583, "tps": 1035047, "wall": 962.0} {"step": 15194, "train_loss": 3.3505642414093018, "lr": 0.00023080818553499133, "tps": 1029908, "wall": 966.9} {"step": 15195, "train_loss": 3.351884365081787, "lr": 0.00023078906204197113, "tps": 1024838, "wall": 971.7} {"step": 15196, "train_loss": 3.3953967094421387, "lr": 0.00023076993842673186, "tps": 1019796, "wall": 976.6} {"step": 15197, "train_loss": 3.2802767753601074, "lr": 0.0002307508146894901, "tps": 1014808, "wall": 981.5} {"step": 15198, "train_loss": 3.3600306510925293, "lr": 0.00023073169083046255, "tps": 1009856, "wall": 986.4} {"step": 15199, "train_loss": 3.4426450729370117, "lr": 0.00023071256684986584, "tps": 1004963, "wall": 991.2} {"step": 15200, "train_loss": 3.4167733192443848, "lr": 0.0002306934427479166, "tps": 1000124, "wall": 996.1} {"step": 15201, "train_loss": 3.435769557952881, "lr": 0.00023067431852483145, "tps": 995354, "wall": 1000.9} {"step": 15202, "train_loss": 3.399158000946045, "lr": 0.00023065519418082704, "tps": 990528, "wall": 1005.9} {"step": 15203, "train_loss": 3.3864426612854004, "lr": 0.00023063606971612002, "tps": 985836, "wall": 1010.7} {"step": 15204, "train_loss": 3.295793056488037, "lr": 0.00023061694513092706, "tps": 981192, "wall": 1015.6} {"step": 15205, "train_loss": 3.332763433456421, "lr": 0.00023059782042546476, "tps": 976569, "wall": 1020.5} {"step": 15206, "train_loss": 3.4019720554351807, "lr": 0.00023057869559994974, "tps": 972014, "wall": 1025.3} {"step": 15207, "train_loss": 3.348973274230957, "lr": 0.0002305595706545987, "tps": 967478, "wall": 1030.2} {"step": 15208, "train_loss": 3.2781317234039307, "lr": 0.0002305404455896283, "tps": 962985, "wall": 1035.0} {"step": 15209, "train_loss": 3.3876070976257324, "lr": 0.00023052132040525506, "tps": 958526, "wall": 1039.9} {"step": 15210, "train_loss": 3.2750697135925293, "lr": 0.0002305021951016958, "tps": 954130, "wall": 1044.8} {"step": 15211, "train_loss": 3.322183609008789, "lr": 0.0002304830696791672, "tps": 949762, "wall": 1049.7} {"step": 15212, "train_loss": 3.2892239093780518, "lr": 0.00023046394413788574, "tps": 945442, "wall": 1054.5} {"step": 15213, "train_loss": 3.3715484142303467, "lr": 0.0002304448184780681, "tps": 941116, "wall": 1059.4} {"step": 15214, "train_loss": 3.3425498008728027, "lr": 0.00023042569269993103, "tps": 936871, "wall": 1064.3} {"step": 15215, "train_loss": 3.4168264865875244, "lr": 0.00023040656680369117, "tps": 932590, "wall": 1069.3} {"step": 15216, "train_loss": 3.399604320526123, "lr": 0.00023038744078956517, "tps": 928419, "wall": 1074.1} {"step": 15217, "train_loss": 3.3376288414001465, "lr": 0.00023036831465776962, "tps": 924295, "wall": 1079.0} {"step": 15218, "train_loss": 3.337794303894043, "lr": 0.0002303491884085213, "tps": 920202, "wall": 1083.9} {"step": 15219, "train_loss": 3.338109254837036, "lr": 0.00023033006204203676, "tps": 916159, "wall": 1088.7} {"step": 15220, "train_loss": 3.4342000484466553, "lr": 0.00023031093555853275, "tps": 912141, "wall": 1093.6} {"step": 15221, "train_loss": 3.3710663318634033, "lr": 0.0002302918089582259, "tps": 908122, "wall": 1098.5} {"step": 15222, "train_loss": 3.437368631362915, "lr": 0.0002302726822413329, "tps": 904130, "wall": 1103.4} {"step": 15223, "train_loss": 3.3990590572357178, "lr": 0.0002302535554080704, "tps": 900244, "wall": 1108.3} {"step": 15224, "train_loss": 3.3927407264709473, "lr": 0.000230234428458655, "tps": 896356, "wall": 1113.2} {"step": 15225, "train_loss": 3.454123020172119, "lr": 0.00023021530139330355, "tps": 892505, "wall": 1118.0} {"step": 15226, "train_loss": 3.361663579940796, "lr": 0.00023019617421223253, "tps": 888683, "wall": 1122.9} {"step": 15227, "train_loss": 3.2551097869873047, "lr": 0.0002301770469156587, "tps": 884812, "wall": 1127.9} {"step": 15228, "train_loss": 3.419658899307251, "lr": 0.0002301579195037988, "tps": 881066, "wall": 1132.8} {"step": 15229, "train_loss": 3.4454755783081055, "lr": 0.00023013879197686938, "tps": 877353, "wall": 1137.6} {"step": 15230, "train_loss": 3.3074114322662354, "lr": 0.00023011966433508717, "tps": 873680, "wall": 1142.5} {"step": 15231, "train_loss": 3.334774971008301, "lr": 0.00023010053657866885, "tps": 870034, "wall": 1147.4} {"step": 15232, "train_loss": 3.3038864135742188, "lr": 0.00023008140870783118, "tps": 866415, "wall": 1152.2} {"step": 15233, "train_loss": 3.357062339782715, "lr": 0.0002300622807227907, "tps": 862821, "wall": 1157.1} {"step": 15234, "train_loss": 3.4670705795288086, "lr": 0.00023004315262376416, "tps": 859271, "wall": 1162.0} {"step": 15235, "train_loss": 3.3299431800842285, "lr": 0.0002300240244109683, "tps": 855740, "wall": 1166.8} {"step": 15236, "train_loss": 3.351321220397949, "lr": 0.0002300048960846197, "tps": 852230, "wall": 1171.7} {"step": 15237, "train_loss": 3.4246959686279297, "lr": 0.00022998576764493507, "tps": 848742, "wall": 1176.6} {"step": 15238, "train_loss": 3.4447755813598633, "lr": 0.00022996663909213117, "tps": 845308, "wall": 1181.5} {"step": 15239, "train_loss": 3.3082451820373535, "lr": 0.00022994751042642464, "tps": 841821, "wall": 1186.4} {"step": 15240, "train_loss": 3.4173147678375244, "lr": 0.00022992838164803217, "tps": 838450, "wall": 1191.3} {"step": 15241, "train_loss": 3.324155569076538, "lr": 0.0002299092527571704, "tps": 835090, "wall": 1196.2} {"step": 15242, "train_loss": 3.372413158416748, "lr": 0.0002298901237540562, "tps": 831771, "wall": 1201.0} {"step": 15243, "train_loss": 3.405625104904175, "lr": 0.00022987099463890606, "tps": 828465, "wall": 1205.9} {"step": 15244, "train_loss": 3.344395637512207, "lr": 0.00022985186541193674, "tps": 825190, "wall": 1210.7} {"step": 15245, "train_loss": 3.4233458042144775, "lr": 0.000229832736073365, "tps": 821926, "wall": 1215.6} {"step": 15246, "train_loss": 3.3734254837036133, "lr": 0.00022981360662340748, "tps": 818707, "wall": 1220.5} {"step": 15247, "train_loss": 3.4134702682495117, "lr": 0.00022979447706228086, "tps": 815506, "wall": 1225.4} {"step": 15248, "train_loss": 3.3341219425201416, "lr": 0.00022977534739020193, "tps": 812334, "wall": 1230.2} {"step": 15249, "train_loss": 3.434148073196411, "lr": 0.00022975621760738734, "tps": 809181, "wall": 1235.1} {"step": 15250, "train_loss": 3.416116237640381, "lr": 0.00022973708771405375, "tps": 806053, "wall": 1240.0} {"step": 15251, "train_loss": 3.317079544067383, "lr": 0.0002297179577104179, "tps": 802953, "wall": 1244.8} {"step": 15252, "train_loss": 3.2784957885742188, "lr": 0.00022969882759669652, "tps": 799842, "wall": 1249.8} {"step": 15253, "train_loss": 3.350245952606201, "lr": 0.0002296796973731063, "tps": 796796, "wall": 1254.6} {"step": 15254, "train_loss": 3.432353973388672, "lr": 0.00022966056703986395, "tps": 793757, "wall": 1259.5} {"step": 15255, "train_loss": 3.422307252883911, "lr": 0.00022964143659718613, "tps": 790742, "wall": 1264.4} {"step": 15256, "train_loss": 3.431699514389038, "lr": 0.00022962230604528966, "tps": 787761, "wall": 1269.3} {"step": 15257, "train_loss": 3.314810037612915, "lr": 0.0002296031753843911, "tps": 784775, "wall": 1274.2} {"step": 15258, "train_loss": 3.3967549800872803, "lr": 0.0002295840446147073, "tps": 781841, "wall": 1279.0} {"step": 15259, "train_loss": 3.4446563720703125, "lr": 0.00022956491373645496, "tps": 778929, "wall": 1283.9} {"step": 15260, "train_loss": 3.2233808040618896, "lr": 0.00022954578274985075, "tps": 776041, "wall": 1288.8} {"step": 15261, "train_loss": 3.3277082443237305, "lr": 0.00022952665165511133, "tps": 773165, "wall": 1293.7} {"step": 15262, "train_loss": 3.4113941192626953, "lr": 0.0002295075204524536, "tps": 770315, "wall": 1298.5} {"step": 15263, "train_loss": 3.483121395111084, "lr": 0.00022948838914209403, "tps": 767494, "wall": 1303.4} {"step": 15264, "train_loss": 3.389702796936035, "lr": 0.00022946925772424952, "tps": 764638, "wall": 1308.3} {"step": 15265, "train_loss": 3.2324507236480713, "lr": 0.00022945012619913683, "tps": 761854, "wall": 1313.2} {"step": 15266, "train_loss": 3.291679859161377, "lr": 0.00022943099456697246, "tps": 759087, "wall": 1318.1} {"step": 15267, "train_loss": 3.351043701171875, "lr": 0.00022941186282797332, "tps": 756341, "wall": 1323.0} {"step": 15268, "train_loss": 3.428417205810547, "lr": 0.0002293927309823561, "tps": 753622, "wall": 1327.8} {"step": 15269, "train_loss": 3.3453125953674316, "lr": 0.00022937359903033762, "tps": 750912, "wall": 1332.7} {"step": 15270, "train_loss": 3.3735175132751465, "lr": 0.0002293544669721344, "tps": 748222, "wall": 1337.6} {"step": 15271, "train_loss": 3.349074602127075, "lr": 0.00022933533480796325, "tps": 745559, "wall": 1342.4} {"step": 15272, "train_loss": 3.397000312805176, "lr": 0.00022931620253804097, "tps": 742906, "wall": 1347.3} {"step": 15273, "train_loss": 3.332982063293457, "lr": 0.00022929707016258424, "tps": 740274, "wall": 1352.2} {"step": 15274, "train_loss": 3.4786670207977295, "lr": 0.00022927793768180976, "tps": 737664, "wall": 1357.1} {"step": 15275, "train_loss": 3.3441669940948486, "lr": 0.00022925880509593434, "tps": 735069, "wall": 1361.9} {"step": 15276, "train_loss": 3.334480047225952, "lr": 0.00022923967240517462, "tps": 732470, "wall": 1366.9} {"step": 15277, "train_loss": 3.3839282989501953, "lr": 0.00022922053960974746, "tps": 729912, "wall": 1371.8} {"step": 15278, "train_loss": 3.3951187133789062, "lr": 0.00022920140670986948, "tps": 727367, "wall": 1376.6} {"step": 15279, "train_loss": 3.391190767288208, "lr": 0.00022918227370575752, "tps": 724858, "wall": 1381.5} {"step": 15280, "train_loss": 3.4564990997314453, "lr": 0.0002291631405976282, "tps": 722362, "wall": 1386.4} {"step": 15281, "train_loss": 3.3424623012542725, "lr": 0.0002291440073856984, "tps": 719880, "wall": 1391.2} {"step": 15282, "train_loss": 3.3748600482940674, "lr": 0.00022912487407018476, "tps": 717414, "wall": 1396.1} {"step": 15283, "train_loss": 3.3209705352783203, "lr": 0.00022910574065130402, "tps": 714963, "wall": 1401.0} {"step": 15284, "train_loss": 3.3956637382507324, "lr": 0.00022908660712927294, "tps": 712519, "wall": 1405.9} {"step": 15285, "train_loss": 3.382084369659424, "lr": 0.00022906747350430836, "tps": 710111, "wall": 1410.7} {"step": 15286, "train_loss": 3.404086112976074, "lr": 0.00022904833977662695, "tps": 707707, "wall": 1415.6} {"step": 15287, "train_loss": 3.3575973510742188, "lr": 0.0002290292059464454, "tps": 705328, "wall": 1420.5} {"step": 15288, "train_loss": 3.3734822273254395, "lr": 0.0002290100720139805, "tps": 702949, "wall": 1425.4} {"step": 15289, "train_loss": 3.3034539222717285, "lr": 0.0002289909379794491, "tps": 700596, "wall": 1430.3} {"step": 15290, "train_loss": 3.3814587593078613, "lr": 0.0002289718038430678, "tps": 698260, "wall": 1435.2} {"step": 15291, "train_loss": 3.4864554405212402, "lr": 0.0002289526696050534, "tps": 695924, "wall": 1440.1} {"step": 15292, "train_loss": 3.357517719268799, "lr": 0.00022893353526562277, "tps": 693631, "wall": 1444.9} {"step": 15293, "train_loss": 3.386347770690918, "lr": 0.0002289144008249925, "tps": 691339, "wall": 1449.8} {"step": 15294, "train_loss": 3.4084136486053467, "lr": 0.0002288952662833794, "tps": 689055, "wall": 1454.7} {"step": 15295, "train_loss": 3.358686685562134, "lr": 0.00022887613164100033, "tps": 686806, "wall": 1459.6} {"step": 15296, "train_loss": 3.384178638458252, "lr": 0.00022885699689807187, "tps": 684563, "wall": 1464.4} {"step": 15297, "train_loss": 3.392015218734741, "lr": 0.00022883786205481094, "tps": 682336, "wall": 1469.3} {"step": 15298, "train_loss": 3.453787088394165, "lr": 0.0002288187271114342, "tps": 680132, "wall": 1474.2} {"step": 15299, "train_loss": 3.450167179107666, "lr": 0.0002287995920681584, "tps": 677933, "wall": 1479.1} {"step": 15300, "train_loss": 3.272984027862549, "lr": 0.00022878045692520044, "tps": 675744, "wall": 1483.9} {"step": 15301, "train_loss": 3.4220163822174072, "lr": 0.00022876132168277692, "tps": 673542, "wall": 1488.9} {"step": 15302, "train_loss": 3.3928637504577637, "lr": 0.0002287421863411047, "tps": 671384, "wall": 1493.8} {"step": 15303, "train_loss": 3.348820209503174, "lr": 0.0002287230509004005, "tps": 669239, "wall": 1498.7} {"step": 15304, "train_loss": 3.345686435699463, "lr": 0.00022870391536088108, "tps": 667118, "wall": 1503.5} {"step": 15305, "train_loss": 3.3230931758880615, "lr": 0.00022868477972276327, "tps": 664959, "wall": 1508.5} {"step": 15306, "train_loss": 3.3346383571624756, "lr": 0.00022866564398626378, "tps": 662864, "wall": 1513.4} {"step": 15307, "train_loss": 3.324601173400879, "lr": 0.00022864650815159946, "tps": 660776, "wall": 1518.3} {"step": 15308, "train_loss": 3.3409066200256348, "lr": 0.00022862737221898702, "tps": 658703, "wall": 1523.1} {"step": 15309, "train_loss": 3.3550195693969727, "lr": 0.0002286082361886432, "tps": 656644, "wall": 1528.0} {"step": 15310, "train_loss": 3.2559518814086914, "lr": 0.00022858910006078484, "tps": 654592, "wall": 1532.9} {"step": 15311, "train_loss": 3.377290725708008, "lr": 0.00022856996383562869, "tps": 652560, "wall": 1537.8} {"step": 15312, "train_loss": 3.407198190689087, "lr": 0.0002285508275133915, "tps": 650542, "wall": 1542.6} {"step": 15313, "train_loss": 3.4287109375, "lr": 0.0002285316910942901, "tps": 648498, "wall": 1547.6} {"step": 15314, "train_loss": 3.449124813079834, "lr": 0.00022851255457854124, "tps": 646509, "wall": 1552.5} {"step": 15315, "train_loss": 3.381415843963623, "lr": 0.0002284934179663617, "tps": 644532, "wall": 1557.3} {"step": 15316, "train_loss": 3.3082408905029297, "lr": 0.0002284742812579682, "tps": 642566, "wall": 1562.2} {"step": 15317, "train_loss": 3.382455348968506, "lr": 0.00022845514445357773, "tps": 640611, "wall": 1567.1} {"step": 15318, "train_loss": 3.322052478790283, "lr": 0.00022843600755340679, "tps": 638670, "wall": 1571.9} {"step": 15319, "train_loss": 3.370959997177124, "lr": 0.00022841687055767237, "tps": 636728, "wall": 1576.8} {"step": 15320, "train_loss": 3.2936105728149414, "lr": 0.00022839773346659118, "tps": 634812, "wall": 1581.7} {"step": 15321, "train_loss": 3.4513087272644043, "lr": 0.00022837859628038, "tps": 632906, "wall": 1586.6} {"step": 15322, "train_loss": 3.383134365081787, "lr": 0.00022835945899925557, "tps": 630998, "wall": 1591.5} {"step": 15323, "train_loss": 3.3276686668395996, "lr": 0.0002283403216234348, "tps": 629112, "wall": 1596.3} {"step": 15324, "train_loss": 3.258089542388916, "lr": 0.0002283211841531344, "tps": 627245, "wall": 1601.2} {"step": 15325, "train_loss": 3.3436193466186523, "lr": 0.00022830204658857116, "tps": 625347, "wall": 1606.2} {"step": 15326, "train_loss": 3.407611131668091, "lr": 0.0002282829089299619, "tps": 623499, "wall": 1611.0} {"step": 15327, "train_loss": 3.4793968200683594, "lr": 0.00022826377117752343, "tps": 621660, "wall": 1615.9} {"step": 15328, "train_loss": 3.3461811542510986, "lr": 0.0002282446333314725, "tps": 619835, "wall": 1620.8} {"step": 15329, "train_loss": 3.2973999977111816, "lr": 0.00022822549539202585, "tps": 618017, "wall": 1625.6} {"step": 15330, "train_loss": 3.3374829292297363, "lr": 0.00022820635735940043, "tps": 616211, "wall": 1630.5} {"step": 15331, "train_loss": 3.4524803161621094, "lr": 0.00022818721923381294, "tps": 614403, "wall": 1635.4} {"step": 15332, "train_loss": 3.3188695907592773, "lr": 0.00022816808101548013, "tps": 612630, "wall": 1640.2} {"step": 15333, "train_loss": 3.343479633331299, "lr": 0.0002281489427046189, "tps": 610856, "wall": 1645.1} {"step": 15334, "train_loss": 3.2940456867218018, "lr": 0.00022812980430144607, "tps": 609091, "wall": 1650.0} {"step": 15335, "train_loss": 3.4647233486175537, "lr": 0.0002281106658061783, "tps": 607337, "wall": 1654.9} {"step": 15336, "train_loss": 3.3547840118408203, "lr": 0.0002280915272190324, "tps": 605593, "wall": 1659.7} {"step": 15337, "train_loss": 3.4157183170318604, "lr": 0.0002280723885402254, "tps": 603858, "wall": 1664.6} {"step": 15338, "train_loss": 3.43263578414917, "lr": 0.0002280532497699738, "tps": 602117, "wall": 1669.5} {"step": 15339, "train_loss": 3.3202896118164062, "lr": 0.0002280341109084946, "tps": 600391, "wall": 1674.4} {"step": 15340, "train_loss": 3.3366217613220215, "lr": 0.0002280149719560046, "tps": 598694, "wall": 1679.3} {"step": 15341, "train_loss": 3.3498518466949463, "lr": 0.00022799583291272053, "tps": 597001, "wall": 1684.2} {"step": 15342, "train_loss": 3.6256284713745117, "lr": 0.00022797669377885922, "tps": 595317, "wall": 1689.0} {"step": 15343, "train_loss": 3.3849663734436035, "lr": 0.00022795755455463752, "tps": 593638, "wall": 1693.9} {"step": 15344, "train_loss": 3.3705344200134277, "lr": 0.00022793841524027225, "tps": 591966, "wall": 1698.8} {"step": 15345, "train_loss": 3.334902286529541, "lr": 0.0002279192758359801, "tps": 590317, "wall": 1703.7} {"step": 15346, "train_loss": 3.3617141246795654, "lr": 0.00022790013634197797, "tps": 588673, "wall": 1708.6} {"step": 15347, "train_loss": 3.4093923568725586, "lr": 0.00022788099675848274, "tps": 587002, "wall": 1713.5} {"step": 15348, "train_loss": 3.31145977973938, "lr": 0.00022786185708571107, "tps": 585373, "wall": 1718.4} {"step": 15349, "train_loss": 3.3755416870117188, "lr": 0.00022784271732387987, "tps": 583751, "wall": 1723.3} {"step": 15350, "train_loss": 3.2931113243103027, "lr": 0.00022782357747320604, "tps": 582127, "wall": 1728.2} {"step": 15351, "train_loss": 3.4451112747192383, "lr": 0.0002278044375339062, "tps": 580532, "wall": 1733.1} {"step": 15352, "train_loss": 3.3383233547210693, "lr": 0.0002277852975061973, "tps": 578943, "wall": 1737.9} {"step": 15353, "train_loss": 3.42927885055542, "lr": 0.00022776615739029615, "tps": 577365, "wall": 1742.8} {"step": 15354, "train_loss": 3.4114441871643066, "lr": 0.00022774701718641956, "tps": 575793, "wall": 1747.7} {"step": 15355, "train_loss": 3.4560461044311523, "lr": 0.00022772787689478427, "tps": 574234, "wall": 1752.5} {"step": 15356, "train_loss": 3.310302734375, "lr": 0.00022770873651560715, "tps": 572679, "wall": 1757.4} {"step": 15357, "train_loss": 3.3548407554626465, "lr": 0.00022768959604910517, "tps": 571133, "wall": 1762.3} {"step": 15358, "train_loss": 3.3654184341430664, "lr": 0.00022767045549549494, "tps": 569594, "wall": 1767.2} {"step": 15359, "train_loss": 3.3397111892700195, "lr": 0.00022765131485499342, "tps": 568063, "wall": 1772.0} {"step": 15360, "train_loss": 3.3589913845062256, "lr": 0.00022763217412781735, "tps": 566543, "wall": 1776.9} {"step": 15361, "train_loss": 3.3283677101135254, "lr": 0.00022761303331418368, "tps": 565033, "wall": 1781.8} {"step": 15362, "train_loss": 3.400496006011963, "lr": 0.00022759389241430906, "tps": 563495, "wall": 1786.8} {"step": 15363, "train_loss": 3.274916648864746, "lr": 0.00022757475142841046, "tps": 561993, "wall": 1791.6} {"step": 15364, "train_loss": 3.326826333999634, "lr": 0.00022755561035670466, "tps": 560507, "wall": 1796.5} {"step": 15365, "train_loss": 3.392092704772949, "lr": 0.00022753646919940846, "tps": 559029, "wall": 1801.4} {"step": 15366, "train_loss": 3.3142523765563965, "lr": 0.00022751732795673878, "tps": 557560, "wall": 1806.2} {"step": 15367, "train_loss": 3.477353096008301, "lr": 0.0002274981866289124, "tps": 556099, "wall": 1811.1} {"step": 15368, "train_loss": 3.1969668865203857, "lr": 0.00022747904521614617, "tps": 554639, "wall": 1816.0} {"step": 15369, "train_loss": 3.2987380027770996, "lr": 0.00022745990371865688, "tps": 553194, "wall": 1820.9} {"step": 15370, "train_loss": 3.2360947132110596, "lr": 0.0002274407621366614, "tps": 551753, "wall": 1825.7} {"step": 15371, "train_loss": 3.331609010696411, "lr": 0.00022742162047037655, "tps": 550320, "wall": 1830.6} {"step": 15372, "train_loss": 3.2356133460998535, "lr": 0.0002274024787200192, "tps": 548889, "wall": 1835.5} {"step": 15373, "train_loss": 3.3680171966552734, "lr": 0.00022738333688580617, "tps": 547471, "wall": 1840.4} {"step": 15374, "train_loss": 3.257601261138916, "lr": 0.00022736419496795432, "tps": 546058, "wall": 1845.3} {"step": 15375, "train_loss": 3.277153491973877, "lr": 0.00022734505296668044, "tps": 544637, "wall": 1850.2} {"step": 15376, "train_loss": 3.4321813583374023, "lr": 0.0002273259108822014, "tps": 543243, "wall": 1855.1} {"step": 15377, "train_loss": 3.4037435054779053, "lr": 0.00022730676871473407, "tps": 541860, "wall": 1859.9} {"step": 15378, "train_loss": 3.4346866607666016, "lr": 0.00022728762646449528, "tps": 540482, "wall": 1864.8} {"step": 15379, "train_loss": 3.383223295211792, "lr": 0.00022726848413170183, "tps": 539101, "wall": 1869.7} {"step": 15380, "train_loss": 3.4650094509124756, "lr": 0.00022724934171657063, "tps": 537732, "wall": 1874.6} {"step": 15381, "train_loss": 3.2613861560821533, "lr": 0.00022723019921931848, "tps": 536369, "wall": 1879.4} {"step": 15382, "train_loss": 3.368434429168701, "lr": 0.00022721105664016224, "tps": 535002, "wall": 1884.4} {"step": 15383, "train_loss": 3.3991856575012207, "lr": 0.00022719191397931873, "tps": 533659, "wall": 1889.2} {"step": 15384, "train_loss": 3.4044876098632812, "lr": 0.00022717277123700486, "tps": 532321, "wall": 1894.1} {"step": 15385, "train_loss": 3.259944200515747, "lr": 0.0002271536284134375, "tps": 530990, "wall": 1899.0} {"step": 15386, "train_loss": 3.3669400215148926, "lr": 0.00022713448550883337, "tps": 529669, "wall": 1903.8} {"step": 15387, "train_loss": 3.3467273712158203, "lr": 0.00022711534252340939, "tps": 528333, "wall": 1908.8} {"step": 15388, "train_loss": 3.3721818923950195, "lr": 0.0002270961994573825, "tps": 527013, "wall": 1913.7} {"step": 15389, "train_loss": 3.294984817504883, "lr": 0.00022707705631096943, "tps": 525709, "wall": 1918.5} {"step": 15390, "train_loss": 3.4252898693084717, "lr": 0.00022705791308438706, "tps": 524410, "wall": 1923.4} {"step": 15391, "train_loss": 3.435009479522705, "lr": 0.0002270387697778523, "tps": 523115, "wall": 1928.3} {"step": 15392, "train_loss": 3.4040822982788086, "lr": 0.00022701962639158198, "tps": 521829, "wall": 1933.2} {"step": 15393, "train_loss": 3.305022716522217, "lr": 0.00022700048292579296, "tps": 520550, "wall": 1938.1} {"step": 15394, "train_loss": 3.3436148166656494, "lr": 0.0002269813393807021, "tps": 519275, "wall": 1943.0} {"step": 15395, "train_loss": 3.4496335983276367, "lr": 0.00022696219575652626, "tps": 518005, "wall": 1947.8} {"step": 15396, "train_loss": 3.3333215713500977, "lr": 0.00022694305205348222, "tps": 516740, "wall": 1952.7} {"step": 15397, "train_loss": 3.3888463973999023, "lr": 0.00022692390827178693, "tps": 515489, "wall": 1957.6} {"step": 15398, "train_loss": 3.3736844062805176, "lr": 0.0002269047644116573, "tps": 514244, "wall": 1962.5} {"step": 15399, "train_loss": 3.396686315536499, "lr": 0.00022688562047331007, "tps": 512981, "wall": 1967.4} {"step": 15400, "train_loss": 3.2880144119262695, "lr": 0.00022686647645696217, "tps": 511745, "wall": 1972.3} {"step": 15401, "train_loss": 3.3578317165374756, "lr": 0.00022684733236283045, "tps": 510512, "wall": 1977.2} {"step": 15402, "train_loss": 3.371140480041504, "lr": 0.00022682818819113178, "tps": 509292, "wall": 1982.1} {"step": 15403, "train_loss": 3.4064300060272217, "lr": 0.00022680904394208303, "tps": 508075, "wall": 1986.9} {"step": 15404, "train_loss": 3.439666271209717, "lr": 0.00022678989961590103, "tps": 506864, "wall": 1991.8} {"step": 15405, "train_loss": 3.3632688522338867, "lr": 0.00022677075521280275, "tps": 505659, "wall": 1996.7} {"step": 15406, "train_loss": 3.4260947704315186, "lr": 0.00022675161073300494, "tps": 504461, "wall": 2001.6} {"step": 15407, "train_loss": 3.3254923820495605, "lr": 0.0002267324661767245, "tps": 503269, "wall": 2006.4} {"step": 15408, "train_loss": 3.4075613021850586, "lr": 0.0002267133215441783, "tps": 502080, "wall": 2011.3} {"step": 15409, "train_loss": 3.4150876998901367, "lr": 0.00022669417683558334, "tps": 500880, "wall": 2016.3} {"step": 15410, "train_loss": 3.359236478805542, "lr": 0.00022667503205115632, "tps": 499709, "wall": 2021.1} {"step": 15411, "train_loss": 3.3459255695343018, "lr": 0.00022665588719111414, "tps": 498521, "wall": 2026.1} {"step": 15412, "train_loss": 3.2598209381103516, "lr": 0.00022663674225567376, "tps": 497348, "wall": 2031.0} {"step": 15413, "train_loss": 3.31905198097229, "lr": 0.00022661759724505197, "tps": 496189, "wall": 2035.9} {"step": 15414, "train_loss": 3.3252758979797363, "lr": 0.00022659845215946569, "tps": 495034, "wall": 2040.7} {"step": 15415, "train_loss": 3.499112606048584, "lr": 0.00022657930699913182, "tps": 493885, "wall": 2045.6} {"step": 15416, "train_loss": 3.4123151302337646, "lr": 0.00022656016176426716, "tps": 492742, "wall": 2050.5} {"step": 15417, "train_loss": 3.2939453125, "lr": 0.00022654101645508865, "tps": 491592, "wall": 2055.4} {"step": 15418, "train_loss": 3.2879929542541504, "lr": 0.00022652187107181316, "tps": 490459, "wall": 2060.3} {"step": 15419, "train_loss": 3.4172914028167725, "lr": 0.00022650272561465756, "tps": 489334, "wall": 2065.2} {"step": 15420, "train_loss": 3.302924871444702, "lr": 0.00022648358008383874, "tps": 488212, "wall": 2070.1} {"step": 15421, "train_loss": 3.3567514419555664, "lr": 0.00022646443447957353, "tps": 487092, "wall": 2075.0} {"step": 15422, "train_loss": 3.35666561126709, "lr": 0.00022644528880207894, "tps": 485982, "wall": 2079.8} {"step": 15423, "train_loss": 3.3551135063171387, "lr": 0.00022642614305157165, "tps": 484876, "wall": 2084.7} {"step": 15424, "train_loss": 3.4106619358062744, "lr": 0.00022640699722826875, "tps": 483760, "wall": 2089.7} {"step": 15425, "train_loss": 3.2470717430114746, "lr": 0.00022638785133238703, "tps": 482666, "wall": 2094.5} {"step": 15426, "train_loss": 3.3655834197998047, "lr": 0.00022636870536414335, "tps": 481574, "wall": 2099.4} {"step": 15427, "train_loss": 3.4655537605285645, "lr": 0.00022634955932375467, "tps": 480486, "wall": 2104.3} {"step": 15428, "train_loss": 3.4330649375915527, "lr": 0.0002263304132114378, "tps": 479405, "wall": 2109.2} {"step": 15429, "train_loss": 3.40834641456604, "lr": 0.00022631126702740971, "tps": 478330, "wall": 2114.1} {"step": 15430, "train_loss": 3.4155964851379395, "lr": 0.00022629212077188724, "tps": 477256, "wall": 2119.0} {"step": 15431, "train_loss": 3.3696067333221436, "lr": 0.00022627297444508725, "tps": 476188, "wall": 2123.8} {"step": 15432, "train_loss": 3.3391449451446533, "lr": 0.0002262538280472267, "tps": 475124, "wall": 2128.7} {"step": 15433, "train_loss": 3.3925867080688477, "lr": 0.00022623468157852242, "tps": 474069, "wall": 2133.6} {"step": 15434, "train_loss": 3.4765119552612305, "lr": 0.00022621553503919138, "tps": 473015, "wall": 2138.5} {"step": 15435, "train_loss": 3.4420528411865234, "lr": 0.00022619638842945032, "tps": 471969, "wall": 2143.4} {"step": 15436, "train_loss": 3.401601791381836, "lr": 0.00022617724174951636, "tps": 470908, "wall": 2148.4} {"step": 15437, "train_loss": 3.417642116546631, "lr": 0.00022615809499960623, "tps": 469872, "wall": 2153.2} {"step": 15438, "train_loss": 3.4057836532592773, "lr": 0.00022613894817993685, "tps": 468840, "wall": 2158.1} {"step": 15439, "train_loss": 3.3454620838165283, "lr": 0.00022611980129072512, "tps": 467814, "wall": 2163.0} {"step": 15440, "train_loss": 3.3000335693359375, "lr": 0.00022610065433218795, "tps": 466792, "wall": 2167.9} {"step": 15441, "train_loss": 3.382317066192627, "lr": 0.00022608150730454228, "tps": 465772, "wall": 2172.7} {"step": 15442, "train_loss": 3.2825276851654053, "lr": 0.00022606236020800494, "tps": 464757, "wall": 2177.6} {"step": 15443, "train_loss": 3.383382797241211, "lr": 0.00022604321304279284, "tps": 463747, "wall": 2182.5} {"step": 15444, "train_loss": 3.390911102294922, "lr": 0.00022602406580912292, "tps": 462744, "wall": 2187.4} {"step": 15445, "train_loss": 3.329580307006836, "lr": 0.000226004918507212, "tps": 461746, "wall": 2192.3} {"step": 15446, "train_loss": 3.3814098834991455, "lr": 0.00022598577113727713, "tps": 460753, "wall": 2197.1} {"step": 15447, "train_loss": 3.365675449371338, "lr": 0.00022596662369953508, "tps": 459764, "wall": 2202.0} {"step": 15448, "train_loss": 3.4467716217041016, "lr": 0.00022594747619420277, "tps": 458766, "wall": 2206.9} {"step": 15449, "train_loss": 3.416119337081909, "lr": 0.00022592832862149714, "tps": 457779, "wall": 2211.8} {"step": 15450, "train_loss": 3.328272819519043, "lr": 0.00022590918098163508, "tps": 456804, "wall": 2216.7} {"step": 15451, "train_loss": 3.467890501022339, "lr": 0.00022589003327483354, "tps": 455831, "wall": 2221.6} {"step": 15452, "train_loss": 3.4373245239257812, "lr": 0.00022587088550130933, "tps": 454859, "wall": 2226.5} {"step": 15453, "train_loss": 3.3821988105773926, "lr": 0.00022585173766127942, "tps": 453893, "wall": 2231.3} {"step": 15454, "train_loss": 3.404658794403076, "lr": 0.00022583258975496074, "tps": 452926, "wall": 2236.3} {"step": 15455, "train_loss": 3.5041980743408203, "lr": 0.00022581344178257014, "tps": 451973, "wall": 2241.1} {"step": 15456, "train_loss": 3.381300449371338, "lr": 0.00022579429374432457, "tps": 451023, "wall": 2246.0} {"step": 15457, "train_loss": 3.3858437538146973, "lr": 0.00022577514564044092, "tps": 450074, "wall": 2250.9} {"step": 15458, "train_loss": 3.3162617683410645, "lr": 0.0002257559974711361, "tps": 449130, "wall": 2255.7} {"step": 15459, "train_loss": 3.3230390548706055, "lr": 0.0002257368492366271, "tps": 448187, "wall": 2260.6} {"step": 15460, "train_loss": 3.3019886016845703, "lr": 0.0002257177009371307, "tps": 447236, "wall": 2265.6} {"step": 15461, "train_loss": 3.346090316772461, "lr": 0.00022569855257286383, "tps": 446302, "wall": 2270.5} {"step": 15462, "train_loss": 3.2929434776306152, "lr": 0.00022567940414404349, "tps": 445370, "wall": 2275.4} {"step": 15463, "train_loss": 3.3387746810913086, "lr": 0.0002256602556508866, "tps": 444449, "wall": 2280.2} {"step": 15464, "train_loss": 3.27358341217041, "lr": 0.00022564110709361003, "tps": 443528, "wall": 2285.1} {"step": 15465, "train_loss": 3.370915651321411, "lr": 0.00022562195847243061, "tps": 442614, "wall": 2290.0} {"step": 15466, "train_loss": 3.3738088607788086, "lr": 0.0002256028097875654, "tps": 441701, "wall": 2294.9} {"step": 15467, "train_loss": 3.329737663269043, "lr": 0.00022558366103923129, "tps": 440792, "wall": 2299.7} {"step": 15468, "train_loss": 3.410737991333008, "lr": 0.00022556451222764502, "tps": 439888, "wall": 2304.6} {"step": 15469, "train_loss": 3.3503031730651855, "lr": 0.00022554536335302373, "tps": 438984, "wall": 2309.5} {"step": 15470, "train_loss": 3.3693904876708984, "lr": 0.00022552621441558434, "tps": 438086, "wall": 2314.4} {"step": 15471, "train_loss": 3.324446201324463, "lr": 0.0002255070654155436, "tps": 437188, "wall": 2319.3} {"step": 15472, "train_loss": 3.435696601867676, "lr": 0.0002254879163531186, "tps": 436301, "wall": 2324.2} {"step": 15473, "train_loss": 3.360919713973999, "lr": 0.0002254687672285262, "tps": 435402, "wall": 2329.1} {"step": 15474, "train_loss": 3.34462833404541, "lr": 0.00022544961804198322, "tps": 434518, "wall": 2334.0} {"step": 15475, "train_loss": 3.3438491821289062, "lr": 0.0002254304687937067, "tps": 433635, "wall": 2338.9} {"step": 15476, "train_loss": 3.4060637950897217, "lr": 0.00022541131948391354, "tps": 432761, "wall": 2343.8} {"step": 15477, "train_loss": 3.4019827842712402, "lr": 0.00022539217011282068, "tps": 431891, "wall": 2348.7} {"step": 15478, "train_loss": 3.325533866882324, "lr": 0.00022537302068064498, "tps": 431028, "wall": 2353.5} {"step": 15479, "train_loss": 3.418755531311035, "lr": 0.00022535387118760344, "tps": 430163, "wall": 2358.4} {"step": 15480, "train_loss": 3.3426382541656494, "lr": 0.00022533472163391297, "tps": 429303, "wall": 2363.3} {"step": 15481, "train_loss": 3.3237404823303223, "lr": 0.0002253155720197905, "tps": 428447, "wall": 2368.2} {"step": 15482, "train_loss": 3.289883852005005, "lr": 0.00022529642234545287, "tps": 427594, "wall": 2373.0} {"step": 15483, "train_loss": 3.4841578006744385, "lr": 0.00022527727261111716, "tps": 426745, "wall": 2377.9} {"step": 15484, "train_loss": 3.342813730239868, "lr": 0.00022525812281700019, "tps": 425894, "wall": 2382.8} {"step": 15485, "train_loss": 3.263554573059082, "lr": 0.0002252389729633189, "tps": 425040, "wall": 2387.8} {"step": 15486, "train_loss": 3.3568170070648193, "lr": 0.00022521982305029025, "tps": 424202, "wall": 2392.6} {"step": 15487, "train_loss": 3.4036355018615723, "lr": 0.00022520067307813118, "tps": 423365, "wall": 2397.5} {"step": 15488, "train_loss": 3.4305481910705566, "lr": 0.0002251815230470586, "tps": 422531, "wall": 2402.4} {"step": 15489, "train_loss": 3.4429564476013184, "lr": 0.00022516237295728942, "tps": 421695, "wall": 2407.3} {"step": 15490, "train_loss": 3.3392348289489746, "lr": 0.00022514322280904066, "tps": 420870, "wall": 2412.2} {"step": 15491, "train_loss": 3.3975582122802734, "lr": 0.00022512407260252918, "tps": 420042, "wall": 2417.1} {"step": 15492, "train_loss": 3.362213134765625, "lr": 0.00022510492233797185, "tps": 419224, "wall": 2422.0} {"step": 15493, "train_loss": 3.34604549407959, "lr": 0.00022508577201558571, "tps": 418407, "wall": 2426.9} {"step": 15494, "train_loss": 3.4183943271636963, "lr": 0.00022506662163558776, "tps": 417597, "wall": 2431.7} {"step": 15495, "train_loss": 3.3513832092285156, "lr": 0.00022504747119819478, "tps": 416789, "wall": 2436.6} {"step": 15496, "train_loss": 3.3807826042175293, "lr": 0.0002250283207036237, "tps": 415984, "wall": 2441.5} {"step": 15497, "train_loss": 3.39517879486084, "lr": 0.0002250091701520917, "tps": 415165, "wall": 2446.4} {"step": 15498, "train_loss": 3.319831371307373, "lr": 0.0002249900195438154, "tps": 414369, "wall": 2451.3} {"step": 15499, "train_loss": 3.3807296752929688, "lr": 0.00022497086887901193, "tps": 413572, "wall": 2456.2} {"step": 15500, "train_loss": 3.38266921043396, "lr": 0.00022495171815789826, "tps": 412778, "wall": 2461.1} {"step": 15501, "train_loss": 3.433337926864624, "lr": 0.00022493256738069118, "tps": 411952, "wall": 2466.2} {"step": 15502, "train_loss": 3.3536376953125, "lr": 0.00022491341654760772, "tps": 411162, "wall": 2471.1} {"step": 15503, "train_loss": 3.2675023078918457, "lr": 0.0002248942656588648, "tps": 410381, "wall": 2475.9} {"step": 15504, "train_loss": 3.350099563598633, "lr": 0.00022487511471467944, "tps": 409601, "wall": 2480.8} {"step": 15505, "train_loss": 3.4072885513305664, "lr": 0.00022485596371526846, "tps": 408824, "wall": 2485.7} {"step": 15506, "train_loss": 3.2964394092559814, "lr": 0.00022483681266084884, "tps": 408052, "wall": 2490.5} {"step": 15507, "train_loss": 3.2800827026367188, "lr": 0.00022481766155163762, "tps": 407281, "wall": 2495.4} {"step": 15508, "train_loss": 3.189941883087158, "lr": 0.0002247985103878516, "tps": 406512, "wall": 2500.3} {"step": 15509, "train_loss": 3.3918819427490234, "lr": 0.00022477935916970782, "tps": 405744, "wall": 2505.2} {"step": 15510, "train_loss": 3.415372371673584, "lr": 0.00022476020789742322, "tps": 404969, "wall": 2510.1} {"step": 15511, "train_loss": 3.2884931564331055, "lr": 0.00022474105657121474, "tps": 404209, "wall": 2515.0} {"step": 15512, "train_loss": 3.332611560821533, "lr": 0.0002247219051912993, "tps": 403455, "wall": 2519.9} {"step": 15513, "train_loss": 3.5138559341430664, "lr": 0.0002247027537578938, "tps": 402702, "wall": 2524.8} {"step": 15514, "train_loss": 3.3511431217193604, "lr": 0.0002246836022712153, "tps": 401952, "wall": 2529.6} {"step": 15515, "train_loss": 3.3666763305664062, "lr": 0.00022466445073148075, "tps": 401205, "wall": 2534.5} {"step": 15516, "train_loss": 3.4888720512390137, "lr": 0.00022464529913890697, "tps": 400459, "wall": 2539.4} {"step": 15517, "train_loss": 3.354416847229004, "lr": 0.00022462614749371102, "tps": 399718, "wall": 2544.3} {"step": 15518, "train_loss": 3.4051387310028076, "lr": 0.00022460699579610985, "tps": 398980, "wall": 2549.1} {"step": 15519, "train_loss": 3.3592610359191895, "lr": 0.00022458784404632033, "tps": 398245, "wall": 2554.0} {"step": 15520, "train_loss": 3.321436643600464, "lr": 0.00022456869224455944, "tps": 397515, "wall": 2558.9} {"step": 15521, "train_loss": 3.3602967262268066, "lr": 0.00022454954039104424, "tps": 396782, "wall": 2563.7} {"step": 15522, "train_loss": 3.313661575317383, "lr": 0.0002245303884859916, "tps": 396045, "wall": 2568.7} {"step": 15523, "train_loss": 3.4177045822143555, "lr": 0.0002245112365296184, "tps": 395322, "wall": 2573.5} {"step": 15524, "train_loss": 3.394317626953125, "lr": 0.0002244920845221417, "tps": 394597, "wall": 2578.4} {"step": 15525, "train_loss": 3.3182156085968018, "lr": 0.00022447293246377842, "tps": 393878, "wall": 2583.3} {"step": 15526, "train_loss": 3.280496120452881, "lr": 0.00022445378035474556, "tps": 393161, "wall": 2588.2} {"step": 15527, "train_loss": 3.3991165161132812, "lr": 0.00022443462819526002, "tps": 392426, "wall": 2593.2} {"step": 15528, "train_loss": 3.2615034580230713, "lr": 0.00022441547598553877, "tps": 391710, "wall": 2598.1} {"step": 15529, "train_loss": 3.2673146724700928, "lr": 0.00022439632372579872, "tps": 390958, "wall": 2603.3} {"step": 15530, "train_loss": 3.3956949710845947, "lr": 0.0002243771714162569, "tps": 390090, "wall": 2609.2} {"step": 15531, "train_loss": 3.3280107975006104, "lr": 0.0002243580190571303, "tps": 389222, "wall": 2615.2} {"step": 15532, "train_loss": 3.373270034790039, "lr": 0.00022433886664863578, "tps": 388493, "wall": 2620.3} {"step": 15533, "train_loss": 3.4211485385894775, "lr": 0.00022431971419099034, "tps": 387776, "wall": 2625.3} {"step": 15534, "train_loss": 3.342569351196289, "lr": 0.00022430056168441093, "tps": 387053, "wall": 2630.4} {"step": 15535, "train_loss": 3.400838613510132, "lr": 0.00022428140912911454, "tps": 386360, "wall": 2635.3} {"step": 15536, "train_loss": 3.365896224975586, "lr": 0.0002242622565253181, "tps": 385663, "wall": 2640.2} {"step": 15537, "train_loss": 3.4418797492980957, "lr": 0.00022424310387323862, "tps": 384975, "wall": 2645.1} {"step": 15538, "train_loss": 3.295523166656494, "lr": 0.00022422395117309302, "tps": 384287, "wall": 2650.0} {"step": 15539, "train_loss": 3.409724235534668, "lr": 0.0002242047984250983, "tps": 383590, "wall": 2655.0} {"step": 15540, "train_loss": 3.463724136352539, "lr": 0.00022418564562947136, "tps": 382899, "wall": 2660.0} {"step": 15541, "train_loss": 3.284447193145752, "lr": 0.00022416649278642924, "tps": 382214, "wall": 2664.9} {"step": 15542, "train_loss": 3.2976365089416504, "lr": 0.0002241473398961888, "tps": 381539, "wall": 2669.8} {"step": 15543, "train_loss": 3.4339981079101562, "lr": 0.00022412818695896709, "tps": 380866, "wall": 2674.7} {"step": 15544, "train_loss": 3.329618215560913, "lr": 0.0002241090339749811, "tps": 380196, "wall": 2679.6} {"step": 15545, "train_loss": 3.404505729675293, "lr": 0.0002240898809444477, "tps": 379525, "wall": 2684.5} {"step": 15546, "train_loss": 3.4486594200134277, "lr": 0.0002240707278675839, "tps": 378855, "wall": 2689.4} {"step": 15547, "train_loss": 3.385725975036621, "lr": 0.00022405157474460668, "tps": 378193, "wall": 2694.3} {"step": 15548, "train_loss": 3.3502328395843506, "lr": 0.0002240324215757331, "tps": 377530, "wall": 2699.2} {"step": 15549, "train_loss": 3.28098201751709, "lr": 0.00022401326836117994, "tps": 376874, "wall": 2704.0} {"step": 15550, "train_loss": 3.3192501068115234, "lr": 0.00022399411510116423, "tps": 376221, "wall": 2708.9} {"step": 15551, "train_loss": 3.307805061340332, "lr": 0.00022397496179590306, "tps": 375569, "wall": 2713.8} {"step": 15552, "train_loss": 3.404966115951538, "lr": 0.00022395580844561326, "tps": 374913, "wall": 2718.7} {"step": 15553, "train_loss": 3.3656089305877686, "lr": 0.0002239366550505118, "tps": 374264, "wall": 2723.6} {"step": 15554, "train_loss": 3.3180179595947266, "lr": 0.00022391750161081575, "tps": 373613, "wall": 2728.5} {"step": 15555, "train_loss": 3.3577499389648438, "lr": 0.00022389834812674205, "tps": 372970, "wall": 2733.4} {"step": 15556, "train_loss": 3.4026432037353516, "lr": 0.00022387919459850763, "tps": 372325, "wall": 2738.3} {"step": 15557, "train_loss": 3.2740116119384766, "lr": 0.0002238600410263294, "tps": 371679, "wall": 2743.3} {"step": 15558, "train_loss": 3.2319250106811523, "lr": 0.00022384088741042457, "tps": 371029, "wall": 2748.2} {"step": 15559, "train_loss": 3.382298707962036, "lr": 0.00022382173375100987, "tps": 370383, "wall": 2753.2} {"step": 15560, "train_loss": 3.262155532836914, "lr": 0.00022380258004830235, "tps": 369744, "wall": 2758.1} {"step": 15561, "train_loss": 3.36639404296875, "lr": 0.000223783426302519, "tps": 369114, "wall": 2763.0} {"step": 15562, "train_loss": 3.3359503746032715, "lr": 0.00022376427251387683, "tps": 368467, "wall": 2768.1} {"step": 15563, "train_loss": 3.3088538646698, "lr": 0.00022374511868259277, "tps": 367827, "wall": 2773.0} {"step": 15564, "train_loss": 3.41508150100708, "lr": 0.00022372596480888378, "tps": 367187, "wall": 2778.1} {"step": 15565, "train_loss": 3.3305516242980957, "lr": 0.00022370681089296693, "tps": 366552, "wall": 2783.1} {"step": 15566, "train_loss": 3.279707193374634, "lr": 0.00022368765693505903, "tps": 365920, "wall": 2788.0} {"step": 15567, "train_loss": 3.2302260398864746, "lr": 0.0002236685029353772, "tps": 365274, "wall": 2793.1} {"step": 15568, "train_loss": 3.45947527885437, "lr": 0.00022364934889413838, "tps": 364651, "wall": 2798.1} {"step": 15569, "train_loss": 3.27644681930542, "lr": 0.00022363019481155951, "tps": 364038, "wall": 2803.0} {"step": 15570, "train_loss": 3.441120147705078, "lr": 0.00022361104068785762, "tps": 363414, "wall": 2808.0} {"step": 15571, "train_loss": 3.229661464691162, "lr": 0.00022359188652324962, "tps": 362801, "wall": 2812.9} {"step": 15572, "train_loss": 3.272782564163208, "lr": 0.00022357273231795262, "tps": 362192, "wall": 2817.8} {"step": 15573, "train_loss": 3.2378437519073486, "lr": 0.00022355357807218344, "tps": 361585, "wall": 2822.7} {"step": 15574, "train_loss": 3.445972442626953, "lr": 0.00022353442378615914, "tps": 360977, "wall": 2827.7} {"step": 15575, "train_loss": 3.3678057193756104, "lr": 0.00022351526946009674, "tps": 360377, "wall": 2832.6} {"step": 15576, "train_loss": 3.3349385261535645, "lr": 0.00022349611509421316, "tps": 359771, "wall": 2837.5} {"step": 15577, "train_loss": 3.407728672027588, "lr": 0.0002234769606887254, "tps": 359174, "wall": 2842.4} {"step": 15578, "train_loss": 3.2639007568359375, "lr": 0.00022345780624385042, "tps": 358576, "wall": 2847.3} {"step": 15579, "train_loss": 3.354741096496582, "lr": 0.00022343865175980524, "tps": 357982, "wall": 2852.2} {"step": 15580, "train_loss": 3.3913772106170654, "lr": 0.0002234194972368068, "tps": 357392, "wall": 2857.1} {"step": 15581, "train_loss": 3.3919174671173096, "lr": 0.00022340034267507214, "tps": 356800, "wall": 2862.1} {"step": 15582, "train_loss": 3.4744322299957275, "lr": 0.00022338118807481823, "tps": 356207, "wall": 2867.0} {"step": 15583, "train_loss": 3.3359193801879883, "lr": 0.000223362033436262, "tps": 355619, "wall": 2871.9} {"step": 15584, "train_loss": 3.4494760036468506, "lr": 0.00022334287875962048, "tps": 355037, "wall": 2876.8} {"step": 15585, "train_loss": 3.3090927600860596, "lr": 0.0002233237240451107, "tps": 354457, "wall": 2881.7} {"step": 15586, "train_loss": 3.314746618270874, "lr": 0.00022330456929294955, "tps": 353878, "wall": 2886.6} {"step": 15587, "train_loss": 3.402803421020508, "lr": 0.00022328541450335405, "tps": 353301, "wall": 2891.5} {"step": 15588, "train_loss": 3.237718105316162, "lr": 0.0002232662596765412, "tps": 352726, "wall": 2896.4} {"step": 15589, "train_loss": 3.3258984088897705, "lr": 0.00022324710481272798, "tps": 352150, "wall": 2901.3} {"step": 15590, "train_loss": 3.3383734226226807, "lr": 0.00022322794991213143, "tps": 351576, "wall": 2906.3} {"step": 15591, "train_loss": 3.232988119125366, "lr": 0.00022320879497496842, "tps": 351009, "wall": 2911.1} {"step": 15592, "train_loss": 3.3715949058532715, "lr": 0.00022318964000145607, "tps": 350439, "wall": 2916.1} {"step": 15593, "train_loss": 3.3003501892089844, "lr": 0.00022317048499181124, "tps": 349871, "wall": 2921.0} {"step": 15594, "train_loss": 3.4648520946502686, "lr": 0.00022315132994625106, "tps": 349295, "wall": 2926.0} {"step": 15595, "train_loss": 3.386136054992676, "lr": 0.00022313217486499235, "tps": 348733, "wall": 2930.9} {"step": 15596, "train_loss": 3.330644130706787, "lr": 0.0002231130197482523, "tps": 348172, "wall": 2935.8} {"step": 15597, "train_loss": 3.2696475982666016, "lr": 0.00022309386459624776, "tps": 347611, "wall": 2940.7} {"step": 15598, "train_loss": 3.386274814605713, "lr": 0.00022307470940919567, "tps": 347052, "wall": 2945.7} {"step": 15599, "train_loss": 3.453200101852417, "lr": 0.00022305555418731325, "tps": 346497, "wall": 2950.6} {"step": 15600, "train_loss": 3.2613749504089355, "lr": 0.0002230363989308172, "tps": 345936, "wall": 2955.5} {"step": 15601, "train_loss": 3.4683706760406494, "lr": 0.00022301724363992475, "tps": 345381, "wall": 2960.5} {"step": 15602, "train_loss": 3.3789923191070557, "lr": 0.0002229980883148528, "tps": 344832, "wall": 2965.4} {"step": 15603, "train_loss": 3.4190826416015625, "lr": 0.0002229789329558183, "tps": 344284, "wall": 2970.3} {"step": 15604, "train_loss": 3.2614870071411133, "lr": 0.00022295977756303832, "tps": 343744, "wall": 2975.1} {"step": 15605, "train_loss": 3.3452677726745605, "lr": 0.0002229406221367298, "tps": 343201, "wall": 2980.0} {"step": 15606, "train_loss": 3.352842092514038, "lr": 0.00022292146667710977, "tps": 342662, "wall": 2984.9} {"step": 15607, "train_loss": 3.352696418762207, "lr": 0.00022290231118439523, "tps": 342119, "wall": 2989.9} {"step": 15608, "train_loss": 3.297149181365967, "lr": 0.0002228831556588031, "tps": 341580, "wall": 2994.8} {"step": 15609, "train_loss": 3.4576823711395264, "lr": 0.00022286400010055045, "tps": 341047, "wall": 2999.6} {"step": 15610, "train_loss": 3.1912569999694824, "lr": 0.00022284484450985423, "tps": 340516, "wall": 3004.5} {"step": 15611, "train_loss": 3.3150668144226074, "lr": 0.00022282568888693148, "tps": 339986, "wall": 3009.4} {"step": 15612, "train_loss": 3.3309531211853027, "lr": 0.0002228065332319992, "tps": 339458, "wall": 3014.2} {"step": 15613, "train_loss": 3.359832286834717, "lr": 0.00022278737754527427, "tps": 338930, "wall": 3019.1} {"step": 15614, "train_loss": 3.416918992996216, "lr": 0.00022276822182697384, "tps": 338406, "wall": 3024.0} {"step": 15615, "train_loss": 3.3064239025115967, "lr": 0.00022274906607731488, "tps": 337884, "wall": 3028.9} {"step": 15616, "train_loss": 3.440711498260498, "lr": 0.00022272991029651432, "tps": 337365, "wall": 3033.7} {"step": 15617, "train_loss": 3.388705253601074, "lr": 0.00022271075448478914, "tps": 336847, "wall": 3038.6} {"step": 15618, "train_loss": 3.3520264625549316, "lr": 0.00022269159864235643, "tps": 336326, "wall": 3043.5} {"step": 15619, "train_loss": 3.365520477294922, "lr": 0.00022267244276943316, "tps": 335804, "wall": 3048.4} {"step": 15620, "train_loss": 3.3882999420166016, "lr": 0.0002226532868662363, "tps": 335289, "wall": 3053.3} {"step": 15621, "train_loss": 3.438821792602539, "lr": 0.0002226341309329828, "tps": 334776, "wall": 3058.2} {"step": 15622, "train_loss": 3.376065492630005, "lr": 0.0002226149749698898, "tps": 334265, "wall": 3063.0} {"step": 15623, "train_loss": 3.309948444366455, "lr": 0.00022259581897717424, "tps": 333756, "wall": 3067.9} {"step": 15624, "train_loss": 3.3136203289031982, "lr": 0.00022257666295505307, "tps": 333247, "wall": 3072.8} {"step": 15625, "train_loss": 3.3418211936950684, "lr": 0.00022255750690374328, "tps": 332737, "wall": 3077.7} {"step": 15626, "train_loss": 3.3873984813690186, "lr": 0.00022253835082346196, "tps": 332235, "wall": 3082.5} {"step": 15627, "train_loss": 3.292461395263672, "lr": 0.00022251919471442605, "tps": 331733, "wall": 3087.4} {"step": 15628, "train_loss": 3.445725679397583, "lr": 0.00022250003857685258, "tps": 331232, "wall": 3092.3} {"step": 15629, "train_loss": 3.3566606044769287, "lr": 0.00022248088241095854, "tps": 330732, "wall": 3097.1} {"step": 15630, "train_loss": 3.378284454345703, "lr": 0.0002224617262169609, "tps": 330234, "wall": 3102.0} {"step": 15631, "train_loss": 3.4197640419006348, "lr": 0.00022244256999507674, "tps": 329731, "wall": 3106.9} {"step": 15632, "train_loss": 3.3519773483276367, "lr": 0.000222423413745523, "tps": 329237, "wall": 3111.8} {"step": 15633, "train_loss": 3.334547281265259, "lr": 0.0002224042574685167, "tps": 328745, "wall": 3116.7} {"step": 15634, "train_loss": 3.326835870742798, "lr": 0.0002223851011642748, "tps": 328251, "wall": 3121.6} {"step": 15635, "train_loss": 3.332559823989868, "lr": 0.00022236594483301437, "tps": 327759, "wall": 3126.4} {"step": 15636, "train_loss": 3.44016695022583, "lr": 0.00022234678847495238, "tps": 327271, "wall": 3131.3} {"step": 15637, "train_loss": 3.3568413257598877, "lr": 0.00022232763209030588, "tps": 326783, "wall": 3136.2} {"step": 15638, "train_loss": 3.376824378967285, "lr": 0.00022230847567929177, "tps": 326296, "wall": 3141.1} {"step": 15639, "train_loss": 3.315532684326172, "lr": 0.00022228931924212714, "tps": 325812, "wall": 3145.9} {"step": 15640, "train_loss": 3.5007667541503906, "lr": 0.00022227016277902908, "tps": 325328, "wall": 3150.8} {"step": 15641, "train_loss": 3.2872846126556396, "lr": 0.00022225100629021439, "tps": 324848, "wall": 3155.7} {"step": 15642, "train_loss": 3.224949836730957, "lr": 0.00022223184977590018, "tps": 324369, "wall": 3160.5} {"step": 15643, "train_loss": 3.373284339904785, "lr": 0.00022221269323630346, "tps": 323888, "wall": 3165.4} {"step": 15644, "train_loss": 3.404489040374756, "lr": 0.00022219353667164127, "tps": 323408, "wall": 3170.3} {"step": 15645, "train_loss": 3.335310935974121, "lr": 0.00022217438008213054, "tps": 322934, "wall": 3175.2} {"step": 15646, "train_loss": 3.3606882095336914, "lr": 0.00022215522346798837, "tps": 322459, "wall": 3180.1} {"step": 15647, "train_loss": 3.311441421508789, "lr": 0.00022213606682943167, "tps": 321986, "wall": 3184.9} {"step": 15648, "train_loss": 3.4287209510803223, "lr": 0.00022211691016667747, "tps": 321516, "wall": 3189.8} {"step": 15649, "train_loss": 3.4047040939331055, "lr": 0.00022209775347994278, "tps": 321045, "wall": 3194.7} {"step": 15650, "train_loss": 3.2787399291992188, "lr": 0.00022207859676944477, "tps": 320576, "wall": 3199.6} {"step": 15651, "train_loss": 3.3990602493286133, "lr": 0.00022205944003540014, "tps": 320110, "wall": 3204.4} {"step": 15652, "train_loss": 3.3682680130004883, "lr": 0.00022204028327802613, "tps": 319646, "wall": 3209.3} {"step": 15653, "train_loss": 3.395993232727051, "lr": 0.00022202112649753964, "tps": 319183, "wall": 3214.1} {"step": 15654, "train_loss": 3.438807487487793, "lr": 0.0002220019696941578, "tps": 318722, "wall": 3219.0} {"step": 15655, "train_loss": 3.3930747509002686, "lr": 0.00022198281286809745, "tps": 318261, "wall": 3223.9} {"step": 15656, "train_loss": 3.413423538208008, "lr": 0.0002219636560195757, "tps": 317791, "wall": 3228.8} {"step": 15657, "train_loss": 3.4096004962921143, "lr": 0.0002219444991488096, "tps": 317335, "wall": 3233.7} {"step": 15658, "train_loss": 3.2945613861083984, "lr": 0.00022192534225601608, "tps": 316878, "wall": 3238.6} {"step": 15659, "train_loss": 3.373246192932129, "lr": 0.00022190618534141215, "tps": 316423, "wall": 3243.4} {"step": 15660, "train_loss": 3.296792507171631, "lr": 0.000221887028405215, "tps": 315970, "wall": 3248.3} {"step": 15661, "train_loss": 3.3086471557617188, "lr": 0.00022186787144764128, "tps": 315517, "wall": 3253.1} {"step": 15662, "train_loss": 3.356384515762329, "lr": 0.00022184871446890832, "tps": 315065, "wall": 3258.0} {"step": 15663, "train_loss": 3.318775177001953, "lr": 0.000221829557469233, "tps": 314617, "wall": 3262.9} {"step": 15664, "train_loss": 3.350503921508789, "lr": 0.0002218104004488324, "tps": 314169, "wall": 3267.7} {"step": 15665, "train_loss": 3.349257469177246, "lr": 0.00022179124340792342, "tps": 313722, "wall": 3272.6} {"step": 15666, "train_loss": 3.317556858062744, "lr": 0.00022177208634672316, "tps": 313276, "wall": 3277.5} {"step": 15667, "train_loss": 3.404977560043335, "lr": 0.00022175292926544863, "tps": 312831, "wall": 3282.3} {"step": 15668, "train_loss": 3.4505667686462402, "lr": 0.00022173377216431678, "tps": 312386, "wall": 3287.2} {"step": 15669, "train_loss": 3.3140108585357666, "lr": 0.00022171461504354468, "tps": 311943, "wall": 3292.1} {"step": 15670, "train_loss": 3.299960136413574, "lr": 0.00022169545790334932, "tps": 311497, "wall": 3297.0} {"step": 15671, "train_loss": 3.3844175338745117, "lr": 0.00022167630074394778, "tps": 311059, "wall": 3301.9} {"step": 15672, "train_loss": 3.3421401977539062, "lr": 0.00022165714356555695, "tps": 310617, "wall": 3306.8} {"step": 15673, "train_loss": 3.3201887607574463, "lr": 0.00022163798636839395, "tps": 310179, "wall": 3311.7} {"step": 15674, "train_loss": 3.393545389175415, "lr": 0.00022161882915267578, "tps": 309744, "wall": 3316.5} {"step": 15675, "train_loss": 3.331814765930176, "lr": 0.00022159967191861935, "tps": 309309, "wall": 3321.4} {"step": 15676, "train_loss": 3.340986490249634, "lr": 0.00022158051466644176, "tps": 308875, "wall": 3326.3} {"step": 15677, "train_loss": 3.294865131378174, "lr": 0.00022156135739636007, "tps": 308444, "wall": 3331.1} {"step": 15678, "train_loss": 3.314497947692871, "lr": 0.00022154220010859116, "tps": 308014, "wall": 3336.0} {"step": 15679, "train_loss": 3.4332597255706787, "lr": 0.00022152304280335217, "tps": 307586, "wall": 3340.9} {"step": 15680, "train_loss": 3.3486695289611816, "lr": 0.0002215038854808601, "tps": 307151, "wall": 3345.8} {"step": 15681, "train_loss": 3.4646503925323486, "lr": 0.00022148472814133188, "tps": 306726, "wall": 3350.7} {"step": 15682, "train_loss": 3.4019808769226074, "lr": 0.0002214655707849846, "tps": 306300, "wall": 3355.5} {"step": 15683, "train_loss": 3.286262035369873, "lr": 0.00022144641341203527, "tps": 305875, "wall": 3360.4} {"step": 15684, "train_loss": 3.2601423263549805, "lr": 0.0002214272560227009, "tps": 305453, "wall": 3365.3} {"step": 15685, "train_loss": 3.362339973449707, "lr": 0.00022140809861719848, "tps": 305030, "wall": 3370.1} {"step": 15686, "train_loss": 3.3816959857940674, "lr": 0.00022138894119574495, "tps": 304609, "wall": 3375.0} {"step": 15687, "train_loss": 3.4275989532470703, "lr": 0.00022136978375855755, "tps": 304190, "wall": 3379.9} {"step": 15688, "train_loss": 3.3841676712036133, "lr": 0.0002213506263058531, "tps": 303772, "wall": 3384.8} {"step": 15689, "train_loss": 3.300450086593628, "lr": 0.0002213314688378487, "tps": 303354, "wall": 3389.6} {"step": 15690, "train_loss": 3.388339042663574, "lr": 0.00022131231135476135, "tps": 302938, "wall": 3394.5} {"step": 15691, "train_loss": 3.269953727722168, "lr": 0.0002212931538568081, "tps": 302523, "wall": 3399.4} {"step": 15692, "train_loss": 3.4068868160247803, "lr": 0.00022127399634420592, "tps": 302109, "wall": 3404.3} {"step": 15693, "train_loss": 3.335038661956787, "lr": 0.00022125483881717175, "tps": 301691, "wall": 3409.2} {"step": 15694, "train_loss": 3.3504714965820312, "lr": 0.00022123568127592282, "tps": 301279, "wall": 3414.1} {"step": 15695, "train_loss": 3.3574841022491455, "lr": 0.00022121652372067598, "tps": 300869, "wall": 3418.9} {"step": 15696, "train_loss": 3.424834728240967, "lr": 0.00022119736615164824, "tps": 300460, "wall": 3423.8} {"step": 15697, "train_loss": 3.3122360706329346, "lr": 0.0002211782085690567, "tps": 300050, "wall": 3428.7} {"step": 15698, "train_loss": 3.278289318084717, "lr": 0.00022115905097311843, "tps": 299644, "wall": 3433.6} {"step": 15699, "train_loss": 3.388803243637085, "lr": 0.00022113989336405032, "tps": 299236, "wall": 3438.5} {"step": 15700, "train_loss": 3.3782849311828613, "lr": 0.0002211207357420694, "tps": 298834, "wall": 3443.3} {"step": 15701, "train_loss": 3.3874688148498535, "lr": 0.00022110157810739276, "tps": 298430, "wall": 3448.2} {"step": 15702, "train_loss": 3.37931752204895, "lr": 0.00022108242046023734, "tps": 298029, "wall": 3453.1} {"step": 15703, "train_loss": 3.4123880863189697, "lr": 0.0002210632628008202, "tps": 297629, "wall": 3457.9} {"step": 15704, "train_loss": 3.3244707584381104, "lr": 0.00022104410512935845, "tps": 297231, "wall": 3462.8} {"step": 15705, "train_loss": 3.342210531234741, "lr": 0.00022102494744606898, "tps": 296827, "wall": 3467.7} {"step": 15706, "train_loss": 3.455338954925537, "lr": 0.00022100578975116876, "tps": 296431, "wall": 3472.6} {"step": 15707, "train_loss": 3.3166937828063965, "lr": 0.00022098663204487502, "tps": 296035, "wall": 3477.4} {"step": 15708, "train_loss": 3.402050256729126, "lr": 0.0002209674743274046, "tps": 295640, "wall": 3482.3} {"step": 15709, "train_loss": 3.24389386177063, "lr": 0.00022094831659897458, "tps": 295247, "wall": 3487.1} {"step": 15710, "train_loss": 3.409799575805664, "lr": 0.00022092915885980202, "tps": 294854, "wall": 3492.0} {"step": 15711, "train_loss": 3.3669214248657227, "lr": 0.00022091000111010387, "tps": 294462, "wall": 3496.9} {"step": 15712, "train_loss": 3.389592409133911, "lr": 0.00022089084335009718, "tps": 294069, "wall": 3501.8} {"step": 15713, "train_loss": 3.297029972076416, "lr": 0.00022087168557999895, "tps": 293679, "wall": 3506.7} {"step": 15714, "train_loss": 3.353952646255493, "lr": 0.00022085252780002624, "tps": 293288, "wall": 3511.5} {"step": 15715, "train_loss": 3.4479293823242188, "lr": 0.00022083337001039603, "tps": 292898, "wall": 3516.5} {"step": 15716, "train_loss": 3.4257049560546875, "lr": 0.0002208142122113254, "tps": 292513, "wall": 3521.3} {"step": 15717, "train_loss": 3.317887783050537, "lr": 0.00022079505440303132, "tps": 292119, "wall": 3526.3} {"step": 15718, "train_loss": 3.384927988052368, "lr": 0.00022077589658573077, "tps": 291738, "wall": 3531.1} {"step": 15719, "train_loss": 3.2792551517486572, "lr": 0.0002207567387596409, "tps": 291356, "wall": 3536.0} {"step": 15720, "train_loss": 3.3559775352478027, "lr": 0.00022073758092497857, "tps": 290975, "wall": 3540.8} {"step": 15721, "train_loss": 3.4011449813842773, "lr": 0.00022071842308196091, "tps": 290592, "wall": 3545.7} {"step": 15722, "train_loss": 3.382441520690918, "lr": 0.00022069926523080497, "tps": 290212, "wall": 3550.6} {"step": 15723, "train_loss": 3.325709342956543, "lr": 0.00022068010737172767, "tps": 289834, "wall": 3555.4} {"step": 15724, "train_loss": 3.4000988006591797, "lr": 0.00022066094950494604, "tps": 289455, "wall": 3560.3} {"step": 15725, "train_loss": 3.3437066078186035, "lr": 0.0002206417916306772, "tps": 289078, "wall": 3565.2} {"step": 15726, "train_loss": 3.3920469284057617, "lr": 0.00022062263374913806, "tps": 288702, "wall": 3570.1} {"step": 15727, "train_loss": 3.3950655460357666, "lr": 0.00022060347586054575, "tps": 288328, "wall": 3574.9} {"step": 15728, "train_loss": 3.3437304496765137, "lr": 0.00022058431796511717, "tps": 287955, "wall": 3579.8} {"step": 15729, "train_loss": 3.3896214962005615, "lr": 0.00022056516006306942, "tps": 287582, "wall": 3584.6} {"step": 15730, "train_loss": 3.344179153442383, "lr": 0.0002205460021546195, "tps": 287207, "wall": 3589.6} {"step": 15731, "train_loss": 3.30800461769104, "lr": 0.00022052684423998448, "tps": 286837, "wall": 3594.4} {"step": 15732, "train_loss": 3.3734774589538574, "lr": 0.00022050768631938134, "tps": 286468, "wall": 3599.3} {"step": 15733, "train_loss": 3.304825782775879, "lr": 0.00022048852839302705, "tps": 286100, "wall": 3604.1} {"step": 15734, "train_loss": 3.367417812347412, "lr": 0.00022046937046113873, "tps": 285732, "wall": 3609.0} {"step": 15735, "train_loss": 3.3775317668914795, "lr": 0.0002204502125239334, "tps": 285367, "wall": 3613.9} {"step": 15736, "train_loss": 3.4327170848846436, "lr": 0.00022043105458162794, "tps": 284997, "wall": 3618.8} {"step": 15737, "train_loss": 3.359920024871826, "lr": 0.00022041189663443952, "tps": 284635, "wall": 3623.6} {"step": 15738, "train_loss": 3.324362277984619, "lr": 0.00022039273868258504, "tps": 284272, "wall": 3628.5} {"step": 15739, "train_loss": 3.3680500984191895, "lr": 0.00022037358072628168, "tps": 283908, "wall": 3633.3} {"step": 15740, "train_loss": 3.403779983520508, "lr": 0.00022035442276574637, "tps": 283548, "wall": 3638.2} {"step": 15741, "train_loss": 3.2173571586608887, "lr": 0.00022033526480119608, "tps": 283188, "wall": 3643.0} {"step": 15742, "train_loss": 3.338963508605957, "lr": 0.00022031610683284796, "tps": 282820, "wall": 3648.0} {"step": 15743, "train_loss": 3.399320125579834, "lr": 0.00022029694886091896, "tps": 282461, "wall": 3652.9} {"step": 15744, "train_loss": 3.338987350463867, "lr": 0.00022027779088562607, "tps": 282104, "wall": 3657.7} {"step": 15745, "train_loss": 3.447859048843384, "lr": 0.00022025863290718633, "tps": 281747, "wall": 3662.6} {"step": 15746, "train_loss": 3.257220506668091, "lr": 0.00022023947492581686, "tps": 281391, "wall": 3667.5} {"step": 15747, "train_loss": 3.3771889209747314, "lr": 0.00022022031694173455, "tps": 281036, "wall": 3672.3} {"step": 15748, "train_loss": 3.4979400634765625, "lr": 0.00022020115895515647, "tps": 280682, "wall": 3677.2} {"step": 15749, "train_loss": 3.361757516860962, "lr": 0.00022018200096629974, "tps": 280329, "wall": 3682.1} {"step": 15750, "train_loss": 3.3347394466400146, "lr": 0.00022016284297538116, "tps": 279977, "wall": 3686.9} {"step": 15751, "train_loss": 3.3979692459106445, "lr": 0.000220143684982618, "tps": 279626, "wall": 3691.8} {"step": 15752, "train_loss": 3.272094964981079, "lr": 0.00022012452698822715, "tps": 279276, "wall": 3696.7} {"step": 15753, "train_loss": 3.289857864379883, "lr": 0.00022010536899242554, "tps": 278927, "wall": 3701.5} {"step": 15754, "train_loss": 3.3052520751953125, "lr": 0.0002200862109954304, "tps": 278572, "wall": 3706.5} {"step": 15755, "train_loss": 3.2401187419891357, "lr": 0.00022006705299745861, "tps": 278224, "wall": 3711.3} {"step": 15756, "train_loss": 3.48482346534729, "lr": 0.00022004789499872733, "tps": 277879, "wall": 3716.2} {"step": 15757, "train_loss": 3.330735683441162, "lr": 0.00022002873699945342, "tps": 277533, "wall": 3721.1} {"step": 15758, "train_loss": 3.3358635902404785, "lr": 0.00022000957899985396, "tps": 277186, "wall": 3725.9} {"step": 15759, "train_loss": 3.3825297355651855, "lr": 0.00021999042100014608, "tps": 276844, "wall": 3730.8} {"step": 15760, "train_loss": 3.3321189880371094, "lr": 0.00021997126300054665, "tps": 276501, "wall": 3735.7} {"step": 15761, "train_loss": 3.366182327270508, "lr": 0.00021995210500127277, "tps": 276158, "wall": 3740.5} {"step": 15762, "train_loss": 3.4051332473754883, "lr": 0.00021993294700254143, "tps": 275817, "wall": 3745.4} {"step": 15763, "train_loss": 3.40264892578125, "lr": 0.00021991378900456968, "tps": 275477, "wall": 3750.3} {"step": 15764, "train_loss": 3.2362451553344727, "lr": 0.0002198946310075745, "tps": 275137, "wall": 3755.1} {"step": 15765, "train_loss": 3.3105216026306152, "lr": 0.000219875473011773, "tps": 274799, "wall": 3760.0} {"step": 15766, "train_loss": 3.377619743347168, "lr": 0.00021985631501738215, "tps": 274460, "wall": 3764.9} {"step": 15767, "train_loss": 3.342177391052246, "lr": 0.00021983715702461894, "tps": 274120, "wall": 3769.8} {"step": 15768, "train_loss": 3.3340630531311035, "lr": 0.00021981799903370038, "tps": 273784, "wall": 3774.6} {"step": 15769, "train_loss": 3.386620283126831, "lr": 0.00021979884104484355, "tps": 273450, "wall": 3779.5} {"step": 15770, "train_loss": 3.297699213027954, "lr": 0.00021977968305826555, "tps": 273116, "wall": 3784.4} {"step": 15771, "train_loss": 3.3446359634399414, "lr": 0.00021976052507418327, "tps": 272783, "wall": 3789.2} {"step": 15772, "train_loss": 3.380312442779541, "lr": 0.00021974136709281372, "tps": 272451, "wall": 3794.1} {"step": 15773, "train_loss": 3.3440606594085693, "lr": 0.00021972220911437403, "tps": 272117, "wall": 3799.0} {"step": 15774, "train_loss": 3.284203052520752, "lr": 0.00021970305113908114, "tps": 271788, "wall": 3803.8} {"step": 15775, "train_loss": 3.392465829849243, "lr": 0.0002196838931671521, "tps": 271458, "wall": 3808.7} {"step": 15776, "train_loss": 3.464716911315918, "lr": 0.00021966473519880394, "tps": 271127, "wall": 3813.6} {"step": 15777, "train_loss": 3.398634433746338, "lr": 0.00021964557723425375, "tps": 270790, "wall": 3818.6} {"step": 15778, "train_loss": 3.4368975162506104, "lr": 0.0002196264192737184, "tps": 270463, "wall": 3823.4} {"step": 15779, "train_loss": 3.2922489643096924, "lr": 0.00021960726131741503, "tps": 270133, "wall": 3828.3} {"step": 15780, "train_loss": 3.2608633041381836, "lr": 0.0002195881033655606, "tps": 269807, "wall": 3833.2} {"step": 15781, "train_loss": 3.3177337646484375, "lr": 0.00021956894541837215, "tps": 269482, "wall": 3838.1} {"step": 15782, "train_loss": 3.369267225265503, "lr": 0.0002195497874760667, "tps": 269157, "wall": 3842.9} {"step": 15783, "train_loss": 3.2747251987457275, "lr": 0.00021953062953886137, "tps": 268829, "wall": 3847.9} {"step": 15784, "train_loss": 3.422786235809326, "lr": 0.00021951147160697302, "tps": 268508, "wall": 3852.7} {"step": 15785, "train_loss": 3.2967727184295654, "lr": 0.00021949231368061876, "tps": 268185, "wall": 3857.6} {"step": 15786, "train_loss": 3.535647392272949, "lr": 0.00021947315576001554, "tps": 267865, "wall": 3862.5} {"step": 15787, "train_loss": 3.337050676345825, "lr": 0.00021945399784538053, "tps": 267543, "wall": 3867.3} {"step": 15788, "train_loss": 3.430691719055176, "lr": 0.00021943483993693065, "tps": 267224, "wall": 3872.2} {"step": 15789, "train_loss": 3.3752694129943848, "lr": 0.0002194156820348829, "tps": 266905, "wall": 3877.1} {"step": 15790, "train_loss": 3.392277479171753, "lr": 0.0002193965241394544, "tps": 266588, "wall": 3881.9} {"step": 15791, "train_loss": 3.4091641902923584, "lr": 0.00021937736625086203, "tps": 266265, "wall": 3886.9} {"step": 15792, "train_loss": 3.383291721343994, "lr": 0.0002193582083693229, "tps": 265949, "wall": 3891.8} {"step": 15793, "train_loss": 3.326080322265625, "lr": 0.00021933905049505406, "tps": 265633, "wall": 3896.6} {"step": 15794, "train_loss": 3.384394884109497, "lr": 0.00021931989262827245, "tps": 265318, "wall": 3901.5} {"step": 15795, "train_loss": 3.412874221801758, "lr": 0.00021930073476919516, "tps": 265003, "wall": 3906.4} {"step": 15796, "train_loss": 3.2898309230804443, "lr": 0.00021928157691803916, "tps": 264691, "wall": 3911.2} {"step": 15797, "train_loss": 3.4747557640075684, "lr": 0.00021926241907502153, "tps": 264377, "wall": 3916.1} {"step": 15798, "train_loss": 3.319565773010254, "lr": 0.00021924326124035922, "tps": 264064, "wall": 3921.0} {"step": 15799, "train_loss": 3.412029266357422, "lr": 0.0002192241034142693, "tps": 263753, "wall": 3925.9} {"step": 15800, "train_loss": 3.255417823791504, "lr": 0.00021920494559696878, "tps": 263444, "wall": 3930.7} {"step": 15801, "train_loss": 3.4135494232177734, "lr": 0.00021918578778867468, "tps": 263135, "wall": 3935.6} {"step": 15802, "train_loss": 3.3471145629882812, "lr": 0.00021916662998960402, "tps": 262824, "wall": 3940.5} {"step": 15803, "train_loss": 3.4265599250793457, "lr": 0.00021914747219997383, "tps": 262514, "wall": 3945.4} {"step": 15804, "train_loss": 3.4061272144317627, "lr": 0.0002191283144200011, "tps": 262203, "wall": 3950.3} {"step": 15805, "train_loss": 3.3490958213806152, "lr": 0.00021910915664990287, "tps": 261896, "wall": 3955.2} {"step": 15806, "train_loss": 3.4041588306427, "lr": 0.00021908999888989617, "tps": 261589, "wall": 3960.1} {"step": 15807, "train_loss": 3.2999255657196045, "lr": 0.00021907084114019805, "tps": 261285, "wall": 3965.0} {"step": 15808, "train_loss": 3.3442697525024414, "lr": 0.00021905168340102544, "tps": 260983, "wall": 3969.8} {"step": 15809, "train_loss": 3.35366153717041, "lr": 0.0002190325256725954, "tps": 260680, "wall": 3974.7} {"step": 15810, "train_loss": 3.4066970348358154, "lr": 0.00021901336795512503, "tps": 260375, "wall": 3979.6} {"step": 15811, "train_loss": 3.3101372718811035, "lr": 0.00021899421024883125, "tps": 260075, "wall": 3984.4} {"step": 15812, "train_loss": 3.2736761569976807, "lr": 0.0002189750525539311, "tps": 259774, "wall": 3989.3} {"step": 15813, "train_loss": 3.2490062713623047, "lr": 0.0002189558948706416, "tps": 259473, "wall": 3994.2} {"step": 15814, "train_loss": 3.3149003982543945, "lr": 0.00021893673719917983, "tps": 259173, "wall": 3999.1} {"step": 15815, "train_loss": 3.394164562225342, "lr": 0.0002189175795397627, "tps": 258874, "wall": 4003.9} {"step": 15816, "train_loss": 3.341737985610962, "lr": 0.0002188984218926073, "tps": 258573, "wall": 4008.9} {"step": 15817, "train_loss": 3.3542160987854004, "lr": 0.0002188792642579307, "tps": 258275, "wall": 4013.7} {"step": 15818, "train_loss": 3.354722261428833, "lr": 0.00021886010663594977, "tps": 257978, "wall": 4018.6} {"step": 15819, "train_loss": 3.408067226409912, "lr": 0.00021884094902688164, "tps": 257683, "wall": 4023.5} {"step": 15820, "train_loss": 3.359647035598755, "lr": 0.00021882179143094333, "tps": 257388, "wall": 4028.3} {"step": 15821, "train_loss": 3.400005578994751, "lr": 0.0002188026338483518, "tps": 257094, "wall": 4033.2} {"step": 15822, "train_loss": 3.4393117427825928, "lr": 0.00021878347627932412, "tps": 256799, "wall": 4038.1} {"step": 15823, "train_loss": 3.3812484741210938, "lr": 0.00021876431872407722, "tps": 256505, "wall": 4043.0} {"step": 15824, "train_loss": 3.505404233932495, "lr": 0.00021874516118282827, "tps": 256213, "wall": 4047.8} {"step": 15825, "train_loss": 3.38683819770813, "lr": 0.00021872600365579418, "tps": 255922, "wall": 4052.7} {"step": 15826, "train_loss": 3.2704837322235107, "lr": 0.00021870684614319193, "tps": 255631, "wall": 4057.5} {"step": 15827, "train_loss": 3.2925057411193848, "lr": 0.0002186876886452387, "tps": 255340, "wall": 4062.4} {"step": 15828, "train_loss": 3.3830833435058594, "lr": 0.00021866853116215133, "tps": 255046, "wall": 4067.4} {"step": 15829, "train_loss": 3.4601714611053467, "lr": 0.00021864937369414693, "tps": 254757, "wall": 4072.3} {"step": 15830, "train_loss": 3.3949108123779297, "lr": 0.00021863021624144246, "tps": 254469, "wall": 4077.1} {"step": 15831, "train_loss": 3.3968493938446045, "lr": 0.00021861105880425504, "tps": 254181, "wall": 4082.0} {"step": 15832, "train_loss": 3.2918860912323, "lr": 0.0002185919013828016, "tps": 253895, "wall": 4086.8} {"step": 15833, "train_loss": 3.3373944759368896, "lr": 0.00021857274397729914, "tps": 253609, "wall": 4091.7} {"step": 15834, "train_loss": 3.4393653869628906, "lr": 0.0002185535865879648, "tps": 253323, "wall": 4096.6} {"step": 15835, "train_loss": 3.3488121032714844, "lr": 0.0002185344292150154, "tps": 253038, "wall": 4101.5} {"step": 15836, "train_loss": 3.3660147190093994, "lr": 0.00021851527185866814, "tps": 252754, "wall": 4106.3} {"step": 15837, "train_loss": 3.339256763458252, "lr": 0.00021849611451913998, "tps": 252470, "wall": 4111.2} {"step": 15838, "train_loss": 3.3487048149108887, "lr": 0.00021847695719664784, "tps": 252187, "wall": 4116.1} {"step": 15839, "train_loss": 3.50343918800354, "lr": 0.00021845779989140883, "tps": 251906, "wall": 4120.9} {"step": 15840, "train_loss": 3.3722801208496094, "lr": 0.00021843864260363995, "tps": 251619, "wall": 4125.9} {"step": 15841, "train_loss": 3.4042937755584717, "lr": 0.0002184194853335583, "tps": 251340, "wall": 4130.7} {"step": 15842, "train_loss": 3.290175437927246, "lr": 0.00021840032808138072, "tps": 251060, "wall": 4135.6} {"step": 15843, "train_loss": 3.253774404525757, "lr": 0.00021838117084732427, "tps": 250781, "wall": 4140.5} {"step": 15844, "train_loss": 3.3327555656433105, "lr": 0.00021836201363160612, "tps": 250503, "wall": 4145.3} {"step": 15845, "train_loss": 3.2897019386291504, "lr": 0.00021834285643444306, "tps": 250225, "wall": 4150.2} {"step": 15846, "train_loss": 3.316596508026123, "lr": 0.00021832369925605226, "tps": 249947, "wall": 4155.1} {"step": 15847, "train_loss": 3.389169931411743, "lr": 0.0002183045420966507, "tps": 249670, "wall": 4159.9} {"step": 15848, "train_loss": 3.400139808654785, "lr": 0.00021828538495645536, "tps": 249395, "wall": 4164.8} {"step": 15849, "train_loss": 3.361654758453369, "lr": 0.00021826622783568324, "tps": 249120, "wall": 4169.7} {"step": 15850, "train_loss": 3.365431785583496, "lr": 0.0002182470707345514, "tps": 248843, "wall": 4174.6} {"step": 15851, "train_loss": 3.2851905822753906, "lr": 0.0002182279136532769, "tps": 248569, "wall": 4179.4} {"step": 15852, "train_loss": 3.362095832824707, "lr": 0.00021820875659207665, "tps": 248295, "wall": 4184.3} {"step": 15853, "train_loss": 3.434546709060669, "lr": 0.00021818959955116767, "tps": 248015, "wall": 4189.3} {"step": 15854, "train_loss": 3.4566874504089355, "lr": 0.00021817044253076703, "tps": 247742, "wall": 4194.2} {"step": 15855, "train_loss": 3.36881160736084, "lr": 0.00021815128553109175, "tps": 247471, "wall": 4199.0} {"step": 15856, "train_loss": 3.370640754699707, "lr": 0.00021813212855235876, "tps": 247201, "wall": 4203.9} {"step": 15857, "train_loss": 3.4500315189361572, "lr": 0.0002181129715947851, "tps": 246927, "wall": 4208.8} {"step": 15858, "train_loss": 3.404881000518799, "lr": 0.00021809381465858784, "tps": 246658, "wall": 4213.7} {"step": 15859, "train_loss": 3.432612419128418, "lr": 0.00021807465774398397, "tps": 246389, "wall": 4218.5} {"step": 15860, "train_loss": 3.4067177772521973, "lr": 0.00021805550085119042, "tps": 246119, "wall": 4223.4} {"step": 15861, "train_loss": 3.356961250305176, "lr": 0.00021803634398042431, "tps": 245850, "wall": 4228.3} {"step": 15862, "train_loss": 3.309497356414795, "lr": 0.0002180171871319026, "tps": 245582, "wall": 4233.2} {"step": 15863, "train_loss": 3.3806583881378174, "lr": 0.00021799803030584224, "tps": 245315, "wall": 4238.1} {"step": 15864, "train_loss": 3.420509099960327, "lr": 0.00021797887350246043, "tps": 245049, "wall": 4242.9} {"step": 15865, "train_loss": 3.338224172592163, "lr": 0.00021795971672197392, "tps": 244778, "wall": 4247.9} {"step": 15866, "train_loss": 3.4598190784454346, "lr": 0.00021794055996459993, "tps": 244513, "wall": 4252.8} {"step": 15867, "train_loss": 3.3055853843688965, "lr": 0.00021792140323055535, "tps": 244246, "wall": 4257.7} {"step": 15868, "train_loss": 3.3755722045898438, "lr": 0.00021790224652005723, "tps": 243983, "wall": 4262.6} {"step": 15869, "train_loss": 3.365419864654541, "lr": 0.00021788308983332257, "tps": 243718, "wall": 4267.4} {"step": 15870, "train_loss": 3.3432159423828125, "lr": 0.0002178639331705684, "tps": 243455, "wall": 4272.3} {"step": 15871, "train_loss": 3.3522846698760986, "lr": 0.0002178447765320117, "tps": 243193, "wall": 4277.2} {"step": 15872, "train_loss": 3.344291925430298, "lr": 0.00021782561991786947, "tps": 242931, "wall": 4282.1} {"step": 15873, "train_loss": 3.3171563148498535, "lr": 0.0002178064633283588, "tps": 242671, "wall": 4286.9} {"step": 15874, "train_loss": 3.44685697555542, "lr": 0.00021778730676369658, "tps": 242411, "wall": 4291.8} {"step": 15875, "train_loss": 3.3264126777648926, "lr": 0.0002177681502240999, "tps": 242151, "wall": 4296.7} {"step": 15876, "train_loss": 3.4079060554504395, "lr": 0.00021774899370978568, "tps": 241893, "wall": 4301.5} {"step": 15877, "train_loss": 3.3436436653137207, "lr": 0.00021772983722097097, "tps": 241628, "wall": 4306.5} {"step": 15878, "train_loss": 3.365816831588745, "lr": 0.00021771068075787287, "tps": 241370, "wall": 4311.4} {"step": 15879, "train_loss": 3.2563533782958984, "lr": 0.00021769152432070827, "tps": 241114, "wall": 4316.3} {"step": 15880, "train_loss": 3.304342746734619, "lr": 0.0002176723679096942, "tps": 240858, "wall": 4321.1} {"step": 15881, "train_loss": 3.359701633453369, "lr": 0.00021765321152504767, "tps": 240601, "wall": 4326.0} {"step": 15882, "train_loss": 3.258561611175537, "lr": 0.00021763405516698567, "tps": 240346, "wall": 4330.9} {"step": 15883, "train_loss": 3.4208195209503174, "lr": 0.00021761489883572526, "tps": 240090, "wall": 4335.8} {"step": 15884, "train_loss": 3.3971505165100098, "lr": 0.00021759574253148335, "tps": 239835, "wall": 4340.6} {"step": 15885, "train_loss": 3.389788866043091, "lr": 0.00021757658625447704, "tps": 239582, "wall": 4345.5} {"step": 15886, "train_loss": 3.3404953479766846, "lr": 0.00021755743000492333, "tps": 239328, "wall": 4350.4} {"step": 15887, "train_loss": 3.377140998840332, "lr": 0.0002175382737830391, "tps": 239076, "wall": 4355.2} {"step": 15888, "train_loss": 3.3029139041900635, "lr": 0.0002175191175890415, "tps": 238824, "wall": 4360.1} {"step": 15889, "train_loss": 3.2751572132110596, "lr": 0.00021749996142314743, "tps": 238571, "wall": 4365.0} {"step": 15890, "train_loss": 3.353111982345581, "lr": 0.00021748080528557394, "tps": 238316, "wall": 4370.0} {"step": 15891, "train_loss": 3.5511107444763184, "lr": 0.00021746164917653808, "tps": 238065, "wall": 4374.8} {"step": 15892, "train_loss": 3.2932639122009277, "lr": 0.00021744249309625673, "tps": 237816, "wall": 4379.7} {"step": 15893, "train_loss": 3.3066415786743164, "lr": 0.00021742333704494695, "tps": 237567, "wall": 4384.6} {"step": 15894, "train_loss": 3.3970515727996826, "lr": 0.00021740418102282578, "tps": 237318, "wall": 4389.4} {"step": 15895, "train_loss": 3.300226926803589, "lr": 0.0002173850250301102, "tps": 237070, "wall": 4394.3} {"step": 15896, "train_loss": 3.4592745304107666, "lr": 0.00021736586906701718, "tps": 236823, "wall": 4399.2} {"step": 15897, "train_loss": 3.4722347259521484, "lr": 0.00021734671313376373, "tps": 236576, "wall": 4404.0} {"step": 15898, "train_loss": 3.3475661277770996, "lr": 0.00021732755723056685, "tps": 236329, "wall": 4408.9} {"step": 15899, "train_loss": 3.360032081604004, "lr": 0.00021730840135764359, "tps": 236084, "wall": 4413.8} {"step": 15900, "train_loss": 3.3848347663879395, "lr": 0.00021728924551521085, "tps": 235840, "wall": 4418.6} {"step": 15901, "train_loss": 3.37001371383667, "lr": 0.00021727008970348575, "tps": 235594, "wall": 4423.5} {"step": 15902, "train_loss": 3.423879384994507, "lr": 0.00021725093392268514, "tps": 235346, "wall": 4428.4} {"step": 15903, "train_loss": 3.4129843711853027, "lr": 0.00021723177817302615, "tps": 235102, "wall": 4433.3} {"step": 15904, "train_loss": 3.4080240726470947, "lr": 0.0002172126224547257, "tps": 234860, "wall": 4438.2} {"step": 15905, "train_loss": 3.391191005706787, "lr": 0.00021719346676800084, "tps": 234618, "wall": 4443.0} {"step": 15906, "train_loss": 3.328223466873169, "lr": 0.00021717431111306854, "tps": 234376, "wall": 4447.9} {"step": 15907, "train_loss": 3.301375150680542, "lr": 0.0002171551554901458, "tps": 234135, "wall": 4452.7} {"step": 15908, "train_loss": 3.3354763984680176, "lr": 0.0002171359998994496, "tps": 233895, "wall": 4457.6} {"step": 15909, "train_loss": 3.3510994911193848, "lr": 0.00021711684434119698, "tps": 233654, "wall": 4462.5} {"step": 15910, "train_loss": 3.3514814376831055, "lr": 0.00021709768881560484, "tps": 233414, "wall": 4467.3} {"step": 15911, "train_loss": 3.3156681060791016, "lr": 0.00021707853332289024, "tps": 233174, "wall": 4472.2} {"step": 15912, "train_loss": 3.3395397663116455, "lr": 0.0002170593778632702, "tps": 232936, "wall": 4477.1} {"step": 15913, "train_loss": 3.3870725631713867, "lr": 0.0002170402224369617, "tps": 232698, "wall": 4481.9} {"step": 15914, "train_loss": 3.4042880535125732, "lr": 0.00021702106704418167, "tps": 232456, "wall": 4486.9} {"step": 15915, "train_loss": 3.346757411956787, "lr": 0.00021700191168514725, "tps": 232219, "wall": 4491.8} {"step": 15916, "train_loss": 3.362051010131836, "lr": 0.00021698275636007527, "tps": 231981, "wall": 4496.6} {"step": 15917, "train_loss": 3.364349365234375, "lr": 0.00021696360106918276, "tps": 231746, "wall": 4501.5} {"step": 15918, "train_loss": 3.429513692855835, "lr": 0.00021694444581268684, "tps": 231511, "wall": 4506.3} {"step": 15919, "train_loss": 3.2862870693206787, "lr": 0.0002169252905908043, "tps": 231275, "wall": 4511.2} {"step": 15920, "train_loss": 3.319549083709717, "lr": 0.00021690613540375226, "tps": 231041, "wall": 4516.1} {"step": 15921, "train_loss": 3.3373215198516846, "lr": 0.0002168869802517477, "tps": 230807, "wall": 4520.9} {"step": 15922, "train_loss": 3.3021507263183594, "lr": 0.00021686782513500764, "tps": 230573, "wall": 4525.8} {"step": 15923, "train_loss": 3.30557918548584, "lr": 0.00021684867005374896, "tps": 230339, "wall": 4530.7} {"step": 15924, "train_loss": 3.3967549800872803, "lr": 0.00021682951500818874, "tps": 230107, "wall": 4535.5} {"step": 15925, "train_loss": 3.4235246181488037, "lr": 0.00021681035999854395, "tps": 229876, "wall": 4540.4} {"step": 15926, "train_loss": 3.349656581878662, "lr": 0.0002167912050250316, "tps": 229645, "wall": 4545.2} {"step": 15927, "train_loss": 3.435185432434082, "lr": 0.0002167720500878686, "tps": 229411, "wall": 4550.2} {"step": 15928, "train_loss": 3.2573766708374023, "lr": 0.00021675289518727212, "tps": 229180, "wall": 4555.0} {"step": 15929, "train_loss": 3.373008966445923, "lr": 0.00021673374032345888, "tps": 228951, "wall": 4559.9} {"step": 15930, "train_loss": 3.358643054962158, "lr": 0.00021671458549664605, "tps": 228721, "wall": 4564.7} {"step": 15931, "train_loss": 3.318793535232544, "lr": 0.00021669543070705055, "tps": 228493, "wall": 4569.6} {"step": 15932, "train_loss": 3.3621697425842285, "lr": 0.0002166762759548894, "tps": 228264, "wall": 4574.4} {"step": 15933, "train_loss": 3.377203941345215, "lr": 0.00021665712124037962, "tps": 228034, "wall": 4579.4} {"step": 15934, "train_loss": 3.321779251098633, "lr": 0.00021663796656373808, "tps": 227806, "wall": 4584.2} {"step": 15935, "train_loss": 3.271421432495117, "lr": 0.00021661881192518186, "tps": 227579, "wall": 4589.1} {"step": 15936, "train_loss": 3.4196348190307617, "lr": 0.0002165996573249279, "tps": 227353, "wall": 4593.9} {"step": 15937, "train_loss": 3.4347176551818848, "lr": 0.00021658050276319332, "tps": 227126, "wall": 4598.8} {"step": 15938, "train_loss": 3.279947519302368, "lr": 0.00021656134824019483, "tps": 226900, "wall": 4603.7} {"step": 15939, "train_loss": 3.51542592048645, "lr": 0.00021654219375614968, "tps": 226673, "wall": 4608.6} {"step": 15940, "train_loss": 3.3966221809387207, "lr": 0.0002165230393112747, "tps": 226448, "wall": 4613.5} {"step": 15941, "train_loss": 3.3214097023010254, "lr": 0.00021650388490578694, "tps": 226223, "wall": 4618.3} {"step": 15942, "train_loss": 3.332789421081543, "lr": 0.00021648473053990333, "tps": 225999, "wall": 4623.2} {"step": 15943, "train_loss": 3.335054636001587, "lr": 0.00021646557621384096, "tps": 225776, "wall": 4628.1} {"step": 15944, "train_loss": 3.3918581008911133, "lr": 0.00021644642192781665, "tps": 225552, "wall": 4632.9} {"step": 15945, "train_loss": 3.422327756881714, "lr": 0.00021642726768204747, "tps": 225330, "wall": 4637.8} {"step": 15946, "train_loss": 3.3999533653259277, "lr": 0.00021640811347675042, "tps": 225108, "wall": 4642.7} {"step": 15947, "train_loss": 3.328138828277588, "lr": 0.0002163889593121425, "tps": 224886, "wall": 4647.5} {"step": 15948, "train_loss": 3.498173236846924, "lr": 0.00021636980518844058, "tps": 224665, "wall": 4652.4} {"step": 15949, "train_loss": 3.380591630935669, "lr": 0.00021635065110586172, "tps": 224445, "wall": 4657.3} {"step": 15950, "train_loss": 3.36757230758667, "lr": 0.00021633149706462291, "tps": 224224, "wall": 4662.1} {"step": 15951, "train_loss": 3.397224187850952, "lr": 0.00021631234306494106, "tps": 224001, "wall": 4667.1} {"step": 15952, "train_loss": 3.3034815788269043, "lr": 0.00021629318910703317, "tps": 223781, "wall": 4672.0} {"step": 15953, "train_loss": 3.3692374229431152, "lr": 0.0002162740351911163, "tps": 223562, "wall": 4676.8} {"step": 15954, "train_loss": 3.3892154693603516, "lr": 0.00021625488131740732, "tps": 223343, "wall": 4681.7} {"step": 15955, "train_loss": 3.283298969268799, "lr": 0.00021623572748612321, "tps": 223125, "wall": 4686.6} {"step": 15956, "train_loss": 3.2647554874420166, "lr": 0.00021621657369748105, "tps": 222908, "wall": 4691.4} {"step": 15957, "train_loss": 3.301565408706665, "lr": 0.00021619741995169774, "tps": 222690, "wall": 4696.3} {"step": 15958, "train_loss": 3.427661895751953, "lr": 0.00021617826624899022, "tps": 222473, "wall": 4701.2} {"step": 15959, "train_loss": 3.2826974391937256, "lr": 0.00021615911258957552, "tps": 222257, "wall": 4706.0} {"step": 15960, "train_loss": 3.3196868896484375, "lr": 0.00021613995897367064, "tps": 222042, "wall": 4710.9} {"step": 15961, "train_loss": 3.2425272464752197, "lr": 0.0002161208054014925, "tps": 221826, "wall": 4715.8} {"step": 15962, "train_loss": 3.2656774520874023, "lr": 0.00021610165187325805, "tps": 221611, "wall": 4720.6} {"step": 15963, "train_loss": 3.327888011932373, "lr": 0.00021608249838918432, "tps": 221395, "wall": 4725.5} {"step": 15964, "train_loss": 3.277083396911621, "lr": 0.00021606334494948825, "tps": 221180, "wall": 4730.5} {"step": 15965, "train_loss": 3.3671512603759766, "lr": 0.00021604419155438683, "tps": 220966, "wall": 4735.3} {"step": 15966, "train_loss": 3.373054027557373, "lr": 0.00021602503820409706, "tps": 220752, "wall": 4740.2} {"step": 15967, "train_loss": 3.3648691177368164, "lr": 0.00021600588489883586, "tps": 220539, "wall": 4745.1} {"step": 15968, "train_loss": 3.3420462608337402, "lr": 0.00021598673163882018, "tps": 220327, "wall": 4749.9} {"step": 15969, "train_loss": 3.380439281463623, "lr": 0.000215967578424267, "tps": 220115, "wall": 4754.8} {"step": 15970, "train_loss": 3.325399875640869, "lr": 0.00021594842525539339, "tps": 219904, "wall": 4759.7} {"step": 15971, "train_loss": 3.414844512939453, "lr": 0.00021592927213241617, "tps": 219693, "wall": 4764.5} {"step": 15972, "train_loss": 3.2720580101013184, "lr": 0.00021591011905555237, "tps": 219482, "wall": 4769.4} {"step": 15973, "train_loss": 3.3761978149414062, "lr": 0.00021589096602501898, "tps": 219272, "wall": 4774.3} {"step": 15974, "train_loss": 3.342987060546875, "lr": 0.00021587181304103296, "tps": 219062, "wall": 4779.2} {"step": 15975, "train_loss": 3.3393807411193848, "lr": 0.00021585266010381123, "tps": 218853, "wall": 4784.0} {"step": 15976, "train_loss": 3.3270702362060547, "lr": 0.00021583350721357083, "tps": 218641, "wall": 4789.0} {"step": 15977, "train_loss": 3.4047696590423584, "lr": 0.0002158143543705287, "tps": 218433, "wall": 4793.8} {"step": 15978, "train_loss": 3.28541898727417, "lr": 0.00021579520157490175, "tps": 218225, "wall": 4798.7} {"step": 15979, "train_loss": 3.3844027519226074, "lr": 0.000215776048826907, "tps": 218018, "wall": 4803.6} {"step": 15980, "train_loss": 3.322357177734375, "lr": 0.00021575689612676145, "tps": 217811, "wall": 4808.4} {"step": 15981, "train_loss": 3.3704864978790283, "lr": 0.00021573774347468194, "tps": 217604, "wall": 4813.3} {"step": 15982, "train_loss": 3.2761330604553223, "lr": 0.0002157185908708855, "tps": 217398, "wall": 4818.2} {"step": 15983, "train_loss": 3.36625599861145, "lr": 0.00021569943831558912, "tps": 217192, "wall": 4823.0} {"step": 15984, "train_loss": 3.3919670581817627, "lr": 0.00021568028580900975, "tps": 216987, "wall": 4827.9} {"step": 15985, "train_loss": 3.3648483753204346, "lr": 0.0002156611333513643, "tps": 216782, "wall": 4832.8} {"step": 15986, "train_loss": 3.261866569519043, "lr": 0.00021564198094286977, "tps": 216578, "wall": 4837.6} {"step": 15987, "train_loss": 3.2250754833221436, "lr": 0.00021562282858374315, "tps": 216374, "wall": 4842.5} {"step": 15988, "train_loss": 3.357863187789917, "lr": 0.00021560367627420135, "tps": 216168, "wall": 4847.4} {"step": 15989, "train_loss": 3.4219679832458496, "lr": 0.0002155845240144613, "tps": 215964, "wall": 4852.3} {"step": 15990, "train_loss": 3.3493728637695312, "lr": 0.00021556537180474005, "tps": 215762, "wall": 4857.1} {"step": 15991, "train_loss": 3.3581292629241943, "lr": 0.0002155462196452545, "tps": 215558, "wall": 4862.0} {"step": 15992, "train_loss": 3.391899824142456, "lr": 0.0002155270675362216, "tps": 215356, "wall": 4866.9} {"step": 15993, "train_loss": 3.3671162128448486, "lr": 0.00021550791547785832, "tps": 215155, "wall": 4871.8} {"step": 15994, "train_loss": 3.3649635314941406, "lr": 0.00021548876347038168, "tps": 214954, "wall": 4876.6} {"step": 15995, "train_loss": 3.345458507537842, "lr": 0.00021546961151400852, "tps": 214752, "wall": 4881.5} {"step": 15996, "train_loss": 3.2848312854766846, "lr": 0.0002154504596089558, "tps": 214552, "wall": 4886.4} {"step": 15997, "train_loss": 3.3627970218658447, "lr": 0.00021543130775544058, "tps": 214351, "wall": 4891.2} {"step": 15998, "train_loss": 3.272606134414673, "lr": 0.00021541215595367974, "tps": 214152, "wall": 4896.1} {"step": 15999, "train_loss": 3.2719039916992188, "lr": 0.00021539300420389022, "tps": 213951, "wall": 4901.0} {"step": 16000, "train_loss": 3.3468406200408936, "lr": 0.00021537385250628902, "tps": 213749, "wall": 4905.9, "val_loss_monitor": 3.406688105974617} {"step": 16001, "train_loss": 3.2903106212615967, "lr": 0.00021535470086109308, "tps": 211505, "wall": 4958.3} {"step": 16002, "train_loss": 3.4141016006469727, "lr": 0.00021533554926851935, "tps": 211310, "wall": 4963.2} {"step": 16003, "train_loss": 3.3430585861206055, "lr": 0.00021531639772878473, "tps": 211112, "wall": 4968.1} {"step": 16004, "train_loss": 3.346071720123291, "lr": 0.00021529724624210625, "tps": 210917, "wall": 4973.0} {"step": 16005, "train_loss": 3.1809539794921875, "lr": 0.0002152780948087008, "tps": 210723, "wall": 4977.9} {"step": 16006, "train_loss": 3.332352638244629, "lr": 0.0002152589434287853, "tps": 210529, "wall": 4982.8} {"step": 16007, "train_loss": 3.3963069915771484, "lr": 0.00021523979210257683, "tps": 210336, "wall": 4987.7} {"step": 16008, "train_loss": 3.492130756378174, "lr": 0.0002152206408302922, "tps": 210144, "wall": 4992.6} {"step": 16009, "train_loss": 3.3162522315979004, "lr": 0.00021520148961214842, "tps": 209951, "wall": 4997.5} {"step": 16010, "train_loss": 3.3701324462890625, "lr": 0.00021518233844836245, "tps": 209759, "wall": 5002.4} {"step": 16011, "train_loss": 3.4376282691955566, "lr": 0.00021516318733915118, "tps": 209567, "wall": 5007.3} {"step": 16012, "train_loss": 3.3648176193237305, "lr": 0.00021514403628473158, "tps": 209377, "wall": 5012.1} {"step": 16013, "train_loss": 3.299529552459717, "lr": 0.00021512488528532063, "tps": 209186, "wall": 5017.0} {"step": 16014, "train_loss": 3.379199981689453, "lr": 0.00021510573434113526, "tps": 208996, "wall": 5021.9} {"step": 16015, "train_loss": 3.4195125102996826, "lr": 0.00021508658345239235, "tps": 208802, "wall": 5026.9} {"step": 16016, "train_loss": 3.3797950744628906, "lr": 0.00021506743261930886, "tps": 208612, "wall": 5031.8} {"step": 16017, "train_loss": 3.400657892227173, "lr": 0.00021504828184210179, "tps": 208424, "wall": 5036.6} {"step": 16018, "train_loss": 3.3218741416931152, "lr": 0.00021502913112098814, "tps": 208235, "wall": 5041.5} {"step": 16019, "train_loss": 3.350435256958008, "lr": 0.0002150099804561846, "tps": 208047, "wall": 5046.4} {"step": 16020, "train_loss": 3.3815343379974365, "lr": 0.00021499082984790838, "tps": 207860, "wall": 5051.2} {"step": 16021, "train_loss": 3.4273204803466797, "lr": 0.00021497167929637628, "tps": 207671, "wall": 5056.2} {"step": 16022, "train_loss": 3.443614959716797, "lr": 0.00021495252880180532, "tps": 207483, "wall": 5061.0} {"step": 16023, "train_loss": 3.291083812713623, "lr": 0.0002149333783644123, "tps": 207296, "wall": 5065.9} {"step": 16024, "train_loss": 3.4405035972595215, "lr": 0.0002149142279844143, "tps": 207109, "wall": 5070.8} {"step": 16025, "train_loss": 3.239487648010254, "lr": 0.0002148950776620282, "tps": 206924, "wall": 5075.7} {"step": 16026, "train_loss": 3.380115509033203, "lr": 0.00021487592739747094, "tps": 206739, "wall": 5080.5} {"step": 16027, "train_loss": 3.359989643096924, "lr": 0.0002148567771909594, "tps": 206552, "wall": 5085.4} {"step": 16028, "train_loss": 3.3608956336975098, "lr": 0.0002148376270427106, "tps": 206365, "wall": 5090.4} {"step": 16029, "train_loss": 3.384009838104248, "lr": 0.00021481847695294147, "tps": 206180, "wall": 5095.3} {"step": 16030, "train_loss": 3.454972267150879, "lr": 0.00021479932692186884, "tps": 205996, "wall": 5100.1} {"step": 16031, "train_loss": 3.359016180038452, "lr": 0.0002147801769497098, "tps": 205808, "wall": 5105.1} {"step": 16032, "train_loss": 3.363464832305908, "lr": 0.00021476102703668116, "tps": 205626, "wall": 5109.9} {"step": 16033, "train_loss": 3.44014310836792, "lr": 0.00021474187718299988, "tps": 205443, "wall": 5114.8} {"step": 16034, "train_loss": 3.303687572479248, "lr": 0.0002147227273888829, "tps": 205260, "wall": 5119.7} {"step": 16035, "train_loss": 3.3975210189819336, "lr": 0.0002147035776545472, "tps": 205077, "wall": 5124.6} {"step": 16036, "train_loss": 3.410458564758301, "lr": 0.00021468442798020955, "tps": 204895, "wall": 5129.4} {"step": 16037, "train_loss": 3.3755786418914795, "lr": 0.00021466527836608705, "tps": 204713, "wall": 5134.3} {"step": 16038, "train_loss": 3.4185173511505127, "lr": 0.0002146461288123966, "tps": 204532, "wall": 5139.2} {"step": 16039, "train_loss": 3.330522298812866, "lr": 0.00021462697931935506, "tps": 204352, "wall": 5144.0} {"step": 16040, "train_loss": 3.30886173248291, "lr": 0.0002146078298871794, "tps": 204169, "wall": 5149.0} {"step": 16041, "train_loss": 3.3407983779907227, "lr": 0.00021458868051608653, "tps": 203989, "wall": 5153.8} {"step": 16042, "train_loss": 3.260725259780884, "lr": 0.00021456953120629337, "tps": 203809, "wall": 5158.7} {"step": 16043, "train_loss": 3.3793163299560547, "lr": 0.00021455038195801685, "tps": 203629, "wall": 5163.6} {"step": 16044, "train_loss": 3.292628049850464, "lr": 0.0002145312327714739, "tps": 203451, "wall": 5168.4} {"step": 16045, "train_loss": 3.332819938659668, "lr": 0.00021451208364688148, "tps": 203272, "wall": 5173.3} {"step": 16046, "train_loss": 3.2267117500305176, "lr": 0.0002144929345844564, "tps": 203093, "wall": 5178.2} {"step": 16047, "train_loss": 3.3898792266845703, "lr": 0.0002144737855844157, "tps": 202914, "wall": 5183.1} {"step": 16048, "train_loss": 3.3240151405334473, "lr": 0.00021445463664697626, "tps": 202737, "wall": 5187.9} {"step": 16049, "train_loss": 3.335667848587036, "lr": 0.000214435487772355, "tps": 202559, "wall": 5192.8} {"step": 16050, "train_loss": 3.3439278602600098, "lr": 0.00021441633896076884, "tps": 202382, "wall": 5197.7} {"step": 16051, "train_loss": 3.378347635269165, "lr": 0.00021439719021243468, "tps": 202205, "wall": 5202.6} {"step": 16052, "train_loss": 3.3405203819274902, "lr": 0.00021437804152756943, "tps": 202026, "wall": 5207.5} {"step": 16053, "train_loss": 3.4111013412475586, "lr": 0.00021435889290639004, "tps": 201849, "wall": 5212.4} {"step": 16054, "train_loss": 3.4447927474975586, "lr": 0.00021433974434911343, "tps": 201673, "wall": 5217.2} {"step": 16055, "train_loss": 3.3132643699645996, "lr": 0.00021432059585595653, "tps": 201498, "wall": 5222.1} {"step": 16056, "train_loss": 3.394108295440674, "lr": 0.0002143014474271362, "tps": 201322, "wall": 5227.0} {"step": 16057, "train_loss": 3.3567001819610596, "lr": 0.00021428229906286932, "tps": 201148, "wall": 5231.9} {"step": 16058, "train_loss": 3.3995137214660645, "lr": 0.00021426315076337297, "tps": 200973, "wall": 5236.7} {"step": 16059, "train_loss": 3.367359161376953, "lr": 0.0002142440025288639, "tps": 200798, "wall": 5241.6} {"step": 16060, "train_loss": 3.334862232208252, "lr": 0.0002142248543595591, "tps": 200625, "wall": 5246.5} {"step": 16061, "train_loss": 3.259598970413208, "lr": 0.00021420570625567544, "tps": 200452, "wall": 5251.3} {"step": 16062, "train_loss": 3.3643174171447754, "lr": 0.00021418655821742988, "tps": 200278, "wall": 5256.2} {"step": 16063, "train_loss": 3.234006404876709, "lr": 0.00021416741024503927, "tps": 200106, "wall": 5261.0} {"step": 16064, "train_loss": 3.3092637062072754, "lr": 0.0002141482623387206, "tps": 199930, "wall": 5266.0} {"step": 16065, "train_loss": 3.3595752716064453, "lr": 0.00021412911449869074, "tps": 199759, "wall": 5270.8} {"step": 16066, "train_loss": 3.34059739112854, "lr": 0.00021410996672516653, "tps": 199587, "wall": 5275.7} {"step": 16067, "train_loss": 3.3155834674835205, "lr": 0.0002140908190183649, "tps": 199416, "wall": 5280.6} {"step": 16068, "train_loss": 3.4328041076660156, "lr": 0.00021407167137850287, "tps": 199245, "wall": 5285.4} {"step": 16069, "train_loss": 3.3553500175476074, "lr": 0.00021405252380579727, "tps": 199074, "wall": 5290.3} {"step": 16070, "train_loss": 3.3052759170532227, "lr": 0.000214033376300465, "tps": 198904, "wall": 5295.2} {"step": 16071, "train_loss": 3.3475732803344727, "lr": 0.00021401422886272288, "tps": 198734, "wall": 5300.0} {"step": 16072, "train_loss": 3.326918363571167, "lr": 0.00021399508149278802, "tps": 198564, "wall": 5304.9} {"step": 16073, "train_loss": 3.307292938232422, "lr": 0.00021397593419087715, "tps": 198395, "wall": 5309.7} {"step": 16074, "train_loss": 3.343424081802368, "lr": 0.00021395678695720717, "tps": 198226, "wall": 5314.6} {"step": 16075, "train_loss": 3.355404853820801, "lr": 0.00021393763979199513, "tps": 198057, "wall": 5319.5} {"step": 16076, "train_loss": 3.3185224533081055, "lr": 0.0002139184926954578, "tps": 197889, "wall": 5324.3} {"step": 16077, "train_loss": 3.4013471603393555, "lr": 0.0002138993456678121, "tps": 197718, "wall": 5329.2} {"step": 16078, "train_loss": 3.3784589767456055, "lr": 0.00021388019870927492, "tps": 197550, "wall": 5334.1} {"step": 16079, "train_loss": 3.3512518405914307, "lr": 0.00021386105182006322, "tps": 197383, "wall": 5338.9} {"step": 16080, "train_loss": 3.2841506004333496, "lr": 0.00021384190500039384, "tps": 197216, "wall": 5343.8} {"step": 16081, "train_loss": 3.298590660095215, "lr": 0.00021382275825048366, "tps": 197049, "wall": 5348.7} {"step": 16082, "train_loss": 3.2275686264038086, "lr": 0.0002138036115705497, "tps": 196882, "wall": 5353.5} {"step": 16083, "train_loss": 3.376380681991577, "lr": 0.0002137844649608087, "tps": 196716, "wall": 5358.4} {"step": 16084, "train_loss": 3.378798246383667, "lr": 0.0002137653184214776, "tps": 196550, "wall": 5363.2} {"step": 16085, "train_loss": 3.3051328659057617, "lr": 0.00021374617195277335, "tps": 196384, "wall": 5368.1} {"step": 16086, "train_loss": 3.3752248287200928, "lr": 0.00021372702555491277, "tps": 196220, "wall": 5372.9} {"step": 16087, "train_loss": 3.4279592037200928, "lr": 0.00021370787922811278, "tps": 196054, "wall": 5377.8} {"step": 16088, "train_loss": 3.305382490158081, "lr": 0.00021368873297259033, "tps": 195889, "wall": 5382.7} {"step": 16089, "train_loss": 3.3562934398651123, "lr": 0.0002136695867885622, "tps": 195723, "wall": 5387.6} {"step": 16090, "train_loss": 3.4712729454040527, "lr": 0.00021365044067624535, "tps": 195559, "wall": 5392.4} {"step": 16091, "train_loss": 3.3255486488342285, "lr": 0.00021363129463585666, "tps": 195395, "wall": 5397.3} {"step": 16092, "train_loss": 3.4176025390625, "lr": 0.00021361214866761304, "tps": 195232, "wall": 5402.1} {"step": 16093, "train_loss": 3.330319404602051, "lr": 0.00021359300277173126, "tps": 195069, "wall": 5407.0} {"step": 16094, "train_loss": 3.3802120685577393, "lr": 0.00021357385694842834, "tps": 194906, "wall": 5411.8} {"step": 16095, "train_loss": 3.377474784851074, "lr": 0.00021355471119792116, "tps": 194743, "wall": 5416.7} {"step": 16096, "train_loss": 3.3283307552337646, "lr": 0.00021353556552042652, "tps": 194580, "wall": 5421.6} {"step": 16097, "train_loss": 3.3353066444396973, "lr": 0.0002135164199161614, "tps": 194418, "wall": 5426.4} {"step": 16098, "train_loss": 3.448390007019043, "lr": 0.00021349727438534254, "tps": 194256, "wall": 5431.3} {"step": 16099, "train_loss": 3.348693609237671, "lr": 0.0002134781289281869, "tps": 194095, "wall": 5436.1} {"step": 16100, "train_loss": 3.3848390579223633, "lr": 0.00021345898354491145, "tps": 193933, "wall": 5441.0} {"step": 16101, "train_loss": 3.3374624252319336, "lr": 0.00021343983823573291, "tps": 193769, "wall": 5446.0} {"step": 16102, "train_loss": 3.1517205238342285, "lr": 0.00021342069300086825, "tps": 193609, "wall": 5450.8} {"step": 16103, "train_loss": 3.3012802600860596, "lr": 0.0002134015478405344, "tps": 193449, "wall": 5455.7} {"step": 16104, "train_loss": 3.3396317958831787, "lr": 0.00021338240275494812, "tps": 193289, "wall": 5460.5} {"step": 16105, "train_loss": 3.3637094497680664, "lr": 0.00021336325774432634, "tps": 193128, "wall": 5465.4} {"step": 16106, "train_loss": 3.2944843769073486, "lr": 0.0002133441128088859, "tps": 192969, "wall": 5470.2} {"step": 16107, "train_loss": 3.3079559803009033, "lr": 0.00021332496794884383, "tps": 192809, "wall": 5475.1} {"step": 16108, "train_loss": 3.242400646209717, "lr": 0.00021330582316441676, "tps": 192650, "wall": 5480.0} {"step": 16109, "train_loss": 3.255368232727051, "lr": 0.00021328667845582172, "tps": 192491, "wall": 5484.8} {"step": 16110, "train_loss": 3.3232574462890625, "lr": 0.0002132675338232756, "tps": 192333, "wall": 5489.7} {"step": 16111, "train_loss": 3.347022533416748, "lr": 0.00021324838926699516, "tps": 192175, "wall": 5494.6} {"step": 16112, "train_loss": 3.28820538520813, "lr": 0.00021322924478719735, "tps": 192017, "wall": 5499.4} {"step": 16113, "train_loss": 3.2961740493774414, "lr": 0.00021321010038409904, "tps": 191859, "wall": 5504.3} {"step": 16114, "train_loss": 3.3041932582855225, "lr": 0.0002131909560579171, "tps": 191698, "wall": 5509.2} {"step": 16115, "train_loss": 3.3925793170928955, "lr": 0.00021317181180886832, "tps": 191541, "wall": 5514.1} {"step": 16116, "train_loss": 3.4419422149658203, "lr": 0.00021315266763716962, "tps": 191384, "wall": 5518.9} {"step": 16117, "train_loss": 3.4008076190948486, "lr": 0.00021313352354303792, "tps": 191228, "wall": 5523.8} {"step": 16118, "train_loss": 3.3315887451171875, "lr": 0.00021311437952669003, "tps": 191072, "wall": 5528.7} {"step": 16119, "train_loss": 3.2868731021881104, "lr": 0.00021309523558834278, "tps": 190916, "wall": 5533.5} {"step": 16120, "train_loss": 3.296583414077759, "lr": 0.0002130760917282131, "tps": 190758, "wall": 5538.4} {"step": 16121, "train_loss": 3.4065566062927246, "lr": 0.00021305694794651787, "tps": 190603, "wall": 5543.3} {"step": 16122, "train_loss": 3.386280059814453, "lr": 0.0002130378042434739, "tps": 190448, "wall": 5548.1} {"step": 16123, "train_loss": 3.4493117332458496, "lr": 0.00021301866061929797, "tps": 190292, "wall": 5553.0} {"step": 16124, "train_loss": 3.3854763507843018, "lr": 0.00021299951707420714, "tps": 190138, "wall": 5557.9} {"step": 16125, "train_loss": 3.458404779434204, "lr": 0.00021298037360841806, "tps": 189983, "wall": 5562.8} {"step": 16126, "train_loss": 3.4356744289398193, "lr": 0.00021296123022214775, "tps": 189826, "wall": 5567.7} {"step": 16127, "train_loss": 3.3931331634521484, "lr": 0.00021294208691561303, "tps": 189672, "wall": 5572.6} {"step": 16128, "train_loss": 3.369709014892578, "lr": 0.00021292294368903067, "tps": 189518, "wall": 5577.4} {"step": 16129, "train_loss": 3.284975290298462, "lr": 0.0002129038005426176, "tps": 189365, "wall": 5582.3} {"step": 16130, "train_loss": 3.3224244117736816, "lr": 0.00021288465747659068, "tps": 189211, "wall": 5587.2} {"step": 16131, "train_loss": 3.286087989807129, "lr": 0.00021286551449116673, "tps": 189058, "wall": 5592.1} {"step": 16132, "train_loss": 3.52976131439209, "lr": 0.00021284637158656264, "tps": 188906, "wall": 5596.9} {"step": 16133, "train_loss": 3.360110282897949, "lr": 0.00021282722876299524, "tps": 188752, "wall": 5601.8} {"step": 16134, "train_loss": 3.3637051582336426, "lr": 0.00021280808602068137, "tps": 188601, "wall": 5606.7} {"step": 16135, "train_loss": 3.492581605911255, "lr": 0.0002127889433598379, "tps": 188448, "wall": 5611.5} {"step": 16136, "train_loss": 3.354729652404785, "lr": 0.00021276980078068161, "tps": 188297, "wall": 5616.4} {"step": 16137, "train_loss": 3.3730311393737793, "lr": 0.0002127506582834295, "tps": 188146, "wall": 5621.3} {"step": 16138, "train_loss": 3.378957748413086, "lr": 0.0002127315158682982, "tps": 187992, "wall": 5626.2} {"step": 16139, "train_loss": 3.2570371627807617, "lr": 0.00021271237353550482, "tps": 187841, "wall": 5631.1} {"step": 16140, "train_loss": 3.354811191558838, "lr": 0.00021269323128526594, "tps": 187691, "wall": 5635.9} {"step": 16141, "train_loss": 3.317817449569702, "lr": 0.00021267408911779863, "tps": 187540, "wall": 5640.8} {"step": 16142, "train_loss": 3.3688533306121826, "lr": 0.00021265494703331963, "tps": 187390, "wall": 5645.7} {"step": 16143, "train_loss": 3.2594685554504395, "lr": 0.00021263580503204574, "tps": 187240, "wall": 5650.5} {"step": 16144, "train_loss": 3.3611984252929688, "lr": 0.00021261666311419387, "tps": 187092, "wall": 5655.4} {"step": 16145, "train_loss": 3.4306447505950928, "lr": 0.00021259752127998085, "tps": 186943, "wall": 5660.2} {"step": 16146, "train_loss": 3.3423664569854736, "lr": 0.0002125783795296235, "tps": 186792, "wall": 5665.2} {"step": 16147, "train_loss": 3.3520078659057617, "lr": 0.00021255923786333872, "tps": 186644, "wall": 5670.0} {"step": 16148, "train_loss": 3.353149890899658, "lr": 0.00021254009628134322, "tps": 186494, "wall": 5674.9} {"step": 16149, "train_loss": 3.434246063232422, "lr": 0.0002125209547838539, "tps": 186345, "wall": 5679.8} {"step": 16150, "train_loss": 3.297914505004883, "lr": 0.0002125018133710876, "tps": 186198, "wall": 5684.6} {"step": 16151, "train_loss": 3.3339054584503174, "lr": 0.00021248267204326124, "tps": 186046, "wall": 5689.6} {"step": 16152, "train_loss": 3.35526442527771, "lr": 0.00021246353080059155, "tps": 185899, "wall": 5694.5} {"step": 16153, "train_loss": 3.3869612216949463, "lr": 0.0002124443896432954, "tps": 185752, "wall": 5699.3} {"step": 16154, "train_loss": 3.3744473457336426, "lr": 0.00021242524857158964, "tps": 185606, "wall": 5704.2} {"step": 16155, "train_loss": 3.366262912750244, "lr": 0.000212406107585691, "tps": 185459, "wall": 5709.1} {"step": 16156, "train_loss": 3.3727645874023438, "lr": 0.0002123869666858164, "tps": 185313, "wall": 5713.9} {"step": 16157, "train_loss": 3.41335391998291, "lr": 0.00021236782587218272, "tps": 185166, "wall": 5718.8} {"step": 16158, "train_loss": 3.338562250137329, "lr": 0.00021234868514500668, "tps": 185019, "wall": 5723.7} {"step": 16159, "train_loss": 3.2428536415100098, "lr": 0.00021232954450450508, "tps": 184873, "wall": 5728.6} {"step": 16160, "train_loss": 3.3968522548675537, "lr": 0.00021231040395089487, "tps": 184728, "wall": 5733.4} {"step": 16161, "train_loss": 3.323822259902954, "lr": 0.00021229126348439286, "tps": 184582, "wall": 5738.3} {"step": 16162, "train_loss": 3.4468815326690674, "lr": 0.00021227212310521578, "tps": 184437, "wall": 5743.2} {"step": 16163, "train_loss": 3.342430591583252, "lr": 0.00021225298281358056, "tps": 184290, "wall": 5748.1} {"step": 16164, "train_loss": 3.3611154556274414, "lr": 0.00021223384260970395, "tps": 184145, "wall": 5753.0} {"step": 16165, "train_loss": 3.345294952392578, "lr": 0.00021221470249380278, "tps": 184001, "wall": 5757.9} {"step": 16166, "train_loss": 3.2747323513031006, "lr": 0.00021219556246609384, "tps": 183857, "wall": 5762.7} {"step": 16167, "train_loss": 3.3123767375946045, "lr": 0.00021217642252679403, "tps": 183713, "wall": 5767.6} {"step": 16168, "train_loss": 3.2647714614868164, "lr": 0.00021215728267612015, "tps": 183570, "wall": 5772.4} {"step": 16169, "train_loss": 3.34059476852417, "lr": 0.00021213814291428897, "tps": 183427, "wall": 5777.3} {"step": 16170, "train_loss": 3.2431163787841797, "lr": 0.00021211900324151733, "tps": 183284, "wall": 5782.2} {"step": 16171, "train_loss": 3.3828728199005127, "lr": 0.00021209986365802207, "tps": 183140, "wall": 5787.1} {"step": 16172, "train_loss": 3.28469181060791, "lr": 0.00021208072416401997, "tps": 182997, "wall": 5791.9} {"step": 16173, "train_loss": 3.4024481773376465, "lr": 0.00021206158475972782, "tps": 182855, "wall": 5796.8} {"step": 16174, "train_loss": 3.4084956645965576, "lr": 0.00021204244544536255, "tps": 182713, "wall": 5801.7} {"step": 16175, "train_loss": 3.3004417419433594, "lr": 0.00021202330622114085, "tps": 182568, "wall": 5806.6} {"step": 16176, "train_loss": 3.348620891571045, "lr": 0.00021200416708727952, "tps": 182428, "wall": 5811.5} {"step": 16177, "train_loss": 3.327716827392578, "lr": 0.00021198502804399544, "tps": 182287, "wall": 5816.3} {"step": 16178, "train_loss": 3.339413642883301, "lr": 0.00021196588909150546, "tps": 182146, "wall": 5821.2} {"step": 16179, "train_loss": 3.295109748840332, "lr": 0.0002119467502300262, "tps": 182005, "wall": 5826.0} {"step": 16180, "train_loss": 3.2555277347564697, "lr": 0.0002119276114597747, "tps": 181864, "wall": 5830.9} {"step": 16181, "train_loss": 3.3759448528289795, "lr": 0.0002119084727809676, "tps": 181724, "wall": 5835.8} {"step": 16182, "train_loss": 3.2733092308044434, "lr": 0.00021188933419382178, "tps": 181584, "wall": 5840.6} {"step": 16183, "train_loss": 3.340559482574463, "lr": 0.00021187019569855403, "tps": 181444, "wall": 5845.5} {"step": 16184, "train_loss": 3.257375478744507, "lr": 0.00021185105729538113, "tps": 181304, "wall": 5850.4} {"step": 16185, "train_loss": 3.2782795429229736, "lr": 0.00021183191898451988, "tps": 181165, "wall": 5855.2} {"step": 16186, "train_loss": 3.4244675636291504, "lr": 0.0002118127807661871, "tps": 181025, "wall": 5860.1} {"step": 16187, "train_loss": 3.3366618156433105, "lr": 0.0002117936426405996, "tps": 180887, "wall": 5865.0} {"step": 16188, "train_loss": 3.2211251258850098, "lr": 0.00021177450460797416, "tps": 180747, "wall": 5869.9} {"step": 16189, "train_loss": 3.475247621536255, "lr": 0.00021175536666852757, "tps": 180608, "wall": 5874.7} {"step": 16190, "train_loss": 3.417328119277954, "lr": 0.00021173622882247664, "tps": 180470, "wall": 5879.6} {"step": 16191, "train_loss": 3.3074464797973633, "lr": 0.0002117170910700381, "tps": 180332, "wall": 5884.5} {"step": 16192, "train_loss": 3.293403148651123, "lr": 0.00021169795341142886, "tps": 180194, "wall": 5889.3} {"step": 16193, "train_loss": 3.3108370304107666, "lr": 0.00021167881584686563, "tps": 180057, "wall": 5894.2} {"step": 16194, "train_loss": 3.3724782466888428, "lr": 0.00021165967837656524, "tps": 179920, "wall": 5899.0} {"step": 16195, "train_loss": 3.3613319396972656, "lr": 0.00021164054100074447, "tps": 179783, "wall": 5903.9} {"step": 16196, "train_loss": 3.3948187828063965, "lr": 0.00021162140371962012, "tps": 179646, "wall": 5908.8} {"step": 16197, "train_loss": 3.4199745655059814, "lr": 0.0002116022665334089, "tps": 179510, "wall": 5913.6} {"step": 16198, "train_loss": 3.29491925239563, "lr": 0.0002115831294423277, "tps": 179373, "wall": 5918.5} {"step": 16199, "train_loss": 3.4658031463623047, "lr": 0.00021156399244659326, "tps": 179237, "wall": 5923.3} {"step": 16200, "train_loss": 3.4162373542785645, "lr": 0.0002115448555464224, "tps": 179099, "wall": 5928.3} {"step": 16201, "train_loss": 3.461440086364746, "lr": 0.00021152571874203183, "tps": 178963, "wall": 5933.1} {"step": 16202, "train_loss": 3.3223068714141846, "lr": 0.00021150658203363838, "tps": 178828, "wall": 5938.0} {"step": 16203, "train_loss": 3.373685836791992, "lr": 0.0002114874454214588, "tps": 178692, "wall": 5942.9} {"step": 16204, "train_loss": 3.411921977996826, "lr": 0.00021146830890570993, "tps": 178557, "wall": 5947.7} {"step": 16205, "train_loss": 3.418057680130005, "lr": 0.00021144917248660855, "tps": 178422, "wall": 5952.6} {"step": 16206, "train_loss": 3.369255304336548, "lr": 0.00021143003616437138, "tps": 178288, "wall": 5957.4} {"step": 16207, "train_loss": 3.3287429809570312, "lr": 0.0002114108999392152, "tps": 178153, "wall": 5962.3} {"step": 16208, "train_loss": 3.4053847789764404, "lr": 0.00021139176381135686, "tps": 178019, "wall": 5967.2} {"step": 16209, "train_loss": 3.3278756141662598, "lr": 0.00021137262778101308, "tps": 177885, "wall": 5972.0} {"step": 16210, "train_loss": 3.290902614593506, "lr": 0.00021135349184840058, "tps": 177751, "wall": 5976.9} {"step": 16211, "train_loss": 3.332948684692383, "lr": 0.00021133435601373627, "tps": 177618, "wall": 5981.8} {"step": 16212, "train_loss": 3.330406665802002, "lr": 0.00021131522027723678, "tps": 177482, "wall": 5986.7} {"step": 16213, "train_loss": 3.365665912628174, "lr": 0.00021129608463911893, "tps": 177349, "wall": 5991.6} {"step": 16214, "train_loss": 3.395028591156006, "lr": 0.00021127694909959957, "tps": 177217, "wall": 5996.4} {"step": 16215, "train_loss": 3.345259189605713, "lr": 0.0002112578136588954, "tps": 177084, "wall": 6001.3} {"step": 16216, "train_loss": 3.3331589698791504, "lr": 0.00021123867831722315, "tps": 176948, "wall": 6006.3} {"step": 16217, "train_loss": 3.385132312774658, "lr": 0.00021121954307479963, "tps": 176816, "wall": 6011.1} {"step": 16218, "train_loss": 3.3993759155273438, "lr": 0.00021120040793184166, "tps": 176683, "wall": 6016.0} {"step": 16219, "train_loss": 3.291395902633667, "lr": 0.00021118127288856587, "tps": 176552, "wall": 6020.8} {"step": 16220, "train_loss": 3.3240222930908203, "lr": 0.00021116213794518908, "tps": 176420, "wall": 6025.7} {"step": 16221, "train_loss": 3.357940435409546, "lr": 0.00021114300310192815, "tps": 176288, "wall": 6030.6} {"step": 16222, "train_loss": 3.3362951278686523, "lr": 0.00021112386835899974, "tps": 176157, "wall": 6035.4} {"step": 16223, "train_loss": 3.4116172790527344, "lr": 0.00021110473371662057, "tps": 176026, "wall": 6040.3} {"step": 16224, "train_loss": 3.3709373474121094, "lr": 0.0002110855991750075, "tps": 175895, "wall": 6045.2} {"step": 16225, "train_loss": 3.392033100128174, "lr": 0.00021106646473437727, "tps": 175763, "wall": 6050.1} {"step": 16226, "train_loss": 3.359884262084961, "lr": 0.0002110473303949466, "tps": 175632, "wall": 6055.0} {"step": 16227, "train_loss": 3.3608927726745605, "lr": 0.0002110281961569322, "tps": 175503, "wall": 6059.8} {"step": 16228, "train_loss": 3.5895981788635254, "lr": 0.00021100906202055098, "tps": 175373, "wall": 6064.7} {"step": 16229, "train_loss": 3.300290822982788, "lr": 0.0002109899279860195, "tps": 175243, "wall": 6069.6} {"step": 16230, "train_loss": 3.3574576377868652, "lr": 0.00021097079405355462, "tps": 175113, "wall": 6074.4} {"step": 16231, "train_loss": 3.2936203479766846, "lr": 0.00021095166022337312, "tps": 174984, "wall": 6079.3} {"step": 16232, "train_loss": 3.340574264526367, "lr": 0.0002109325264956917, "tps": 174855, "wall": 6084.1} {"step": 16233, "train_loss": 3.2289881706237793, "lr": 0.00021091339287072707, "tps": 174726, "wall": 6089.0} {"step": 16234, "train_loss": 3.3427278995513916, "lr": 0.000210894259348696, "tps": 174597, "wall": 6093.9} {"step": 16235, "train_loss": 3.3411264419555664, "lr": 0.0002108751259298153, "tps": 174468, "wall": 6098.8} {"step": 16236, "train_loss": 3.369657039642334, "lr": 0.00021085599261430168, "tps": 174340, "wall": 6103.6} {"step": 16237, "train_loss": 3.393643379211426, "lr": 0.0002108368594023718, "tps": 174210, "wall": 6108.6} {"step": 16238, "train_loss": 3.4301528930664062, "lr": 0.00021081772629424252, "tps": 174082, "wall": 6113.4} {"step": 16239, "train_loss": 3.2633724212646484, "lr": 0.00021079859329013054, "tps": 173954, "wall": 6118.3} {"step": 16240, "train_loss": 3.3379292488098145, "lr": 0.00021077946039025256, "tps": 173826, "wall": 6123.2} {"step": 16241, "train_loss": 3.333785057067871, "lr": 0.00021076032759482537, "tps": 173699, "wall": 6128.0} {"step": 16242, "train_loss": 3.3790907859802246, "lr": 0.00021074119490406573, "tps": 173573, "wall": 6132.9} {"step": 16243, "train_loss": 3.3643412590026855, "lr": 0.0002107220623181903, "tps": 173446, "wall": 6137.7} {"step": 16244, "train_loss": 3.3757572174072266, "lr": 0.0002107029298374158, "tps": 173319, "wall": 6142.6} {"step": 16245, "train_loss": 3.341250419616699, "lr": 0.0002106837974619591, "tps": 173193, "wall": 6147.5} {"step": 16246, "train_loss": 3.501589298248291, "lr": 0.00021066466519203676, "tps": 173067, "wall": 6152.3} {"step": 16247, "train_loss": 3.477320432662964, "lr": 0.00021064553302786566, "tps": 172941, "wall": 6157.2} {"step": 16248, "train_loss": 3.4518933296203613, "lr": 0.00021062640096966247, "tps": 172815, "wall": 6162.0} {"step": 16249, "train_loss": 3.396921157836914, "lr": 0.0002106072690176439, "tps": 172687, "wall": 6167.0} {"step": 16250, "train_loss": 3.3146872520446777, "lr": 0.0002105881371720267, "tps": 172562, "wall": 6171.8} {"step": 16251, "train_loss": 3.422008991241455, "lr": 0.0002105690054330275, "tps": 172436, "wall": 6176.7} {"step": 16252, "train_loss": 3.3987715244293213, "lr": 0.00021054987380086324, "tps": 172311, "wall": 6181.6} {"step": 16253, "train_loss": 3.382418155670166, "lr": 0.0002105307422757505, "tps": 172186, "wall": 6186.5} {"step": 16254, "train_loss": 3.3305418491363525, "lr": 0.00021051161085790598, "tps": 172061, "wall": 6191.3} {"step": 16255, "train_loss": 3.338771343231201, "lr": 0.0002104924795475465, "tps": 171937, "wall": 6196.2} {"step": 16256, "train_loss": 3.294602870941162, "lr": 0.0002104733483448887, "tps": 171812, "wall": 6201.1} {"step": 16257, "train_loss": 3.3377182483673096, "lr": 0.00021045421725014932, "tps": 171688, "wall": 6205.9} {"step": 16258, "train_loss": 3.2862730026245117, "lr": 0.00021043508626354505, "tps": 171564, "wall": 6210.8} {"step": 16259, "train_loss": 3.4363083839416504, "lr": 0.00021041595538529273, "tps": 171441, "wall": 6215.6} {"step": 16260, "train_loss": 3.345883369445801, "lr": 0.0002103968246156089, "tps": 171317, "wall": 6220.5} {"step": 16261, "train_loss": 3.3761792182922363, "lr": 0.00021037769395471035, "tps": 171194, "wall": 6225.4} {"step": 16262, "train_loss": 3.3846919536590576, "lr": 0.00021035856340281388, "tps": 171069, "wall": 6230.3} {"step": 16263, "train_loss": 3.3063130378723145, "lr": 0.00021033943296013612, "tps": 170946, "wall": 6235.1} {"step": 16264, "train_loss": 3.3223419189453125, "lr": 0.0002103203026268937, "tps": 170823, "wall": 6240.0} {"step": 16265, "train_loss": 3.2263095378875732, "lr": 0.00021030117240330352, "tps": 170701, "wall": 6244.9} {"step": 16266, "train_loss": 3.34651517868042, "lr": 0.00021028204228958216, "tps": 170579, "wall": 6249.7} {"step": 16267, "train_loss": 3.3343331813812256, "lr": 0.00021026291228594634, "tps": 170457, "wall": 6254.6} {"step": 16268, "train_loss": 3.2189269065856934, "lr": 0.00021024378239261276, "tps": 170334, "wall": 6259.5} {"step": 16269, "train_loss": 3.265331268310547, "lr": 0.00021022465260979814, "tps": 170213, "wall": 6264.3} {"step": 16270, "train_loss": 3.4530282020568848, "lr": 0.0002102055229377192, "tps": 170091, "wall": 6269.2} {"step": 16271, "train_loss": 3.2857134342193604, "lr": 0.00021018639337659262, "tps": 169970, "wall": 6274.0} {"step": 16272, "train_loss": 3.356301784515381, "lr": 0.00021016726392663509, "tps": 169848, "wall": 6278.9} {"step": 16273, "train_loss": 3.393296480178833, "lr": 0.00021014813458806333, "tps": 169727, "wall": 6283.8} {"step": 16274, "train_loss": 3.3997700214385986, "lr": 0.0002101290053610941, "tps": 169604, "wall": 6288.7} {"step": 16275, "train_loss": 3.37520170211792, "lr": 0.0002101098762459439, "tps": 169484, "wall": 6293.6} {"step": 16276, "train_loss": 3.4099621772766113, "lr": 0.00021009074724282964, "tps": 169363, "wall": 6298.4} {"step": 16277, "train_loss": 3.388240337371826, "lr": 0.00021007161835196792, "tps": 169243, "wall": 6303.3} {"step": 16278, "train_loss": 3.4190165996551514, "lr": 0.00021005248957357546, "tps": 169123, "wall": 6308.2} {"step": 16279, "train_loss": 3.317387819290161, "lr": 0.0002100333609078689, "tps": 169003, "wall": 6313.0} {"step": 16280, "train_loss": 3.43865966796875, "lr": 0.00021001423235506502, "tps": 168884, "wall": 6317.9} {"step": 16281, "train_loss": 3.281275510787964, "lr": 0.0002099951039153804, "tps": 168763, "wall": 6322.8} {"step": 16282, "train_loss": 3.313664436340332, "lr": 0.0002099759755890318, "tps": 168645, "wall": 6327.6} {"step": 16283, "train_loss": 3.3012919425964355, "lr": 0.00020995684737623588, "tps": 168526, "wall": 6332.5} {"step": 16284, "train_loss": 3.3717703819274902, "lr": 0.0002099377192772094, "tps": 168406, "wall": 6337.4} {"step": 16285, "train_loss": 3.29727840423584, "lr": 0.00020991859129216892, "tps": 168287, "wall": 6342.2} {"step": 16286, "train_loss": 3.376394271850586, "lr": 0.0002098994634213312, "tps": 168167, "wall": 6347.2} {"step": 16287, "train_loss": 3.3342976570129395, "lr": 0.00020988033566491293, "tps": 168048, "wall": 6352.0} {"step": 16288, "train_loss": 3.319582462310791, "lr": 0.00020986120802313072, "tps": 167930, "wall": 6356.9} {"step": 16289, "train_loss": 3.382175922393799, "lr": 0.0002098420804962013, "tps": 167812, "wall": 6361.7} {"step": 16290, "train_loss": 3.3992371559143066, "lr": 0.00020982295308434137, "tps": 167694, "wall": 6366.6} {"step": 16291, "train_loss": 3.3375167846679688, "lr": 0.00020980382578776756, "tps": 167577, "wall": 6371.5} {"step": 16292, "train_loss": 3.306488275527954, "lr": 0.00020978469860669655, "tps": 167459, "wall": 6376.3} {"step": 16293, "train_loss": 3.3762118816375732, "lr": 0.00020976557154134504, "tps": 167342, "wall": 6381.2} {"step": 16294, "train_loss": 3.345456838607788, "lr": 0.00020974644459192973, "tps": 167224, "wall": 6386.1} {"step": 16295, "train_loss": 3.3195502758026123, "lr": 0.00020972731775866716, "tps": 167107, "wall": 6390.9} {"step": 16296, "train_loss": 3.3426637649536133, "lr": 0.00020970819104177416, "tps": 166990, "wall": 6395.8} {"step": 16297, "train_loss": 3.3547616004943848, "lr": 0.00020968906444146734, "tps": 166872, "wall": 6400.7} {"step": 16298, "train_loss": 3.331080436706543, "lr": 0.00020966993795796333, "tps": 166756, "wall": 6405.6} {"step": 16299, "train_loss": 3.290449619293213, "lr": 0.00020965081159147876, "tps": 166638, "wall": 6410.5} {"step": 16300, "train_loss": 3.3309082984924316, "lr": 0.00020963168534223042, "tps": 166522, "wall": 6415.4} {"step": 16301, "train_loss": 3.4088962078094482, "lr": 0.00020961255921043496, "tps": 166406, "wall": 6420.2} {"step": 16302, "train_loss": 3.213150978088379, "lr": 0.00020959343319630887, "tps": 166290, "wall": 6425.1} {"step": 16303, "train_loss": 3.3542113304138184, "lr": 0.00020957430730006901, "tps": 166175, "wall": 6430.0} {"step": 16304, "train_loss": 3.4496655464172363, "lr": 0.00020955518152193198, "tps": 166059, "wall": 6434.8} {"step": 16305, "train_loss": 3.317896604537964, "lr": 0.0002095360558621144, "tps": 165944, "wall": 6439.7} {"step": 16306, "train_loss": 3.290081739425659, "lr": 0.0002095169303208329, "tps": 165828, "wall": 6444.6} {"step": 16307, "train_loss": 3.4032909870147705, "lr": 0.00020949780489830423, "tps": 165714, "wall": 6449.4} {"step": 16308, "train_loss": 3.3588309288024902, "lr": 0.00020947867959474498, "tps": 165599, "wall": 6454.3} {"step": 16309, "train_loss": 3.326707601547241, "lr": 0.0002094595544103718, "tps": 165484, "wall": 6459.2} {"step": 16310, "train_loss": 3.3479084968566895, "lr": 0.00020944042934540135, "tps": 165369, "wall": 6464.0} {"step": 16311, "train_loss": 3.270798683166504, "lr": 0.00020942130440005033, "tps": 165254, "wall": 6469.0} {"step": 16312, "train_loss": 3.3871402740478516, "lr": 0.00020940217957453533, "tps": 165140, "wall": 6473.8} {"step": 16313, "train_loss": 3.3075926303863525, "lr": 0.000209383054869073, "tps": 165026, "wall": 6478.7} {"step": 16314, "train_loss": 3.366962194442749, "lr": 0.00020936393028388005, "tps": 164912, "wall": 6483.5} {"step": 16315, "train_loss": 3.4292216300964355, "lr": 0.000209344805819173, "tps": 164799, "wall": 6488.4} {"step": 16316, "train_loss": 3.304459571838379, "lr": 0.0002093256814751686, "tps": 164686, "wall": 6493.3} {"step": 16317, "train_loss": 3.4377870559692383, "lr": 0.00020930655725208346, "tps": 164570, "wall": 6498.2} {"step": 16318, "train_loss": 3.4091405868530273, "lr": 0.00020928743315013423, "tps": 164458, "wall": 6503.1} {"step": 16319, "train_loss": 3.2921221256256104, "lr": 0.0002092683091695375, "tps": 164345, "wall": 6507.9} {"step": 16320, "train_loss": 3.457955837249756, "lr": 0.00020924918531050994, "tps": 164232, "wall": 6512.8} {"step": 16321, "train_loss": 3.364912271499634, "lr": 0.0002092300615732682, "tps": 164119, "wall": 6517.7} {"step": 16322, "train_loss": 3.415491819381714, "lr": 0.00020921093795802894, "tps": 164006, "wall": 6522.6} {"step": 16323, "train_loss": 3.418391704559326, "lr": 0.00020919181446500874, "tps": 163893, "wall": 6527.5} {"step": 16324, "train_loss": 3.311990261077881, "lr": 0.00020917269109442424, "tps": 163781, "wall": 6532.3} {"step": 16325, "train_loss": 3.3759336471557617, "lr": 0.00020915356784649206, "tps": 163669, "wall": 6537.2} {"step": 16326, "train_loss": 3.417555332183838, "lr": 0.0002091344447214289, "tps": 163557, "wall": 6542.1} {"step": 16327, "train_loss": 3.3094913959503174, "lr": 0.0002091153217194513, "tps": 163445, "wall": 6546.9} {"step": 16328, "train_loss": 3.3312132358551025, "lr": 0.000209096198840776, "tps": 163334, "wall": 6551.8} {"step": 16329, "train_loss": 3.509120464324951, "lr": 0.00020907707608561947, "tps": 163223, "wall": 6556.7} {"step": 16330, "train_loss": 3.321579933166504, "lr": 0.00020905795345419842, "tps": 163112, "wall": 6561.5} {"step": 16331, "train_loss": 3.4473257064819336, "lr": 0.0002090388309467295, "tps": 163000, "wall": 6566.4} {"step": 16332, "train_loss": 3.4061217308044434, "lr": 0.00020901970856342924, "tps": 162890, "wall": 6571.3} {"step": 16333, "train_loss": 3.336869716644287, "lr": 0.00020900058630451436, "tps": 162779, "wall": 6576.2} {"step": 16334, "train_loss": 3.290029525756836, "lr": 0.00020898146417020144, "tps": 162669, "wall": 6581.0} {"step": 16335, "train_loss": 3.284816265106201, "lr": 0.00020896234216070706, "tps": 162556, "wall": 6586.0} {"step": 16336, "train_loss": 3.3087360858917236, "lr": 0.00020894322027624785, "tps": 162446, "wall": 6590.8} {"step": 16337, "train_loss": 3.37943696975708, "lr": 0.00020892409851704048, "tps": 162336, "wall": 6595.7} {"step": 16338, "train_loss": 3.3109328746795654, "lr": 0.00020890497688330154, "tps": 162227, "wall": 6600.6} {"step": 16339, "train_loss": 3.3810195922851562, "lr": 0.00020888585537524756, "tps": 162117, "wall": 6605.4} {"step": 16340, "train_loss": 3.2106456756591797, "lr": 0.00020886673399309524, "tps": 162008, "wall": 6610.3} {"step": 16341, "train_loss": 3.348686933517456, "lr": 0.0002088476127370612, "tps": 161899, "wall": 6615.2} {"step": 16342, "train_loss": 3.4451422691345215, "lr": 0.00020882849160736196, "tps": 161790, "wall": 6620.0} {"step": 16343, "train_loss": 3.4799342155456543, "lr": 0.00020880937060421416, "tps": 161680, "wall": 6624.9} {"step": 16344, "train_loss": 3.2845370769500732, "lr": 0.00020879024972783445, "tps": 161572, "wall": 6629.8} {"step": 16345, "train_loss": 3.3255202770233154, "lr": 0.0002087711289784394, "tps": 161463, "wall": 6634.6} {"step": 16346, "train_loss": 3.3424739837646484, "lr": 0.00020875200835624553, "tps": 161355, "wall": 6639.5} {"step": 16347, "train_loss": 3.420409679412842, "lr": 0.00020873288786146956, "tps": 161247, "wall": 6644.4} {"step": 16348, "train_loss": 3.307373046875, "lr": 0.00020871376749432812, "tps": 161137, "wall": 6649.3} {"step": 16349, "train_loss": 3.430945873260498, "lr": 0.00020869464725503764, "tps": 161029, "wall": 6654.1} {"step": 16350, "train_loss": 3.296860694885254, "lr": 0.00020867552714381486, "tps": 160922, "wall": 6659.0} {"step": 16351, "train_loss": 3.430971145629883, "lr": 0.00020865640716087635, "tps": 160814, "wall": 6663.9} {"step": 16352, "train_loss": 3.405729293823242, "lr": 0.0002086372873064386, "tps": 160706, "wall": 6668.7} {"step": 16353, "train_loss": 3.2249341011047363, "lr": 0.0002086181675807183, "tps": 160599, "wall": 6673.6} {"step": 16354, "train_loss": 3.455951690673828, "lr": 0.00020859904798393197, "tps": 160492, "wall": 6678.4} {"step": 16355, "train_loss": 3.3764960765838623, "lr": 0.00020857992851629632, "tps": 160384, "wall": 6683.4} {"step": 16356, "train_loss": 3.3018734455108643, "lr": 0.00020856080917802783, "tps": 160278, "wall": 6688.2} {"step": 16357, "train_loss": 3.321411609649658, "lr": 0.0002085416899693431, "tps": 160171, "wall": 6693.1} {"step": 16358, "train_loss": 3.2894511222839355, "lr": 0.00020852257089045873, "tps": 160064, "wall": 6697.9} {"step": 16359, "train_loss": 3.3619236946105957, "lr": 0.00020850345194159132, "tps": 159958, "wall": 6702.8} {"step": 16360, "train_loss": 3.412588596343994, "lr": 0.00020848433312295738, "tps": 159851, "wall": 6707.7} {"step": 16361, "train_loss": 3.3677380084991455, "lr": 0.00020846521443477364, "tps": 159745, "wall": 6712.6} {"step": 16362, "train_loss": 3.331538438796997, "lr": 0.00020844609587725645, "tps": 159638, "wall": 6717.4} {"step": 16363, "train_loss": 3.3797879219055176, "lr": 0.00020842697745062258, "tps": 159533, "wall": 6722.3} {"step": 16364, "train_loss": 3.2968907356262207, "lr": 0.00020840785915508846, "tps": 159427, "wall": 6727.2} {"step": 16365, "train_loss": 3.331143379211426, "lr": 0.00020838874099087087, "tps": 159322, "wall": 6732.0} {"step": 16366, "train_loss": 3.37247896194458, "lr": 0.00020836962295818615, "tps": 159216, "wall": 6736.9} {"step": 16367, "train_loss": 3.3356499671936035, "lr": 0.000208350505057251, "tps": 159111, "wall": 6741.8} {"step": 16368, "train_loss": 3.4162073135375977, "lr": 0.00020833138728828198, "tps": 159005, "wall": 6746.7} {"step": 16369, "train_loss": 3.3992559909820557, "lr": 0.0002083122696514956, "tps": 158900, "wall": 6751.5} {"step": 16370, "train_loss": 3.269005060195923, "lr": 0.00020829315214710846, "tps": 158796, "wall": 6756.4} {"step": 16371, "train_loss": 3.300257444381714, "lr": 0.00020827403477533717, "tps": 158691, "wall": 6761.3} {"step": 16372, "train_loss": 3.290553092956543, "lr": 0.00020825491753639818, "tps": 158584, "wall": 6766.2} {"step": 16373, "train_loss": 3.351137399673462, "lr": 0.00020823580043050814, "tps": 158480, "wall": 6771.1} {"step": 16374, "train_loss": 3.395622968673706, "lr": 0.00020821668345788363, "tps": 158376, "wall": 6776.0} {"step": 16375, "train_loss": 3.385154962539673, "lr": 0.00020819756661874116, "tps": 158271, "wall": 6780.8} {"step": 16376, "train_loss": 3.303544521331787, "lr": 0.00020817844991329726, "tps": 158168, "wall": 6785.7} {"step": 16377, "train_loss": 3.350048065185547, "lr": 0.00020815933334176855, "tps": 158064, "wall": 6790.6} {"step": 16378, "train_loss": 3.373640775680542, "lr": 0.00020814021690437158, "tps": 157961, "wall": 6795.4} {"step": 16379, "train_loss": 3.3178091049194336, "lr": 0.00020812110060132279, "tps": 157857, "wall": 6800.3} {"step": 16380, "train_loss": 3.377774238586426, "lr": 0.00020810198443283885, "tps": 157754, "wall": 6805.2} {"step": 16381, "train_loss": 3.3935160636901855, "lr": 0.00020808286839913627, "tps": 157651, "wall": 6810.0} {"step": 16382, "train_loss": 3.3184642791748047, "lr": 0.00020806375250043165, "tps": 157548, "wall": 6814.9} {"step": 16383, "train_loss": 3.3485076427459717, "lr": 0.00020804463673694144, "tps": 157445, "wall": 6819.8} {"step": 16384, "train_loss": 3.2909603118896484, "lr": 0.00020802552110888223, "tps": 157342, "wall": 6824.7} {"step": 16385, "train_loss": 3.3696281909942627, "lr": 0.00020800640561647061, "tps": 157238, "wall": 6829.6} {"step": 16386, "train_loss": 3.4023947715759277, "lr": 0.00020798729025992306, "tps": 157134, "wall": 6834.5} {"step": 16387, "train_loss": 3.4650075435638428, "lr": 0.00020796817503945607, "tps": 157032, "wall": 6839.4} {"step": 16388, "train_loss": 3.2953150272369385, "lr": 0.00020794905995528634, "tps": 156930, "wall": 6844.2} {"step": 16389, "train_loss": 3.450150728225708, "lr": 0.00020792994500763023, "tps": 156828, "wall": 6849.1} {"step": 16390, "train_loss": 3.365664005279541, "lr": 0.0002079108301967044, "tps": 156726, "wall": 6854.0} {"step": 16391, "train_loss": 3.3537392616271973, "lr": 0.0002078917155227253, "tps": 156625, "wall": 6858.8} {"step": 16392, "train_loss": 3.355468988418579, "lr": 0.0002078726009859096, "tps": 156523, "wall": 6863.7} {"step": 16393, "train_loss": 3.3083741664886475, "lr": 0.00020785348658647365, "tps": 156422, "wall": 6868.6} {"step": 16394, "train_loss": 3.351566791534424, "lr": 0.00020783437232463404, "tps": 156321, "wall": 6873.4} {"step": 16395, "train_loss": 3.375427722930908, "lr": 0.00020781525820060738, "tps": 156220, "wall": 6878.3} {"step": 16396, "train_loss": 3.403409957885742, "lr": 0.0002077961442146101, "tps": 156119, "wall": 6883.1} {"step": 16397, "train_loss": 3.3593130111694336, "lr": 0.00020777703036685874, "tps": 156017, "wall": 6888.1} {"step": 16398, "train_loss": 3.3166961669921875, "lr": 0.00020775791665756993, "tps": 155916, "wall": 6892.9} {"step": 16399, "train_loss": 3.3241517543792725, "lr": 0.00020773880308696003, "tps": 155815, "wall": 6897.8} {"step": 16400, "train_loss": 3.3657665252685547, "lr": 0.00020771968965524563, "tps": 155715, "wall": 6902.7} {"step": 16401, "train_loss": 3.3844287395477295, "lr": 0.00020770057636264322, "tps": 155613, "wall": 6907.6} {"step": 16402, "train_loss": 3.322539806365967, "lr": 0.0002076814632093694, "tps": 155513, "wall": 6912.5} {"step": 16403, "train_loss": 3.391857147216797, "lr": 0.00020766235019564064, "tps": 155413, "wall": 6917.4} {"step": 16404, "train_loss": 3.307760238647461, "lr": 0.0002076432373216734, "tps": 155314, "wall": 6922.2} {"step": 16405, "train_loss": 3.3166186809539795, "lr": 0.0002076241245876843, "tps": 155214, "wall": 6927.1} {"step": 16406, "train_loss": 3.271026611328125, "lr": 0.00020760501199388972, "tps": 155115, "wall": 6931.9} {"step": 16407, "train_loss": 3.2789649963378906, "lr": 0.00020758589954050628, "tps": 155016, "wall": 6936.8} {"step": 16408, "train_loss": 3.445013999938965, "lr": 0.0002075667872277504, "tps": 154917, "wall": 6941.6} {"step": 16409, "train_loss": 3.366084098815918, "lr": 0.00020754767505583869, "tps": 154816, "wall": 6946.6} {"step": 16410, "train_loss": 3.341919422149658, "lr": 0.0002075285630249875, "tps": 154717, "wall": 6951.4} {"step": 16411, "train_loss": 3.4599640369415283, "lr": 0.00020750945113541346, "tps": 154619, "wall": 6956.3} {"step": 16412, "train_loss": 3.413025379180908, "lr": 0.00020749033938733308, "tps": 154521, "wall": 6961.1} {"step": 16413, "train_loss": 3.2573461532592773, "lr": 0.00020747122778096277, "tps": 154422, "wall": 6966.0} {"step": 16414, "train_loss": 3.407025098800659, "lr": 0.00020745211631651906, "tps": 154324, "wall": 6970.9} {"step": 16415, "train_loss": 3.3318848609924316, "lr": 0.00020743300499421853, "tps": 154226, "wall": 6975.7} {"step": 16416, "train_loss": 3.350008487701416, "lr": 0.00020741389381427752, "tps": 154127, "wall": 6980.6} {"step": 16417, "train_loss": 3.3349742889404297, "lr": 0.0002073947827769126, "tps": 154029, "wall": 6985.5} {"step": 16418, "train_loss": 3.4450488090515137, "lr": 0.0002073756718823403, "tps": 153932, "wall": 6990.3} {"step": 16419, "train_loss": 3.2684292793273926, "lr": 0.00020735656113077705, "tps": 153834, "wall": 6995.2} {"step": 16420, "train_loss": 3.3014378547668457, "lr": 0.00020733745052243938, "tps": 153736, "wall": 7000.1} {"step": 16421, "train_loss": 3.3498196601867676, "lr": 0.0002073183400575437, "tps": 153639, "wall": 7004.9} {"step": 16422, "train_loss": 3.330706834793091, "lr": 0.00020729922973630665, "tps": 153541, "wall": 7009.8} {"step": 16423, "train_loss": 3.2817740440368652, "lr": 0.00020728011955894454, "tps": 153443, "wall": 7014.7} {"step": 16424, "train_loss": 3.297325611114502, "lr": 0.00020726100952567396, "tps": 153346, "wall": 7019.6} {"step": 16425, "train_loss": 3.3320350646972656, "lr": 0.00020724189963671134, "tps": 153249, "wall": 7024.4} {"step": 16426, "train_loss": 3.3418617248535156, "lr": 0.00020722278989227313, "tps": 153153, "wall": 7029.3} {"step": 16427, "train_loss": 3.2771592140197754, "lr": 0.00020720368029257587, "tps": 153057, "wall": 7034.1} {"step": 16428, "train_loss": 3.407163619995117, "lr": 0.00020718457083783603, "tps": 152960, "wall": 7039.0} {"step": 16429, "train_loss": 3.32057523727417, "lr": 0.0002071654615282701, "tps": 152864, "wall": 7043.9} {"step": 16430, "train_loss": 3.422961711883545, "lr": 0.00020714635236409446, "tps": 152768, "wall": 7048.7} {"step": 16431, "train_loss": 3.343040943145752, "lr": 0.00020712724334552563, "tps": 152672, "wall": 7053.6} {"step": 16432, "train_loss": 3.406623363494873, "lr": 0.0002071081344727801, "tps": 152576, "wall": 7058.4} {"step": 16433, "train_loss": 3.34617018699646, "lr": 0.00020708902574607434, "tps": 152481, "wall": 7063.3} {"step": 16434, "train_loss": 3.3670363426208496, "lr": 0.00020706991716562483, "tps": 152384, "wall": 7068.2} {"step": 16435, "train_loss": 3.358792781829834, "lr": 0.00020705080873164797, "tps": 152288, "wall": 7073.1} {"step": 16436, "train_loss": 3.349404811859131, "lr": 0.00020703170044436016, "tps": 152192, "wall": 7078.0} {"step": 16437, "train_loss": 3.318655252456665, "lr": 0.00020701259230397807, "tps": 152097, "wall": 7082.8} {"step": 16438, "train_loss": 3.3203535079956055, "lr": 0.00020699348431071796, "tps": 152002, "wall": 7087.7} {"step": 16439, "train_loss": 3.2565460205078125, "lr": 0.00020697437646479642, "tps": 151907, "wall": 7092.6} {"step": 16440, "train_loss": 3.306156635284424, "lr": 0.00020695526876642983, "tps": 151812, "wall": 7097.4} {"step": 16441, "train_loss": 3.149531364440918, "lr": 0.0002069361612158346, "tps": 151715, "wall": 7102.4} {"step": 16442, "train_loss": 3.339505434036255, "lr": 0.00020691705381322727, "tps": 151613, "wall": 7107.6} {"step": 16443, "train_loss": 3.344731569290161, "lr": 0.00020689794655882432, "tps": 151519, "wall": 7112.5} {"step": 16444, "train_loss": 3.2280192375183105, "lr": 0.0002068788394528421, "tps": 151425, "wall": 7117.3} {"step": 16445, "train_loss": 3.3649258613586426, "lr": 0.0002068597324954971, "tps": 151330, "wall": 7122.2} {"step": 16446, "train_loss": 3.347980260848999, "lr": 0.00020684062568700572, "tps": 151234, "wall": 7127.1} {"step": 16447, "train_loss": 3.3717808723449707, "lr": 0.00020682151902758452, "tps": 151140, "wall": 7132.0} {"step": 16448, "train_loss": 3.3559317588806152, "lr": 0.00020680241251744982, "tps": 151046, "wall": 7136.9} {"step": 16449, "train_loss": 3.172811985015869, "lr": 0.00020678330615681812, "tps": 150952, "wall": 7141.7} {"step": 16450, "train_loss": 3.2716779708862305, "lr": 0.00020676419994590582, "tps": 150859, "wall": 7146.6} {"step": 16451, "train_loss": 3.3486173152923584, "lr": 0.00020674509388492939, "tps": 150765, "wall": 7151.5} {"step": 16452, "train_loss": 3.3057806491851807, "lr": 0.00020672598797410525, "tps": 150672, "wall": 7156.3} {"step": 16453, "train_loss": 3.325942039489746, "lr": 0.00020670688221364984, "tps": 150579, "wall": 7161.2} {"step": 16454, "train_loss": 3.128721237182617, "lr": 0.00020668777660377962, "tps": 150485, "wall": 7166.1} {"step": 16455, "train_loss": 3.395545721054077, "lr": 0.00020666867114471095, "tps": 150393, "wall": 7170.9} {"step": 16456, "train_loss": 3.2557406425476074, "lr": 0.0002066495658366603, "tps": 150300, "wall": 7175.8} {"step": 16457, "train_loss": 3.311941385269165, "lr": 0.00020663046067984412, "tps": 150207, "wall": 7180.7} {"step": 16458, "train_loss": 3.423717498779297, "lr": 0.0002066113556744788, "tps": 150115, "wall": 7185.5} {"step": 16459, "train_loss": 3.4196574687957764, "lr": 0.00020659225082078072, "tps": 150021, "wall": 7190.4} {"step": 16460, "train_loss": 3.398892402648926, "lr": 0.00020657314611896633, "tps": 149929, "wall": 7195.3} {"step": 16461, "train_loss": 3.323349952697754, "lr": 0.00020655404156925212, "tps": 149836, "wall": 7200.2} {"step": 16462, "train_loss": 3.444685459136963, "lr": 0.00020653493717185444, "tps": 149744, "wall": 7205.1} {"step": 16463, "train_loss": 3.282323122024536, "lr": 0.0002065158329269897, "tps": 149653, "wall": 7209.9} {"step": 16464, "train_loss": 3.282972574234009, "lr": 0.00020649672883487442, "tps": 149561, "wall": 7214.8} {"step": 16465, "train_loss": 3.3555073738098145, "lr": 0.00020647762489572484, "tps": 149469, "wall": 7219.6} {"step": 16466, "train_loss": 3.400256633758545, "lr": 0.00020645852110975747, "tps": 149377, "wall": 7224.5} {"step": 16467, "train_loss": 3.3409929275512695, "lr": 0.00020643941747718874, "tps": 149286, "wall": 7229.3} {"step": 16468, "train_loss": 3.4411699771881104, "lr": 0.00020642031399823498, "tps": 149195, "wall": 7234.2} {"step": 16469, "train_loss": 3.364136219024658, "lr": 0.00020640121067311265, "tps": 149104, "wall": 7239.1} {"step": 16470, "train_loss": 3.2950031757354736, "lr": 0.00020638210750203816, "tps": 149013, "wall": 7243.9} {"step": 16471, "train_loss": 3.285243511199951, "lr": 0.00020636300448522788, "tps": 148920, "wall": 7248.9} {"step": 16472, "train_loss": 3.3451316356658936, "lr": 0.00020634390162289825, "tps": 148830, "wall": 7253.7} {"step": 16473, "train_loss": 3.249950408935547, "lr": 0.0002063247989152656, "tps": 148739, "wall": 7258.6} {"step": 16474, "train_loss": 3.4258995056152344, "lr": 0.0002063056963625464, "tps": 148648, "wall": 7263.5} {"step": 16475, "train_loss": 3.435439109802246, "lr": 0.00020628659396495697, "tps": 148558, "wall": 7268.3} {"step": 16476, "train_loss": 3.298733711242676, "lr": 0.00020626749172271378, "tps": 148468, "wall": 7273.2} {"step": 16477, "train_loss": 3.293165683746338, "lr": 0.00020624838963603318, "tps": 148378, "wall": 7278.0} {"step": 16478, "train_loss": 3.421041250228882, "lr": 0.00020622928770513155, "tps": 148288, "wall": 7282.9} {"step": 16479, "train_loss": 3.3868696689605713, "lr": 0.0002062101859302253, "tps": 148198, "wall": 7287.8} {"step": 16480, "train_loss": 3.2993245124816895, "lr": 0.0002061910843115308, "tps": 148108, "wall": 7292.6} {"step": 16481, "train_loss": 3.3174281120300293, "lr": 0.00020617198284926454, "tps": 148018, "wall": 7297.5} {"step": 16482, "train_loss": 3.2999939918518066, "lr": 0.0002061528815436427, "tps": 147928, "wall": 7302.4} {"step": 16483, "train_loss": 3.2552502155303955, "lr": 0.00020613378039488177, "tps": 147837, "wall": 7307.3} {"step": 16484, "train_loss": 3.2595643997192383, "lr": 0.00020611467940319814, "tps": 147748, "wall": 7312.2} {"step": 16485, "train_loss": 3.33494234085083, "lr": 0.0002060955785688082, "tps": 147659, "wall": 7317.0} {"step": 16486, "train_loss": 3.3126590251922607, "lr": 0.00020607647789192828, "tps": 147570, "wall": 7321.9} {"step": 16487, "train_loss": 3.2337377071380615, "lr": 0.00020605737737277476, "tps": 147481, "wall": 7326.7} {"step": 16488, "train_loss": 3.2492220401763916, "lr": 0.00020603827701156405, "tps": 147392, "wall": 7331.6} {"step": 16489, "train_loss": 3.3583972454071045, "lr": 0.00020601917680851246, "tps": 147303, "wall": 7336.5} {"step": 16490, "train_loss": 3.379161834716797, "lr": 0.0002060000767638364, "tps": 147215, "wall": 7341.3} {"step": 16491, "train_loss": 3.3787500858306885, "lr": 0.0002059809768777523, "tps": 147125, "wall": 7346.2} {"step": 16492, "train_loss": 3.2303524017333984, "lr": 0.00020596187715047636, "tps": 147037, "wall": 7351.1} {"step": 16493, "train_loss": 3.3839008808135986, "lr": 0.0002059427775822251, "tps": 146948, "wall": 7356.0} {"step": 16494, "train_loss": 3.2370986938476562, "lr": 0.0002059236781732148, "tps": 146860, "wall": 7360.8} {"step": 16495, "train_loss": 3.3863677978515625, "lr": 0.00020590457892366178, "tps": 146773, "wall": 7365.7} {"step": 16496, "train_loss": 3.248382091522217, "lr": 0.00020588547983378251, "tps": 146683, "wall": 7370.6} {"step": 16497, "train_loss": 3.29180645942688, "lr": 0.00020586638090379323, "tps": 146595, "wall": 7375.5} {"step": 16498, "train_loss": 3.3609848022460938, "lr": 0.00020584728213391041, "tps": 146508, "wall": 7380.3} {"step": 16499, "train_loss": 3.3616678714752197, "lr": 0.00020582818352435033, "tps": 146420, "wall": 7385.2} {"step": 16500, "train_loss": 3.1825878620147705, "lr": 0.00020580908507532932, "tps": 146333, "wall": 7390.0} {"step": 16501, "train_loss": 3.3154711723327637, "lr": 0.0002057899867870638, "tps": 146241, "wall": 7395.1} {"step": 16502, "train_loss": 3.298302173614502, "lr": 0.0002057708886597701, "tps": 146154, "wall": 7400.0} {"step": 16503, "train_loss": 3.3852286338806152, "lr": 0.0002057517906936645, "tps": 146066, "wall": 7404.9} {"step": 16504, "train_loss": 3.30830717086792, "lr": 0.00020573269288896338, "tps": 145979, "wall": 7409.7} {"step": 16505, "train_loss": 3.2367160320281982, "lr": 0.00020571359524588313, "tps": 145892, "wall": 7414.6} {"step": 16506, "train_loss": 3.2157952785491943, "lr": 0.00020569449776464, "tps": 145805, "wall": 7419.5} {"step": 16507, "train_loss": 3.318629503250122, "lr": 0.00020567540044545037, "tps": 145718, "wall": 7424.4} {"step": 16508, "train_loss": 3.3447020053863525, "lr": 0.00020565630328853063, "tps": 145630, "wall": 7429.3} {"step": 16509, "train_loss": 3.405878782272339, "lr": 0.00020563720629409704, "tps": 145544, "wall": 7434.2} {"step": 16510, "train_loss": 3.2911133766174316, "lr": 0.00020561810946236592, "tps": 145457, "wall": 7439.0} {"step": 16511, "train_loss": 3.344360589981079, "lr": 0.0002055990127935537, "tps": 145370, "wall": 7443.9} {"step": 16512, "train_loss": 3.4029312133789062, "lr": 0.0002055799162878766, "tps": 145285, "wall": 7448.8} {"step": 16513, "train_loss": 3.452857732772827, "lr": 0.000205560819945551, "tps": 145199, "wall": 7453.6} {"step": 16514, "train_loss": 3.3469204902648926, "lr": 0.0002055417237667932, "tps": 145112, "wall": 7458.5} {"step": 16515, "train_loss": 3.404132604598999, "lr": 0.00020552262775181955, "tps": 145026, "wall": 7463.4} {"step": 16516, "train_loss": 3.3257813453674316, "lr": 0.00020550353190084634, "tps": 144941, "wall": 7468.3} {"step": 16517, "train_loss": 3.3529632091522217, "lr": 0.0002054844362140899, "tps": 144855, "wall": 7473.1} {"step": 16518, "train_loss": 3.426370620727539, "lr": 0.0002054653406917666, "tps": 144768, "wall": 7478.1} {"step": 16519, "train_loss": 3.2240681648254395, "lr": 0.0002054462453340926, "tps": 144683, "wall": 7482.9} {"step": 16520, "train_loss": 3.367464542388916, "lr": 0.0002054271501412844, "tps": 144596, "wall": 7487.9} {"step": 16521, "train_loss": 3.4130282402038574, "lr": 0.00020540805511355824, "tps": 144511, "wall": 7492.7} {"step": 16522, "train_loss": 3.2901363372802734, "lr": 0.00020538896025113043, "tps": 144425, "wall": 7497.6} {"step": 16523, "train_loss": 3.3594119548797607, "lr": 0.00020536986555421725, "tps": 144341, "wall": 7502.5} {"step": 16524, "train_loss": 3.3727922439575195, "lr": 0.000205350771023035, "tps": 144256, "wall": 7507.3} {"step": 16525, "train_loss": 3.240346908569336, "lr": 0.00020533167665780005, "tps": 144171, "wall": 7512.2} {"step": 16526, "train_loss": 3.199289321899414, "lr": 0.00020531258245872863, "tps": 144087, "wall": 7517.1} {"step": 16527, "train_loss": 3.270159959793091, "lr": 0.00020529348842603703, "tps": 144002, "wall": 7521.9} {"step": 16528, "train_loss": 3.3417720794677734, "lr": 0.00020527439455994166, "tps": 143918, "wall": 7526.8} {"step": 16529, "train_loss": 3.4424941539764404, "lr": 0.0002052553008606587, "tps": 143833, "wall": 7531.7} {"step": 16530, "train_loss": 3.3806581497192383, "lr": 0.00020523620732840452, "tps": 143749, "wall": 7536.6} {"step": 16531, "train_loss": 3.3594536781311035, "lr": 0.00020521711396339539, "tps": 143665, "wall": 7541.4} {"step": 16532, "train_loss": 3.3326594829559326, "lr": 0.0002051980207658476, "tps": 143579, "wall": 7546.4} {"step": 16533, "train_loss": 3.344907760620117, "lr": 0.00020517892773597738, "tps": 143496, "wall": 7551.2} {"step": 16534, "train_loss": 3.2940852642059326, "lr": 0.00020515983487400105, "tps": 143412, "wall": 7556.1} {"step": 16535, "train_loss": 3.385310649871826, "lr": 0.000205140742180135, "tps": 143329, "wall": 7560.9} {"step": 16536, "train_loss": 3.270113468170166, "lr": 0.0002051216496545954, "tps": 143245, "wall": 7565.8} {"step": 16537, "train_loss": 3.339261531829834, "lr": 0.0002051025572975985, "tps": 143162, "wall": 7570.7} {"step": 16538, "train_loss": 3.339369535446167, "lr": 0.00020508346510936072, "tps": 143078, "wall": 7575.5} {"step": 16539, "train_loss": 3.322507858276367, "lr": 0.0002050643730900982, "tps": 142995, "wall": 7580.4} {"step": 16540, "train_loss": 3.2740726470947266, "lr": 0.00020504528124002728, "tps": 142912, "wall": 7585.3} {"step": 16541, "train_loss": 3.322843551635742, "lr": 0.0002050261895593642, "tps": 142829, "wall": 7590.1} {"step": 16542, "train_loss": 3.4074325561523438, "lr": 0.00020500709804832526, "tps": 142746, "wall": 7595.0} {"step": 16543, "train_loss": 3.346628427505493, "lr": 0.00020498800670712677, "tps": 142663, "wall": 7599.9} {"step": 16544, "train_loss": 3.319366455078125, "lr": 0.00020496891553598495, "tps": 142580, "wall": 7604.8} {"step": 16545, "train_loss": 3.3400814533233643, "lr": 0.00020494982453511603, "tps": 142495, "wall": 7609.8} {"step": 16546, "train_loss": 3.293443441390991, "lr": 0.00020493073370473632, "tps": 142413, "wall": 7614.6} {"step": 16547, "train_loss": 3.3972508907318115, "lr": 0.00020491164304506208, "tps": 142330, "wall": 7619.5} {"step": 16548, "train_loss": 3.317251682281494, "lr": 0.0002048925525563096, "tps": 142248, "wall": 7624.4} {"step": 16549, "train_loss": 3.4126651287078857, "lr": 0.00020487346223869505, "tps": 142166, "wall": 7629.2} {"step": 16550, "train_loss": 3.3823137283325195, "lr": 0.00020485437209243475, "tps": 142084, "wall": 7634.1} {"step": 16551, "train_loss": 3.377253770828247, "lr": 0.0002048352821177449, "tps": 142002, "wall": 7639.0} {"step": 16552, "train_loss": 3.351367950439453, "lr": 0.0002048161923148419, "tps": 141920, "wall": 7643.8} {"step": 16553, "train_loss": 3.3863418102264404, "lr": 0.00020479710268394178, "tps": 141838, "wall": 7648.7} {"step": 16554, "train_loss": 3.350541114807129, "lr": 0.00020477801322526097, "tps": 141757, "wall": 7653.6} {"step": 16555, "train_loss": 3.373408794403076, "lr": 0.00020475892393901566, "tps": 141675, "wall": 7658.4} {"step": 16556, "train_loss": 3.411916732788086, "lr": 0.00020473983482542204, "tps": 141594, "wall": 7663.3} {"step": 16557, "train_loss": 3.306891441345215, "lr": 0.00020472074588469643, "tps": 141512, "wall": 7668.2} {"step": 16558, "train_loss": 3.3323252201080322, "lr": 0.00020470165711705506, "tps": 141430, "wall": 7673.1} {"step": 16559, "train_loss": 3.4078056812286377, "lr": 0.0002046825685227141, "tps": 141349, "wall": 7677.9} {"step": 16560, "train_loss": 3.291538715362549, "lr": 0.00020466348010188986, "tps": 141268, "wall": 7682.8} {"step": 16561, "train_loss": 3.2588300704956055, "lr": 0.0002046443918547985, "tps": 141187, "wall": 7687.7} {"step": 16562, "train_loss": 3.321655750274658, "lr": 0.00020462530378165635, "tps": 141107, "wall": 7692.5} {"step": 16563, "train_loss": 3.261474609375, "lr": 0.0002046062158826796, "tps": 141026, "wall": 7697.4} {"step": 16564, "train_loss": 3.387031078338623, "lr": 0.0002045871281580844, "tps": 140945, "wall": 7702.3} {"step": 16565, "train_loss": 3.3562674522399902, "lr": 0.00020456804060808712, "tps": 140864, "wall": 7707.2} {"step": 16566, "train_loss": 3.2581491470336914, "lr": 0.00020454895323290386, "tps": 140784, "wall": 7712.1} {"step": 16567, "train_loss": 3.366989850997925, "lr": 0.00020452986603275092, "tps": 140704, "wall": 7716.9} {"step": 16568, "train_loss": 3.368321180343628, "lr": 0.00020451077900784448, "tps": 140623, "wall": 7721.8} {"step": 16569, "train_loss": 3.3666739463806152, "lr": 0.0002044916921584008, "tps": 140542, "wall": 7726.7} {"step": 16570, "train_loss": 3.2866134643554688, "lr": 0.00020447260548463604, "tps": 140462, "wall": 7731.6} {"step": 16571, "train_loss": 3.3605737686157227, "lr": 0.0002044535189867664, "tps": 140382, "wall": 7736.4} {"step": 16572, "train_loss": 3.3687386512756348, "lr": 0.0002044344326650083, "tps": 140302, "wall": 7741.3} {"step": 16573, "train_loss": 3.3714208602905273, "lr": 0.00020441534651957763, "tps": 140223, "wall": 7746.2} {"step": 16574, "train_loss": 3.3518176078796387, "lr": 0.00020439626055069078, "tps": 140143, "wall": 7751.0} {"step": 16575, "train_loss": 3.4197793006896973, "lr": 0.000204377174758564, "tps": 140064, "wall": 7755.9} {"step": 16576, "train_loss": 3.401665687561035, "lr": 0.0002043580891434134, "tps": 139984, "wall": 7760.8} {"step": 16577, "train_loss": 3.4002022743225098, "lr": 0.00020433900370545516, "tps": 139905, "wall": 7765.7} {"step": 16578, "train_loss": 3.3616936206817627, "lr": 0.0002043199184449056, "tps": 139826, "wall": 7770.5} {"step": 16579, "train_loss": 3.3194875717163086, "lr": 0.00020430083336198088, "tps": 139747, "wall": 7775.4} {"step": 16580, "train_loss": 3.3692777156829834, "lr": 0.00020428174845689708, "tps": 139667, "wall": 7780.3} {"step": 16581, "train_loss": 3.341993808746338, "lr": 0.00020426266372987052, "tps": 139588, "wall": 7785.1} {"step": 16582, "train_loss": 3.3207335472106934, "lr": 0.00020424357918111738, "tps": 139509, "wall": 7790.0} {"step": 16583, "train_loss": 3.3513236045837402, "lr": 0.00020422449481085378, "tps": 139430, "wall": 7794.9} {"step": 16584, "train_loss": 3.396989345550537, "lr": 0.000204205410619296, "tps": 139352, "wall": 7799.8} {"step": 16585, "train_loss": 3.376521110534668, "lr": 0.0002041863266066602, "tps": 139273, "wall": 7804.6} {"step": 16586, "train_loss": 3.339028835296631, "lr": 0.0002041672427731625, "tps": 139194, "wall": 7809.6} {"step": 16587, "train_loss": 3.462028980255127, "lr": 0.00020414815911901912, "tps": 139116, "wall": 7814.4} {"step": 16588, "train_loss": 3.343761920928955, "lr": 0.00020412907564444627, "tps": 139037, "wall": 7819.3} {"step": 16589, "train_loss": 3.2952494621276855, "lr": 0.00020410999234966016, "tps": 138959, "wall": 7824.1} {"step": 16590, "train_loss": 3.3964431285858154, "lr": 0.00020409090923487685, "tps": 138881, "wall": 7829.0} {"step": 16591, "train_loss": 3.4701333045959473, "lr": 0.0002040718263003126, "tps": 138804, "wall": 7833.9} {"step": 16592, "train_loss": 3.3204805850982666, "lr": 0.0002040527435461836, "tps": 138726, "wall": 7838.7} {"step": 16593, "train_loss": 3.3614001274108887, "lr": 0.00020403366097270596, "tps": 138648, "wall": 7843.6} {"step": 16594, "train_loss": 3.3430328369140625, "lr": 0.0002040145785800958, "tps": 138569, "wall": 7848.5} {"step": 16595, "train_loss": 3.343130111694336, "lr": 0.00020399549636856943, "tps": 138492, "wall": 7853.4} {"step": 16596, "train_loss": 3.2605457305908203, "lr": 0.00020397641433834296, "tps": 138414, "wall": 7858.3} {"step": 16597, "train_loss": 3.3269665241241455, "lr": 0.00020395733248963248, "tps": 138337, "wall": 7863.1} {"step": 16598, "train_loss": 3.38447642326355, "lr": 0.00020393825082265426, "tps": 138260, "wall": 7868.0} {"step": 16599, "train_loss": 3.399064064025879, "lr": 0.00020391916933762438, "tps": 138182, "wall": 7872.9} {"step": 16600, "train_loss": 3.4363136291503906, "lr": 0.00020390008803475903, "tps": 138105, "wall": 7877.8} {"step": 16601, "train_loss": 3.3265700340270996, "lr": 0.00020388100691427435, "tps": 138028, "wall": 7882.6} {"step": 16602, "train_loss": 3.3727564811706543, "lr": 0.00020386192597638653, "tps": 137951, "wall": 7887.5} {"step": 16603, "train_loss": 3.2957231998443604, "lr": 0.00020384284522131165, "tps": 137874, "wall": 7892.4} {"step": 16604, "train_loss": 3.4824600219726562, "lr": 0.00020382376464926592, "tps": 137797, "wall": 7897.3} {"step": 16605, "train_loss": 3.3122878074645996, "lr": 0.00020380468426046543, "tps": 137721, "wall": 7902.1} {"step": 16606, "train_loss": 3.3164420127868652, "lr": 0.0002037856040551263, "tps": 137643, "wall": 7907.1} {"step": 16607, "train_loss": 3.323558807373047, "lr": 0.0002037665240334648, "tps": 137567, "wall": 7911.9} {"step": 16608, "train_loss": 3.386918783187866, "lr": 0.000203747444195697, "tps": 137490, "wall": 7916.8} {"step": 16609, "train_loss": 3.279547929763794, "lr": 0.00020372836454203897, "tps": 137414, "wall": 7921.7} {"step": 16610, "train_loss": 3.4060709476470947, "lr": 0.00020370928507270692, "tps": 137338, "wall": 7926.5} {"step": 16611, "train_loss": 3.2753701210021973, "lr": 0.000203690205787917, "tps": 137262, "wall": 7931.4} {"step": 16612, "train_loss": 3.330801010131836, "lr": 0.00020367112668788528, "tps": 137186, "wall": 7936.2} {"step": 16613, "train_loss": 3.3765125274658203, "lr": 0.00020365204777282792, "tps": 137111, "wall": 7941.1} {"step": 16614, "train_loss": 3.322558879852295, "lr": 0.0002036329690429611, "tps": 137034, "wall": 7946.0} {"step": 16615, "train_loss": 3.2894091606140137, "lr": 0.00020361389049850087, "tps": 136959, "wall": 7950.9} {"step": 16616, "train_loss": 3.23874568939209, "lr": 0.0002035948121396633, "tps": 136883, "wall": 7955.7} {"step": 16617, "train_loss": 3.281388759613037, "lr": 0.0002035757339666647, "tps": 136808, "wall": 7960.6} {"step": 16618, "train_loss": 3.3778505325317383, "lr": 0.000203556655979721, "tps": 136733, "wall": 7965.4} {"step": 16619, "train_loss": 3.3438920974731445, "lr": 0.00020353757817904842, "tps": 136657, "wall": 7970.4} {"step": 16620, "train_loss": 3.4275288581848145, "lr": 0.00020351850056486302, "tps": 136582, "wall": 7975.2} {"step": 16621, "train_loss": 3.3362722396850586, "lr": 0.00020349942313738098, "tps": 136506, "wall": 7980.1} {"step": 16622, "train_loss": 3.2989492416381836, "lr": 0.00020348034589681832, "tps": 136430, "wall": 7985.0} {"step": 16623, "train_loss": 3.293358087539673, "lr": 0.00020346126884339123, "tps": 136355, "wall": 7989.9} {"step": 16624, "train_loss": 3.2941131591796875, "lr": 0.00020344219197731577, "tps": 136280, "wall": 7994.8} {"step": 16625, "train_loss": 3.2304279804229736, "lr": 0.00020342311529880807, "tps": 136206, "wall": 7999.6} {"step": 16626, "train_loss": 3.3506879806518555, "lr": 0.00020340403880808418, "tps": 136132, "wall": 8004.5} {"step": 16627, "train_loss": 3.468048572540283, "lr": 0.00020338496250536027, "tps": 136057, "wall": 8009.4} {"step": 16628, "train_loss": 3.341158390045166, "lr": 0.0002033658863908524, "tps": 135983, "wall": 8014.2} {"step": 16629, "train_loss": 3.3552238941192627, "lr": 0.00020334681046477662, "tps": 135908, "wall": 8019.1} {"step": 16630, "train_loss": 3.288747787475586, "lr": 0.00020332773472734914, "tps": 135834, "wall": 8023.9} {"step": 16631, "train_loss": 3.409414291381836, "lr": 0.00020330865917878596, "tps": 135759, "wall": 8028.9} {"step": 16632, "train_loss": 3.3932442665100098, "lr": 0.00020328958381930318, "tps": 135685, "wall": 8033.7} {"step": 16633, "train_loss": 3.376488447189331, "lr": 0.0002032705086491169, "tps": 135611, "wall": 8038.6} {"step": 16634, "train_loss": 3.313723564147949, "lr": 0.00020325143366844325, "tps": 135537, "wall": 8043.5} {"step": 16635, "train_loss": 3.3559470176696777, "lr": 0.00020323235887749822, "tps": 135463, "wall": 8048.3} {"step": 16636, "train_loss": 3.157188653945923, "lr": 0.0002032132842764979, "tps": 135390, "wall": 8053.2} {"step": 16637, "train_loss": 3.40449595451355, "lr": 0.00020319420986565848, "tps": 135316, "wall": 8058.1} {"step": 16638, "train_loss": 3.2809696197509766, "lr": 0.00020317513564519591, "tps": 135242, "wall": 8062.9} {"step": 16639, "train_loss": 3.3661818504333496, "lr": 0.0002031560616153263, "tps": 135169, "wall": 8067.8} {"step": 16640, "train_loss": 3.3525876998901367, "lr": 0.00020313698777626576, "tps": 135096, "wall": 8072.7} {"step": 16641, "train_loss": 3.3382186889648438, "lr": 0.00020311791412823036, "tps": 135022, "wall": 8077.5} {"step": 16642, "train_loss": 3.3607258796691895, "lr": 0.0002030988406714361, "tps": 134949, "wall": 8082.4} {"step": 16643, "train_loss": 3.3290047645568848, "lr": 0.0002030797674060991, "tps": 134875, "wall": 8087.3} {"step": 16644, "train_loss": 3.370619773864746, "lr": 0.00020306069433243543, "tps": 134802, "wall": 8092.2} {"step": 16645, "train_loss": 3.395573616027832, "lr": 0.0002030416214506611, "tps": 134729, "wall": 8097.1} {"step": 16646, "train_loss": 3.3506505489349365, "lr": 0.00020302254876099224, "tps": 134656, "wall": 8101.9} {"step": 16647, "train_loss": 3.2847492694854736, "lr": 0.0002030034762636448, "tps": 134583, "wall": 8106.8} {"step": 16648, "train_loss": 3.379483222961426, "lr": 0.000202984403958835, "tps": 134511, "wall": 8111.7} {"step": 16649, "train_loss": 3.376166820526123, "lr": 0.0002029653318467787, "tps": 134438, "wall": 8116.5} {"step": 16650, "train_loss": 3.4183902740478516, "lr": 0.00020294625992769207, "tps": 134366, "wall": 8121.4} {"step": 16651, "train_loss": 3.4738950729370117, "lr": 0.00020292718820179116, "tps": 134292, "wall": 8126.3} {"step": 16652, "train_loss": 3.3644907474517822, "lr": 0.00020290811666929197, "tps": 134220, "wall": 8131.2} {"step": 16653, "train_loss": 3.3979289531707764, "lr": 0.00020288904533041056, "tps": 134148, "wall": 8136.0} {"step": 16654, "train_loss": 3.3584814071655273, "lr": 0.00020286997418536297, "tps": 134076, "wall": 8140.9} {"step": 16655, "train_loss": 3.322542667388916, "lr": 0.0002028509032343652, "tps": 134004, "wall": 8145.8} {"step": 16656, "train_loss": 3.269566059112549, "lr": 0.00020283183247763335, "tps": 133931, "wall": 8150.7} {"step": 16657, "train_loss": 3.261111259460449, "lr": 0.0002028127619153834, "tps": 133859, "wall": 8155.5} {"step": 16658, "train_loss": 3.2900290489196777, "lr": 0.0002027936915478315, "tps": 133787, "wall": 8160.4} {"step": 16659, "train_loss": 3.3542330265045166, "lr": 0.00020277462137519353, "tps": 133716, "wall": 8165.3} {"step": 16660, "train_loss": 3.2698380947113037, "lr": 0.0002027555513976856, "tps": 133644, "wall": 8170.1} {"step": 16661, "train_loss": 3.373307704925537, "lr": 0.0002027364816155237, "tps": 133573, "wall": 8175.0} {"step": 16662, "train_loss": 3.4142069816589355, "lr": 0.0002027174120289239, "tps": 133501, "wall": 8179.9} {"step": 16663, "train_loss": 3.3971753120422363, "lr": 0.00020269834263810218, "tps": 133430, "wall": 8184.7} {"step": 16664, "train_loss": 3.3314576148986816, "lr": 0.00020267927344327458, "tps": 133359, "wall": 8189.6} {"step": 16665, "train_loss": 3.4431509971618652, "lr": 0.00020266020444465705, "tps": 133287, "wall": 8194.5} {"step": 16666, "train_loss": 3.35947322845459, "lr": 0.00020264113564246575, "tps": 133216, "wall": 8199.3} {"step": 16667, "train_loss": 3.2644662857055664, "lr": 0.0002026220670369165, "tps": 133145, "wall": 8204.2} {"step": 16668, "train_loss": 3.3842482566833496, "lr": 0.00020260299862822555, "tps": 133074, "wall": 8209.1} {"step": 16669, "train_loss": 3.330557346343994, "lr": 0.00020258393041660866, "tps": 133003, "wall": 8214.0} {"step": 16670, "train_loss": 3.3896846771240234, "lr": 0.00020256486240228196, "tps": 132932, "wall": 8218.8} {"step": 16671, "train_loss": 3.3161520957946777, "lr": 0.0002025457945854615, "tps": 132862, "wall": 8223.7} {"step": 16672, "train_loss": 3.314600944519043, "lr": 0.00020252672696636318, "tps": 132791, "wall": 8228.5} {"step": 16673, "train_loss": 3.2957537174224854, "lr": 0.00020250765954520303, "tps": 132721, "wall": 8233.4} {"step": 16674, "train_loss": 3.3075432777404785, "lr": 0.00020248859232219709, "tps": 132650, "wall": 8238.3} {"step": 16675, "train_loss": 3.3327999114990234, "lr": 0.00020246952529756132, "tps": 132580, "wall": 8243.2} {"step": 16676, "train_loss": 3.4004316329956055, "lr": 0.00020245045847151172, "tps": 132509, "wall": 8248.0} {"step": 16677, "train_loss": 3.2368197441101074, "lr": 0.00020243139184426422, "tps": 132439, "wall": 8252.9} {"step": 16678, "train_loss": 3.381448268890381, "lr": 0.00020241232541603492, "tps": 132369, "wall": 8257.8} {"step": 16679, "train_loss": 3.2952375411987305, "lr": 0.00020239325918703976, "tps": 132299, "wall": 8262.6} {"step": 16680, "train_loss": 3.2238306999206543, "lr": 0.00020237419315749468, "tps": 132228, "wall": 8267.6} {"step": 16681, "train_loss": 3.3519322872161865, "lr": 0.00020235512732761572, "tps": 132158, "wall": 8272.4} {"step": 16682, "train_loss": 3.344015598297119, "lr": 0.00020233606169761884, "tps": 132088, "wall": 8277.3} {"step": 16683, "train_loss": 3.3484132289886475, "lr": 0.00020231699626771993, "tps": 132018, "wall": 8282.2} {"step": 16684, "train_loss": 3.223512649536133, "lr": 0.0002022979310381351, "tps": 131949, "wall": 8287.0} {"step": 16685, "train_loss": 3.40556001663208, "lr": 0.00020227886600908027, "tps": 131879, "wall": 8291.9} {"step": 16686, "train_loss": 3.364142894744873, "lr": 0.0002022598011807714, "tps": 131809, "wall": 8296.8} {"step": 16687, "train_loss": 3.3755292892456055, "lr": 0.00020224073655342447, "tps": 131740, "wall": 8301.7} {"step": 16688, "train_loss": 3.3382363319396973, "lr": 0.00020222167212725545, "tps": 131670, "wall": 8306.6} {"step": 16689, "train_loss": 3.358297348022461, "lr": 0.0002022026079024802, "tps": 131601, "wall": 8311.4} {"step": 16690, "train_loss": 3.359226942062378, "lr": 0.0002021835438793149, "tps": 131532, "wall": 8316.3} {"step": 16691, "train_loss": 3.3420684337615967, "lr": 0.0002021644800579753, "tps": 131463, "wall": 8321.1} {"step": 16692, "train_loss": 3.3843576908111572, "lr": 0.00020214541643867744, "tps": 131394, "wall": 8326.0} {"step": 16693, "train_loss": 3.326751232147217, "lr": 0.00020212635302163724, "tps": 131324, "wall": 8330.9} {"step": 16694, "train_loss": 3.3520925045013428, "lr": 0.00020210728980707074, "tps": 131255, "wall": 8335.8} {"step": 16695, "train_loss": 3.382857322692871, "lr": 0.00020208822679519382, "tps": 131187, "wall": 8340.7} {"step": 16696, "train_loss": 3.3174448013305664, "lr": 0.00020206916398622245, "tps": 131118, "wall": 8345.5} {"step": 16697, "train_loss": 3.395364284515381, "lr": 0.00020205010138037253, "tps": 131050, "wall": 8350.4} {"step": 16698, "train_loss": 3.411761999130249, "lr": 0.00020203103897786003, "tps": 130981, "wall": 8355.3} {"step": 16699, "train_loss": 3.3444442749023438, "lr": 0.00020201197677890091, "tps": 130912, "wall": 8360.2} {"step": 16700, "train_loss": 3.3407678604125977, "lr": 0.00020199291478371106, "tps": 130844, "wall": 8365.0} {"step": 16701, "train_loss": 3.311655044555664, "lr": 0.00020197385299250647, "tps": 130776, "wall": 8369.9} {"step": 16702, "train_loss": 3.4005000591278076, "lr": 0.00020195479140550307, "tps": 130708, "wall": 8374.8} {"step": 16703, "train_loss": 3.3777918815612793, "lr": 0.00020193573002291672, "tps": 130640, "wall": 8379.6} {"step": 16704, "train_loss": 3.460878372192383, "lr": 0.00020191666884496342, "tps": 130572, "wall": 8384.5} {"step": 16705, "train_loss": 3.3871281147003174, "lr": 0.00020189760787185909, "tps": 130502, "wall": 8389.4} {"step": 16706, "train_loss": 3.3632020950317383, "lr": 0.00020187854710381959, "tps": 130434, "wall": 8394.3} {"step": 16707, "train_loss": 3.2810611724853516, "lr": 0.00020185948654106092, "tps": 130367, "wall": 8399.2} {"step": 16708, "train_loss": 3.4289472103118896, "lr": 0.000201840426183799, "tps": 130299, "wall": 8404.0} {"step": 16709, "train_loss": 3.2773032188415527, "lr": 0.00020182136603224965, "tps": 130231, "wall": 8408.9} {"step": 16710, "train_loss": 3.4351682662963867, "lr": 0.0002018023060866289, "tps": 130164, "wall": 8413.8} {"step": 16711, "train_loss": 3.3746628761291504, "lr": 0.00020178324634715256, "tps": 130096, "wall": 8418.6} {"step": 16712, "train_loss": 3.407219171524048, "lr": 0.00020176418681403665, "tps": 130029, "wall": 8423.5} {"step": 16713, "train_loss": 3.3567841053009033, "lr": 0.000201745127487497, "tps": 129961, "wall": 8428.4} {"step": 16714, "train_loss": 3.365834951400757, "lr": 0.0002017260683677495, "tps": 129894, "wall": 8433.3} {"step": 16715, "train_loss": 3.2908167839050293, "lr": 0.00020170700945501015, "tps": 129826, "wall": 8438.2} {"step": 16716, "train_loss": 3.300476312637329, "lr": 0.00020168795074949474, "tps": 129759, "wall": 8443.0} {"step": 16717, "train_loss": 3.2386834621429443, "lr": 0.00020166889225141921, "tps": 129691, "wall": 8448.0} {"step": 16718, "train_loss": 3.367506504058838, "lr": 0.00020164983396099947, "tps": 129624, "wall": 8452.9} {"step": 16719, "train_loss": 3.3143973350524902, "lr": 0.0002016307758784514, "tps": 129557, "wall": 8457.8} {"step": 16720, "train_loss": 3.1945667266845703, "lr": 0.00020161171800399088, "tps": 129490, "wall": 8462.6} {"step": 16721, "train_loss": 3.2896580696105957, "lr": 0.00020159266033783384, "tps": 129423, "wall": 8467.5} {"step": 16722, "train_loss": 3.379737377166748, "lr": 0.00020157360288019618, "tps": 129356, "wall": 8472.4} {"step": 16723, "train_loss": 3.24259877204895, "lr": 0.00020155454563129368, "tps": 129290, "wall": 8477.2} {"step": 16724, "train_loss": 3.4742584228515625, "lr": 0.00020153548859134227, "tps": 129223, "wall": 8482.1} {"step": 16725, "train_loss": 3.192183256149292, "lr": 0.00020151643176055792, "tps": 129156, "wall": 8487.0} {"step": 16726, "train_loss": 3.468919515609741, "lr": 0.00020149737513915636, "tps": 129090, "wall": 8491.9} {"step": 16727, "train_loss": 3.3384904861450195, "lr": 0.00020147831872735354, "tps": 129024, "wall": 8496.7} {"step": 16728, "train_loss": 3.3788323402404785, "lr": 0.00020145926252536538, "tps": 128957, "wall": 8501.6} {"step": 16729, "train_loss": 3.3226213455200195, "lr": 0.00020144020653340764, "tps": 128890, "wall": 8506.6} {"step": 16730, "train_loss": 3.293337821960449, "lr": 0.00020142115075169628, "tps": 128824, "wall": 8511.4} {"step": 16731, "train_loss": 3.4078123569488525, "lr": 0.00020140209518044712, "tps": 128758, "wall": 8516.3} {"step": 16732, "train_loss": 3.33752703666687, "lr": 0.00020138303981987604, "tps": 128692, "wall": 8521.2} {"step": 16733, "train_loss": 3.4476125240325928, "lr": 0.0002013639846701989, "tps": 128627, "wall": 8526.0} {"step": 16734, "train_loss": 3.3759870529174805, "lr": 0.00020134492973163153, "tps": 128561, "wall": 8530.9} {"step": 16735, "train_loss": 3.376059055328369, "lr": 0.00020132587500438983, "tps": 128495, "wall": 8535.8} {"step": 16736, "train_loss": 3.324439525604248, "lr": 0.00020130682048868955, "tps": 128430, "wall": 8540.6} {"step": 16737, "train_loss": 3.355894088745117, "lr": 0.00020128776618474667, "tps": 128364, "wall": 8545.5} {"step": 16738, "train_loss": 3.336369514465332, "lr": 0.00020126871209277702, "tps": 128298, "wall": 8550.4} {"step": 16739, "train_loss": 3.3322510719299316, "lr": 0.0002012496582129964, "tps": 128233, "wall": 8555.3} {"step": 16740, "train_loss": 3.371471643447876, "lr": 0.00020123060454562067, "tps": 128167, "wall": 8560.2} {"step": 16741, "train_loss": 3.319572687149048, "lr": 0.0002012115510908656, "tps": 128102, "wall": 8565.1} {"step": 16742, "train_loss": 3.32912015914917, "lr": 0.00020119249784894717, "tps": 128036, "wall": 8570.0} {"step": 16743, "train_loss": 3.3510899543762207, "lr": 0.00020117344482008113, "tps": 127971, "wall": 8574.9} {"step": 16744, "train_loss": 3.334929943084717, "lr": 0.00020115439200448328, "tps": 127906, "wall": 8579.7} {"step": 16745, "train_loss": 3.3548121452331543, "lr": 0.00020113533940236956, "tps": 127841, "wall": 8584.6} {"step": 16746, "train_loss": 3.2269766330718994, "lr": 0.0002011162870139557, "tps": 127776, "wall": 8589.5} {"step": 16747, "train_loss": 3.3816399574279785, "lr": 0.00020109723483945758, "tps": 127711, "wall": 8594.3} {"step": 16748, "train_loss": 3.2318944931030273, "lr": 0.00020107818287909096, "tps": 127646, "wall": 8599.2} {"step": 16749, "train_loss": 3.338097333908081, "lr": 0.0002010591311330718, "tps": 127581, "wall": 8604.1} {"step": 16750, "train_loss": 3.3325209617614746, "lr": 0.00020104007960161573, "tps": 127517, "wall": 8609.0} {"step": 16751, "train_loss": 3.298647165298462, "lr": 0.0002010210282849387, "tps": 127452, "wall": 8613.9} {"step": 16752, "train_loss": 3.330803394317627, "lr": 0.00020100197718325654, "tps": 127388, "wall": 8618.7} {"step": 16753, "train_loss": 3.381779193878174, "lr": 0.00020098292629678493, "tps": 127323, "wall": 8623.6} {"step": 16754, "train_loss": 3.4915337562561035, "lr": 0.0002009638756257398, "tps": 127258, "wall": 8628.6} {"step": 16755, "train_loss": 3.3851568698883057, "lr": 0.0002009448251703369, "tps": 127193, "wall": 8633.4} {"step": 16756, "train_loss": 3.3013620376586914, "lr": 0.00020092577493079205, "tps": 127129, "wall": 8638.3} {"step": 16757, "train_loss": 3.3362650871276855, "lr": 0.0002009067249073211, "tps": 127065, "wall": 8643.2} {"step": 16758, "train_loss": 3.324725866317749, "lr": 0.00020088767510013976, "tps": 127001, "wall": 8648.1} {"step": 16759, "train_loss": 3.3985278606414795, "lr": 0.00020086862550946388, "tps": 126937, "wall": 8652.9} {"step": 16760, "train_loss": 3.321727752685547, "lr": 0.00020084957613550924, "tps": 126873, "wall": 8657.8} {"step": 16761, "train_loss": 3.428849220275879, "lr": 0.00020083052697849162, "tps": 126809, "wall": 8662.7} {"step": 16762, "train_loss": 3.2808127403259277, "lr": 0.00020081147803862684, "tps": 126745, "wall": 8667.6} {"step": 16763, "train_loss": 3.35164737701416, "lr": 0.0002007924293161307, "tps": 126681, "wall": 8672.5} {"step": 16764, "train_loss": 3.352612018585205, "lr": 0.0002007733808112189, "tps": 126618, "wall": 8677.3} {"step": 16765, "train_loss": 3.3048763275146484, "lr": 0.00020075433252410733, "tps": 126554, "wall": 8682.2} {"step": 16766, "train_loss": 3.4085941314697266, "lr": 0.00020073528445501175, "tps": 126490, "wall": 8687.2} {"step": 16767, "train_loss": 3.380375862121582, "lr": 0.00020071623660414788, "tps": 126427, "wall": 8692.0} {"step": 16768, "train_loss": 3.317939519882202, "lr": 0.0002006971889717315, "tps": 126363, "wall": 8696.9} {"step": 16769, "train_loss": 3.426225423812866, "lr": 0.00020067814155797845, "tps": 126300, "wall": 8701.8} {"step": 16770, "train_loss": 3.356248378753662, "lr": 0.0002006590943631044, "tps": 126237, "wall": 8706.7} {"step": 16771, "train_loss": 3.216248035430908, "lr": 0.0002006400473873253, "tps": 126174, "wall": 8711.5} {"step": 16772, "train_loss": 3.2852752208709717, "lr": 0.0002006210006308567, "tps": 126110, "wall": 8716.4} {"step": 16773, "train_loss": 3.429490327835083, "lr": 0.00020060195409391446, "tps": 126048, "wall": 8721.3} {"step": 16774, "train_loss": 3.2811384201049805, "lr": 0.00020058290777671432, "tps": 125985, "wall": 8726.1} {"step": 16775, "train_loss": 3.369784355163574, "lr": 0.00020056386167947206, "tps": 125922, "wall": 8731.0} {"step": 16776, "train_loss": 3.2581214904785156, "lr": 0.00020054481580240342, "tps": 125859, "wall": 8735.9} {"step": 16777, "train_loss": 3.317821979522705, "lr": 0.0002005257701457242, "tps": 125796, "wall": 8740.8} {"step": 16778, "train_loss": 3.337869882583618, "lr": 0.00020050672470965007, "tps": 125734, "wall": 8745.7} {"step": 16779, "train_loss": 3.2524285316467285, "lr": 0.0002004876794943968, "tps": 125670, "wall": 8750.6} {"step": 16780, "train_loss": 3.2537927627563477, "lr": 0.00020046863450018019, "tps": 125608, "wall": 8755.5} {"step": 16781, "train_loss": 3.4190187454223633, "lr": 0.00020044958972721593, "tps": 125545, "wall": 8760.3} {"step": 16782, "train_loss": 3.3444595336914062, "lr": 0.00020043054517571976, "tps": 125483, "wall": 8765.2} {"step": 16783, "train_loss": 3.4667696952819824, "lr": 0.00020041150084590745, "tps": 125421, "wall": 8770.1} {"step": 16784, "train_loss": 3.388763427734375, "lr": 0.00020039245673799476, "tps": 125358, "wall": 8775.0} {"step": 16785, "train_loss": 3.376919984817505, "lr": 0.00020037341285219728, "tps": 125296, "wall": 8779.8} {"step": 16786, "train_loss": 3.195044994354248, "lr": 0.00020035436918873088, "tps": 125234, "wall": 8784.7} {"step": 16787, "train_loss": 3.4152374267578125, "lr": 0.00020033532574781132, "tps": 125172, "wall": 8789.6} {"step": 16788, "train_loss": 3.382221221923828, "lr": 0.0002003162825296542, "tps": 125110, "wall": 8794.5} {"step": 16789, "train_loss": 3.424842119216919, "lr": 0.0002002972395344753, "tps": 125048, "wall": 8799.3} {"step": 16790, "train_loss": 3.314018726348877, "lr": 0.0002002781967624903, "tps": 124986, "wall": 8804.2} {"step": 16791, "train_loss": 3.3757481575012207, "lr": 0.000200259154213915, "tps": 124924, "wall": 8809.2} {"step": 16792, "train_loss": 3.3472490310668945, "lr": 0.00020024011188896505, "tps": 124863, "wall": 8814.0} {"step": 16793, "train_loss": 3.3030617237091064, "lr": 0.0002002210697878562, "tps": 124801, "wall": 8818.9} {"step": 16794, "train_loss": 3.362107753753662, "lr": 0.00020020202791080417, "tps": 124740, "wall": 8823.8} {"step": 16795, "train_loss": 3.4216995239257812, "lr": 0.00020018298625802455, "tps": 124678, "wall": 8828.6} {"step": 16796, "train_loss": 3.3045525550842285, "lr": 0.00020016394482973317, "tps": 124617, "wall": 8833.5} {"step": 16797, "train_loss": 3.3393051624298096, "lr": 0.0002001449036261457, "tps": 124556, "wall": 8838.4} {"step": 16798, "train_loss": 3.232541561126709, "lr": 0.0002001258626474779, "tps": 124495, "wall": 8843.2} {"step": 16799, "train_loss": 3.283764362335205, "lr": 0.0002001068218939453, "tps": 124434, "wall": 8848.1} {"step": 16800, "train_loss": 3.2525744438171387, "lr": 0.00020008778136576373, "tps": 124373, "wall": 8853.0} {"step": 16801, "train_loss": 3.30926513671875, "lr": 0.0002000687410631489, "tps": 124312, "wall": 8857.8} {"step": 16802, "train_loss": 3.377945899963379, "lr": 0.00020004970098631638, "tps": 124251, "wall": 8862.7} {"step": 16803, "train_loss": 3.2772622108459473, "lr": 0.00020003066113548194, "tps": 124189, "wall": 8867.6} {"step": 16804, "train_loss": 3.379314661026001, "lr": 0.00020001162151086135, "tps": 124128, "wall": 8872.5} {"step": 16805, "train_loss": 3.3040080070495605, "lr": 0.00019999258211267007, "tps": 124068, "wall": 8877.4} {"step": 16806, "train_loss": 3.3825981616973877, "lr": 0.00019997354294112394, "tps": 124007, "wall": 8882.2} {"step": 16807, "train_loss": 3.4043164253234863, "lr": 0.0001999545039964386, "tps": 123946, "wall": 8887.1} {"step": 16808, "train_loss": 3.245145320892334, "lr": 0.00019993546527882975, "tps": 123886, "wall": 8892.0} {"step": 16809, "train_loss": 3.335545063018799, "lr": 0.00019991642678851302, "tps": 123825, "wall": 8896.8} {"step": 16810, "train_loss": 3.2935853004455566, "lr": 0.00019989738852570406, "tps": 123765, "wall": 8901.7} {"step": 16811, "train_loss": 3.481093406677246, "lr": 0.00019987835049061864, "tps": 123704, "wall": 8906.6} {"step": 16812, "train_loss": 3.3617424964904785, "lr": 0.00019985931268347228, "tps": 123644, "wall": 8911.5} {"step": 16813, "train_loss": 3.2688982486724854, "lr": 0.00019984027510448074, "tps": 123584, "wall": 8916.3} {"step": 16814, "train_loss": 3.261141777038574, "lr": 0.00019982123775385971, "tps": 123524, "wall": 8921.2} {"step": 16815, "train_loss": 3.3517489433288574, "lr": 0.00019980220063182472, "tps": 123463, "wall": 8926.1} {"step": 16816, "train_loss": 3.405224323272705, "lr": 0.0001997831637385915, "tps": 123402, "wall": 8931.1} {"step": 16817, "train_loss": 3.4199891090393066, "lr": 0.00019976412707437571, "tps": 123343, "wall": 8935.9} {"step": 16818, "train_loss": 3.431039571762085, "lr": 0.000199745090639393, "tps": 123283, "wall": 8940.8} {"step": 16819, "train_loss": 3.302375555038452, "lr": 0.00019972605443385896, "tps": 123223, "wall": 8945.6} {"step": 16820, "train_loss": 3.427216053009033, "lr": 0.00019970701845798932, "tps": 123164, "wall": 8950.5} {"step": 16821, "train_loss": 3.3936269283294678, "lr": 0.00019968798271199965, "tps": 123104, "wall": 8955.4} {"step": 16822, "train_loss": 3.3366756439208984, "lr": 0.0001996689471961056, "tps": 123044, "wall": 8960.3} {"step": 16823, "train_loss": 3.321653366088867, "lr": 0.0001996499119105228, "tps": 122985, "wall": 8965.1} {"step": 16824, "train_loss": 3.300837993621826, "lr": 0.00019963087685546694, "tps": 122925, "wall": 8970.0} {"step": 16825, "train_loss": 3.302598237991333, "lr": 0.0001996118420311536, "tps": 122866, "wall": 8974.8} {"step": 16826, "train_loss": 3.3912336826324463, "lr": 0.0001995928074377984, "tps": 122807, "wall": 8979.7} {"step": 16827, "train_loss": 3.28043270111084, "lr": 0.00019957377307561699, "tps": 122747, "wall": 8984.6} {"step": 16828, "train_loss": 3.212812662124634, "lr": 0.000199554738944825, "tps": 122687, "wall": 8989.5} {"step": 16829, "train_loss": 3.336604356765747, "lr": 0.00019953570504563798, "tps": 122628, "wall": 8994.4} {"step": 16830, "train_loss": 3.3615424633026123, "lr": 0.00019951667137827164, "tps": 122570, "wall": 8999.2} {"step": 16831, "train_loss": 3.2378320693969727, "lr": 0.0001994976379429416, "tps": 122511, "wall": 9004.1} {"step": 16832, "train_loss": 3.3488593101501465, "lr": 0.00019947860473986336, "tps": 122452, "wall": 9009.0} {"step": 16833, "train_loss": 3.4130163192749023, "lr": 0.00019945957176925258, "tps": 122393, "wall": 9013.8} {"step": 16834, "train_loss": 3.3857815265655518, "lr": 0.00019944053903132495, "tps": 122334, "wall": 9018.7} {"step": 16835, "train_loss": 3.395183563232422, "lr": 0.00019942150652629598, "tps": 122275, "wall": 9023.6} {"step": 16836, "train_loss": 3.4137775897979736, "lr": 0.0001994024742543813, "tps": 122217, "wall": 9028.4} {"step": 16837, "train_loss": 3.3140928745269775, "lr": 0.00019938344221579648, "tps": 122158, "wall": 9033.3} {"step": 16838, "train_loss": 3.4123637676239014, "lr": 0.00019936441041075716, "tps": 122099, "wall": 9038.2} {"step": 16839, "train_loss": 3.295041084289551, "lr": 0.00019934537883947894, "tps": 122041, "wall": 9043.1} {"step": 16840, "train_loss": 3.2820932865142822, "lr": 0.00019932634750217734, "tps": 121982, "wall": 9048.0} {"step": 16841, "train_loss": 3.398805856704712, "lr": 0.00019930731639906802, "tps": 121923, "wall": 9052.8} {"step": 16842, "train_loss": 3.4153223037719727, "lr": 0.00019928828553036652, "tps": 121865, "wall": 9057.7} {"step": 16843, "train_loss": 3.340573310852051, "lr": 0.00019926925489628845, "tps": 121807, "wall": 9062.6} {"step": 16844, "train_loss": 3.2876172065734863, "lr": 0.0001992502244970494, "tps": 121749, "wall": 9067.4} {"step": 16845, "train_loss": 3.4186151027679443, "lr": 0.0001992311943328649, "tps": 121691, "wall": 9072.3} {"step": 16846, "train_loss": 3.424806833267212, "lr": 0.0001992121644039506, "tps": 121633, "wall": 9077.2} {"step": 16847, "train_loss": 3.3427765369415283, "lr": 0.00019919313471052194, "tps": 121575, "wall": 9082.0} {"step": 16848, "train_loss": 3.3243918418884277, "lr": 0.00019917410525279467, "tps": 121517, "wall": 9086.9} {"step": 16849, "train_loss": 3.2952771186828613, "lr": 0.0001991550760309842, "tps": 121459, "wall": 9091.8} {"step": 16850, "train_loss": 3.3393287658691406, "lr": 0.00019913604704530617, "tps": 121401, "wall": 9096.6} {"step": 16851, "train_loss": 3.390707492828369, "lr": 0.0001991170182959762, "tps": 121344, "wall": 9101.5} {"step": 16852, "train_loss": 3.3149073123931885, "lr": 0.00019909798978320965, "tps": 121285, "wall": 9106.4} {"step": 16853, "train_loss": 3.3535335063934326, "lr": 0.0001990789615072223, "tps": 121228, "wall": 9111.3} {"step": 16854, "train_loss": 3.2634594440460205, "lr": 0.00019905993346822952, "tps": 121170, "wall": 9116.1} {"step": 16855, "train_loss": 3.408936023712158, "lr": 0.00019904090566644708, "tps": 121113, "wall": 9121.0} {"step": 16856, "train_loss": 3.4291868209838867, "lr": 0.00019902187810209027, "tps": 121055, "wall": 9125.9} {"step": 16857, "train_loss": 3.2197980880737305, "lr": 0.0001990028507753748, "tps": 120998, "wall": 9130.7} {"step": 16858, "train_loss": 3.28951096534729, "lr": 0.0001989838236865162, "tps": 120941, "wall": 9135.6} {"step": 16859, "train_loss": 3.410886287689209, "lr": 0.00019896479683572996, "tps": 120884, "wall": 9140.5} {"step": 16860, "train_loss": 3.2416489124298096, "lr": 0.00019894577022323162, "tps": 120826, "wall": 9145.3} {"step": 16861, "train_loss": 3.4053874015808105, "lr": 0.00019892674384923672, "tps": 120769, "wall": 9150.2} {"step": 16862, "train_loss": 3.3422598838806152, "lr": 0.0001989077177139609, "tps": 120712, "wall": 9155.1} {"step": 16863, "train_loss": 3.3523306846618652, "lr": 0.0001988886918176195, "tps": 120655, "wall": 9159.9} {"step": 16864, "train_loss": 3.3386547565460205, "lr": 0.00019886966616042818, "tps": 120598, "wall": 9164.8} {"step": 16865, "train_loss": 3.3235116004943848, "lr": 0.00019885064074260243, "tps": 120540, "wall": 9169.8} {"step": 16866, "train_loss": 3.2619733810424805, "lr": 0.00019883161556435774, "tps": 120483, "wall": 9174.6} {"step": 16867, "train_loss": 3.275474786758423, "lr": 0.00019881259062590968, "tps": 120427, "wall": 9179.5} {"step": 16868, "train_loss": 3.382869005203247, "lr": 0.00019879356592747373, "tps": 120370, "wall": 9184.4} {"step": 16869, "train_loss": 3.261115789413452, "lr": 0.0001987745414692654, "tps": 120313, "wall": 9189.2} {"step": 16870, "train_loss": 3.344297170639038, "lr": 0.00019875551725150023, "tps": 120257, "wall": 9194.1} {"step": 16871, "train_loss": 3.3318018913269043, "lr": 0.00019873649327439366, "tps": 120200, "wall": 9199.0} {"step": 16872, "train_loss": 3.25295352935791, "lr": 0.00019871746953816134, "tps": 120144, "wall": 9203.8} {"step": 16873, "train_loss": 3.287261486053467, "lr": 0.00019869844604301863, "tps": 120087, "wall": 9208.7} {"step": 16874, "train_loss": 3.2734663486480713, "lr": 0.00019867942278918105, "tps": 120031, "wall": 9213.6} {"step": 16875, "train_loss": 3.415198802947998, "lr": 0.00019866039977686417, "tps": 119975, "wall": 9218.4} {"step": 16876, "train_loss": 3.2727298736572266, "lr": 0.00019864137700628337, "tps": 119919, "wall": 9223.3} {"step": 16877, "train_loss": 3.4020986557006836, "lr": 0.00019862235447765426, "tps": 119861, "wall": 9228.3} {"step": 16878, "train_loss": 3.413348436355591, "lr": 0.0001986033321911923, "tps": 119805, "wall": 9233.1} {"step": 16879, "train_loss": 3.354635000228882, "lr": 0.0001985843101471129, "tps": 119749, "wall": 9238.0} {"step": 16880, "train_loss": 3.369424343109131, "lr": 0.00019856528834563157, "tps": 119693, "wall": 9242.9} {"step": 16881, "train_loss": 3.4632480144500732, "lr": 0.00019854626678696385, "tps": 119637, "wall": 9247.7} {"step": 16882, "train_loss": 3.300550699234009, "lr": 0.00019852724547132517, "tps": 119582, "wall": 9252.6} {"step": 16883, "train_loss": 3.3576502799987793, "lr": 0.00019850822439893104, "tps": 119526, "wall": 9257.5} {"step": 16884, "train_loss": 3.346710205078125, "lr": 0.00019848920356999687, "tps": 119470, "wall": 9262.3} {"step": 16885, "train_loss": 3.4957995414733887, "lr": 0.0001984701829847382, "tps": 119414, "wall": 9267.2} {"step": 16886, "train_loss": 3.325895309448242, "lr": 0.00019845116264337044, "tps": 119359, "wall": 9272.1} {"step": 16887, "train_loss": 3.3561816215515137, "lr": 0.00019843214254610904, "tps": 119303, "wall": 9276.9} {"step": 16888, "train_loss": 3.408388137817383, "lr": 0.00019841312269316955, "tps": 119248, "wall": 9281.8} {"step": 16889, "train_loss": 3.3537869453430176, "lr": 0.0001983941030847674, "tps": 119191, "wall": 9286.7} {"step": 16890, "train_loss": 3.3297057151794434, "lr": 0.00019837508372111797, "tps": 119136, "wall": 9291.6} {"step": 16891, "train_loss": 3.246366262435913, "lr": 0.00019835606460243677, "tps": 119081, "wall": 9296.5} {"step": 16892, "train_loss": 3.3673975467681885, "lr": 0.00019833704572893925, "tps": 119026, "wall": 9301.3} {"step": 16893, "train_loss": 3.35880708694458, "lr": 0.0001983180271008408, "tps": 118970, "wall": 9306.2} {"step": 16894, "train_loss": 3.392622470855713, "lr": 0.000198299008718357, "tps": 118915, "wall": 9311.0} {"step": 16895, "train_loss": 3.35400390625, "lr": 0.00019827999058170316, "tps": 118860, "wall": 9315.9} {"step": 16896, "train_loss": 3.481308937072754, "lr": 0.00019826097269109476, "tps": 118805, "wall": 9320.8} {"step": 16897, "train_loss": 3.358945369720459, "lr": 0.0001982419550467472, "tps": 118751, "wall": 9325.6} {"step": 16898, "train_loss": 3.280449390411377, "lr": 0.00019822293764887596, "tps": 118696, "wall": 9330.5} {"step": 16899, "train_loss": 3.426708221435547, "lr": 0.00019820392049769653, "tps": 118641, "wall": 9335.3} {"step": 16900, "train_loss": 3.3667991161346436, "lr": 0.0001981849035934242, "tps": 118586, "wall": 9340.2} {"step": 16901, "train_loss": 3.2453296184539795, "lr": 0.0001981658869362745, "tps": 118532, "wall": 9345.1} {"step": 16902, "train_loss": 3.323629379272461, "lr": 0.0001981468705264628, "tps": 118476, "wall": 9350.0} {"step": 16903, "train_loss": 3.4406373500823975, "lr": 0.00019812785436420453, "tps": 118421, "wall": 9354.9} {"step": 16904, "train_loss": 3.3167219161987305, "lr": 0.00019810883844971507, "tps": 118367, "wall": 9359.8} {"step": 16905, "train_loss": 3.3141424655914307, "lr": 0.00019808982278320998, "tps": 118312, "wall": 9364.6} {"step": 16906, "train_loss": 3.2654271125793457, "lr": 0.00019807080736490446, "tps": 118258, "wall": 9369.5} {"step": 16907, "train_loss": 3.3345513343811035, "lr": 0.00019805179219501407, "tps": 118203, "wall": 9374.3} {"step": 16908, "train_loss": 3.3430113792419434, "lr": 0.00019803277727375415, "tps": 118149, "wall": 9379.2} {"step": 16909, "train_loss": 3.4340546131134033, "lr": 0.00019801376260134013, "tps": 118095, "wall": 9384.1} {"step": 16910, "train_loss": 3.322765588760376, "lr": 0.0001979947481779874, "tps": 118040, "wall": 9389.0} {"step": 16911, "train_loss": 3.2535345554351807, "lr": 0.0001979757340039113, "tps": 117986, "wall": 9393.8} {"step": 16912, "train_loss": 3.3271408081054688, "lr": 0.00019795672007932736, "tps": 117932, "wall": 9398.7} {"step": 16913, "train_loss": 3.4279637336730957, "lr": 0.0001979377064044508, "tps": 117878, "wall": 9403.6} {"step": 16914, "train_loss": 3.298611640930176, "lr": 0.00019791869297949713, "tps": 117823, "wall": 9408.5} {"step": 16915, "train_loss": 3.348949909210205, "lr": 0.00019789967980468173, "tps": 117769, "wall": 9413.4} {"step": 16916, "train_loss": 3.280156135559082, "lr": 0.00019788066688021996, "tps": 117715, "wall": 9418.2} {"step": 16917, "train_loss": 3.2981555461883545, "lr": 0.00019786165420632715, "tps": 117662, "wall": 9423.1} {"step": 16918, "train_loss": 3.306245803833008, "lr": 0.00019784264178321869, "tps": 117608, "wall": 9427.9} {"step": 16919, "train_loss": 3.212803840637207, "lr": 0.0001978236296111101, "tps": 117554, "wall": 9432.8} {"step": 16920, "train_loss": 3.3382728099823, "lr": 0.00019780461769021654, "tps": 117501, "wall": 9437.6} {"step": 16921, "train_loss": 3.3339972496032715, "lr": 0.00019778560602075345, "tps": 117447, "wall": 9442.5} {"step": 16922, "train_loss": 3.3597190380096436, "lr": 0.0001977665946029363, "tps": 117394, "wall": 9447.4} {"step": 16923, "train_loss": 3.319988489151001, "lr": 0.00019774758343698033, "tps": 117340, "wall": 9452.2} {"step": 16924, "train_loss": 3.2771363258361816, "lr": 0.00019772857252310094, "tps": 117287, "wall": 9457.1} {"step": 16925, "train_loss": 3.227261543273926, "lr": 0.00019770956186151347, "tps": 117233, "wall": 9462.0} {"step": 16926, "train_loss": 3.2464680671691895, "lr": 0.0001976905514524333, "tps": 117179, "wall": 9466.9} {"step": 16927, "train_loss": 3.30946683883667, "lr": 0.00019767154129607576, "tps": 117126, "wall": 9471.8} {"step": 16928, "train_loss": 3.327775478363037, "lr": 0.00019765253139265623, "tps": 117073, "wall": 9476.6} {"step": 16929, "train_loss": 3.377744674682617, "lr": 0.00019763352174239005, "tps": 117020, "wall": 9481.5} {"step": 16930, "train_loss": 3.391033172607422, "lr": 0.00019761451234549248, "tps": 116967, "wall": 9486.3} {"step": 16931, "train_loss": 3.3167192935943604, "lr": 0.00019759550320217896, "tps": 116914, "wall": 9491.2} {"step": 16932, "train_loss": 3.292630910873413, "lr": 0.00019757649431266484, "tps": 116861, "wall": 9496.0} {"step": 16933, "train_loss": 3.3317341804504395, "lr": 0.00019755748567716532, "tps": 116808, "wall": 9500.9} {"step": 16934, "train_loss": 3.447822093963623, "lr": 0.00019753847729589582, "tps": 116755, "wall": 9505.8} {"step": 16935, "train_loss": 3.390737295150757, "lr": 0.00019751946916907173, "tps": 116702, "wall": 9510.7} {"step": 16936, "train_loss": 3.3177597522735596, "lr": 0.00019750046129690828, "tps": 116649, "wall": 9515.5} {"step": 16937, "train_loss": 3.39758563041687, "lr": 0.00019748145367962084, "tps": 116597, "wall": 9520.4} {"step": 16938, "train_loss": 3.358341693878174, "lr": 0.00019746244631742464, "tps": 116544, "wall": 9525.2} {"step": 16939, "train_loss": 3.3865554332733154, "lr": 0.00019744343921053518, "tps": 116491, "wall": 9530.1} {"step": 16940, "train_loss": 3.3730320930480957, "lr": 0.00019742443235916765, "tps": 116438, "wall": 9535.0} {"step": 16941, "train_loss": 3.251209259033203, "lr": 0.00019740542576353733, "tps": 116386, "wall": 9539.9} {"step": 16942, "train_loss": 3.322895050048828, "lr": 0.00019738641942385955, "tps": 116333, "wall": 9544.7} {"step": 16943, "train_loss": 3.2996373176574707, "lr": 0.00019736741334034963, "tps": 116281, "wall": 9549.6} {"step": 16944, "train_loss": 3.259204626083374, "lr": 0.00019734840751322295, "tps": 116229, "wall": 9554.5} {"step": 16945, "train_loss": 3.2793145179748535, "lr": 0.00019732940194269464, "tps": 116176, "wall": 9559.3} {"step": 16946, "train_loss": 3.2963435649871826, "lr": 0.0001973103966289801, "tps": 116124, "wall": 9564.2} {"step": 16947, "train_loss": 3.2720353603363037, "lr": 0.0001972913915722947, "tps": 116072, "wall": 9569.1} {"step": 16948, "train_loss": 3.358224391937256, "lr": 0.00019727238677285356, "tps": 116019, "wall": 9574.0} {"step": 16949, "train_loss": 3.332791805267334, "lr": 0.00019725338223087205, "tps": 115967, "wall": 9578.8} {"step": 16950, "train_loss": 3.4001383781433105, "lr": 0.00019723437794656547, "tps": 115915, "wall": 9583.7} {"step": 16951, "train_loss": 3.2902865409851074, "lr": 0.00019721537392014917, "tps": 115862, "wall": 9588.6} {"step": 16952, "train_loss": 3.3687305450439453, "lr": 0.00019719637015183829, "tps": 115810, "wall": 9593.5} {"step": 16953, "train_loss": 3.216169595718384, "lr": 0.0001971773666418481, "tps": 115759, "wall": 9598.4} {"step": 16954, "train_loss": 3.3036036491394043, "lr": 0.00019715836339039404, "tps": 115707, "wall": 9603.2} {"step": 16955, "train_loss": 3.284813404083252, "lr": 0.00019713936039769122, "tps": 115654, "wall": 9608.1} {"step": 16956, "train_loss": 3.317915439605713, "lr": 0.00019712035766395497, "tps": 115603, "wall": 9613.0} {"step": 16957, "train_loss": 3.3020944595336914, "lr": 0.0001971013551894005, "tps": 115551, "wall": 9617.9} {"step": 16958, "train_loss": 3.3592302799224854, "lr": 0.0001970823529742432, "tps": 115499, "wall": 9622.8} {"step": 16959, "train_loss": 3.3005170822143555, "lr": 0.0001970633510186982, "tps": 115447, "wall": 9627.6} {"step": 16960, "train_loss": 3.3366830348968506, "lr": 0.00019704434932298076, "tps": 115396, "wall": 9632.5} {"step": 16961, "train_loss": 3.3231730461120605, "lr": 0.00019702534788730626, "tps": 115344, "wall": 9637.4} {"step": 16962, "train_loss": 3.4318084716796875, "lr": 0.0001970063467118898, "tps": 115293, "wall": 9642.2} {"step": 16963, "train_loss": 3.276857376098633, "lr": 0.00019698734579694672, "tps": 115241, "wall": 9647.2} {"step": 16964, "train_loss": 3.330385684967041, "lr": 0.00019696834514269223, "tps": 115190, "wall": 9652.0} {"step": 16965, "train_loss": 3.307339668273926, "lr": 0.00019694934474934157, "tps": 115139, "wall": 9656.9} {"step": 16966, "train_loss": 3.352346658706665, "lr": 0.00019693034461710997, "tps": 115087, "wall": 9661.7} {"step": 16967, "train_loss": 3.359788417816162, "lr": 0.00019691134474621267, "tps": 115036, "wall": 9666.6} {"step": 16968, "train_loss": 3.216015338897705, "lr": 0.0001968923451368649, "tps": 114985, "wall": 9671.5} {"step": 16969, "train_loss": 3.319517135620117, "lr": 0.00019687334578928192, "tps": 114934, "wall": 9676.3} {"step": 16970, "train_loss": 3.2556967735290527, "lr": 0.00019685434670367892, "tps": 114883, "wall": 9681.2} {"step": 16971, "train_loss": 3.4146647453308105, "lr": 0.00019683534788027113, "tps": 114832, "wall": 9686.1} {"step": 16972, "train_loss": 3.2616686820983887, "lr": 0.0001968163493192738, "tps": 114781, "wall": 9691.0} {"step": 16973, "train_loss": 3.4576334953308105, "lr": 0.00019679735102090206, "tps": 114730, "wall": 9695.8} {"step": 16974, "train_loss": 3.3358378410339355, "lr": 0.00019677835298537123, "tps": 114679, "wall": 9700.7} {"step": 16975, "train_loss": 3.3367857933044434, "lr": 0.00019675935521289644, "tps": 114628, "wall": 9705.6} {"step": 16976, "train_loss": 3.3351802825927734, "lr": 0.00019674035770369294, "tps": 114577, "wall": 9710.5} {"step": 16977, "train_loss": 3.2651658058166504, "lr": 0.00019672136045797593, "tps": 114526, "wall": 9715.4} {"step": 16978, "train_loss": 3.4086716175079346, "lr": 0.00019670236347596066, "tps": 114476, "wall": 9720.2} {"step": 16979, "train_loss": 3.2776410579681396, "lr": 0.0001966833667578622, "tps": 114426, "wall": 9725.1} {"step": 16980, "train_loss": 3.3560380935668945, "lr": 0.00019666437030389585, "tps": 114375, "wall": 9729.9} {"step": 16981, "train_loss": 3.2857964038848877, "lr": 0.00019664537411427681, "tps": 114325, "wall": 9734.8} {"step": 16982, "train_loss": 3.3786001205444336, "lr": 0.00019662637818922019, "tps": 114275, "wall": 9739.6} {"step": 16983, "train_loss": 3.314082384109497, "lr": 0.00019660738252894126, "tps": 114224, "wall": 9744.5} {"step": 16984, "train_loss": 3.2956504821777344, "lr": 0.00019658838713365514, "tps": 114174, "wall": 9749.4} {"step": 16985, "train_loss": 3.283252000808716, "lr": 0.00019656939200357701, "tps": 114124, "wall": 9754.2} {"step": 16986, "train_loss": 3.4054372310638428, "lr": 0.00019655039713892212, "tps": 114074, "wall": 9759.1} {"step": 16987, "train_loss": 3.4074525833129883, "lr": 0.00019653140253990558, "tps": 114024, "wall": 9763.9} {"step": 16988, "train_loss": 3.4168879985809326, "lr": 0.0001965124082067426, "tps": 113973, "wall": 9768.9} {"step": 16989, "train_loss": 3.389997959136963, "lr": 0.0001964934141396483, "tps": 113923, "wall": 9773.7} {"step": 16990, "train_loss": 3.2753233909606934, "lr": 0.0001964744203388379, "tps": 113873, "wall": 9778.6} {"step": 16991, "train_loss": 3.3704473972320557, "lr": 0.00019645542680452656, "tps": 113823, "wall": 9783.5} {"step": 16992, "train_loss": 3.2990427017211914, "lr": 0.00019643643353692937, "tps": 113773, "wall": 9788.3} {"step": 16993, "train_loss": 3.3613991737365723, "lr": 0.00019641744053626155, "tps": 113723, "wall": 9793.2} {"step": 16994, "train_loss": 3.3009819984436035, "lr": 0.00019639844780273825, "tps": 113674, "wall": 9798.0} {"step": 16995, "train_loss": 3.2891335487365723, "lr": 0.00019637945533657462, "tps": 113624, "wall": 9802.9} {"step": 16996, "train_loss": 3.3955297470092773, "lr": 0.0001963604631379858, "tps": 113575, "wall": 9807.7} {"step": 16997, "train_loss": 3.265977621078491, "lr": 0.0001963414712071869, "tps": 113525, "wall": 9812.6} {"step": 16998, "train_loss": 3.4439449310302734, "lr": 0.00019632247954439312, "tps": 113475, "wall": 9817.5} {"step": 16999, "train_loss": 3.3439674377441406, "lr": 0.00019630348814981952, "tps": 113426, "wall": 9822.4} {"step": 17000, "train_loss": 3.3753457069396973, "lr": 0.00019628449702368137, "tps": 113375, "wall": 9827.3, "val_loss_monitor": 3.3910849638580665} {"step": 17001, "train_loss": 3.2657759189605713, "lr": 0.00019626550616619367, "tps": 112783, "wall": 9879.5} {"step": 17002, "train_loss": 3.2845442295074463, "lr": 0.00019624651557757162, "tps": 112734, "wall": 9884.4} {"step": 17003, "train_loss": 3.245662212371826, "lr": 0.0001962275252580303, "tps": 112685, "wall": 9889.3} {"step": 17004, "train_loss": 3.3417341709136963, "lr": 0.00019620853520778487, "tps": 112636, "wall": 9894.2} {"step": 17005, "train_loss": 3.2682273387908936, "lr": 0.0001961895454270505, "tps": 112587, "wall": 9899.0} {"step": 17006, "train_loss": 3.429157257080078, "lr": 0.0001961705559160422, "tps": 112538, "wall": 9903.9} {"step": 17007, "train_loss": 3.414687156677246, "lr": 0.0001961515666749751, "tps": 112489, "wall": 9908.8} {"step": 17008, "train_loss": 3.3732407093048096, "lr": 0.0001961325777040644, "tps": 112440, "wall": 9913.7} {"step": 17009, "train_loss": 3.34649658203125, "lr": 0.0001961135890035251, "tps": 112392, "wall": 9918.6} {"step": 17010, "train_loss": 3.2561628818511963, "lr": 0.00019609460057357238, "tps": 112343, "wall": 9923.4} {"step": 17011, "train_loss": 3.3641715049743652, "lr": 0.00019607561241442127, "tps": 112294, "wall": 9928.3} {"step": 17012, "train_loss": 3.1591148376464844, "lr": 0.000196056624526287, "tps": 112246, "wall": 9933.2} {"step": 17013, "train_loss": 3.3445215225219727, "lr": 0.00019603763690938456, "tps": 112198, "wall": 9938.0} {"step": 17014, "train_loss": 3.3247156143188477, "lr": 0.00019601864956392905, "tps": 112149, "wall": 9942.9} {"step": 17015, "train_loss": 3.2756781578063965, "lr": 0.0001959996624901356, "tps": 112100, "wall": 9947.8} {"step": 17016, "train_loss": 3.257746934890747, "lr": 0.0001959806756882192, "tps": 112052, "wall": 9952.7} {"step": 17017, "train_loss": 3.279475688934326, "lr": 0.00019596168915839507, "tps": 112004, "wall": 9957.6} {"step": 17018, "train_loss": 3.2529234886169434, "lr": 0.00019594270290087824, "tps": 111955, "wall": 9962.5} {"step": 17019, "train_loss": 3.3364152908325195, "lr": 0.0001959237169158837, "tps": 111907, "wall": 9967.4} {"step": 17020, "train_loss": 3.3628287315368652, "lr": 0.00019590473120362667, "tps": 111859, "wall": 9972.3} {"step": 17021, "train_loss": 3.4844775199890137, "lr": 0.0001958857457643221, "tps": 111811, "wall": 9977.1} {"step": 17022, "train_loss": 3.339055299758911, "lr": 0.00019586676059818513, "tps": 111763, "wall": 9982.0} {"step": 17023, "train_loss": 3.453418493270874, "lr": 0.0001958477757054308, "tps": 111715, "wall": 9986.8} {"step": 17024, "train_loss": 3.3437581062316895, "lr": 0.00019582879108627417, "tps": 111667, "wall": 9991.7} {"step": 17025, "train_loss": 3.3520989418029785, "lr": 0.00019580980674093032, "tps": 111619, "wall": 9996.6} {"step": 17026, "train_loss": 3.3971173763275146, "lr": 0.00019579082266961426, "tps": 111571, "wall": 10001.5} {"step": 17027, "train_loss": 3.2899229526519775, "lr": 0.00019577183887254109, "tps": 111522, "wall": 10006.4} {"step": 17028, "train_loss": 3.302060604095459, "lr": 0.00019575285534992584, "tps": 111475, "wall": 10011.3} {"step": 17029, "train_loss": 3.3300094604492188, "lr": 0.00019573387210198356, "tps": 111427, "wall": 10016.2} {"step": 17030, "train_loss": 3.323413610458374, "lr": 0.00019571488912892925, "tps": 111379, "wall": 10021.1} {"step": 17031, "train_loss": 3.3093972206115723, "lr": 0.000195695906430978, "tps": 111332, "wall": 10025.9} {"step": 17032, "train_loss": 3.453240394592285, "lr": 0.00019567692400834487, "tps": 111284, "wall": 10030.8} {"step": 17033, "train_loss": 3.341296672821045, "lr": 0.00019565794186124485, "tps": 111237, "wall": 10035.7} {"step": 17034, "train_loss": 3.268756628036499, "lr": 0.00019563895998989296, "tps": 111189, "wall": 10040.5} {"step": 17035, "train_loss": 3.330442190170288, "lr": 0.00019561997839450426, "tps": 111142, "wall": 10045.4} {"step": 17036, "train_loss": 3.3737382888793945, "lr": 0.00019560099707529376, "tps": 111095, "wall": 10050.3} {"step": 17037, "train_loss": 3.242711067199707, "lr": 0.00019558201603247653, "tps": 111048, "wall": 10055.1} {"step": 17038, "train_loss": 3.3443562984466553, "lr": 0.00019556303526626744, "tps": 111000, "wall": 10060.0} {"step": 17039, "train_loss": 3.329072952270508, "lr": 0.00019554405477688173, "tps": 110953, "wall": 10064.9} {"step": 17040, "train_loss": 3.308100461959839, "lr": 0.0001955250745645342, "tps": 110905, "wall": 10069.8} {"step": 17041, "train_loss": 3.3462061882019043, "lr": 0.00019550609462944, "tps": 110858, "wall": 10074.7} {"step": 17042, "train_loss": 3.260983943939209, "lr": 0.0001954871149718141, "tps": 110811, "wall": 10079.5} {"step": 17043, "train_loss": 3.3378515243530273, "lr": 0.00019546813559187144, "tps": 110764, "wall": 10084.4} {"step": 17044, "train_loss": 3.2350680828094482, "lr": 0.00019544915648982706, "tps": 110718, "wall": 10089.2} {"step": 17045, "train_loss": 3.3617160320281982, "lr": 0.00019543017766589604, "tps": 110671, "wall": 10094.1} {"step": 17046, "train_loss": 3.3321259021759033, "lr": 0.0001954111991202932, "tps": 110624, "wall": 10098.9} {"step": 17047, "train_loss": 3.295248031616211, "lr": 0.00019539222085323367, "tps": 110577, "wall": 10103.8} {"step": 17048, "train_loss": 3.3082363605499268, "lr": 0.00019537324286493242, "tps": 110531, "wall": 10108.7} {"step": 17049, "train_loss": 3.36674165725708, "lr": 0.0001953542651556044, "tps": 110484, "wall": 10113.5} {"step": 17050, "train_loss": 3.307499885559082, "lr": 0.00019533528772546456, "tps": 110438, "wall": 10118.4} {"step": 17051, "train_loss": 3.435382127761841, "lr": 0.0001953163105747279, "tps": 110391, "wall": 10123.3} {"step": 17052, "train_loss": 3.313479423522949, "lr": 0.0001952973337036095, "tps": 110344, "wall": 10128.2} {"step": 17053, "train_loss": 3.2848408222198486, "lr": 0.00019527835711232415, "tps": 110297, "wall": 10133.0} {"step": 17054, "train_loss": 3.3632073402404785, "lr": 0.00019525938080108696, "tps": 110251, "wall": 10137.9} {"step": 17055, "train_loss": 3.352775812149048, "lr": 0.0001952404047701128, "tps": 110204, "wall": 10142.8} {"step": 17056, "train_loss": 3.376729965209961, "lr": 0.00019522142901961674, "tps": 110158, "wall": 10147.6} {"step": 17057, "train_loss": 3.2060983180999756, "lr": 0.0001952024535498136, "tps": 110112, "wall": 10152.5} {"step": 17058, "train_loss": 3.317005157470703, "lr": 0.00019518347836091843, "tps": 110065, "wall": 10157.4} {"step": 17059, "train_loss": 3.431969165802002, "lr": 0.00019516450345314617, "tps": 110019, "wall": 10162.2} {"step": 17060, "train_loss": 3.288187026977539, "lr": 0.00019514552882671175, "tps": 109973, "wall": 10167.1} {"step": 17061, "train_loss": 3.4251818656921387, "lr": 0.00019512655448183014, "tps": 109927, "wall": 10172.0} {"step": 17062, "train_loss": 3.227710247039795, "lr": 0.00019510758041871632, "tps": 109880, "wall": 10176.9} {"step": 17063, "train_loss": 3.3527204990386963, "lr": 0.00019508860663758508, "tps": 109834, "wall": 10181.7} {"step": 17064, "train_loss": 3.362942695617676, "lr": 0.00019506963313865145, "tps": 109787, "wall": 10186.7} {"step": 17065, "train_loss": 3.247910499572754, "lr": 0.0001950506599221304, "tps": 109741, "wall": 10191.5} {"step": 17066, "train_loss": 3.39133882522583, "lr": 0.00019503168698823683, "tps": 109696, "wall": 10196.4} {"step": 17067, "train_loss": 3.371464729309082, "lr": 0.0001950127143371857, "tps": 109650, "wall": 10201.3} {"step": 17068, "train_loss": 3.3961691856384277, "lr": 0.0001949937419691918, "tps": 109604, "wall": 10206.1} {"step": 17069, "train_loss": 3.281385660171509, "lr": 0.00019497476988447022, "tps": 109558, "wall": 10211.0} {"step": 17070, "train_loss": 3.402904510498047, "lr": 0.00019495579808323578, "tps": 109512, "wall": 10215.8} {"step": 17071, "train_loss": 3.4045114517211914, "lr": 0.0001949368265657034, "tps": 109467, "wall": 10220.7} {"step": 17072, "train_loss": 3.320199728012085, "lr": 0.00019491785533208802, "tps": 109421, "wall": 10225.6} {"step": 17073, "train_loss": 3.3535265922546387, "lr": 0.00019489888438260452, "tps": 109375, "wall": 10230.4} {"step": 17074, "train_loss": 3.38714861869812, "lr": 0.0001948799137174678, "tps": 109330, "wall": 10235.3} {"step": 17075, "train_loss": 3.2975525856018066, "lr": 0.00019486094333689277, "tps": 109284, "wall": 10240.2} {"step": 17076, "train_loss": 3.3163654804229736, "lr": 0.0001948419732410944, "tps": 109239, "wall": 10245.0} {"step": 17077, "train_loss": 3.29341983795166, "lr": 0.0001948230034302875, "tps": 109193, "wall": 10250.0} {"step": 17078, "train_loss": 3.472825765609741, "lr": 0.00019480403390468692, "tps": 109147, "wall": 10254.8} {"step": 17079, "train_loss": 3.299405574798584, "lr": 0.00019478506466450766, "tps": 109102, "wall": 10259.7} {"step": 17080, "train_loss": 3.28680419921875, "lr": 0.00019476609570996453, "tps": 109057, "wall": 10264.5} {"step": 17081, "train_loss": 3.3614883422851562, "lr": 0.00019474712704127244, "tps": 109012, "wall": 10269.4} {"step": 17082, "train_loss": 3.2797858715057373, "lr": 0.00019472815865864625, "tps": 108966, "wall": 10274.2} {"step": 17083, "train_loss": 3.2618908882141113, "lr": 0.00019470919056230085, "tps": 108921, "wall": 10279.1} {"step": 17084, "train_loss": 3.3903934955596924, "lr": 0.0001946902227524511, "tps": 108876, "wall": 10284.0} {"step": 17085, "train_loss": 3.3232438564300537, "lr": 0.0001946712552293119, "tps": 108831, "wall": 10288.8} {"step": 17086, "train_loss": 3.3236727714538574, "lr": 0.00019465228799309808, "tps": 108786, "wall": 10293.7} {"step": 17087, "train_loss": 3.205645799636841, "lr": 0.00019463332104402455, "tps": 108741, "wall": 10298.5} {"step": 17088, "train_loss": 3.38765025138855, "lr": 0.00019461435438230607, "tps": 108696, "wall": 10303.4} {"step": 17089, "train_loss": 3.4225146770477295, "lr": 0.0001945953880081576, "tps": 108651, "wall": 10308.3} {"step": 17090, "train_loss": 3.319119453430176, "lr": 0.0001945764219217939, "tps": 108606, "wall": 10313.1} {"step": 17091, "train_loss": 3.3073525428771973, "lr": 0.0001945574561234299, "tps": 108561, "wall": 10318.0} {"step": 17092, "train_loss": 3.43825364112854, "lr": 0.00019453849061328038, "tps": 108517, "wall": 10322.8} {"step": 17093, "train_loss": 3.326061725616455, "lr": 0.0001945195253915603, "tps": 108472, "wall": 10327.7} {"step": 17094, "train_loss": 3.351003885269165, "lr": 0.00019450056045848432, "tps": 108427, "wall": 10332.6} {"step": 17095, "train_loss": 3.391052722930908, "lr": 0.00019448159581426743, "tps": 108383, "wall": 10337.4} {"step": 17096, "train_loss": 3.35508131980896, "lr": 0.00019446263145912442, "tps": 108338, "wall": 10342.3} {"step": 17097, "train_loss": 3.318483829498291, "lr": 0.00019444366739327005, "tps": 108293, "wall": 10347.2} {"step": 17098, "train_loss": 3.3668947219848633, "lr": 0.0001944247036169192, "tps": 108249, "wall": 10352.0} {"step": 17099, "train_loss": 3.2716517448425293, "lr": 0.00019440574013028674, "tps": 108204, "wall": 10356.9} {"step": 17100, "train_loss": 3.3211848735809326, "lr": 0.00019438677693358738, "tps": 108160, "wall": 10361.7} {"step": 17101, "train_loss": 3.3248534202575684, "lr": 0.00019436781402703602, "tps": 108115, "wall": 10366.7} {"step": 17102, "train_loss": 3.376124858856201, "lr": 0.00019434885141084745, "tps": 108071, "wall": 10371.5} {"step": 17103, "train_loss": 3.338486671447754, "lr": 0.00019432988908523648, "tps": 108026, "wall": 10376.4} {"step": 17104, "train_loss": 3.317793607711792, "lr": 0.00019431092705041793, "tps": 107982, "wall": 10381.3} {"step": 17105, "train_loss": 3.3673548698425293, "lr": 0.00019429196530660657, "tps": 107938, "wall": 10386.1} {"step": 17106, "train_loss": 3.3217763900756836, "lr": 0.00019427300385401725, "tps": 107894, "wall": 10391.0} {"step": 17107, "train_loss": 3.2166199684143066, "lr": 0.0001942540426928647, "tps": 107850, "wall": 10395.8} {"step": 17108, "train_loss": 3.2522342205047607, "lr": 0.0001942350818233638, "tps": 107805, "wall": 10400.7} {"step": 17109, "train_loss": 3.3548712730407715, "lr": 0.00019421612124572923, "tps": 107761, "wall": 10405.5} {"step": 17110, "train_loss": 3.361056327819824, "lr": 0.00019419716096017586, "tps": 107717, "wall": 10410.4} {"step": 17111, "train_loss": 3.2753663063049316, "lr": 0.00019417820096691846, "tps": 107673, "wall": 10415.3} {"step": 17112, "train_loss": 3.333019495010376, "lr": 0.00019415924126617174, "tps": 107629, "wall": 10420.1} {"step": 17113, "train_loss": 3.3617002964019775, "lr": 0.00019414028185815054, "tps": 107586, "wall": 10425.0} {"step": 17114, "train_loss": 3.291698694229126, "lr": 0.0001941213227430697, "tps": 107541, "wall": 10429.9} {"step": 17115, "train_loss": 3.381129741668701, "lr": 0.00019410236392114385, "tps": 107497, "wall": 10434.8} {"step": 17116, "train_loss": 3.241360902786255, "lr": 0.00019408340539258783, "tps": 107453, "wall": 10439.7} {"step": 17117, "train_loss": 3.3271334171295166, "lr": 0.00019406444715761639, "tps": 107409, "wall": 10444.6} {"step": 17118, "train_loss": 3.467423439025879, "lr": 0.00019404548921644432, "tps": 107365, "wall": 10449.4} {"step": 17119, "train_loss": 3.26021146774292, "lr": 0.0001940265315692863, "tps": 107322, "wall": 10454.3} {"step": 17120, "train_loss": 3.383026123046875, "lr": 0.0001940075742163572, "tps": 107278, "wall": 10459.1} {"step": 17121, "train_loss": 3.337515115737915, "lr": 0.0001939886171578717, "tps": 107235, "wall": 10464.0} {"step": 17122, "train_loss": 3.2157795429229736, "lr": 0.0001939696603940445, "tps": 107191, "wall": 10468.9} {"step": 17123, "train_loss": 3.3184123039245605, "lr": 0.00019395070392509042, "tps": 107147, "wall": 10473.8} {"step": 17124, "train_loss": 3.3242268562316895, "lr": 0.00019393174775122422, "tps": 107104, "wall": 10478.6} {"step": 17125, "train_loss": 3.3381171226501465, "lr": 0.0001939127918726605, "tps": 107060, "wall": 10483.5} {"step": 17126, "train_loss": 3.3254261016845703, "lr": 0.00019389383628961416, "tps": 107017, "wall": 10488.4} {"step": 17127, "train_loss": 3.3238000869750977, "lr": 0.00019387488100229983, "tps": 106973, "wall": 10493.2} {"step": 17128, "train_loss": 3.3287549018859863, "lr": 0.0001938559260109323, "tps": 106930, "wall": 10498.1} {"step": 17129, "train_loss": 3.291022300720215, "lr": 0.0001938369713157262, "tps": 106887, "wall": 10502.9} {"step": 17130, "train_loss": 3.3729639053344727, "lr": 0.00019381801691689633, "tps": 106843, "wall": 10507.8} {"step": 17131, "train_loss": 3.3916726112365723, "lr": 0.0001937990628146574, "tps": 106800, "wall": 10512.7} {"step": 17132, "train_loss": 3.3370609283447266, "lr": 0.00019378010900922407, "tps": 106757, "wall": 10517.5} {"step": 17133, "train_loss": 3.2306103706359863, "lr": 0.00019376115550081107, "tps": 106714, "wall": 10522.4} {"step": 17134, "train_loss": 3.2903990745544434, "lr": 0.00019374220228963318, "tps": 106671, "wall": 10527.3} {"step": 17135, "train_loss": 3.3540334701538086, "lr": 0.00019372324937590496, "tps": 106628, "wall": 10532.1} {"step": 17136, "train_loss": 3.333522319793701, "lr": 0.00019370429675984126, "tps": 106585, "wall": 10537.0} {"step": 17137, "train_loss": 3.4503917694091797, "lr": 0.0001936853444416567, "tps": 106542, "wall": 10541.8} {"step": 17138, "train_loss": 3.4180920124053955, "lr": 0.00019366639242156594, "tps": 106498, "wall": 10546.8} {"step": 17139, "train_loss": 3.341458320617676, "lr": 0.00019364744069978377, "tps": 106455, "wall": 10551.7} {"step": 17140, "train_loss": 3.288456439971924, "lr": 0.00019362848927652478, "tps": 106413, "wall": 10556.5} {"step": 17141, "train_loss": 3.265460968017578, "lr": 0.0001936095381520037, "tps": 106370, "wall": 10561.3} {"step": 17142, "train_loss": 3.339373826980591, "lr": 0.0001935905873264352, "tps": 106328, "wall": 10566.2} {"step": 17143, "train_loss": 3.2708778381347656, "lr": 0.00019357163680003395, "tps": 106285, "wall": 10571.1} {"step": 17144, "train_loss": 3.3711462020874023, "lr": 0.0001935526865730146, "tps": 106242, "wall": 10575.9} {"step": 17145, "train_loss": 3.3092041015625, "lr": 0.0001935337366455919, "tps": 106199, "wall": 10580.8} {"step": 17146, "train_loss": 3.356553077697754, "lr": 0.00019351478701798045, "tps": 106157, "wall": 10585.7} {"step": 17147, "train_loss": 3.5110273361206055, "lr": 0.0001934958376903949, "tps": 106114, "wall": 10590.6} {"step": 17148, "train_loss": 3.3749544620513916, "lr": 0.00019347688866304998, "tps": 106072, "wall": 10595.4} {"step": 17149, "train_loss": 3.2959160804748535, "lr": 0.00019345793993616025, "tps": 106029, "wall": 10600.3} {"step": 17150, "train_loss": 3.307342529296875, "lr": 0.00019343899150994044, "tps": 105987, "wall": 10605.1} {"step": 17151, "train_loss": 3.243788242340088, "lr": 0.00019342004338460518, "tps": 105944, "wall": 10610.0} {"step": 17152, "train_loss": 3.394350528717041, "lr": 0.00019340109556036908, "tps": 105901, "wall": 10614.9} {"step": 17153, "train_loss": 3.342771291732788, "lr": 0.00019338214803744678, "tps": 105859, "wall": 10619.8} {"step": 17154, "train_loss": 3.4001660346984863, "lr": 0.000193363200816053, "tps": 105817, "wall": 10624.6} {"step": 17155, "train_loss": 3.3138418197631836, "lr": 0.00019334425389640235, "tps": 105775, "wall": 10629.5} {"step": 17156, "train_loss": 3.364017963409424, "lr": 0.0001933253072787094, "tps": 105732, "wall": 10634.4} {"step": 17157, "train_loss": 3.346795082092285, "lr": 0.0001933063609631888, "tps": 105690, "wall": 10639.2} {"step": 17158, "train_loss": 3.2519237995147705, "lr": 0.00019328741495005521, "tps": 105648, "wall": 10644.1} {"step": 17159, "train_loss": 3.355551242828369, "lr": 0.0001932684692395232, "tps": 105606, "wall": 10648.9} {"step": 17160, "train_loss": 3.3174490928649902, "lr": 0.0001932495238318074, "tps": 105564, "wall": 10653.8} {"step": 17161, "train_loss": 3.4007186889648438, "lr": 0.00019323057872712248, "tps": 105522, "wall": 10658.7} {"step": 17162, "train_loss": 3.324282169342041, "lr": 0.000193211633925683, "tps": 105480, "wall": 10663.5} {"step": 17163, "train_loss": 3.3363897800445557, "lr": 0.00019319268942770358, "tps": 105437, "wall": 10668.5} {"step": 17164, "train_loss": 3.3347678184509277, "lr": 0.00019317374523339882, "tps": 105395, "wall": 10673.4} {"step": 17165, "train_loss": 3.3278088569641113, "lr": 0.0001931548013429833, "tps": 105353, "wall": 10678.2} {"step": 17166, "train_loss": 3.3521718978881836, "lr": 0.00019313585775667172, "tps": 105312, "wall": 10683.1} {"step": 17167, "train_loss": 3.263232946395874, "lr": 0.0001931169144746785, "tps": 105270, "wall": 10687.9} {"step": 17168, "train_loss": 3.3114662170410156, "lr": 0.0001930979714972184, "tps": 105228, "wall": 10692.8} {"step": 17169, "train_loss": 3.2889857292175293, "lr": 0.00019307902882450596, "tps": 105186, "wall": 10697.7} {"step": 17170, "train_loss": 3.2625842094421387, "lr": 0.00019306008645675565, "tps": 105145, "wall": 10702.5} {"step": 17171, "train_loss": 3.4037723541259766, "lr": 0.00019304114439418216, "tps": 105103, "wall": 10707.4} {"step": 17172, "train_loss": 3.3350257873535156, "lr": 0.0001930222026370001, "tps": 105061, "wall": 10712.3} {"step": 17173, "train_loss": 3.2906086444854736, "lr": 0.00019300326118542395, "tps": 105019, "wall": 10717.2} {"step": 17174, "train_loss": 3.3999738693237305, "lr": 0.0001929843200396683, "tps": 104978, "wall": 10722.1} {"step": 17175, "train_loss": 3.258223056793213, "lr": 0.00019296537919994778, "tps": 104935, "wall": 10727.0} {"step": 17176, "train_loss": 3.358353614807129, "lr": 0.00019294643866647686, "tps": 104894, "wall": 10731.8} {"step": 17177, "train_loss": 3.3601906299591064, "lr": 0.00019292749843947014, "tps": 104853, "wall": 10736.7} {"step": 17178, "train_loss": 3.3042900562286377, "lr": 0.00019290855851914222, "tps": 104811, "wall": 10741.6} {"step": 17179, "train_loss": 3.363009452819824, "lr": 0.00019288961890570762, "tps": 104770, "wall": 10746.4} {"step": 17180, "train_loss": 3.327317714691162, "lr": 0.00019287067959938083, "tps": 104729, "wall": 10751.3} {"step": 17181, "train_loss": 3.2430388927459717, "lr": 0.00019285174060037648, "tps": 104688, "wall": 10756.1} {"step": 17182, "train_loss": 3.322638750076294, "lr": 0.00019283280190890914, "tps": 104647, "wall": 10761.0} {"step": 17183, "train_loss": 3.262291193008423, "lr": 0.0001928138635251932, "tps": 104605, "wall": 10765.9} {"step": 17184, "train_loss": 3.369442939758301, "lr": 0.0001927949254494433, "tps": 104564, "wall": 10770.7} {"step": 17185, "train_loss": 3.378528356552124, "lr": 0.00019277598768187404, "tps": 104523, "wall": 10775.6} {"step": 17186, "train_loss": 3.362135648727417, "lr": 0.00019275705022269978, "tps": 104482, "wall": 10780.5} {"step": 17187, "train_loss": 3.238015651702881, "lr": 0.00019273811307213512, "tps": 104441, "wall": 10785.3} {"step": 17188, "train_loss": 3.339843988418579, "lr": 0.0001927191762303947, "tps": 104399, "wall": 10790.2} {"step": 17189, "train_loss": 3.3914716243743896, "lr": 0.00019270023969769281, "tps": 104358, "wall": 10795.1} {"step": 17190, "train_loss": 3.33760929107666, "lr": 0.0001926813034742441, "tps": 104318, "wall": 10799.9} {"step": 17191, "train_loss": 3.3238773345947266, "lr": 0.00019266236756026306, "tps": 104277, "wall": 10804.8} {"step": 17192, "train_loss": 3.368654727935791, "lr": 0.00019264343195596423, "tps": 104236, "wall": 10809.7} {"step": 17193, "train_loss": 3.3682711124420166, "lr": 0.0001926244966615621, "tps": 104195, "wall": 10814.5} {"step": 17194, "train_loss": 3.3507611751556396, "lr": 0.00019260556167727112, "tps": 104154, "wall": 10819.4} {"step": 17195, "train_loss": 3.293264627456665, "lr": 0.00019258662700330582, "tps": 104114, "wall": 10824.2} {"step": 17196, "train_loss": 3.311936855316162, "lr": 0.0001925676926398807, "tps": 104073, "wall": 10829.1} {"step": 17197, "train_loss": 3.3963539600372314, "lr": 0.00019254875858721023, "tps": 104032, "wall": 10834.0} {"step": 17198, "train_loss": 3.267455577850342, "lr": 0.0001925298248455089, "tps": 103992, "wall": 10838.8} {"step": 17199, "train_loss": 3.4024500846862793, "lr": 0.00019251089141499126, "tps": 103951, "wall": 10843.7} {"step": 17200, "train_loss": 3.258662700653076, "lr": 0.00019249195829587165, "tps": 103910, "wall": 10848.6} {"step": 17201, "train_loss": 3.321779727935791, "lr": 0.00019247302548836465, "tps": 103869, "wall": 10853.5} {"step": 17202, "train_loss": 3.3908863067626953, "lr": 0.00019245409299268476, "tps": 103829, "wall": 10858.4} {"step": 17203, "train_loss": 3.3602969646453857, "lr": 0.00019243516080904636, "tps": 103788, "wall": 10863.2} {"step": 17204, "train_loss": 3.340087413787842, "lr": 0.0001924162289376639, "tps": 103748, "wall": 10868.1} {"step": 17205, "train_loss": 3.3433780670166016, "lr": 0.00019239729737875196, "tps": 103708, "wall": 10872.9} {"step": 17206, "train_loss": 3.3418660163879395, "lr": 0.0001923783661325249, "tps": 103667, "wall": 10877.8} {"step": 17207, "train_loss": 3.311046600341797, "lr": 0.0001923594351991972, "tps": 103627, "wall": 10882.7} {"step": 17208, "train_loss": 3.276966094970703, "lr": 0.00019234050457898332, "tps": 103587, "wall": 10887.5} {"step": 17209, "train_loss": 3.3134050369262695, "lr": 0.00019232157427209772, "tps": 103547, "wall": 10892.4} {"step": 17210, "train_loss": 3.306408405303955, "lr": 0.00019230264427875477, "tps": 103507, "wall": 10897.2} {"step": 17211, "train_loss": 3.2901759147644043, "lr": 0.00019228371459916902, "tps": 103466, "wall": 10902.1} {"step": 17212, "train_loss": 3.361673355102539, "lr": 0.00019226478523355484, "tps": 103426, "wall": 10907.0} {"step": 17213, "train_loss": 3.386298656463623, "lr": 0.00019224585618212662, "tps": 103385, "wall": 10911.9} {"step": 17214, "train_loss": 3.2612576484680176, "lr": 0.00019222692744509892, "tps": 103345, "wall": 10916.8} {"step": 17215, "train_loss": 3.315021514892578, "lr": 0.00019220799902268607, "tps": 103305, "wall": 10921.6} {"step": 17216, "train_loss": 3.3680660724639893, "lr": 0.00019218907091510246, "tps": 103265, "wall": 10926.5} {"step": 17217, "train_loss": 3.300913095474243, "lr": 0.0001921701431225626, "tps": 103226, "wall": 10931.3} {"step": 17218, "train_loss": 3.354071617126465, "lr": 0.00019215121564528084, "tps": 103186, "wall": 10936.2} {"step": 17219, "train_loss": 3.2683260440826416, "lr": 0.00019213228848347167, "tps": 103146, "wall": 10941.1} {"step": 17220, "train_loss": 3.294536590576172, "lr": 0.00019211336163734937, "tps": 103106, "wall": 10945.9} {"step": 17221, "train_loss": 3.413085699081421, "lr": 0.00019209443510712846, "tps": 103066, "wall": 10950.8} {"step": 17222, "train_loss": 3.264101505279541, "lr": 0.00019207550889302334, "tps": 103026, "wall": 10955.7} {"step": 17223, "train_loss": 3.1586673259735107, "lr": 0.00019205658299524826, "tps": 102986, "wall": 10960.6} {"step": 17224, "train_loss": 3.275463581085205, "lr": 0.00019203765741401777, "tps": 102947, "wall": 10965.4} {"step": 17225, "train_loss": 3.3077335357666016, "lr": 0.00019201873214954622, "tps": 102907, "wall": 10970.3} {"step": 17226, "train_loss": 3.369502067565918, "lr": 0.000191999807202048, "tps": 102867, "wall": 10975.2} {"step": 17227, "train_loss": 3.2550559043884277, "lr": 0.00019198088257173747, "tps": 102827, "wall": 10980.1} {"step": 17228, "train_loss": 3.476168394088745, "lr": 0.00019196195825882896, "tps": 102787, "wall": 10984.9} {"step": 17229, "train_loss": 3.293915271759033, "lr": 0.00019194303426353702, "tps": 102748, "wall": 10989.8} {"step": 17230, "train_loss": 3.2883100509643555, "lr": 0.0001919241105860758, "tps": 102708, "wall": 10994.7} {"step": 17231, "train_loss": 3.2689547538757324, "lr": 0.00019190518722665982, "tps": 102669, "wall": 10999.5} {"step": 17232, "train_loss": 3.196402072906494, "lr": 0.00019188626418550344, "tps": 102630, "wall": 11004.4} {"step": 17233, "train_loss": 3.1794443130493164, "lr": 0.00019186734146282088, "tps": 102590, "wall": 11009.3} {"step": 17234, "train_loss": 3.396472692489624, "lr": 0.00019184841905882664, "tps": 102550, "wall": 11014.2} {"step": 17235, "train_loss": 3.3618767261505127, "lr": 0.00019182949697373506, "tps": 102511, "wall": 11019.0} {"step": 17236, "train_loss": 3.294060707092285, "lr": 0.00019181057520776043, "tps": 102471, "wall": 11023.9} {"step": 17237, "train_loss": 3.3896079063415527, "lr": 0.00019179165376111718, "tps": 102431, "wall": 11028.9} {"step": 17238, "train_loss": 3.3828835487365723, "lr": 0.00019177273263401952, "tps": 102392, "wall": 11033.7} {"step": 17239, "train_loss": 3.390678644180298, "lr": 0.00019175381182668196, "tps": 102353, "wall": 11038.6} {"step": 17240, "train_loss": 3.396651268005371, "lr": 0.0001917348913393187, "tps": 102314, "wall": 11043.5} {"step": 17241, "train_loss": 3.322943687438965, "lr": 0.00019171597117214413, "tps": 102275, "wall": 11048.3} {"step": 17242, "train_loss": 3.346259117126465, "lr": 0.00019169705132537253, "tps": 102236, "wall": 11053.2} {"step": 17243, "train_loss": 3.401595115661621, "lr": 0.00019167813179921833, "tps": 102197, "wall": 11058.1} {"step": 17244, "train_loss": 3.3656840324401855, "lr": 0.00019165921259389572, "tps": 102157, "wall": 11063.0} {"step": 17245, "train_loss": 3.2504947185516357, "lr": 0.0001916402937096191, "tps": 102118, "wall": 11067.8} {"step": 17246, "train_loss": 3.3025808334350586, "lr": 0.0001916213751466028, "tps": 102079, "wall": 11072.7} {"step": 17247, "train_loss": 3.377473831176758, "lr": 0.0001916024569050611, "tps": 102040, "wall": 11077.6} {"step": 17248, "train_loss": 3.3207969665527344, "lr": 0.00019158353898520827, "tps": 102002, "wall": 11082.4} {"step": 17249, "train_loss": 3.3575923442840576, "lr": 0.0001915646213872587, "tps": 101962, "wall": 11087.4} {"step": 17250, "train_loss": 3.280118703842163, "lr": 0.00019154570411142658, "tps": 101923, "wall": 11092.2} {"step": 17251, "train_loss": 3.360302209854126, "lr": 0.00019152678715792627, "tps": 101885, "wall": 11097.1} {"step": 17252, "train_loss": 3.173055648803711, "lr": 0.0001915078705269721, "tps": 101846, "wall": 11102.0} {"step": 17253, "train_loss": 3.2693166732788086, "lr": 0.0001914889542187783, "tps": 101807, "wall": 11106.8} {"step": 17254, "train_loss": 3.4063467979431152, "lr": 0.00019147003823355912, "tps": 101768, "wall": 11111.7} {"step": 17255, "train_loss": 3.398989677429199, "lr": 0.0001914511225715289, "tps": 101730, "wall": 11116.5} {"step": 17256, "train_loss": 3.3770740032196045, "lr": 0.00019143220723290196, "tps": 101691, "wall": 11121.4} {"step": 17257, "train_loss": 3.2292940616607666, "lr": 0.0001914132922178925, "tps": 101653, "wall": 11126.2} {"step": 17258, "train_loss": 3.388505220413208, "lr": 0.00019139437752671476, "tps": 101614, "wall": 11131.1} {"step": 17259, "train_loss": 3.3441317081451416, "lr": 0.00019137546315958312, "tps": 101576, "wall": 11136.0} {"step": 17260, "train_loss": 3.2018065452575684, "lr": 0.0001913565491167118, "tps": 101537, "wall": 11140.8} {"step": 17261, "train_loss": 3.2924041748046875, "lr": 0.00019133763539831496, "tps": 101499, "wall": 11145.7} {"step": 17262, "train_loss": 3.3329083919525146, "lr": 0.00019131872200460695, "tps": 101460, "wall": 11150.6} {"step": 17263, "train_loss": 3.3332417011260986, "lr": 0.0001912998089358021, "tps": 101422, "wall": 11155.5} {"step": 17264, "train_loss": 3.4417147636413574, "lr": 0.00019128089619211452, "tps": 101383, "wall": 11160.4} {"step": 17265, "train_loss": 3.3355090618133545, "lr": 0.00019126198377375844, "tps": 101345, "wall": 11165.2} {"step": 17266, "train_loss": 3.283886194229126, "lr": 0.00019124307168094827, "tps": 101307, "wall": 11170.1} {"step": 17267, "train_loss": 3.3316690921783447, "lr": 0.00019122415991389805, "tps": 101269, "wall": 11174.9} {"step": 17268, "train_loss": 3.363888740539551, "lr": 0.00019120524847282213, "tps": 101231, "wall": 11179.8} {"step": 17269, "train_loss": 3.307302951812744, "lr": 0.00019118633735793478, "tps": 101193, "wall": 11184.6} {"step": 17270, "train_loss": 3.4135348796844482, "lr": 0.00019116742656945005, "tps": 101154, "wall": 11189.5} {"step": 17271, "train_loss": 3.389921188354492, "lr": 0.00019114851610758232, "tps": 101116, "wall": 11194.4} {"step": 17272, "train_loss": 3.2684531211853027, "lr": 0.00019112960597254578, "tps": 101078, "wall": 11199.2} {"step": 17273, "train_loss": 3.3429832458496094, "lr": 0.0001911106961645546, "tps": 101040, "wall": 11204.1} {"step": 17274, "train_loss": 3.349400758743286, "lr": 0.00019109178668382301, "tps": 101002, "wall": 11209.0} {"step": 17275, "train_loss": 3.24556040763855, "lr": 0.00019107287753056525, "tps": 100964, "wall": 11213.9} {"step": 17276, "train_loss": 3.269716739654541, "lr": 0.00019105396870499548, "tps": 100926, "wall": 11218.7} {"step": 17277, "train_loss": 3.35799241065979, "lr": 0.00019103506020732796, "tps": 100888, "wall": 11223.6} {"step": 17278, "train_loss": 3.246168851852417, "lr": 0.00019101615203777686, "tps": 100850, "wall": 11228.4} {"step": 17279, "train_loss": 3.3858704566955566, "lr": 0.00019099724419655627, "tps": 100812, "wall": 11233.3} {"step": 17280, "train_loss": 3.3222131729125977, "lr": 0.00019097833668388047, "tps": 100775, "wall": 11238.2} {"step": 17281, "train_loss": 3.259200096130371, "lr": 0.0001909594294999637, "tps": 100737, "wall": 11243.0} {"step": 17282, "train_loss": 3.335094928741455, "lr": 0.00019094052264502005, "tps": 100699, "wall": 11247.9} {"step": 17283, "train_loss": 3.315699338912964, "lr": 0.00019092161611926375, "tps": 100661, "wall": 11252.8} {"step": 17284, "train_loss": 3.2835655212402344, "lr": 0.000190902709922909, "tps": 100624, "wall": 11257.6} {"step": 17285, "train_loss": 3.397428512573242, "lr": 0.00019088380405616983, "tps": 100586, "wall": 11262.5} {"step": 17286, "train_loss": 3.3418822288513184, "lr": 0.00019086489851926052, "tps": 100548, "wall": 11267.4} {"step": 17287, "train_loss": 3.286349296569824, "lr": 0.00019084599331239526, "tps": 100511, "wall": 11272.2} {"step": 17288, "train_loss": 3.381199598312378, "lr": 0.00019082708843578815, "tps": 100473, "wall": 11277.1} {"step": 17289, "train_loss": 3.2584667205810547, "lr": 0.0001908081838896534, "tps": 100436, "wall": 11281.9} {"step": 17290, "train_loss": 3.2184340953826904, "lr": 0.000190789279674205, "tps": 100399, "wall": 11286.8} {"step": 17291, "train_loss": 3.2565083503723145, "lr": 0.00019077037578965739, "tps": 100361, "wall": 11291.6} {"step": 17292, "train_loss": 3.3659887313842773, "lr": 0.00019075147223622443, "tps": 100324, "wall": 11296.5} {"step": 17293, "train_loss": 3.3000235557556152, "lr": 0.00019073256901412034, "tps": 100286, "wall": 11301.4} {"step": 17294, "train_loss": 3.3277859687805176, "lr": 0.00019071366612355938, "tps": 100249, "wall": 11306.2} {"step": 17295, "train_loss": 3.3618228435516357, "lr": 0.00019069476356475557, "tps": 100212, "wall": 11311.1} {"step": 17296, "train_loss": 3.3121275901794434, "lr": 0.00019067586133792306, "tps": 100174, "wall": 11316.0} {"step": 17297, "train_loss": 3.3464865684509277, "lr": 0.00019065695944327592, "tps": 100137, "wall": 11320.9} {"step": 17298, "train_loss": 3.350285530090332, "lr": 0.00019063805788102842, "tps": 100099, "wall": 11325.8} {"step": 17299, "train_loss": 3.3533432483673096, "lr": 0.00019061915665139455, "tps": 100061, "wall": 11330.7} {"step": 17300, "train_loss": 3.355618953704834, "lr": 0.00019060025575458846, "tps": 100024, "wall": 11335.6} {"step": 17301, "train_loss": 3.2996628284454346, "lr": 0.00019058135519082434, "tps": 99987, "wall": 11340.4} {"step": 17302, "train_loss": 3.233447551727295, "lr": 0.00019056245496031613, "tps": 99950, "wall": 11345.3} {"step": 17303, "train_loss": 3.3041014671325684, "lr": 0.00019054355506327802, "tps": 99913, "wall": 11350.1} {"step": 17304, "train_loss": 3.2675204277038574, "lr": 0.00019052465549992414, "tps": 99876, "wall": 11355.0} {"step": 17305, "train_loss": 3.3879454135894775, "lr": 0.00019050575627046858, "tps": 99839, "wall": 11359.8} {"step": 17306, "train_loss": 3.3442037105560303, "lr": 0.00019048685737512537, "tps": 99803, "wall": 11364.7} {"step": 17307, "train_loss": 3.326262950897217, "lr": 0.00019046795881410859, "tps": 99766, "wall": 11369.6} {"step": 17308, "train_loss": 3.2947311401367188, "lr": 0.00019044906058763246, "tps": 99729, "wall": 11374.4} {"step": 17309, "train_loss": 3.416714906692505, "lr": 0.00019043016269591097, "tps": 99692, "wall": 11379.3} {"step": 17310, "train_loss": 3.2999320030212402, "lr": 0.00019041126513915814, "tps": 99655, "wall": 11384.1} {"step": 17311, "train_loss": 3.307245969772339, "lr": 0.00019039236791758816, "tps": 99618, "wall": 11389.1} {"step": 17312, "train_loss": 3.2918643951416016, "lr": 0.000190373471031415, "tps": 99581, "wall": 11393.9} {"step": 17313, "train_loss": 3.324019432067871, "lr": 0.00019035457448085273, "tps": 99544, "wall": 11398.8} {"step": 17314, "train_loss": 3.334007978439331, "lr": 0.00019033567826611547, "tps": 99508, "wall": 11403.6} {"step": 17315, "train_loss": 3.3464279174804688, "lr": 0.00019031678238741733, "tps": 99470, "wall": 11408.6} {"step": 17316, "train_loss": 3.395275592803955, "lr": 0.00019029788684497216, "tps": 99434, "wall": 11413.4} {"step": 17317, "train_loss": 3.2935562133789062, "lr": 0.00019027899163899417, "tps": 99397, "wall": 11418.3} {"step": 17318, "train_loss": 3.397148609161377, "lr": 0.00019026009676969744, "tps": 99361, "wall": 11423.1} {"step": 17319, "train_loss": 3.363534450531006, "lr": 0.0001902412022372959, "tps": 99324, "wall": 11428.0} {"step": 17320, "train_loss": 3.234065055847168, "lr": 0.0001902223080420036, "tps": 99288, "wall": 11432.8} {"step": 17321, "train_loss": 3.2920069694519043, "lr": 0.00019020341418403468, "tps": 99251, "wall": 11437.7} {"step": 17322, "train_loss": 3.368450164794922, "lr": 0.00019018452066360303, "tps": 99215, "wall": 11442.6} {"step": 17323, "train_loss": 3.3086748123168945, "lr": 0.00019016562748092275, "tps": 99178, "wall": 11447.5} {"step": 17324, "train_loss": 3.339923620223999, "lr": 0.00019014673463620786, "tps": 99141, "wall": 11452.4} {"step": 17325, "train_loss": 3.315263032913208, "lr": 0.0001901278421296724, "tps": 99105, "wall": 11457.2} {"step": 17326, "train_loss": 3.382561445236206, "lr": 0.0001901089499615303, "tps": 99069, "wall": 11462.1} {"step": 17327, "train_loss": 3.2711329460144043, "lr": 0.00019009005813199568, "tps": 99033, "wall": 11467.0} {"step": 17328, "train_loss": 3.34073543548584, "lr": 0.00019007116664128252, "tps": 98996, "wall": 11471.8} {"step": 17329, "train_loss": 3.3965861797332764, "lr": 0.00019005227548960475, "tps": 98960, "wall": 11476.7} {"step": 17330, "train_loss": 3.3154890537261963, "lr": 0.00019003338467717647, "tps": 98924, "wall": 11481.5} {"step": 17331, "train_loss": 3.2912914752960205, "lr": 0.00019001449420421156, "tps": 98888, "wall": 11486.4} {"step": 17332, "train_loss": 3.3341665267944336, "lr": 0.00018999560407092418, "tps": 98851, "wall": 11491.3} {"step": 17333, "train_loss": 3.2995195388793945, "lr": 0.00018997671427752817, "tps": 98815, "wall": 11496.1} {"step": 17334, "train_loss": 3.277428150177002, "lr": 0.00018995782482423757, "tps": 98779, "wall": 11501.0} {"step": 17335, "train_loss": 3.2496893405914307, "lr": 0.00018993893571126632, "tps": 98743, "wall": 11505.9} {"step": 17336, "train_loss": 3.2961533069610596, "lr": 0.00018992004693882847, "tps": 98706, "wall": 11510.8} {"step": 17337, "train_loss": 3.3368964195251465, "lr": 0.00018990115850713797, "tps": 98670, "wall": 11515.7} {"step": 17338, "train_loss": 3.310878038406372, "lr": 0.00018988227041640877, "tps": 98634, "wall": 11520.6} {"step": 17339, "train_loss": 3.373074531555176, "lr": 0.00018986338266685482, "tps": 98598, "wall": 11525.5} {"step": 17340, "train_loss": 3.3733744621276855, "lr": 0.00018984449525869006, "tps": 98559, "wall": 11530.7} {"step": 17341, "train_loss": 3.2385752201080322, "lr": 0.00018982560819212854, "tps": 98521, "wall": 11535.8} {"step": 17342, "train_loss": 3.275604724884033, "lr": 0.0001898067214673842, "tps": 98485, "wall": 11540.7} {"step": 17343, "train_loss": 3.308861255645752, "lr": 0.00018978783508467092, "tps": 98447, "wall": 11545.8} {"step": 17344, "train_loss": 3.3773937225341797, "lr": 0.00018976894904420264, "tps": 98411, "wall": 11550.7} {"step": 17345, "train_loss": 3.3858795166015625, "lr": 0.0001897500633461934, "tps": 98375, "wall": 11555.6} {"step": 17346, "train_loss": 3.3484151363372803, "lr": 0.00018973117799085706, "tps": 98338, "wall": 11560.6} {"step": 17347, "train_loss": 3.2520835399627686, "lr": 0.00018971229297840751, "tps": 98302, "wall": 11565.5} {"step": 17348, "train_loss": 3.3595221042633057, "lr": 0.00018969340830905882, "tps": 98265, "wall": 11570.5} {"step": 17349, "train_loss": 3.3358397483825684, "lr": 0.00018967452398302483, "tps": 98230, "wall": 11575.4} {"step": 17350, "train_loss": 3.3265581130981445, "lr": 0.00018965564000051943, "tps": 98192, "wall": 11580.4} {"step": 17351, "train_loss": 3.285012722015381, "lr": 0.00018963675636175662, "tps": 98155, "wall": 11585.5} {"step": 17352, "train_loss": 3.353008270263672, "lr": 0.00018961787306695028, "tps": 98118, "wall": 11590.5} {"step": 17353, "train_loss": 3.2557592391967773, "lr": 0.0001895989901163143, "tps": 98082, "wall": 11595.4} {"step": 17354, "train_loss": 3.3405909538269043, "lr": 0.00018958010751006258, "tps": 98046, "wall": 11600.3} {"step": 17355, "train_loss": 3.3264684677124023, "lr": 0.0001895612252484091, "tps": 98010, "wall": 11605.3} {"step": 17356, "train_loss": 3.3367204666137695, "lr": 0.0001895423433315677, "tps": 97974, "wall": 11610.3} {"step": 17357, "train_loss": 3.243957042694092, "lr": 0.00018952346175975224, "tps": 97938, "wall": 11615.2} {"step": 17358, "train_loss": 3.333989381790161, "lr": 0.00018950458053317669, "tps": 97902, "wall": 11620.1} {"step": 17359, "train_loss": 3.214799404144287, "lr": 0.0001894856996520549, "tps": 97866, "wall": 11625.1} {"step": 17360, "train_loss": 3.4339144229888916, "lr": 0.00018946681911660072, "tps": 97830, "wall": 11630.1} {"step": 17361, "train_loss": 3.223294734954834, "lr": 0.0001894479389270281, "tps": 97794, "wall": 11634.9} {"step": 17362, "train_loss": 3.276998996734619, "lr": 0.00018942905908355092, "tps": 97759, "wall": 11639.8} {"step": 17363, "train_loss": 3.2589175701141357, "lr": 0.00018941017958638292, "tps": 97724, "wall": 11644.6} {"step": 17364, "train_loss": 3.3483707904815674, "lr": 0.00018939130043573813, "tps": 97689, "wall": 11649.5} {"step": 17365, "train_loss": 3.2998409271240234, "lr": 0.00018937242163183035, "tps": 97653, "wall": 11654.4} {"step": 17366, "train_loss": 3.3143787384033203, "lr": 0.00018935354317487337, "tps": 97618, "wall": 11659.3} {"step": 17367, "train_loss": 3.4287681579589844, "lr": 0.00018933466506508112, "tps": 97583, "wall": 11664.1} {"step": 17368, "train_loss": 3.3242015838623047, "lr": 0.00018931578730266746, "tps": 97548, "wall": 11669.0} {"step": 17369, "train_loss": 3.251260995864868, "lr": 0.00018929690988784629, "tps": 97513, "wall": 11673.9} {"step": 17370, "train_loss": 3.2574374675750732, "lr": 0.0001892780328208313, "tps": 97478, "wall": 11678.7} {"step": 17371, "train_loss": 3.405008554458618, "lr": 0.00018925915610183643, "tps": 97443, "wall": 11683.6} {"step": 17372, "train_loss": 3.385695457458496, "lr": 0.00018924027973107554, "tps": 97407, "wall": 11688.6} {"step": 17373, "train_loss": 3.438668966293335, "lr": 0.00018922140370876238, "tps": 97373, "wall": 11693.4} {"step": 17374, "train_loss": 3.2478981018066406, "lr": 0.00018920252803511086, "tps": 97338, "wall": 11698.3} {"step": 17375, "train_loss": 3.374343156814575, "lr": 0.00018918365271033478, "tps": 97303, "wall": 11703.1} {"step": 17376, "train_loss": 3.2410237789154053, "lr": 0.00018916477773464786, "tps": 97268, "wall": 11708.0} {"step": 17377, "train_loss": 3.355717182159424, "lr": 0.00018914590310826408, "tps": 97233, "wall": 11712.8} {"step": 17378, "train_loss": 3.3564257621765137, "lr": 0.00018912702883139716, "tps": 97199, "wall": 11717.7} {"step": 17379, "train_loss": 3.267411231994629, "lr": 0.000189108154904261, "tps": 97163, "wall": 11722.7} {"step": 17380, "train_loss": 3.3571572303771973, "lr": 0.00018908928132706923, "tps": 97127, "wall": 11727.6} {"step": 17381, "train_loss": 3.3976504802703857, "lr": 0.00018907040810003576, "tps": 97092, "wall": 11732.6} {"step": 17382, "train_loss": 3.401625633239746, "lr": 0.0001890515352233744, "tps": 97057, "wall": 11737.5} {"step": 17383, "train_loss": 3.356781482696533, "lr": 0.00018903266269729895, "tps": 97022, "wall": 11742.4} {"step": 17384, "train_loss": 3.3925750255584717, "lr": 0.0001890137905220232, "tps": 96987, "wall": 11747.3} {"step": 17385, "train_loss": 3.374851703643799, "lr": 0.00018899491869776082, "tps": 96952, "wall": 11752.2} {"step": 17386, "train_loss": 3.3944406509399414, "lr": 0.00018897604722472577, "tps": 96918, "wall": 11757.1} {"step": 17387, "train_loss": 3.2779812812805176, "lr": 0.00018895717610313163, "tps": 96883, "wall": 11761.9} {"step": 17388, "train_loss": 3.3179595470428467, "lr": 0.00018893830533319234, "tps": 96848, "wall": 11766.8} {"step": 17389, "train_loss": 3.300410747528076, "lr": 0.00018891943491512164, "tps": 96813, "wall": 11771.8} {"step": 17390, "train_loss": 3.3387818336486816, "lr": 0.00018890056484913324, "tps": 96778, "wall": 11776.7} {"step": 17391, "train_loss": 3.402834415435791, "lr": 0.0001888816951354409, "tps": 96744, "wall": 11781.6} {"step": 17392, "train_loss": 3.4702677726745605, "lr": 0.0001888628257742584, "tps": 96708, "wall": 11786.6} {"step": 17393, "train_loss": 3.3322596549987793, "lr": 0.0001888439567657995, "tps": 96674, "wall": 11791.5} {"step": 17394, "train_loss": 3.221024751663208, "lr": 0.00018882508811027794, "tps": 96639, "wall": 11796.4} {"step": 17395, "train_loss": 3.4132351875305176, "lr": 0.00018880621980790747, "tps": 96604, "wall": 11801.3} {"step": 17396, "train_loss": 3.2610692977905273, "lr": 0.00018878735185890187, "tps": 96570, "wall": 11806.2} {"step": 17397, "train_loss": 3.32816481590271, "lr": 0.0001887684842634748, "tps": 96535, "wall": 11811.1} {"step": 17398, "train_loss": 3.301396369934082, "lr": 0.00018874961702184, "tps": 96501, "wall": 11816.0} {"step": 17399, "train_loss": 3.1956162452697754, "lr": 0.0001887307501342113, "tps": 96466, "wall": 11821.0} {"step": 17400, "train_loss": 3.249152660369873, "lr": 0.0001887118836008023, "tps": 96432, "wall": 11825.9} {"step": 17401, "train_loss": 3.4154486656188965, "lr": 0.0001886930174218268, "tps": 96397, "wall": 11830.8} {"step": 17402, "train_loss": 3.3633155822753906, "lr": 0.00018867415159749847, "tps": 96363, "wall": 11835.6} {"step": 17403, "train_loss": 3.356588840484619, "lr": 0.00018865528612803107, "tps": 96329, "wall": 11840.5} {"step": 17404, "train_loss": 3.297313690185547, "lr": 0.00018863642101363826, "tps": 96294, "wall": 11845.4} {"step": 17405, "train_loss": 3.435403347015381, "lr": 0.00018861755625453375, "tps": 96260, "wall": 11850.3} {"step": 17406, "train_loss": 3.2724695205688477, "lr": 0.00018859869185093136, "tps": 96226, "wall": 11855.2} {"step": 17407, "train_loss": 3.370943307876587, "lr": 0.00018857982780304462, "tps": 96192, "wall": 11860.1} {"step": 17408, "train_loss": 3.3794069290161133, "lr": 0.00018856096411108727, "tps": 96158, "wall": 11865.0} {"step": 17409, "train_loss": 3.361100673675537, "lr": 0.00018854210077527307, "tps": 96123, "wall": 11870.0} {"step": 17410, "train_loss": 3.3211216926574707, "lr": 0.00018852323779581557, "tps": 96089, "wall": 11874.9} {"step": 17411, "train_loss": 3.3337178230285645, "lr": 0.0001885043751729286, "tps": 96055, "wall": 11879.7} {"step": 17412, "train_loss": 3.2156970500946045, "lr": 0.00018848551290682574, "tps": 96021, "wall": 11884.6} {"step": 17413, "train_loss": 3.1924867630004883, "lr": 0.00018846665099772074, "tps": 95987, "wall": 11889.5} {"step": 17414, "train_loss": 3.2976109981536865, "lr": 0.00018844778944582718, "tps": 95953, "wall": 11894.4} {"step": 17415, "train_loss": 3.451744318008423, "lr": 0.00018842892825135881, "tps": 95919, "wall": 11899.3} {"step": 17416, "train_loss": 3.370917797088623, "lr": 0.00018841006741452927, "tps": 95885, "wall": 11904.2} {"step": 17417, "train_loss": 3.321047782897949, "lr": 0.00018839120693555216, "tps": 95852, "wall": 11909.0} {"step": 17418, "train_loss": 3.365015745162964, "lr": 0.00018837234681464112, "tps": 95817, "wall": 11914.0} {"step": 17419, "train_loss": 3.2346041202545166, "lr": 0.00018835348705200993, "tps": 95783, "wall": 11919.0} {"step": 17420, "train_loss": 3.268275499343872, "lr": 0.0001883346276478721, "tps": 95745, "wall": 11924.3} {"step": 17421, "train_loss": 3.297943115234375, "lr": 0.00018831576860244126, "tps": 95709, "wall": 11929.5} {"step": 17422, "train_loss": 3.401134490966797, "lr": 0.00018829690991593122, "tps": 95674, "wall": 11934.6} {"step": 17423, "train_loss": 3.479508638381958, "lr": 0.00018827805158855548, "tps": 95638, "wall": 11939.7} {"step": 17424, "train_loss": 3.37491512298584, "lr": 0.00018825919362052763, "tps": 95603, "wall": 11944.8} {"step": 17425, "train_loss": 3.3183670043945312, "lr": 0.00018824033601206138, "tps": 95566, "wall": 11950.2} {"step": 17426, "train_loss": 3.3024258613586426, "lr": 0.00018822147876337036, "tps": 95525, "wall": 11955.9} {"step": 17427, "train_loss": 3.4034156799316406, "lr": 0.0001882026218746681, "tps": 95491, "wall": 11960.9} {"step": 17428, "train_loss": 3.3743462562561035, "lr": 0.00018818376534616827, "tps": 95457, "wall": 11965.9} {"step": 17429, "train_loss": 3.3178839683532715, "lr": 0.00018816490917808446, "tps": 95422, "wall": 11970.9} {"step": 17430, "train_loss": 3.2676501274108887, "lr": 0.0001881460533706303, "tps": 95388, "wall": 11975.8} {"step": 17431, "train_loss": 3.3344409465789795, "lr": 0.00018812719792401933, "tps": 95355, "wall": 11980.7} {"step": 17432, "train_loss": 3.294613838195801, "lr": 0.0001881083428384652, "tps": 95322, "wall": 11985.6} {"step": 17433, "train_loss": 3.363522529602051, "lr": 0.00018808948811418157, "tps": 95287, "wall": 11990.6} {"step": 17434, "train_loss": 3.290909767150879, "lr": 0.00018807063375138187, "tps": 95253, "wall": 11995.5} {"step": 17435, "train_loss": 3.3682773113250732, "lr": 0.00018805177975027973, "tps": 95220, "wall": 12000.5} {"step": 17436, "train_loss": 3.2052438259124756, "lr": 0.00018803292611108886, "tps": 95186, "wall": 12005.4} {"step": 17437, "train_loss": 3.320765972137451, "lr": 0.00018801407283402263, "tps": 95152, "wall": 12010.3} {"step": 17438, "train_loss": 3.3927955627441406, "lr": 0.00018799521991929473, "tps": 95119, "wall": 12015.3} {"step": 17439, "train_loss": 3.3578524589538574, "lr": 0.00018797636736711873, "tps": 95086, "wall": 12020.1} {"step": 17440, "train_loss": 3.2695181369781494, "lr": 0.0001879575151777082, "tps": 95051, "wall": 12025.1} {"step": 17441, "train_loss": 3.3799643516540527, "lr": 0.00018793866335127665, "tps": 95018, "wall": 12030.1} {"step": 17442, "train_loss": 3.315807342529297, "lr": 0.00018791981188803764, "tps": 94984, "wall": 12035.0} {"step": 17443, "train_loss": 3.342355489730835, "lr": 0.0001879009607882048, "tps": 94951, "wall": 12039.9} {"step": 17444, "train_loss": 3.40059232711792, "lr": 0.00018788211005199156, "tps": 94917, "wall": 12044.9} {"step": 17445, "train_loss": 3.2531309127807617, "lr": 0.0001878632596796115, "tps": 94884, "wall": 12049.9} {"step": 17446, "train_loss": 3.3769989013671875, "lr": 0.00018784440967127824, "tps": 94850, "wall": 12054.8} {"step": 17447, "train_loss": 3.349003314971924, "lr": 0.0001878255600272052, "tps": 94818, "wall": 12059.6} {"step": 17448, "train_loss": 3.3652150630950928, "lr": 0.00018780671074760598, "tps": 94784, "wall": 12064.5} {"step": 17449, "train_loss": 3.4175305366516113, "lr": 0.00018778786183269405, "tps": 94750, "wall": 12069.6} {"step": 17450, "train_loss": 3.227898120880127, "lr": 0.00018776901328268296, "tps": 94717, "wall": 12074.5} {"step": 17451, "train_loss": 3.350660800933838, "lr": 0.00018775016509778626, "tps": 94683, "wall": 12079.5} {"step": 17452, "train_loss": 3.2640600204467773, "lr": 0.0001877313172782174, "tps": 94650, "wall": 12084.4} {"step": 17453, "train_loss": 3.318655014038086, "lr": 0.00018771246982418992, "tps": 94617, "wall": 12089.3} {"step": 17454, "train_loss": 3.367643117904663, "lr": 0.00018769362273591736, "tps": 94584, "wall": 12094.3} {"step": 17455, "train_loss": 3.286402702331543, "lr": 0.00018767477601361318, "tps": 94551, "wall": 12099.2} {"step": 17456, "train_loss": 3.3251760005950928, "lr": 0.00018765592965749091, "tps": 94518, "wall": 12104.1} {"step": 17457, "train_loss": 3.2928779125213623, "lr": 0.00018763708366776393, "tps": 94484, "wall": 12109.2} {"step": 17458, "train_loss": 3.413097858428955, "lr": 0.00018761823804464594, "tps": 94450, "wall": 12114.2} {"step": 17459, "train_loss": 3.442290782928467, "lr": 0.00018759939278835023, "tps": 94418, "wall": 12119.0} {"step": 17460, "train_loss": 3.2631874084472656, "lr": 0.00018758054789909037, "tps": 94385, "wall": 12123.9} {"step": 17461, "train_loss": 3.31839656829834, "lr": 0.0001875617033770798, "tps": 94353, "wall": 12128.8} {"step": 17462, "train_loss": 3.2938437461853027, "lr": 0.00018754285922253203, "tps": 94320, "wall": 12133.7} {"step": 17463, "train_loss": 3.235521078109741, "lr": 0.00018752401543566048, "tps": 94288, "wall": 12138.5} {"step": 17464, "train_loss": 3.37980055809021, "lr": 0.00018750517201667863, "tps": 94255, "wall": 12143.5} {"step": 17465, "train_loss": 3.389366388320923, "lr": 0.0001874863289658, "tps": 94222, "wall": 12148.4} {"step": 17466, "train_loss": 3.3177976608276367, "lr": 0.00018746748628323796, "tps": 94190, "wall": 12153.3} {"step": 17467, "train_loss": 3.2935991287231445, "lr": 0.00018744864396920597, "tps": 94157, "wall": 12158.1} {"step": 17468, "train_loss": 3.333510398864746, "lr": 0.00018742980202391757, "tps": 94125, "wall": 12163.0} {"step": 17469, "train_loss": 3.398930311203003, "lr": 0.00018741096044758607, "tps": 94092, "wall": 12167.9} {"step": 17470, "train_loss": 3.4239630699157715, "lr": 0.00018739211924042505, "tps": 94060, "wall": 12172.8} {"step": 17471, "train_loss": 3.4057252407073975, "lr": 0.00018737327840264784, "tps": 94028, "wall": 12177.7} {"step": 17472, "train_loss": 3.4358506202697754, "lr": 0.0001873544379344679, "tps": 93995, "wall": 12182.5} {"step": 17473, "train_loss": 3.309762954711914, "lr": 0.00018733559783609859, "tps": 93963, "wall": 12187.4} {"step": 17474, "train_loss": 3.372777223587036, "lr": 0.00018731675810775342, "tps": 93931, "wall": 12192.3} {"step": 17475, "train_loss": 3.340977668762207, "lr": 0.00018729791874964584, "tps": 93899, "wall": 12197.2} {"step": 17476, "train_loss": 3.33191180229187, "lr": 0.00018727907976198913, "tps": 93867, "wall": 12202.1} {"step": 17477, "train_loss": 3.3822503089904785, "lr": 0.0001872602411449968, "tps": 93834, "wall": 12207.0} {"step": 17478, "train_loss": 3.4133527278900146, "lr": 0.00018724140289888224, "tps": 93802, "wall": 12211.8} {"step": 17479, "train_loss": 3.337449789047241, "lr": 0.00018722256502385885, "tps": 93770, "wall": 12216.7} {"step": 17480, "train_loss": 3.291747808456421, "lr": 0.00018720372752014001, "tps": 93738, "wall": 12221.6} {"step": 17481, "train_loss": 3.3896708488464355, "lr": 0.0001871848903879391, "tps": 93705, "wall": 12226.6} {"step": 17482, "train_loss": 3.3226659297943115, "lr": 0.00018716605362746957, "tps": 93673, "wall": 12231.5} {"step": 17483, "train_loss": 3.291022777557373, "lr": 0.00018714721723894472, "tps": 93641, "wall": 12236.4} {"step": 17484, "train_loss": 3.203535795211792, "lr": 0.00018712838122257798, "tps": 93609, "wall": 12241.3} {"step": 17485, "train_loss": 3.3544387817382812, "lr": 0.00018710954557858275, "tps": 93577, "wall": 12246.2} {"step": 17486, "train_loss": 3.3636956214904785, "lr": 0.00018709071030717232, "tps": 93545, "wall": 12251.1} {"step": 17487, "train_loss": 3.3101677894592285, "lr": 0.0001870718754085601, "tps": 93513, "wall": 12256.0} {"step": 17488, "train_loss": 3.3902978897094727, "lr": 0.00018705304088295952, "tps": 93481, "wall": 12260.9} {"step": 17489, "train_loss": 3.239612579345703, "lr": 0.00018703420673058378, "tps": 93448, "wall": 12265.8} {"step": 17490, "train_loss": 3.1816956996917725, "lr": 0.00018701537295164638, "tps": 93416, "wall": 12270.7} {"step": 17491, "train_loss": 3.3018741607666016, "lr": 0.00018699653954636062, "tps": 93384, "wall": 12275.6} {"step": 17492, "train_loss": 3.2942919731140137, "lr": 0.00018697770651493985, "tps": 93352, "wall": 12280.5} {"step": 17493, "train_loss": 3.322507381439209, "lr": 0.0001869588738575974, "tps": 93321, "wall": 12285.4} {"step": 17494, "train_loss": 3.353661298751831, "lr": 0.00018694004157454664, "tps": 93287, "wall": 12290.6} {"step": 17495, "train_loss": 3.288378953933716, "lr": 0.00018692120966600086, "tps": 93253, "wall": 12295.7} {"step": 17496, "train_loss": 3.2713775634765625, "lr": 0.0001869023781321734, "tps": 93221, "wall": 12300.6} {"step": 17497, "train_loss": 3.2668726444244385, "lr": 0.00018688354697327756, "tps": 93188, "wall": 12305.7} {"step": 17498, "train_loss": 3.355776786804199, "lr": 0.00018686471618952676, "tps": 93156, "wall": 12310.7} {"step": 17499, "train_loss": 3.315666913986206, "lr": 0.0001868458857811342, "tps": 93124, "wall": 12315.6} {"step": 17500, "train_loss": 3.355318784713745, "lr": 0.00018682705574831325, "tps": 93092, "wall": 12320.6} {"step": 17501, "train_loss": 3.272576093673706, "lr": 0.00018680822609127716, "tps": 93058, "wall": 12325.7} {"step": 17502, "train_loss": 3.363001823425293, "lr": 0.0001867893968102394, "tps": 93026, "wall": 12330.7} {"step": 17503, "train_loss": 3.3530921936035156, "lr": 0.00018677056790541302, "tps": 92990, "wall": 12336.1} {"step": 17504, "train_loss": 3.3458356857299805, "lr": 0.00018675173937701152, "tps": 92955, "wall": 12341.4} {"step": 17505, "train_loss": 3.344515800476074, "lr": 0.00018673291122524814, "tps": 92923, "wall": 12346.4} {"step": 17506, "train_loss": 3.38914155960083, "lr": 0.00018671408345033607, "tps": 92889, "wall": 12351.7} {"step": 17507, "train_loss": 3.3103771209716797, "lr": 0.0001866952560524887, "tps": 92856, "wall": 12356.7} {"step": 17508, "train_loss": 3.2267580032348633, "lr": 0.00018667642903191927, "tps": 92822, "wall": 12362.0} {"step": 17509, "train_loss": 3.4123172760009766, "lr": 0.00018665760238884108, "tps": 92790, "wall": 12367.0} {"step": 17510, "train_loss": 3.3352644443511963, "lr": 0.00018663877612346726, "tps": 92757, "wall": 12372.0} {"step": 17511, "train_loss": 3.2570626735687256, "lr": 0.0001866199502360113, "tps": 92725, "wall": 12377.0} {"step": 17512, "train_loss": 3.3712804317474365, "lr": 0.00018660112472668633, "tps": 92693, "wall": 12382.1} {"step": 17513, "train_loss": 3.2829020023345947, "lr": 0.0001865822995957056, "tps": 92661, "wall": 12387.0} {"step": 17514, "train_loss": 3.226144552230835, "lr": 0.0001865634748432824, "tps": 92628, "wall": 12392.1} {"step": 17515, "train_loss": 3.3495841026306152, "lr": 0.00018654465046962998, "tps": 92595, "wall": 12397.3} {"step": 17516, "train_loss": 3.3384857177734375, "lr": 0.00018652582647496154, "tps": 92562, "wall": 12402.4} {"step": 17517, "train_loss": 3.2979230880737305, "lr": 0.00018650700285949038, "tps": 92528, "wall": 12407.6} {"step": 17518, "train_loss": 3.290286064147949, "lr": 0.00018648817962342972, "tps": 92495, "wall": 12412.8} {"step": 17519, "train_loss": 3.367502450942993, "lr": 0.00018646935676699275, "tps": 92462, "wall": 12417.9} {"step": 17520, "train_loss": 3.298563241958618, "lr": 0.0001864505342903927, "tps": 92430, "wall": 12423.0} {"step": 17521, "train_loss": 3.2995314598083496, "lr": 0.0001864317121938428, "tps": 92397, "wall": 12428.1} {"step": 17522, "train_loss": 3.3382551670074463, "lr": 0.0001864128904775564, "tps": 92364, "wall": 12433.2} {"step": 17523, "train_loss": 3.3569068908691406, "lr": 0.00018639406914174646, "tps": 92331, "wall": 12438.3} {"step": 17524, "train_loss": 3.3485209941864014, "lr": 0.00018637524818662632, "tps": 92298, "wall": 12443.6} {"step": 17525, "train_loss": 3.3615808486938477, "lr": 0.00018635642761240928, "tps": 92264, "wall": 12448.8} {"step": 17526, "train_loss": 3.3185670375823975, "lr": 0.0001863376074193084, "tps": 92232, "wall": 12453.9} {"step": 17527, "train_loss": 3.336087942123413, "lr": 0.0001863187876075369, "tps": 92200, "wall": 12458.9} {"step": 17528, "train_loss": 3.390155076980591, "lr": 0.000186299968177308, "tps": 92168, "wall": 12463.9} {"step": 17529, "train_loss": 3.2675933837890625, "lr": 0.00018628114912883493, "tps": 92135, "wall": 12469.1} {"step": 17530, "train_loss": 3.379810094833374, "lr": 0.0001862623304623308, "tps": 92103, "wall": 12474.2} {"step": 17531, "train_loss": 3.3605360984802246, "lr": 0.0001862435121780088, "tps": 92069, "wall": 12479.5} {"step": 17532, "train_loss": 3.324617385864258, "lr": 0.00018622469427608218, "tps": 92036, "wall": 12484.6} {"step": 17533, "train_loss": 3.218501329421997, "lr": 0.000186205876756764, "tps": 92004, "wall": 12489.7} {"step": 17534, "train_loss": 3.3118410110473633, "lr": 0.0001861870596202675, "tps": 91972, "wall": 12494.7} {"step": 17535, "train_loss": 3.296708106994629, "lr": 0.0001861682428668058, "tps": 91941, "wall": 12499.7} {"step": 17536, "train_loss": 3.3176491260528564, "lr": 0.0001861494264965921, "tps": 91909, "wall": 12504.8} {"step": 17537, "train_loss": 3.3796374797821045, "lr": 0.0001861306105098395, "tps": 91877, "wall": 12509.8} {"step": 17538, "train_loss": 3.359532117843628, "lr": 0.00018611179490676114, "tps": 91845, "wall": 12514.9} {"step": 17539, "train_loss": 3.259920120239258, "lr": 0.00018609297968757028, "tps": 91814, "wall": 12519.8} {"step": 17540, "train_loss": 3.3375425338745117, "lr": 0.00018607416485247991, "tps": 91783, "wall": 12524.7} {"step": 17541, "train_loss": 3.20115065574646, "lr": 0.00018605535040170325, "tps": 91751, "wall": 12529.8} {"step": 17542, "train_loss": 3.3282275199890137, "lr": 0.00018603653633545347, "tps": 91720, "wall": 12534.8} {"step": 17543, "train_loss": 3.41239857673645, "lr": 0.0001860177226539436, "tps": 91689, "wall": 12539.8} {"step": 17544, "train_loss": 3.3868260383605957, "lr": 0.00018599890935738685, "tps": 91657, "wall": 12544.8} {"step": 17545, "train_loss": 3.451934814453125, "lr": 0.00018598009644599627, "tps": 91626, "wall": 12549.8} {"step": 17546, "train_loss": 3.2603249549865723, "lr": 0.00018596128391998497, "tps": 91595, "wall": 12554.8} {"step": 17547, "train_loss": 3.3837833404541016, "lr": 0.0001859424717795661, "tps": 91563, "wall": 12559.8} {"step": 17548, "train_loss": 3.2454702854156494, "lr": 0.00018592366002495277, "tps": 91532, "wall": 12564.8} {"step": 17549, "train_loss": 3.412114143371582, "lr": 0.00018590484865635808, "tps": 91501, "wall": 12569.9} {"step": 17550, "train_loss": 3.3422751426696777, "lr": 0.00018588603767399504, "tps": 91470, "wall": 12574.8} {"step": 17551, "train_loss": 3.261014461517334, "lr": 0.00018586722707807684, "tps": 91439, "wall": 12579.7} {"step": 17552, "train_loss": 3.396178960800171, "lr": 0.0001858484168688166, "tps": 91409, "wall": 12584.7} {"step": 17553, "train_loss": 3.2866294384002686, "lr": 0.00018582960704642724, "tps": 91376, "wall": 12589.8} {"step": 17554, "train_loss": 3.3904428482055664, "lr": 0.000185810797611122, "tps": 91345, "wall": 12594.8} {"step": 17555, "train_loss": 3.370100736618042, "lr": 0.00018579198856311387, "tps": 91314, "wall": 12599.9} {"step": 17556, "train_loss": 3.2961034774780273, "lr": 0.00018577317990261597, "tps": 91282, "wall": 12605.0} {"step": 17557, "train_loss": 3.2979938983917236, "lr": 0.00018575437162984132, "tps": 91251, "wall": 12610.0} {"step": 17558, "train_loss": 3.285618543624878, "lr": 0.000185735563745003, "tps": 91219, "wall": 12615.1} {"step": 17559, "train_loss": 3.221741199493408, "lr": 0.0001857167562483141, "tps": 91186, "wall": 12620.4} {"step": 17560, "train_loss": 3.2845401763916016, "lr": 0.0001856979491399876, "tps": 91154, "wall": 12625.5} {"step": 17561, "train_loss": 3.3179609775543213, "lr": 0.0001856791424202366, "tps": 91123, "wall": 12630.6} {"step": 17562, "train_loss": 3.413419008255005, "lr": 0.00018566033608927418, "tps": 91091, "wall": 12635.7} {"step": 17563, "train_loss": 3.2922871112823486, "lr": 0.0001856415301473133, "tps": 91060, "wall": 12640.8} {"step": 17564, "train_loss": 3.332669496536255, "lr": 0.00018562272459456697, "tps": 91029, "wall": 12645.8} {"step": 17565, "train_loss": 3.3513543605804443, "lr": 0.00018560391943124832, "tps": 90996, "wall": 12651.1} {"step": 17566, "train_loss": 3.344022512435913, "lr": 0.00018558511465757032, "tps": 90962, "wall": 12656.5} {"step": 17567, "train_loss": 3.3421201705932617, "lr": 0.00018556631027374603, "tps": 90930, "wall": 12661.8} {"step": 17568, "train_loss": 3.3943095207214355, "lr": 0.00018554750627998838, "tps": 90899, "wall": 12666.8} {"step": 17569, "train_loss": 3.370237350463867, "lr": 0.00018552870267651055, "tps": 90867, "wall": 12671.9} {"step": 17570, "train_loss": 3.308946132659912, "lr": 0.00018550989946352532, "tps": 90837, "wall": 12676.9} {"step": 17571, "train_loss": 3.3610925674438477, "lr": 0.0001854910966412459, "tps": 90806, "wall": 12681.9} {"step": 17572, "train_loss": 3.2413179874420166, "lr": 0.00018547229420988516, "tps": 90776, "wall": 12686.8} {"step": 17573, "train_loss": 3.4232449531555176, "lr": 0.0001854534921696562, "tps": 90746, "wall": 12691.7} {"step": 17574, "train_loss": 3.36183500289917, "lr": 0.00018543469052077188, "tps": 90716, "wall": 12696.7} {"step": 17575, "train_loss": 3.297287940979004, "lr": 0.00018541588926344527, "tps": 90685, "wall": 12701.7} {"step": 17576, "train_loss": 3.2900962829589844, "lr": 0.00018539708839788936, "tps": 90653, "wall": 12706.9} {"step": 17577, "train_loss": 3.291285991668701, "lr": 0.0001853782879243171, "tps": 90622, "wall": 12712.0} {"step": 17578, "train_loss": 3.31108021736145, "lr": 0.00018535948784294143, "tps": 90592, "wall": 12717.0} {"step": 17579, "train_loss": 3.272960662841797, "lr": 0.00018534068815397544, "tps": 90562, "wall": 12721.9} {"step": 17580, "train_loss": 3.2828850746154785, "lr": 0.00018532188885763188, "tps": 90532, "wall": 12726.8} {"step": 17581, "train_loss": 3.3318986892700195, "lr": 0.00018530308995412393, "tps": 90502, "wall": 12731.7} {"step": 17582, "train_loss": 3.397409439086914, "lr": 0.00018528429144366442, "tps": 90473, "wall": 12736.6} {"step": 17583, "train_loss": 3.395796060562134, "lr": 0.00018526549332646637, "tps": 90443, "wall": 12741.4} {"step": 17584, "train_loss": 3.362020492553711, "lr": 0.0001852466956027427, "tps": 90413, "wall": 12746.4} {"step": 17585, "train_loss": 3.324455499649048, "lr": 0.00018522789827270627, "tps": 90384, "wall": 12751.3} {"step": 17586, "train_loss": 3.328965663909912, "lr": 0.00018520910133657017, "tps": 90354, "wall": 12756.2} {"step": 17587, "train_loss": 3.228252410888672, "lr": 0.00018519030479454717, "tps": 90325, "wall": 12761.1} {"step": 17588, "train_loss": 3.332909345626831, "lr": 0.00018517150864685037, "tps": 90295, "wall": 12766.0} {"step": 17589, "train_loss": 3.302372932434082, "lr": 0.00018515271289369257, "tps": 90265, "wall": 12771.0} {"step": 17590, "train_loss": 3.4538049697875977, "lr": 0.00018513391753528669, "tps": 90236, "wall": 12775.9} {"step": 17591, "train_loss": 3.3557136058807373, "lr": 0.00018511512257184568, "tps": 90206, "wall": 12780.8} {"step": 17592, "train_loss": 3.2622900009155273, "lr": 0.00018509632800358246, "tps": 90175, "wall": 12785.9} {"step": 17593, "train_loss": 3.4077258110046387, "lr": 0.00018507753383071, "tps": 90144, "wall": 12791.0} {"step": 17594, "train_loss": 3.295046806335449, "lr": 0.00018505874005344102, "tps": 90113, "wall": 12796.1} {"step": 17595, "train_loss": 3.235826015472412, "lr": 0.00018503994667198854, "tps": 90083, "wall": 12801.1} {"step": 17596, "train_loss": 3.3196804523468018, "lr": 0.00018502115368656548, "tps": 90050, "wall": 12806.5} {"step": 17597, "train_loss": 3.3992621898651123, "lr": 0.0001850023610973847, "tps": 90018, "wall": 12811.8} {"step": 17598, "train_loss": 3.418405294418335, "lr": 0.00018498356890465903, "tps": 89986, "wall": 12817.1} {"step": 17599, "train_loss": 3.3495278358459473, "lr": 0.00018496477710860135, "tps": 89954, "wall": 12822.4} {"step": 17600, "train_loss": 3.3903145790100098, "lr": 0.00018494598570942462, "tps": 89922, "wall": 12827.7} {"step": 17601, "train_loss": 3.335000514984131, "lr": 0.00018492719470734165, "tps": 89890, "wall": 12833.0} {"step": 17602, "train_loss": 3.315647602081299, "lr": 0.0001849084041025653, "tps": 89858, "wall": 12838.3} {"step": 17603, "train_loss": 3.2689974308013916, "lr": 0.0001848896138953085, "tps": 89826, "wall": 12843.7} {"step": 17604, "train_loss": 3.4091079235076904, "lr": 0.00018487082408578397, "tps": 89793, "wall": 12849.0} {"step": 17605, "train_loss": 3.3757266998291016, "lr": 0.0001848520346742047, "tps": 89763, "wall": 12854.1} {"step": 17606, "train_loss": 3.3684849739074707, "lr": 0.0001848332456607835, "tps": 89732, "wall": 12859.2} {"step": 17607, "train_loss": 3.334359645843506, "lr": 0.00018481445704573312, "tps": 89701, "wall": 12864.4} {"step": 17608, "train_loss": 3.4047770500183105, "lr": 0.00018479566882926652, "tps": 89671, "wall": 12869.5} {"step": 17609, "train_loss": 3.2639002799987793, "lr": 0.0001847768810115965, "tps": 89638, "wall": 12874.9} {"step": 17610, "train_loss": 3.2735774517059326, "lr": 0.00018475809359293587, "tps": 89608, "wall": 12880.0} {"step": 17611, "train_loss": 3.3201069831848145, "lr": 0.00018473930657349747, "tps": 89578, "wall": 12885.0} {"step": 17612, "train_loss": 3.262441873550415, "lr": 0.00018472051995349409, "tps": 89547, "wall": 12890.2} {"step": 17613, "train_loss": 3.362765312194824, "lr": 0.00018470173373313862, "tps": 89517, "wall": 12895.2} {"step": 17614, "train_loss": 3.3333723545074463, "lr": 0.00018468294791264378, "tps": 89487, "wall": 12900.3} {"step": 17615, "train_loss": 3.320171594619751, "lr": 0.00018466416249222247, "tps": 89457, "wall": 12905.3} {"step": 17616, "train_loss": 3.270460605621338, "lr": 0.00018464537747208738, "tps": 89428, "wall": 12910.4} {"step": 17617, "train_loss": 3.2533750534057617, "lr": 0.0001846265928524513, "tps": 89398, "wall": 12915.4} {"step": 17618, "train_loss": 3.3398852348327637, "lr": 0.00018460780863352723, "tps": 89368, "wall": 12920.4} {"step": 17619, "train_loss": 3.397042751312256, "lr": 0.00018458902481552776, "tps": 89338, "wall": 12925.5} {"step": 17620, "train_loss": 3.4594521522521973, "lr": 0.00018457024139866568, "tps": 89308, "wall": 12930.5} {"step": 17621, "train_loss": 3.284205436706543, "lr": 0.0001845514583831539, "tps": 89278, "wall": 12935.6} {"step": 17622, "train_loss": 3.2928271293640137, "lr": 0.00018453267576920505, "tps": 89249, "wall": 12940.6} {"step": 17623, "train_loss": 3.2877583503723145, "lr": 0.000184513893557032, "tps": 89219, "wall": 12945.7} {"step": 17624, "train_loss": 3.2297208309173584, "lr": 0.0001844951117468475, "tps": 89190, "wall": 12950.6} {"step": 17625, "train_loss": 3.3303215503692627, "lr": 0.00018447633033886427, "tps": 89161, "wall": 12955.5} {"step": 17626, "train_loss": 3.2325916290283203, "lr": 0.0001844575493332951, "tps": 89132, "wall": 12960.5} {"step": 17627, "train_loss": 3.3269810676574707, "lr": 0.00018443876873035274, "tps": 89102, "wall": 12965.6} {"step": 17628, "train_loss": 3.327228546142578, "lr": 0.0001844199885302499, "tps": 89071, "wall": 12970.9} {"step": 17629, "train_loss": 3.351290702819824, "lr": 0.0001844012087331994, "tps": 89040, "wall": 12976.0} {"step": 17630, "train_loss": 3.285264730453491, "lr": 0.0001843824293394139, "tps": 89011, "wall": 12981.1} {"step": 17631, "train_loss": 3.3455116748809814, "lr": 0.00018436365034910624, "tps": 88982, "wall": 12986.1} {"step": 17632, "train_loss": 3.3453855514526367, "lr": 0.000184344871762489, "tps": 88952, "wall": 12991.1} {"step": 17633, "train_loss": 3.2599568367004395, "lr": 0.00018432609357977496, "tps": 88922, "wall": 12996.2} {"step": 17634, "train_loss": 3.2469851970672607, "lr": 0.0001843073158011769, "tps": 88893, "wall": 13001.3} {"step": 17635, "train_loss": 3.349043130874634, "lr": 0.00018428853842690753, "tps": 88863, "wall": 13006.3} {"step": 17636, "train_loss": 3.220297336578369, "lr": 0.00018426976145717946, "tps": 88833, "wall": 13011.5} {"step": 17637, "train_loss": 3.3609681129455566, "lr": 0.0001842509848922055, "tps": 88804, "wall": 13016.6} {"step": 17638, "train_loss": 3.2898333072662354, "lr": 0.00018423220873219832, "tps": 88774, "wall": 13021.6} {"step": 17639, "train_loss": 3.4324145317077637, "lr": 0.00018421343297737064, "tps": 88745, "wall": 13026.7} {"step": 17640, "train_loss": 3.216468095779419, "lr": 0.00018419465762793506, "tps": 88715, "wall": 13031.7} {"step": 17641, "train_loss": 3.385809898376465, "lr": 0.00018417588268410437, "tps": 88685, "wall": 13036.9} {"step": 17642, "train_loss": 3.1963748931884766, "lr": 0.0001841571081460913, "tps": 88656, "wall": 13042.0} {"step": 17643, "train_loss": 3.2230334281921387, "lr": 0.00018413833401410834, "tps": 88626, "wall": 13047.1} {"step": 17644, "train_loss": 3.340747356414795, "lr": 0.0001841195602883683, "tps": 88597, "wall": 13052.1} {"step": 17645, "train_loss": 3.307084798812866, "lr": 0.00018410078696908384, "tps": 88567, "wall": 13057.2} {"step": 17646, "train_loss": 3.2357428073883057, "lr": 0.0001840820140564676, "tps": 88537, "wall": 13062.4} {"step": 17647, "train_loss": 3.3054614067077637, "lr": 0.00018406324155073223, "tps": 88507, "wall": 13067.6} {"step": 17648, "train_loss": 3.2408628463745117, "lr": 0.00018404446945209042, "tps": 88478, "wall": 13072.7} {"step": 17649, "train_loss": 3.333242416381836, "lr": 0.0001840256977607548, "tps": 88448, "wall": 13077.8} {"step": 17650, "train_loss": 3.3217201232910156, "lr": 0.00018400692647693801, "tps": 88418, "wall": 13082.9} {"step": 17651, "train_loss": 3.4397101402282715, "lr": 0.0001839881556008527, "tps": 88389, "wall": 13088.0} {"step": 17652, "train_loss": 3.281856060028076, "lr": 0.0001839693851327116, "tps": 88359, "wall": 13093.1} {"step": 17653, "train_loss": 3.233607292175293, "lr": 0.00018395061507272712, "tps": 88330, "wall": 13098.2} {"step": 17654, "train_loss": 3.345386505126953, "lr": 0.00018393184542111213, "tps": 88300, "wall": 13103.5} {"step": 17655, "train_loss": 3.273712158203125, "lr": 0.0001839130761780791, "tps": 88270, "wall": 13108.6} {"step": 17656, "train_loss": 3.298689126968384, "lr": 0.0001838943073438407, "tps": 88241, "wall": 13113.7} {"step": 17657, "train_loss": 3.287656307220459, "lr": 0.00018387553891860954, "tps": 88211, "wall": 13118.9} {"step": 17658, "train_loss": 3.4003944396972656, "lr": 0.00018385677090259822, "tps": 88181, "wall": 13124.1} {"step": 17659, "train_loss": 3.315016746520996, "lr": 0.00018383800329601938, "tps": 88149, "wall": 13129.5} {"step": 17660, "train_loss": 3.2756755352020264, "lr": 0.0001838192360990856, "tps": 88119, "wall": 13134.7} {"step": 17661, "train_loss": 3.3207693099975586, "lr": 0.00018380046931200942, "tps": 88091, "wall": 13139.8} {"step": 17662, "train_loss": 3.336273193359375, "lr": 0.00018378170293500352, "tps": 88061, "wall": 13144.9} {"step": 17663, "train_loss": 3.2764811515808105, "lr": 0.0001837629369682804, "tps": 88032, "wall": 13150.0} {"step": 17664, "train_loss": 3.251283645629883, "lr": 0.00018374417141205275, "tps": 88004, "wall": 13154.9} {"step": 17665, "train_loss": 3.297628402709961, "lr": 0.0001837254062665331, "tps": 87976, "wall": 13159.9} {"step": 17666, "train_loss": 3.352032423019409, "lr": 0.00018370664153193392, "tps": 87948, "wall": 13164.8} {"step": 17667, "train_loss": 3.3895819187164307, "lr": 0.00018368787720846795, "tps": 87920, "wall": 13169.7} {"step": 17668, "train_loss": 3.346280813217163, "lr": 0.00018366911329634758, "tps": 87891, "wall": 13174.8} {"step": 17669, "train_loss": 3.2488622665405273, "lr": 0.0001836503497957856, "tps": 87863, "wall": 13179.7} {"step": 17670, "train_loss": 3.284457206726074, "lr": 0.00018363158670699434, "tps": 87836, "wall": 13184.6} {"step": 17671, "train_loss": 3.407996416091919, "lr": 0.00018361282403018642, "tps": 87806, "wall": 13189.8} {"step": 17672, "train_loss": 3.3928098678588867, "lr": 0.00018359406176557448, "tps": 87778, "wall": 13194.8} {"step": 17673, "train_loss": 3.3986666202545166, "lr": 0.00018357529991337086, "tps": 87749, "wall": 13199.9} {"step": 17674, "train_loss": 3.4458017349243164, "lr": 0.0001835565384737883, "tps": 87719, "wall": 13205.1} {"step": 17675, "train_loss": 3.358567714691162, "lr": 0.00018353777744703923, "tps": 87689, "wall": 13210.4} {"step": 17676, "train_loss": 3.2825186252593994, "lr": 0.00018351901683333615, "tps": 87660, "wall": 13215.6} {"step": 17677, "train_loss": 3.354464530944824, "lr": 0.00018350025663289166, "tps": 87630, "wall": 13220.8} {"step": 17678, "train_loss": 3.2186243534088135, "lr": 0.0001834814968459182, "tps": 87600, "wall": 13226.0} {"step": 17679, "train_loss": 3.3301596641540527, "lr": 0.00018346273747262836, "tps": 87572, "wall": 13231.1} {"step": 17680, "train_loss": 3.3274483680725098, "lr": 0.00018344397851323462, "tps": 87544, "wall": 13236.0} {"step": 17681, "train_loss": 3.3746023178100586, "lr": 0.00018342521996794937, "tps": 87516, "wall": 13241.0} {"step": 17682, "train_loss": 3.3507397174835205, "lr": 0.00018340646183698532, "tps": 87488, "wall": 13246.0} {"step": 17683, "train_loss": 3.3382933139801025, "lr": 0.00018338770412055483, "tps": 87460, "wall": 13251.0} {"step": 17684, "train_loss": 3.3991641998291016, "lr": 0.00018336894681887035, "tps": 87433, "wall": 13255.9} {"step": 17685, "train_loss": 3.30720591545105, "lr": 0.00018335018993214446, "tps": 87404, "wall": 13261.0} {"step": 17686, "train_loss": 3.306913137435913, "lr": 0.00018333143346058962, "tps": 87376, "wall": 13266.0} {"step": 17687, "train_loss": 3.219637632369995, "lr": 0.0001833126774044182, "tps": 87348, "wall": 13271.0} {"step": 17688, "train_loss": 3.4089651107788086, "lr": 0.00018329392176384283, "tps": 87320, "wall": 13276.0} {"step": 17689, "train_loss": 3.34548020362854, "lr": 0.0001832751665390759, "tps": 87292, "wall": 13281.0} {"step": 17690, "train_loss": 3.432929515838623, "lr": 0.0001832564117303299, "tps": 87263, "wall": 13286.1} {"step": 17691, "train_loss": 3.380455493927002, "lr": 0.00018323765733781717, "tps": 87234, "wall": 13291.3} {"step": 17692, "train_loss": 3.436784029006958, "lr": 0.00018321890336175036, "tps": 87205, "wall": 13296.4} {"step": 17693, "train_loss": 3.3884215354919434, "lr": 0.00018320014980234168, "tps": 87178, "wall": 13301.4} {"step": 17694, "train_loss": 3.310281753540039, "lr": 0.00018318139665980372, "tps": 87150, "wall": 13306.4} {"step": 17695, "train_loss": 3.388911008834839, "lr": 0.0001831626439343489, "tps": 87122, "wall": 13311.4} {"step": 17696, "train_loss": 3.4072437286376953, "lr": 0.00018314389162618974, "tps": 87095, "wall": 13316.3} {"step": 17697, "train_loss": 3.2502591609954834, "lr": 0.00018312513973553845, "tps": 87067, "wall": 13321.3} {"step": 17698, "train_loss": 3.303375720977783, "lr": 0.00018310638826260763, "tps": 87040, "wall": 13326.2} {"step": 17699, "train_loss": 3.3623266220092773, "lr": 0.0001830876372076096, "tps": 87013, "wall": 13331.1} {"step": 17700, "train_loss": 3.3301706314086914, "lr": 0.00018306888657075682, "tps": 86986, "wall": 13336.0} {"step": 17701, "train_loss": 3.2786824703216553, "lr": 0.00018305013635226173, "tps": 86958, "wall": 13341.0} {"step": 17702, "train_loss": 3.327747344970703, "lr": 0.00018303138655233667, "tps": 86931, "wall": 13346.0} {"step": 17703, "train_loss": 3.3017659187316895, "lr": 0.0001830126371711941, "tps": 86903, "wall": 13351.0} {"step": 17704, "train_loss": 3.3503684997558594, "lr": 0.00018299388820904627, "tps": 86876, "wall": 13356.0} {"step": 17705, "train_loss": 3.336015224456787, "lr": 0.00018297513966610576, "tps": 86847, "wall": 13361.1} {"step": 17706, "train_loss": 3.2309775352478027, "lr": 0.00018295639154258488, "tps": 86819, "wall": 13366.2} {"step": 17707, "train_loss": 3.4273757934570312, "lr": 0.00018293764383869597, "tps": 86791, "wall": 13371.3} {"step": 17708, "train_loss": 3.299398183822632, "lr": 0.00018291889655465147, "tps": 86763, "wall": 13376.3} {"step": 17709, "train_loss": 3.3085250854492188, "lr": 0.00018290014969066367, "tps": 86735, "wall": 13381.4} {"step": 17710, "train_loss": 3.295705556869507, "lr": 0.00018288140324694498, "tps": 86707, "wall": 13386.5} {"step": 17711, "train_loss": 3.366152286529541, "lr": 0.0001828626572237078, "tps": 86679, "wall": 13391.5} {"step": 17712, "train_loss": 3.3711109161376953, "lr": 0.00018284391162116443, "tps": 86651, "wall": 13396.6} {"step": 17713, "train_loss": 3.3276686668395996, "lr": 0.00018282516643952724, "tps": 86623, "wall": 13401.7} {"step": 17714, "train_loss": 3.360186815261841, "lr": 0.0001828064216790086, "tps": 86595, "wall": 13406.8} {"step": 17715, "train_loss": 3.2436347007751465, "lr": 0.00018278767733982077, "tps": 86568, "wall": 13411.8} {"step": 17716, "train_loss": 3.3379197120666504, "lr": 0.00018276893342217618, "tps": 86541, "wall": 13416.7} {"step": 17717, "train_loss": 3.4464564323425293, "lr": 0.00018275018992628712, "tps": 86515, "wall": 13421.6} {"step": 17718, "train_loss": 3.345109462738037, "lr": 0.00018273144685236595, "tps": 86488, "wall": 13426.4} {"step": 17719, "train_loss": 3.242582321166992, "lr": 0.00018271270420062497, "tps": 86461, "wall": 13431.4} {"step": 17720, "train_loss": 3.3351330757141113, "lr": 0.00018269396197127642, "tps": 86435, "wall": 13436.2} {"step": 17721, "train_loss": 3.2385096549987793, "lr": 0.00018267522016453275, "tps": 86408, "wall": 13441.1} {"step": 17722, "train_loss": 3.287080764770508, "lr": 0.00018265647878060618, "tps": 86382, "wall": 13446.0} {"step": 17723, "train_loss": 3.3914027214050293, "lr": 0.00018263773781970906, "tps": 86356, "wall": 13450.8} {"step": 17724, "train_loss": 3.3301303386688232, "lr": 0.00018261899728205366, "tps": 86329, "wall": 13455.7} {"step": 17725, "train_loss": 3.334275245666504, "lr": 0.00018260025716785227, "tps": 86303, "wall": 13460.6} {"step": 17726, "train_loss": 3.257774829864502, "lr": 0.0001825815174773172, "tps": 86276, "wall": 13465.4} {"step": 17727, "train_loss": 3.3259735107421875, "lr": 0.0001825627782106607, "tps": 86250, "wall": 13470.3} {"step": 17728, "train_loss": 3.2887380123138428, "lr": 0.0001825440393680951, "tps": 86223, "wall": 13475.3} {"step": 17729, "train_loss": 3.2607357501983643, "lr": 0.00018252530094983266, "tps": 86197, "wall": 13480.1} {"step": 17730, "train_loss": 3.29301118850708, "lr": 0.00018250656295608564, "tps": 86170, "wall": 13485.0} {"step": 17731, "train_loss": 3.378998279571533, "lr": 0.00018248782538706623, "tps": 86143, "wall": 13490.1} {"step": 17732, "train_loss": 3.361205577850342, "lr": 0.00018246908824298683, "tps": 86116, "wall": 13495.0} {"step": 17733, "train_loss": 3.366891622543335, "lr": 0.00018245035152405966, "tps": 86090, "wall": 13499.9} {"step": 17734, "train_loss": 3.3135323524475098, "lr": 0.00018243161523049688, "tps": 86063, "wall": 13504.9} {"step": 17735, "train_loss": 3.3221654891967773, "lr": 0.0001824128793625108, "tps": 86037, "wall": 13509.8} {"step": 17736, "train_loss": 3.3257503509521484, "lr": 0.00018239414392031366, "tps": 86010, "wall": 13514.7} {"step": 17737, "train_loss": 3.3077034950256348, "lr": 0.00018237540890411768, "tps": 85983, "wall": 13519.7} {"step": 17738, "train_loss": 3.251652479171753, "lr": 0.00018235667431413513, "tps": 85957, "wall": 13524.6} {"step": 17739, "train_loss": 3.2382161617279053, "lr": 0.0001823379401505782, "tps": 85930, "wall": 13529.6} {"step": 17740, "train_loss": 3.3537373542785645, "lr": 0.00018231920641365913, "tps": 85904, "wall": 13534.5} {"step": 17741, "train_loss": 3.4158735275268555, "lr": 0.00018230047310359012, "tps": 85877, "wall": 13539.6} {"step": 17742, "train_loss": 3.3708105087280273, "lr": 0.00018228174022058338, "tps": 85849, "wall": 13544.6} {"step": 17743, "train_loss": 3.327631950378418, "lr": 0.00018226300776485118, "tps": 85821, "wall": 13549.8} {"step": 17744, "train_loss": 3.3586912155151367, "lr": 0.00018224427573660564, "tps": 85794, "wall": 13554.8} {"step": 17745, "train_loss": 3.271519184112549, "lr": 0.00018222554413605894, "tps": 85768, "wall": 13559.8} {"step": 17746, "train_loss": 3.3787412643432617, "lr": 0.00018220681296342338, "tps": 85741, "wall": 13564.7} {"step": 17747, "train_loss": 3.291718006134033, "lr": 0.00018218808221891108, "tps": 85715, "wall": 13569.6} {"step": 17748, "train_loss": 3.314547300338745, "lr": 0.00018216935190273418, "tps": 85689, "wall": 13574.6} {"step": 17749, "train_loss": 3.273172616958618, "lr": 0.00018215062201510493, "tps": 85663, "wall": 13579.5} {"step": 17750, "train_loss": 3.2139153480529785, "lr": 0.0001821318925562355, "tps": 85637, "wall": 13584.4} {"step": 17751, "train_loss": 3.2956881523132324, "lr": 0.00018211316352633806, "tps": 85611, "wall": 13589.3} {"step": 17752, "train_loss": 3.3004775047302246, "lr": 0.0001820944349256247, "tps": 85584, "wall": 13594.3} {"step": 17753, "train_loss": 3.2973389625549316, "lr": 0.0001820757067543077, "tps": 85558, "wall": 13599.2} {"step": 17754, "train_loss": 3.2527966499328613, "lr": 0.0001820569790125991, "tps": 85531, "wall": 13604.2} {"step": 17755, "train_loss": 3.339655876159668, "lr": 0.00018203825170071104, "tps": 85505, "wall": 13609.1} {"step": 17756, "train_loss": 3.39605712890625, "lr": 0.00018201952481885583, "tps": 85480, "wall": 13614.0} {"step": 17757, "train_loss": 3.2423465251922607, "lr": 0.00018200079836724542, "tps": 85453, "wall": 13618.9} {"step": 17758, "train_loss": 3.3801703453063965, "lr": 0.000181982072346092, "tps": 85427, "wall": 13623.8} {"step": 17759, "train_loss": 3.3225598335266113, "lr": 0.0001819633467556078, "tps": 85401, "wall": 13628.7} {"step": 17760, "train_loss": 3.276278495788574, "lr": 0.00018194462159600488, "tps": 85376, "wall": 13633.6} {"step": 17761, "train_loss": 3.3348031044006348, "lr": 0.00018192589686749525, "tps": 85350, "wall": 13638.5} {"step": 17762, "train_loss": 3.3558058738708496, "lr": 0.00018190717257029118, "tps": 85324, "wall": 13643.4} {"step": 17763, "train_loss": 3.1958000659942627, "lr": 0.00018188844870460473, "tps": 85298, "wall": 13648.3} {"step": 17764, "train_loss": 3.321524143218994, "lr": 0.00018186972527064796, "tps": 85272, "wall": 13653.2} {"step": 17765, "train_loss": 3.344294309616089, "lr": 0.000181851002268633, "tps": 85247, "wall": 13658.1} {"step": 17766, "train_loss": 3.319516658782959, "lr": 0.000181832279698772, "tps": 85221, "wall": 13663.0} {"step": 17767, "train_loss": 3.357154607772827, "lr": 0.00018181355756127695, "tps": 85194, "wall": 13668.0} {"step": 17768, "train_loss": 3.3082265853881836, "lr": 0.00018179483585635997, "tps": 85168, "wall": 13673.1} {"step": 17769, "train_loss": 3.2994322776794434, "lr": 0.0001817761145842332, "tps": 85141, "wall": 13678.1} {"step": 17770, "train_loss": 3.2572743892669678, "lr": 0.0001817573937451087, "tps": 85115, "wall": 13683.0} {"step": 17771, "train_loss": 3.4562313556671143, "lr": 0.00018173867333919844, "tps": 85090, "wall": 13687.9} {"step": 17772, "train_loss": 3.244354248046875, "lr": 0.00018171995336671462, "tps": 85064, "wall": 13692.7} {"step": 17773, "train_loss": 3.2321598529815674, "lr": 0.00018170123382786924, "tps": 85039, "wall": 13697.7} {"step": 17774, "train_loss": 3.2594730854034424, "lr": 0.00018168251472287428, "tps": 85013, "wall": 13702.6} {"step": 17775, "train_loss": 3.2416329383850098, "lr": 0.00018166379605194193, "tps": 84987, "wall": 13707.5} {"step": 17776, "train_loss": 3.255079984664917, "lr": 0.00018164507781528414, "tps": 84962, "wall": 13712.4} {"step": 17777, "train_loss": 3.348426342010498, "lr": 0.00018162636001311304, "tps": 84936, "wall": 13717.3} {"step": 17778, "train_loss": 3.3543145656585693, "lr": 0.00018160764264564053, "tps": 84911, "wall": 13722.1} {"step": 17779, "train_loss": 3.34433650970459, "lr": 0.00018158892571307873, "tps": 84885, "wall": 13727.1} {"step": 17780, "train_loss": 3.225966691970825, "lr": 0.00018157020921563972, "tps": 84860, "wall": 13731.9} {"step": 17781, "train_loss": 3.3626840114593506, "lr": 0.0001815514931535354, "tps": 84834, "wall": 13736.8} {"step": 17782, "train_loss": 3.3849680423736572, "lr": 0.0001815327775269779, "tps": 84809, "wall": 13741.7} {"step": 17783, "train_loss": 3.1979291439056396, "lr": 0.0001815140623361792, "tps": 84784, "wall": 13746.6} {"step": 17784, "train_loss": 3.3902626037597656, "lr": 0.00018149534758135123, "tps": 84758, "wall": 13751.5} {"step": 17785, "train_loss": 3.3707053661346436, "lr": 0.00018147663326270608, "tps": 84733, "wall": 13756.3} {"step": 17786, "train_loss": 3.453359603881836, "lr": 0.00018145791938045566, "tps": 84708, "wall": 13761.2} {"step": 17787, "train_loss": 3.2746517658233643, "lr": 0.00018143920593481205, "tps": 84683, "wall": 13766.1} {"step": 17788, "train_loss": 3.422842502593994, "lr": 0.0001814204929259872, "tps": 84657, "wall": 13770.9} {"step": 17789, "train_loss": 3.373246669769287, "lr": 0.00018140178035419305, "tps": 84632, "wall": 13775.9} {"step": 17790, "train_loss": 3.227787494659424, "lr": 0.00018138306821964165, "tps": 84607, "wall": 13780.7} {"step": 17791, "train_loss": 3.190833806991577, "lr": 0.00018136435652254496, "tps": 84582, "wall": 13785.6} {"step": 17792, "train_loss": 3.3702893257141113, "lr": 0.0001813456452631149, "tps": 84556, "wall": 13790.6} {"step": 17793, "train_loss": 3.380765438079834, "lr": 0.00018132693444156348, "tps": 84531, "wall": 13795.5} {"step": 17794, "train_loss": 3.332961082458496, "lr": 0.0001813082240581026, "tps": 84506, "wall": 13800.3} {"step": 17795, "train_loss": 3.286165714263916, "lr": 0.0001812895141129443, "tps": 84480, "wall": 13805.2} {"step": 17796, "train_loss": 3.3113245964050293, "lr": 0.00018127080460630048, "tps": 84455, "wall": 13810.1} {"step": 17797, "train_loss": 3.251687526702881, "lr": 0.00018125209553838305, "tps": 84430, "wall": 13815.0} {"step": 17798, "train_loss": 3.2555336952209473, "lr": 0.000181233386909404, "tps": 84405, "wall": 13819.9} {"step": 17799, "train_loss": 3.3220653533935547, "lr": 0.00018121467871957522, "tps": 84380, "wall": 13824.8} {"step": 17800, "train_loss": 3.328526496887207, "lr": 0.00018119597096910868, "tps": 84355, "wall": 13829.7} {"step": 17801, "train_loss": 3.2858119010925293, "lr": 0.00018117726365821625, "tps": 84330, "wall": 13834.6} {"step": 17802, "train_loss": 3.273695230484009, "lr": 0.0001811585567871099, "tps": 84304, "wall": 13839.5} {"step": 17803, "train_loss": 3.2386693954467773, "lr": 0.00018113985035600152, "tps": 84280, "wall": 13844.4} {"step": 17804, "train_loss": 3.2850639820098877, "lr": 0.00018112114436510298, "tps": 84254, "wall": 13849.3} {"step": 17805, "train_loss": 3.426363468170166, "lr": 0.0001811024388146263, "tps": 84229, "wall": 13854.2} {"step": 17806, "train_loss": 3.213888645172119, "lr": 0.00018108373370478328, "tps": 84204, "wall": 13859.1} {"step": 17807, "train_loss": 3.358333110809326, "lr": 0.00018106502903578577, "tps": 84179, "wall": 13864.0} {"step": 17808, "train_loss": 3.1895174980163574, "lr": 0.00018104632480784574, "tps": 84154, "wall": 13868.8} {"step": 17809, "train_loss": 3.3659415245056152, "lr": 0.00018102762102117508, "tps": 84129, "wall": 13873.7} {"step": 17810, "train_loss": 3.3523778915405273, "lr": 0.00018100891767598557, "tps": 84105, "wall": 13878.6} {"step": 17811, "train_loss": 3.2932486534118652, "lr": 0.0001809902147724892, "tps": 84080, "wall": 13883.5} {"step": 17812, "train_loss": 3.312103748321533, "lr": 0.00018097151231089785, "tps": 84055, "wall": 13888.4} {"step": 17813, "train_loss": 3.384322166442871, "lr": 0.00018095281029142322, "tps": 84030, "wall": 13893.3} {"step": 17814, "train_loss": 3.4377009868621826, "lr": 0.0001809341087142773, "tps": 84005, "wall": 13898.2} {"step": 17815, "train_loss": 3.230583429336548, "lr": 0.00018091540757967192, "tps": 83980, "wall": 13903.1} {"step": 17816, "train_loss": 3.351585865020752, "lr": 0.0001808967068878189, "tps": 83955, "wall": 13908.1} {"step": 17817, "train_loss": 3.268169641494751, "lr": 0.00018087800663893009, "tps": 83930, "wall": 13913.0} {"step": 17818, "train_loss": 3.3390915393829346, "lr": 0.0001808593068332174, "tps": 83905, "wall": 13917.9} {"step": 17819, "train_loss": 3.3401544094085693, "lr": 0.00018084060747089255, "tps": 83880, "wall": 13922.8} {"step": 17820, "train_loss": 3.2977635860443115, "lr": 0.0001808219085521674, "tps": 83855, "wall": 13927.7} {"step": 17821, "train_loss": 3.4428582191467285, "lr": 0.0001808032100772538, "tps": 83830, "wall": 13932.6} {"step": 17822, "train_loss": 3.342831611633301, "lr": 0.00018078451204636358, "tps": 83806, "wall": 13937.5} {"step": 17823, "train_loss": 3.361668109893799, "lr": 0.0001807658144597085, "tps": 83781, "wall": 13942.4} {"step": 17824, "train_loss": 3.2878689765930176, "lr": 0.00018074711731750042, "tps": 83756, "wall": 13947.3} {"step": 17825, "train_loss": 3.2277979850769043, "lr": 0.0001807284206199511, "tps": 83731, "wall": 13952.2} {"step": 17826, "train_loss": 3.335829257965088, "lr": 0.00018070972436727242, "tps": 83707, "wall": 13957.1} {"step": 17827, "train_loss": 3.3197860717773438, "lr": 0.000180691028559676, "tps": 83682, "wall": 13962.0} {"step": 17828, "train_loss": 3.287202835083008, "lr": 0.00018067233319737377, "tps": 83657, "wall": 13967.0} {"step": 17829, "train_loss": 3.384096145629883, "lr": 0.00018065363828057755, "tps": 83632, "wall": 13971.9} {"step": 17830, "train_loss": 3.3168342113494873, "lr": 0.00018063494380949897, "tps": 83608, "wall": 13976.8} {"step": 17831, "train_loss": 3.3458023071289062, "lr": 0.0001806162497843499, "tps": 83583, "wall": 13981.7} {"step": 17832, "train_loss": 3.349278450012207, "lr": 0.0001805975562053421, "tps": 83559, "wall": 13986.5} {"step": 17833, "train_loss": 3.2429416179656982, "lr": 0.00018057886307268727, "tps": 83534, "wall": 13991.5} {"step": 17834, "train_loss": 3.351734161376953, "lr": 0.00018056017038659724, "tps": 83508, "wall": 13996.6} {"step": 17835, "train_loss": 3.3878989219665527, "lr": 0.00018054147814728375, "tps": 83484, "wall": 14001.5} {"step": 17836, "train_loss": 3.4179234504699707, "lr": 0.00018052278635495852, "tps": 83459, "wall": 14006.4} {"step": 17837, "train_loss": 3.3058347702026367, "lr": 0.00018050409500983326, "tps": 83434, "wall": 14011.3} {"step": 17838, "train_loss": 3.3188881874084473, "lr": 0.00018048540411211978, "tps": 83409, "wall": 14016.3} {"step": 17839, "train_loss": 3.3376944065093994, "lr": 0.0001804667136620298, "tps": 83384, "wall": 14021.3} {"step": 17840, "train_loss": 3.3285810947418213, "lr": 0.00018044802365977503, "tps": 83359, "wall": 14026.3} {"step": 17841, "train_loss": 3.2838544845581055, "lr": 0.00018042933410556712, "tps": 83335, "wall": 14031.2} {"step": 17842, "train_loss": 3.478041648864746, "lr": 0.00018041064499961794, "tps": 83310, "wall": 14036.2} {"step": 17843, "train_loss": 3.2580742835998535, "lr": 0.00018039195634213907, "tps": 83285, "wall": 14041.2} {"step": 17844, "train_loss": 3.3043150901794434, "lr": 0.00018037326813334222, "tps": 83260, "wall": 14046.2} {"step": 17845, "train_loss": 3.2915704250335693, "lr": 0.00018035458037343922, "tps": 83235, "wall": 14051.2} {"step": 17846, "train_loss": 3.3333842754364014, "lr": 0.00018033589306264163, "tps": 83211, "wall": 14056.1} {"step": 17847, "train_loss": 3.331547737121582, "lr": 0.0001803172062011612, "tps": 83185, "wall": 14061.1} {"step": 17848, "train_loss": 3.3277909755706787, "lr": 0.00018029851978920957, "tps": 83160, "wall": 14066.1} {"step": 17849, "train_loss": 3.3634121417999268, "lr": 0.0001802798338269985, "tps": 83136, "wall": 14071.1} {"step": 17850, "train_loss": 3.2803525924682617, "lr": 0.00018026114831473967, "tps": 83111, "wall": 14076.1} {"step": 17851, "train_loss": 3.317807674407959, "lr": 0.00018024246325264458, "tps": 83087, "wall": 14081.0} {"step": 17852, "train_loss": 3.318629026412964, "lr": 0.0001802237786409251, "tps": 83062, "wall": 14085.9} {"step": 17853, "train_loss": 3.302114486694336, "lr": 0.0001802050944797928, "tps": 83038, "wall": 14090.9} {"step": 17854, "train_loss": 3.306939125061035, "lr": 0.0001801864107694593, "tps": 83013, "wall": 14095.9} {"step": 17855, "train_loss": 3.29032826423645, "lr": 0.0001801677275101363, "tps": 82988, "wall": 14100.8} {"step": 17856, "train_loss": 3.3023133277893066, "lr": 0.00018014904470203548, "tps": 82963, "wall": 14105.9} {"step": 17857, "train_loss": 3.287562370300293, "lr": 0.00018013036234536842, "tps": 82938, "wall": 14111.0} {"step": 17858, "train_loss": 3.287977695465088, "lr": 0.00018011168044034675, "tps": 82913, "wall": 14115.9} {"step": 17859, "train_loss": 3.287797451019287, "lr": 0.0001800929989871822, "tps": 82889, "wall": 14120.9} {"step": 17860, "train_loss": 3.2802681922912598, "lr": 0.0001800743179860862, "tps": 82864, "wall": 14125.9} {"step": 17861, "train_loss": 3.355025291442871, "lr": 0.00018005563743727057, "tps": 82839, "wall": 14131.0} {"step": 17862, "train_loss": 3.3712925910949707, "lr": 0.0001800369573409468, "tps": 82815, "wall": 14135.9} {"step": 17863, "train_loss": 3.2282471656799316, "lr": 0.00018001827769732653, "tps": 82791, "wall": 14140.8} {"step": 17864, "train_loss": 3.3285489082336426, "lr": 0.0001799995985066214, "tps": 82766, "wall": 14145.9} {"step": 17865, "train_loss": 3.2828054428100586, "lr": 0.00017998091976904296, "tps": 82741, "wall": 14150.9} {"step": 17866, "train_loss": 3.29996919631958, "lr": 0.00017996224148480287, "tps": 82716, "wall": 14155.9} {"step": 17867, "train_loss": 3.3634815216064453, "lr": 0.00017994356365411265, "tps": 82692, "wall": 14160.8} {"step": 17868, "train_loss": 3.386781692504883, "lr": 0.0001799248862771839, "tps": 82668, "wall": 14165.8} {"step": 17869, "train_loss": 3.262270450592041, "lr": 0.00017990620935422823, "tps": 82644, "wall": 14170.7} {"step": 17870, "train_loss": 3.274503231048584, "lr": 0.00017988753288545714, "tps": 82620, "wall": 14175.6} {"step": 17871, "train_loss": 3.291318655014038, "lr": 0.00017986885687108227, "tps": 82596, "wall": 14180.5} {"step": 17872, "train_loss": 3.4056060314178467, "lr": 0.0001798501813113152, "tps": 82572, "wall": 14185.5} {"step": 17873, "train_loss": 3.2945761680603027, "lr": 0.00017983150620636738, "tps": 82547, "wall": 14190.4} {"step": 17874, "train_loss": 3.3486075401306152, "lr": 0.0001798128315564505, "tps": 82523, "wall": 14195.5} {"step": 17875, "train_loss": 3.3068807125091553, "lr": 0.00017979415736177597, "tps": 82499, "wall": 14200.4} {"step": 17876, "train_loss": 3.260573387145996, "lr": 0.00017977548362255546, "tps": 82474, "wall": 14205.4} {"step": 17877, "train_loss": 3.2603816986083984, "lr": 0.00017975681033900043, "tps": 82450, "wall": 14210.4} {"step": 17878, "train_loss": 3.325204372406006, "lr": 0.00017973813751132238, "tps": 82426, "wall": 14215.3} {"step": 17879, "train_loss": 3.406965732574463, "lr": 0.00017971946513973297, "tps": 82402, "wall": 14220.2} {"step": 17880, "train_loss": 3.2699904441833496, "lr": 0.00017970079322444363, "tps": 82378, "wall": 14225.2} {"step": 17881, "train_loss": 3.319444179534912, "lr": 0.00017968212176566582, "tps": 82354, "wall": 14230.1} {"step": 17882, "train_loss": 3.470282793045044, "lr": 0.0001796634507636111, "tps": 82331, "wall": 14234.9} {"step": 17883, "train_loss": 3.355616569519043, "lr": 0.00017964478021849107, "tps": 82307, "wall": 14239.8} {"step": 17884, "train_loss": 3.363924503326416, "lr": 0.00017962611013051712, "tps": 82284, "wall": 14244.7} {"step": 17885, "train_loss": 3.327415943145752, "lr": 0.00017960744049990077, "tps": 82260, "wall": 14249.6} {"step": 17886, "train_loss": 3.296895742416382, "lr": 0.00017958877132685355, "tps": 82237, "wall": 14254.4} {"step": 17887, "train_loss": 3.3072946071624756, "lr": 0.0001795701026115869, "tps": 82213, "wall": 14259.3} {"step": 17888, "train_loss": 3.336068868637085, "lr": 0.00017955143435431227, "tps": 82189, "wall": 14264.2} {"step": 17889, "train_loss": 3.3581008911132812, "lr": 0.00017953276655524128, "tps": 82165, "wall": 14269.2} {"step": 17890, "train_loss": 3.256627082824707, "lr": 0.00017951409921458523, "tps": 82142, "wall": 14274.1} {"step": 17891, "train_loss": 3.2808985710144043, "lr": 0.00017949543233255564, "tps": 82118, "wall": 14279.0} {"step": 17892, "train_loss": 3.385734796524048, "lr": 0.000179476765909364, "tps": 82094, "wall": 14283.9} {"step": 17893, "train_loss": 3.3732941150665283, "lr": 0.0001794580999452218, "tps": 82071, "wall": 14288.8} {"step": 17894, "train_loss": 3.3357901573181152, "lr": 0.00017943943444034032, "tps": 82047, "wall": 14293.7} {"step": 17895, "train_loss": 3.2449684143066406, "lr": 0.0001794207693949312, "tps": 82024, "wall": 14298.6} {"step": 17896, "train_loss": 3.2877166271209717, "lr": 0.00017940210480920583, "tps": 82000, "wall": 14303.5} {"step": 17897, "train_loss": 3.329103946685791, "lr": 0.00017938344068337556, "tps": 81976, "wall": 14308.5} {"step": 17898, "train_loss": 3.3656492233276367, "lr": 0.0001793647770176519, "tps": 81953, "wall": 14313.4} {"step": 17899, "train_loss": 3.2926104068756104, "lr": 0.0001793461138122462, "tps": 81929, "wall": 14318.3} {"step": 17900, "train_loss": 3.3933205604553223, "lr": 0.00017932745106736996, "tps": 81905, "wall": 14323.3} {"step": 17901, "train_loss": 3.325582504272461, "lr": 0.0001793087887832346, "tps": 81882, "wall": 14328.2} {"step": 17902, "train_loss": 3.354387044906616, "lr": 0.00017929012696005136, "tps": 81858, "wall": 14333.2} {"step": 17903, "train_loss": 3.316340446472168, "lr": 0.00017927146559803186, "tps": 81834, "wall": 14338.2} {"step": 17904, "train_loss": 3.357548952102661, "lr": 0.00017925280469738736, "tps": 81810, "wall": 14343.2} {"step": 17905, "train_loss": 3.2968645095825195, "lr": 0.0001792341442583293, "tps": 81786, "wall": 14348.2} {"step": 17906, "train_loss": 3.2634530067443848, "lr": 0.00017921548428106912, "tps": 81762, "wall": 14353.2} {"step": 17907, "train_loss": 3.359647274017334, "lr": 0.00017919682476581804, "tps": 81738, "wall": 14358.1} {"step": 17908, "train_loss": 3.312685489654541, "lr": 0.0001791781657127876, "tps": 81714, "wall": 14363.2} {"step": 17909, "train_loss": 3.1953444480895996, "lr": 0.00017915950712218907, "tps": 81690, "wall": 14368.2} {"step": 17910, "train_loss": 3.405277729034424, "lr": 0.00017914084899423393, "tps": 81667, "wall": 14373.2} {"step": 17911, "train_loss": 3.2433769702911377, "lr": 0.0001791221913291334, "tps": 81643, "wall": 14378.1} {"step": 17912, "train_loss": 3.2844276428222656, "lr": 0.00017910353412709887, "tps": 81619, "wall": 14383.2} {"step": 17913, "train_loss": 3.479302406311035, "lr": 0.00017908487738834178, "tps": 81595, "wall": 14388.2} {"step": 17914, "train_loss": 3.2835397720336914, "lr": 0.00017906622111307335, "tps": 81571, "wall": 14393.2} {"step": 17915, "train_loss": 3.2785322666168213, "lr": 0.00017904756530150504, "tps": 81548, "wall": 14398.1} {"step": 17916, "train_loss": 3.284095287322998, "lr": 0.00017902890995384816, "tps": 81524, "wall": 14403.1} {"step": 17917, "train_loss": 3.357332468032837, "lr": 0.0001790102550703139, "tps": 81501, "wall": 14408.0} {"step": 17918, "train_loss": 3.333519458770752, "lr": 0.00017899160065111373, "tps": 81477, "wall": 14413.0} {"step": 17919, "train_loss": 3.252472400665283, "lr": 0.00017897294669645892, "tps": 81454, "wall": 14418.0} {"step": 17920, "train_loss": 3.3035645484924316, "lr": 0.00017895429320656083, "tps": 81430, "wall": 14423.0} {"step": 17921, "train_loss": 3.2118301391601562, "lr": 0.00017893564018163068, "tps": 81406, "wall": 14428.0} {"step": 17922, "train_loss": 3.4082131385803223, "lr": 0.00017891698762187983, "tps": 81382, "wall": 14433.0} {"step": 17923, "train_loss": 3.314072608947754, "lr": 0.0001788983355275196, "tps": 81357, "wall": 14438.3} {"step": 17924, "train_loss": 3.357382297515869, "lr": 0.00017887968389876125, "tps": 81333, "wall": 14443.4} {"step": 17925, "train_loss": 3.2177858352661133, "lr": 0.000178861032735816, "tps": 81309, "wall": 14448.5} {"step": 17926, "train_loss": 3.3582382202148438, "lr": 0.00017884238203889528, "tps": 81285, "wall": 14453.6} {"step": 17927, "train_loss": 3.3269481658935547, "lr": 0.00017882373180821021, "tps": 81261, "wall": 14458.7} {"step": 17928, "train_loss": 3.327378988265991, "lr": 0.00017880508204397213, "tps": 81237, "wall": 14463.8} {"step": 17929, "train_loss": 3.4111974239349365, "lr": 0.00017878643274639236, "tps": 81213, "wall": 14468.9} {"step": 17930, "train_loss": 3.342728614807129, "lr": 0.0001787677839156821, "tps": 81189, "wall": 14473.9} {"step": 17931, "train_loss": 3.3309290409088135, "lr": 0.00017874913555205262, "tps": 81165, "wall": 14479.0} {"step": 17932, "train_loss": 3.306778907775879, "lr": 0.00017873048765571512, "tps": 81141, "wall": 14484.0} {"step": 17933, "train_loss": 3.356330156326294, "lr": 0.00017871184022688095, "tps": 81117, "wall": 14489.1} {"step": 17934, "train_loss": 3.331493616104126, "lr": 0.00017869319326576126, "tps": 81093, "wall": 14494.2} {"step": 17935, "train_loss": 3.243015766143799, "lr": 0.00017867454677256728, "tps": 81069, "wall": 14499.2} {"step": 17936, "train_loss": 3.2691359519958496, "lr": 0.00017865590074751027, "tps": 81045, "wall": 14504.4} {"step": 17937, "train_loss": 3.295889377593994, "lr": 0.0001786372551908015, "tps": 81020, "wall": 14509.7} {"step": 17938, "train_loss": 3.302553415298462, "lr": 0.00017861861010265212, "tps": 80996, "wall": 14514.8} {"step": 17939, "train_loss": 3.304875135421753, "lr": 0.00017859996548327337, "tps": 80972, "wall": 14519.9} {"step": 17940, "train_loss": 3.3485419750213623, "lr": 0.00017858132133287646, "tps": 80948, "wall": 14525.0} {"step": 17941, "train_loss": 3.302725076675415, "lr": 0.00017856267765167254, "tps": 80924, "wall": 14530.1} {"step": 17942, "train_loss": 3.301528215408325, "lr": 0.00017854403443987287, "tps": 80900, "wall": 14535.3} {"step": 17943, "train_loss": 3.271444320678711, "lr": 0.00017852539169768865, "tps": 80876, "wall": 14540.4} {"step": 17944, "train_loss": 3.3675856590270996, "lr": 0.000178506749425331, "tps": 80852, "wall": 14545.5} {"step": 17945, "train_loss": 3.2948453426361084, "lr": 0.00017848810762301115, "tps": 80828, "wall": 14550.7} {"step": 17946, "train_loss": 3.3950588703155518, "lr": 0.00017846946629094027, "tps": 80804, "wall": 14555.8} {"step": 17947, "train_loss": 3.316248893737793, "lr": 0.00017845082542932952, "tps": 80780, "wall": 14560.9} {"step": 17948, "train_loss": 3.229104995727539, "lr": 0.00017843218503839006, "tps": 80757, "wall": 14566.0} {"step": 17949, "train_loss": 3.333510160446167, "lr": 0.00017841354511833303, "tps": 80732, "wall": 14571.2} {"step": 17950, "train_loss": 3.323476552963257, "lr": 0.00017839490566936967, "tps": 80709, "wall": 14576.3} {"step": 17951, "train_loss": 3.3072290420532227, "lr": 0.00017837626669171103, "tps": 80685, "wall": 14581.3} {"step": 17952, "train_loss": 3.332879066467285, "lr": 0.00017835762818556837, "tps": 80662, "wall": 14586.4} {"step": 17953, "train_loss": 3.345458507537842, "lr": 0.0001783389901511527, "tps": 80638, "wall": 14591.5} {"step": 17954, "train_loss": 3.350379467010498, "lr": 0.00017832035258867515, "tps": 80615, "wall": 14596.5} {"step": 17955, "train_loss": 3.272325038909912, "lr": 0.00017830171549834697, "tps": 80591, "wall": 14601.6} {"step": 17956, "train_loss": 3.296978235244751, "lr": 0.00017828307888037917, "tps": 80568, "wall": 14606.6} {"step": 17957, "train_loss": 3.2569518089294434, "lr": 0.00017826444273498292, "tps": 80544, "wall": 14611.7} {"step": 17958, "train_loss": 3.305870532989502, "lr": 0.00017824580706236933, "tps": 80521, "wall": 14616.7} {"step": 17959, "train_loss": 3.378573417663574, "lr": 0.00017822717186274947, "tps": 80498, "wall": 14621.7} {"step": 17960, "train_loss": 3.3583924770355225, "lr": 0.0001782085371363345, "tps": 80473, "wall": 14627.1} {"step": 17961, "train_loss": 3.4382164478302, "lr": 0.00017818990288333546, "tps": 80449, "wall": 14632.2} {"step": 17962, "train_loss": 3.3247714042663574, "lr": 0.00017817126910396348, "tps": 80426, "wall": 14637.3} {"step": 17963, "train_loss": 3.2694711685180664, "lr": 0.0001781526357984296, "tps": 80402, "wall": 14642.4} {"step": 17964, "train_loss": 3.359928607940674, "lr": 0.00017813400296694493, "tps": 80379, "wall": 14647.5} {"step": 17965, "train_loss": 3.3318188190460205, "lr": 0.00017811537060972058, "tps": 80355, "wall": 14652.6} {"step": 17966, "train_loss": 3.3059558868408203, "lr": 0.00017809673872696755, "tps": 80331, "wall": 14657.8} {"step": 17967, "train_loss": 3.272449016571045, "lr": 0.0001780781073188969, "tps": 80306, "wall": 14663.1} {"step": 17968, "train_loss": 3.3268980979919434, "lr": 0.00017805947638571977, "tps": 80283, "wall": 14668.2} {"step": 17969, "train_loss": 3.2277016639709473, "lr": 0.00017804084592764713, "tps": 80261, "wall": 14673.2} {"step": 17970, "train_loss": 3.335867166519165, "lr": 0.00017802221594489005, "tps": 80238, "wall": 14678.1} {"step": 17971, "train_loss": 3.3260598182678223, "lr": 0.0001780035864376596, "tps": 80215, "wall": 14683.0} {"step": 17972, "train_loss": 3.4638547897338867, "lr": 0.0001779849574061668, "tps": 80193, "wall": 14688.0} {"step": 17973, "train_loss": 3.2047529220581055, "lr": 0.00017796632885062262, "tps": 80170, "wall": 14693.0} {"step": 17974, "train_loss": 3.304051399230957, "lr": 0.00017794770077123818, "tps": 80147, "wall": 14698.1} {"step": 17975, "train_loss": 3.4406955242156982, "lr": 0.0001779290731682245, "tps": 80125, "wall": 14703.0} {"step": 17976, "train_loss": 3.269289970397949, "lr": 0.0001779104460417925, "tps": 80102, "wall": 14707.8} {"step": 17977, "train_loss": 3.354506015777588, "lr": 0.00017789181939215326, "tps": 80080, "wall": 14712.8} {"step": 17978, "train_loss": 3.2761621475219727, "lr": 0.0001778731932195178, "tps": 80058, "wall": 14717.7} {"step": 17979, "train_loss": 3.219346046447754, "lr": 0.00017785456752409705, "tps": 80035, "wall": 14722.6} {"step": 17980, "train_loss": 3.3261613845825195, "lr": 0.00017783594230610207, "tps": 80012, "wall": 14727.7} {"step": 17981, "train_loss": 3.397906541824341, "lr": 0.00017781731756574373, "tps": 79990, "wall": 14732.7} {"step": 17982, "train_loss": 3.3867053985595703, "lr": 0.00017779869330323322, "tps": 79967, "wall": 14737.7} {"step": 17983, "train_loss": 3.2960562705993652, "lr": 0.00017778006951878132, "tps": 79943, "wall": 14742.8} {"step": 17984, "train_loss": 3.3073558807373047, "lr": 0.00017776144621259906, "tps": 79920, "wall": 14748.0} {"step": 17985, "train_loss": 3.2970995903015137, "lr": 0.0001777428233848975, "tps": 79897, "wall": 14753.1} {"step": 17986, "train_loss": 3.4160079956054688, "lr": 0.00017772420103588746, "tps": 79873, "wall": 14758.2} {"step": 17987, "train_loss": 3.322699546813965, "lr": 0.00017770557916577996, "tps": 79850, "wall": 14763.3} {"step": 17988, "train_loss": 3.3408823013305664, "lr": 0.00017768695777478595, "tps": 79827, "wall": 14768.4} {"step": 17989, "train_loss": 3.323561429977417, "lr": 0.00017766833686311642, "tps": 79804, "wall": 14773.5} {"step": 17990, "train_loss": 3.301438331604004, "lr": 0.00017764971643098224, "tps": 79781, "wall": 14778.7} {"step": 17991, "train_loss": 3.353452682495117, "lr": 0.00017763109647859433, "tps": 79757, "wall": 14783.8} {"step": 17992, "train_loss": 3.390976905822754, "lr": 0.00017761247700616371, "tps": 79734, "wall": 14788.9} {"step": 17993, "train_loss": 3.372107982635498, "lr": 0.0001775938580139012, "tps": 79711, "wall": 14794.0} {"step": 17994, "train_loss": 3.278911590576172, "lr": 0.00017757523950201774, "tps": 79688, "wall": 14799.1} {"step": 17995, "train_loss": 3.3036882877349854, "lr": 0.00017755662147072432, "tps": 79665, "wall": 14804.3} {"step": 17996, "train_loss": 3.253645420074463, "lr": 0.0001775380039202317, "tps": 79641, "wall": 14809.5} {"step": 17997, "train_loss": 3.2270665168762207, "lr": 0.00017751938685075093, "tps": 79618, "wall": 14814.6} {"step": 17998, "train_loss": 3.244455575942993, "lr": 0.00017750077026249284, "tps": 79595, "wall": 14819.8} {"step": 17999, "train_loss": 3.311178207397461, "lr": 0.00017748215415566834, "tps": 79572, "wall": 14824.9} {"step": 18000, "train_loss": 3.350543975830078, "lr": 0.00017746353853048826, "tps": 79548, "wall": 14830.1, "val_loss_monitor": 3.378465178557038} {"step": 18001, "train_loss": 3.321077585220337, "lr": 0.00017744492338716352, "tps": 79267, "wall": 14883.5} {"step": 18002, "train_loss": 3.308014392852783, "lr": 0.00017742630872590503, "tps": 79245, "wall": 14888.5} {"step": 18001, "train_loss": 3.226193904876709, "lr": 0.00017744492338716352, "tps": 246411395, "wall": 4.8} {"step": 18002, "train_loss": 3.248103618621826, "lr": 0.00017742630872590503, "tps": 131032419, "wall": 9.0} {"step": 18003, "train_loss": 3.230915069580078, "lr": 0.00017740769454692359, "tps": 88047056, "wall": 13.4} {"step": 18004, "train_loss": 3.3177685737609863, "lr": 0.00017738908085043008, "tps": 66078497, "wall": 17.9} {"step": 18005, "train_loss": 3.190268039703369, "lr": 0.0001773704676366354, "tps": 52646102, "wall": 22.4} {"step": 18006, "train_loss": 3.224151372909546, "lr": 0.00017735185490575038, "tps": 43693036, "wall": 27.0} {"step": 18007, "train_loss": 3.19891619682312, "lr": 0.0001773332426579858, "tps": 37286544, "wall": 31.7} {"step": 18008, "train_loss": 3.308614730834961, "lr": 0.00017731463089355255, "tps": 32498748, "wall": 36.3} {"step": 18009, "train_loss": 3.287865161895752, "lr": 0.00017729601961266153, "tps": 28828728, "wall": 40.9} {"step": 18010, "train_loss": 3.305459499359131, "lr": 0.00017727740881552347, "tps": 25861051, "wall": 45.6} {"step": 18011, "train_loss": 3.2003445625305176, "lr": 0.00017725879850234922, "tps": 23498842, "wall": 50.2} {"step": 18012, "train_loss": 3.292206287384033, "lr": 0.00017724018867334968, "tps": 21513015, "wall": 54.9} {"step": 18013, "train_loss": 3.1638782024383545, "lr": 0.00017722157932873557, "tps": 19836598, "wall": 59.5} {"step": 18014, "train_loss": 3.1987648010253906, "lr": 0.0001772029704687177, "tps": 18402641, "wall": 64.2} {"step": 18015, "train_loss": 3.379470109939575, "lr": 0.0001771843620935069, "tps": 17164832, "wall": 68.8} {"step": 18016, "train_loss": 3.272494316101074, "lr": 0.00017716575420331397, "tps": 16071313, "wall": 73.5} {"step": 18017, "train_loss": 3.190858840942383, "lr": 0.00017714714679834966, "tps": 15103024, "wall": 78.2} {"step": 18018, "train_loss": 3.311927318572998, "lr": 0.0001771285398788248, "tps": 14253690, "wall": 82.8} {"step": 18019, "train_loss": 3.2840776443481445, "lr": 0.00017710993344495024, "tps": 13492736, "wall": 87.5} {"step": 18020, "train_loss": 3.2735724449157715, "lr": 0.00017709132749693657, "tps": 12808882, "wall": 92.2} {"step": 18021, "train_loss": 3.3358681201934814, "lr": 0.00017707272203499472, "tps": 12186745, "wall": 96.9} {"step": 18022, "train_loss": 3.328828811645508, "lr": 0.0001770541170593354, "tps": 11615115, "wall": 101.7} {"step": 18023, "train_loss": 3.2310051918029785, "lr": 0.0001770355125701693, "tps": 11088859, "wall": 106.5} {"step": 18024, "train_loss": 3.1767568588256836, "lr": 0.00017701690856770732, "tps": 10606349, "wall": 111.4} {"step": 18025, "train_loss": 3.2351696491241455, "lr": 0.00017699830505216006, "tps": 10169927, "wall": 116.2} {"step": 18026, "train_loss": 3.1140756607055664, "lr": 0.0001769797020237384, "tps": 9770887, "wall": 120.9} {"step": 18027, "train_loss": 3.231722831726074, "lr": 0.00017696109948265294, "tps": 9403835, "wall": 125.6} {"step": 18028, "train_loss": 3.3193087577819824, "lr": 0.0001769424974291145, "tps": 9050773, "wall": 130.5} {"step": 18029, "train_loss": 3.233288049697876, "lr": 0.00017692389586333377, "tps": 8732741, "wall": 135.3} {"step": 18030, "train_loss": 3.273737668991089, "lr": 0.00017690529478552147, "tps": 8429053, "wall": 140.2} {"step": 18031, "train_loss": 3.227482318878174, "lr": 0.00017688669419588834, "tps": 8154451, "wall": 144.9} {"step": 18032, "train_loss": 3.2787911891937256, "lr": 0.00017686809409464508, "tps": 7891922, "wall": 149.7} {"step": 18033, "train_loss": 3.2579076290130615, "lr": 0.00017684949448200236, "tps": 7649665, "wall": 154.5} {"step": 18034, "train_loss": 3.1159515380859375, "lr": 0.0001768308953581709, "tps": 7422186, "wall": 159.2} {"step": 18035, "train_loss": 3.2801461219787598, "lr": 0.00017681229672336136, "tps": 7208564, "wall": 164.0} {"step": 18036, "train_loss": 3.233121156692505, "lr": 0.00017679369857778453, "tps": 7000433, "wall": 168.9} {"step": 18037, "train_loss": 3.277627944946289, "lr": 0.000176775100921651, "tps": 6808644, "wall": 173.6} {"step": 18038, "train_loss": 3.2340188026428223, "lr": 0.00017675650375517145, "tps": 6627894, "wall": 178.4} {"step": 18039, "train_loss": 3.198317766189575, "lr": 0.0001767379070785566, "tps": 6454455, "wall": 183.2} {"step": 18040, "train_loss": 3.220193862915039, "lr": 0.00017671931089201706, "tps": 6291332, "wall": 187.9} {"step": 18041, "train_loss": 3.211756944656372, "lr": 0.00017670071519576346, "tps": 6137561, "wall": 192.6} {"step": 18042, "train_loss": 3.3157334327697754, "lr": 0.0001766821199900065, "tps": 5991439, "wall": 197.4} {"step": 18043, "train_loss": 3.1270813941955566, "lr": 0.00017666352527495688, "tps": 5852124, "wall": 202.1} {"step": 18044, "train_loss": 3.304043769836426, "lr": 0.00017664493105082517, "tps": 5717529, "wall": 206.8} {"step": 18045, "train_loss": 3.1382832527160645, "lr": 0.00017662633731782204, "tps": 5589724, "wall": 211.6} {"step": 18046, "train_loss": 3.3338069915771484, "lr": 0.00017660774407615812, "tps": 5465792, "wall": 216.4} {"step": 18047, "train_loss": 3.093179702758789, "lr": 0.00017658915132604398, "tps": 5349068, "wall": 221.1} {"step": 18048, "train_loss": 3.2823328971862793, "lr": 0.0001765705590676903, "tps": 5235188, "wall": 225.9} {"step": 18049, "train_loss": 3.327353000640869, "lr": 0.0001765519673013077, "tps": 5128203, "wall": 230.7} {"step": 18050, "train_loss": 3.2409956455230713, "lr": 0.00017653337602710676, "tps": 5024658, "wall": 235.4} {"step": 18051, "train_loss": 3.139037847518921, "lr": 0.00017651478524529805, "tps": 4926003, "wall": 240.2} {"step": 18052, "train_loss": 3.2572624683380127, "lr": 0.00017649619495609223, "tps": 4830548, "wall": 244.9} {"step": 18053, "train_loss": 3.3022425174713135, "lr": 0.0001764776051596999, "tps": 4738433, "wall": 249.7} {"step": 18054, "train_loss": 3.2460029125213623, "lr": 0.00017645901585633156, "tps": 4649943, "wall": 254.5} {"step": 18055, "train_loss": 3.2185416221618652, "lr": 0.00017644042704619784, "tps": 4564238, "wall": 259.3} {"step": 18056, "train_loss": 3.1776504516601562, "lr": 0.00017642183872950939, "tps": 4481761, "wall": 264.0} {"step": 18057, "train_loss": 3.280336856842041, "lr": 0.00017640325090647666, "tps": 4402356, "wall": 268.8} {"step": 18058, "train_loss": 3.262389898300171, "lr": 0.00017638466357731023, "tps": 4325596, "wall": 273.6} {"step": 18059, "train_loss": 3.245455741882324, "lr": 0.00017636607674222074, "tps": 4251472, "wall": 278.4} {"step": 18060, "train_loss": 3.3629093170166016, "lr": 0.00017634749040141868, "tps": 4180281, "wall": 283.1} {"step": 18061, "train_loss": 3.2794992923736572, "lr": 0.0001763289045551146, "tps": 4110905, "wall": 287.9} {"step": 18062, "train_loss": 3.2420992851257324, "lr": 0.00017631031920351906, "tps": 4043976, "wall": 292.7} {"step": 18063, "train_loss": 3.301725149154663, "lr": 0.0001762917343468426, "tps": 3979435, "wall": 297.5} {"step": 18064, "train_loss": 3.2269787788391113, "lr": 0.0001762731499852957, "tps": 3916734, "wall": 302.3} {"step": 18065, "train_loss": 3.251997232437134, "lr": 0.00017625456611908895, "tps": 3855886, "wall": 307.1} {"step": 18066, "train_loss": 3.31038498878479, "lr": 0.00017623598274843288, "tps": 3796769, "wall": 311.9} {"step": 18067, "train_loss": 3.335564613342285, "lr": 0.00017621739987353787, "tps": 3739483, "wall": 316.6} {"step": 18068, "train_loss": 3.205066204071045, "lr": 0.0001761988174946146, "tps": 3683587, "wall": 321.5} {"step": 18069, "train_loss": 3.1530568599700928, "lr": 0.00017618023561187345, "tps": 3630034, "wall": 326.2} {"step": 18070, "train_loss": 3.3442153930664062, "lr": 0.00017616165422552503, "tps": 3577487, "wall": 331.0} {"step": 18071, "train_loss": 3.2616994380950928, "lr": 0.00017614307333577967, "tps": 3526587, "wall": 335.8} {"step": 18072, "train_loss": 3.2207674980163574, "lr": 0.00017612449294284797, "tps": 3477220, "wall": 340.6} {"step": 18073, "train_loss": 3.261913537979126, "lr": 0.00017610591304694046, "tps": 3428368, "wall": 345.5} {"step": 18074, "train_loss": 3.1842429637908936, "lr": 0.00017608733364826747, "tps": 3381903, "wall": 350.3} {"step": 18075, "train_loss": 3.2541122436523438, "lr": 0.00017606875474703956, "tps": 3336490, "wall": 355.1} {"step": 18076, "train_loss": 3.300276279449463, "lr": 0.00017605017634346722, "tps": 3292056, "wall": 359.9} {"step": 18077, "train_loss": 3.269888401031494, "lr": 0.00017603159843776077, "tps": 3248140, "wall": 364.8} {"step": 18078, "train_loss": 3.2714662551879883, "lr": 0.00017601302103013077, "tps": 3206243, "wall": 369.5} {"step": 18079, "train_loss": 3.3700037002563477, "lr": 0.00017599444412078768, "tps": 3165381, "wall": 374.3} {"step": 18080, "train_loss": 3.202807664871216, "lr": 0.00017597586770994194, "tps": 3125547, "wall": 379.1} {"step": 18081, "train_loss": 3.268446683883667, "lr": 0.00017595729179780388, "tps": 3086632, "wall": 383.9} {"step": 18082, "train_loss": 3.2286791801452637, "lr": 0.00017593871638458403, "tps": 3048078, "wall": 388.8} {"step": 18083, "train_loss": 3.2236523628234863, "lr": 0.00017592014147049283, "tps": 3010241, "wall": 393.7} {"step": 18084, "train_loss": 3.2216663360595703, "lr": 0.0001759015670557406, "tps": 2970746, "wall": 399.0} {"step": 18085, "train_loss": 3.3076934814453125, "lr": 0.00017588299314053783, "tps": 2932932, "wall": 404.1} {"step": 18086, "train_loss": 3.250147819519043, "lr": 0.0001758644197250949, "tps": 2897537, "wall": 409.1} {"step": 18087, "train_loss": 3.23276948928833, "lr": 0.0001758458468096222, "tps": 2864180, "wall": 413.9} {"step": 18088, "train_loss": 3.259207248687744, "lr": 0.0001758272743943301, "tps": 2831414, "wall": 418.7} {"step": 18089, "train_loss": 3.258439302444458, "lr": 0.00017580870247942905, "tps": 2799163, "wall": 423.5} {"step": 18090, "train_loss": 3.226104259490967, "lr": 0.00017579013106512945, "tps": 2767553, "wall": 428.4} {"step": 18091, "train_loss": 3.174069404602051, "lr": 0.0001757715601516416, "tps": 2736781, "wall": 433.2} {"step": 18092, "train_loss": 3.2950727939605713, "lr": 0.00017575298973917586, "tps": 2706695, "wall": 438.1} {"step": 18093, "train_loss": 3.2632932662963867, "lr": 0.00017573441982794274, "tps": 2677009, "wall": 443.0} {"step": 18094, "train_loss": 3.285956859588623, "lr": 0.00017571585041815246, "tps": 2648184, "wall": 447.8} {"step": 18095, "train_loss": 3.1846745014190674, "lr": 0.00017569728151001543, "tps": 2619762, "wall": 452.7} {"step": 18096, "train_loss": 3.240764856338501, "lr": 0.00017567871310374198, "tps": 2591899, "wall": 457.6} {"step": 18097, "train_loss": 3.238079309463501, "lr": 0.0001756601451995425, "tps": 2564650, "wall": 462.5} {"step": 18098, "train_loss": 3.299024820327759, "lr": 0.00017564157779762724, "tps": 2537471, "wall": 467.4} {"step": 18099, "train_loss": 3.311668872833252, "lr": 0.0001756230108982066, "tps": 2510382, "wall": 472.5} {"step": 18100, "train_loss": 3.2413668632507324, "lr": 0.00017560444450149095, "tps": 2482562, "wall": 477.8} {"step": 18101, "train_loss": 3.1271579265594482, "lr": 0.0001755858786076905, "tps": 2457055, "wall": 482.8} {"step": 18102, "train_loss": 3.1864049434661865, "lr": 0.00017556731321701565, "tps": 2432453, "wall": 487.7} {"step": 18103, "train_loss": 3.1852517127990723, "lr": 0.00017554874832967666, "tps": 2407141, "wall": 492.9} {"step": 18104, "train_loss": 3.156827926635742, "lr": 0.00017553018394588388, "tps": 2383541, "wall": 497.8} {"step": 18105, "train_loss": 3.2036194801330566, "lr": 0.00017551162006584754, "tps": 2359627, "wall": 502.9} {"step": 18106, "train_loss": 3.2877798080444336, "lr": 0.000175493056689778, "tps": 2336280, "wall": 507.9} {"step": 18107, "train_loss": 3.17112398147583, "lr": 0.00017547449381788552, "tps": 2312238, "wall": 513.2} {"step": 18108, "train_loss": 3.328244686126709, "lr": 0.00017545593145038035, "tps": 2289320, "wall": 518.4} {"step": 18109, "train_loss": 3.2202110290527344, "lr": 0.00017543736958747284, "tps": 2267403, "wall": 523.4} {"step": 18110, "train_loss": 3.2193589210510254, "lr": 0.00017541880822937323, "tps": 2245828, "wall": 528.5} {"step": 18111, "train_loss": 3.183169364929199, "lr": 0.00017540024737629171, "tps": 2224907, "wall": 533.5} {"step": 18112, "train_loss": 3.228195905685425, "lr": 0.00017538168702843865, "tps": 2204328, "wall": 538.5} {"step": 18113, "train_loss": 3.2428436279296875, "lr": 0.00017536312718602427, "tps": 2183838, "wall": 543.6} {"step": 18114, "train_loss": 3.2165753841400146, "lr": 0.00017534456784925876, "tps": 2162835, "wall": 548.9} {"step": 18115, "train_loss": 3.2339844703674316, "lr": 0.0001753260090183524, "tps": 2143090, "wall": 554.0} {"step": 18116, "train_loss": 3.2418551445007324, "lr": 0.00017530745069351542, "tps": 2123663, "wall": 559.1} {"step": 18117, "train_loss": 3.2455601692199707, "lr": 0.00017528889287495814, "tps": 2103450, "wall": 564.5} {"step": 18118, "train_loss": 3.1806674003601074, "lr": 0.0001752703355628906, "tps": 2084661, "wall": 569.6} {"step": 18119, "train_loss": 3.296125650405884, "lr": 0.00017525177875752314, "tps": 2066476, "wall": 574.7} {"step": 18120, "train_loss": 3.311326503753662, "lr": 0.00017523322245906604, "tps": 2048936, "wall": 579.6} {"step": 18121, "train_loss": 3.2263245582580566, "lr": 0.00017521466666772933, "tps": 2031477, "wall": 584.6} {"step": 18122, "train_loss": 3.2801966667175293, "lr": 0.0001751961113837233, "tps": 2014429, "wall": 589.6} {"step": 18123, "train_loss": 3.236416816711426, "lr": 0.00017517755660725816, "tps": 1997590, "wall": 594.6} {"step": 18124, "train_loss": 3.224801778793335, "lr": 0.0001751590023385441, "tps": 1981339, "wall": 599.5} {"step": 18125, "train_loss": 3.221731662750244, "lr": 0.0001751404485777913, "tps": 1965322, "wall": 604.4} {"step": 18126, "train_loss": 3.1754114627838135, "lr": 0.00017512189532520984, "tps": 1949548, "wall": 609.4} {"step": 18127, "train_loss": 3.2849137783050537, "lr": 0.00017510334258101008, "tps": 1934045, "wall": 614.3} {"step": 18128, "train_loss": 3.2618024349212646, "lr": 0.000175084790345402, "tps": 1918703, "wall": 619.2} {"step": 18129, "train_loss": 3.234792947769165, "lr": 0.0001750662386185959, "tps": 1903718, "wall": 624.1} {"step": 18130, "train_loss": 3.261876106262207, "lr": 0.00017504768740080184, "tps": 1888922, "wall": 629.1} {"step": 18131, "train_loss": 3.230888605117798, "lr": 0.00017502913669223, "tps": 1874389, "wall": 634.0} {"step": 18132, "train_loss": 3.335928440093994, "lr": 0.0001750105864930906, "tps": 1860032, "wall": 638.9} {"step": 18133, "train_loss": 3.1292190551757812, "lr": 0.00017499203680359363, "tps": 1845951, "wall": 643.8} {"step": 18134, "train_loss": 3.135402202606201, "lr": 0.00017497348762394936, "tps": 1831922, "wall": 648.8} {"step": 18135, "train_loss": 3.115161657333374, "lr": 0.00017495493895436788, "tps": 1818208, "wall": 653.7} {"step": 18136, "train_loss": 3.3779659271240234, "lr": 0.00017493639079505923, "tps": 1804795, "wall": 658.6} {"step": 18137, "train_loss": 3.2581143379211426, "lr": 0.0001749178431462336, "tps": 1791477, "wall": 663.5} {"step": 18138, "train_loss": 3.1528749465942383, "lr": 0.00017489929600810112, "tps": 1778384, "wall": 668.4} {"step": 18139, "train_loss": 3.3669040203094482, "lr": 0.0001748807493808718, "tps": 1765530, "wall": 673.4} {"step": 18140, "train_loss": 3.1472229957580566, "lr": 0.00017486220326475577, "tps": 1752863, "wall": 678.3} {"step": 18141, "train_loss": 3.26188063621521, "lr": 0.0001748436576599632, "tps": 1740370, "wall": 683.2} {"step": 18142, "train_loss": 3.2083890438079834, "lr": 0.00017482511256670412, "tps": 1728090, "wall": 688.1} {"step": 18143, "train_loss": 3.3009326457977295, "lr": 0.0001748065679851886, "tps": 1715933, "wall": 693.0} {"step": 18144, "train_loss": 3.3664278984069824, "lr": 0.00017478802391562666, "tps": 1703925, "wall": 697.9} {"step": 18145, "train_loss": 3.2606992721557617, "lr": 0.00017476948035822853, "tps": 1692194, "wall": 702.8} {"step": 18146, "train_loss": 3.1559877395629883, "lr": 0.0001747509373132041, "tps": 1680482, "wall": 707.7} {"step": 18147, "train_loss": 3.2206268310546875, "lr": 0.00017473239478076353, "tps": 1669038, "wall": 712.6} {"step": 18148, "train_loss": 3.2607808113098145, "lr": 0.00017471385276111683, "tps": 1657748, "wall": 717.5} {"step": 18149, "train_loss": 3.2488937377929688, "lr": 0.00017469531125447407, "tps": 1646632, "wall": 722.4} {"step": 18150, "train_loss": 3.0979716777801514, "lr": 0.0001746767702610453, "tps": 1635280, "wall": 727.4} {"step": 18151, "train_loss": 3.210510730743408, "lr": 0.0001746582297810405, "tps": 1624341, "wall": 732.4} {"step": 18152, "train_loss": 3.252601146697998, "lr": 0.0001746396898146697, "tps": 1613462, "wall": 737.3} {"step": 18153, "train_loss": 3.3013579845428467, "lr": 0.00017462115036214298, "tps": 1602685, "wall": 742.3} {"step": 18154, "train_loss": 3.238525390625, "lr": 0.00017460261142367029, "tps": 1592032, "wall": 747.4} {"step": 18155, "train_loss": 3.1576528549194336, "lr": 0.00017458407299946176, "tps": 1581685, "wall": 752.3} {"step": 18156, "train_loss": 3.22760272026062, "lr": 0.00017456553508972723, "tps": 1571352, "wall": 757.3} {"step": 18157, "train_loss": 3.208169460296631, "lr": 0.0001745469976946768, "tps": 1561151, "wall": 762.3} {"step": 18158, "train_loss": 3.276970148086548, "lr": 0.00017452846081452038, "tps": 1551122, "wall": 767.2} {"step": 18159, "train_loss": 3.178212881088257, "lr": 0.0001745099244494681, "tps": 1541216, "wall": 772.2} {"step": 18160, "train_loss": 3.2560245990753174, "lr": 0.00017449138859972982, "tps": 1531331, "wall": 777.2} {"step": 18161, "train_loss": 3.3647165298461914, "lr": 0.00017447285326551554, "tps": 1521671, "wall": 782.2} {"step": 18162, "train_loss": 3.151738405227661, "lr": 0.0001744543184470353, "tps": 1512186, "wall": 787.2} {"step": 18163, "train_loss": 3.249903678894043, "lr": 0.00017443578414449897, "tps": 1502913, "wall": 792.1} {"step": 18164, "train_loss": 3.175119400024414, "lr": 0.00017441725035811652, "tps": 1493774, "wall": 796.9} {"step": 18165, "train_loss": 3.224215507507324, "lr": 0.00017439871708809797, "tps": 1484730, "wall": 801.8} {"step": 18166, "train_loss": 3.3570189476013184, "lr": 0.00017438018433465317, "tps": 1475656, "wall": 806.8} {"step": 18167, "train_loss": 3.119875431060791, "lr": 0.00017436165209799208, "tps": 1466826, "wall": 811.7} {"step": 18168, "train_loss": 3.139374256134033, "lr": 0.00017434312037832475, "tps": 1458137, "wall": 816.6} {"step": 18169, "train_loss": 3.172328472137451, "lr": 0.00017432458917586102, "tps": 1449542, "wall": 821.5} {"step": 18170, "train_loss": 3.2552177906036377, "lr": 0.0001743060584908107, "tps": 1440683, "wall": 826.6} {"step": 18171, "train_loss": 3.2594847679138184, "lr": 0.00017428752832338392, "tps": 1432090, "wall": 831.6} {"step": 18172, "train_loss": 3.3096425533294678, "lr": 0.00017426899867379052, "tps": 1423499, "wall": 836.7} {"step": 18173, "train_loss": 3.1219019889831543, "lr": 0.0001742504695422403, "tps": 1415089, "wall": 841.7} {"step": 18174, "train_loss": 3.2408814430236816, "lr": 0.00017423194092894327, "tps": 1406770, "wall": 846.7} {"step": 18175, "train_loss": 3.349378824234009, "lr": 0.0001742134128341093, "tps": 1398571, "wall": 851.7} {"step": 18176, "train_loss": 3.2233476638793945, "lr": 0.0001741948852579483, "tps": 1390489, "wall": 856.7} {"step": 18177, "train_loss": 3.242119789123535, "lr": 0.00017417635820067, "tps": 1382502, "wall": 861.7} {"step": 18178, "train_loss": 3.2273001670837402, "lr": 0.00017415783166248446, "tps": 1374584, "wall": 866.7} {"step": 18179, "train_loss": 3.211221694946289, "lr": 0.00017413930564360154, "tps": 1366722, "wall": 871.8} {"step": 18180, "train_loss": 3.14673113822937, "lr": 0.00017412078014423097, "tps": 1358980, "wall": 876.8} {"step": 18181, "train_loss": 3.321333646774292, "lr": 0.0001741022551645827, "tps": 1351525, "wall": 881.7} {"step": 18182, "train_loss": 3.1635138988494873, "lr": 0.0001740837307048666, "tps": 1344006, "wall": 886.6} {"step": 18183, "train_loss": 3.29274845123291, "lr": 0.00017406520676529246, "tps": 1336667, "wall": 891.6} {"step": 18184, "train_loss": 3.2372870445251465, "lr": 0.00017404668334607015, "tps": 1329411, "wall": 896.5} {"step": 18185, "train_loss": 3.272202491760254, "lr": 0.00017402816044740944, "tps": 1322256, "wall": 901.4} {"step": 18186, "train_loss": 3.3189477920532227, "lr": 0.0001740096380695203, "tps": 1315186, "wall": 906.3} {"step": 18187, "train_loss": 3.273149013519287, "lr": 0.0001739911162126124, "tps": 1308158, "wall": 911.2} {"step": 18188, "train_loss": 3.296431303024292, "lr": 0.00017397259487689568, "tps": 1301223, "wall": 916.1} {"step": 18189, "train_loss": 3.2432861328125, "lr": 0.0001739540740625799, "tps": 1294154, "wall": 921.1} {"step": 18190, "train_loss": 3.1025586128234863, "lr": 0.0001739355537698748, "tps": 1287161, "wall": 926.2} {"step": 18191, "train_loss": 3.356226921081543, "lr": 0.00017391703399899028, "tps": 1280210, "wall": 931.3} {"step": 18192, "train_loss": 3.148719310760498, "lr": 0.0001738985147501361, "tps": 1273563, "wall": 936.2} {"step": 18193, "train_loss": 3.1098384857177734, "lr": 0.000173879996023522, "tps": 1266984, "wall": 941.1} {"step": 18194, "train_loss": 3.22369647026062, "lr": 0.00017386147781935782, "tps": 1260327, "wall": 946.1} {"step": 18195, "train_loss": 3.2120063304901123, "lr": 0.0001738429601378533, "tps": 1253937, "wall": 951.0} {"step": 18196, "train_loss": 3.2625160217285156, "lr": 0.00017382444297921827, "tps": 1247585, "wall": 955.9} {"step": 18197, "train_loss": 3.140575885772705, "lr": 0.0001738059263436624, "tps": 1241308, "wall": 960.8} {"step": 18198, "train_loss": 3.2148027420043945, "lr": 0.0001737874102313955, "tps": 1235078, "wall": 965.7} {"step": 18199, "train_loss": 3.2882325649261475, "lr": 0.00017376889464262738, "tps": 1228840, "wall": 970.6} {"step": 18200, "train_loss": 3.2825233936309814, "lr": 0.00017375037957756764, "tps": 1222738, "wall": 975.5} {"step": 18201, "train_loss": 3.29616641998291, "lr": 0.00017373186503642614, "tps": 1216584, "wall": 980.5} {"step": 18202, "train_loss": 3.235563278198242, "lr": 0.00017371335101941257, "tps": 1210339, "wall": 985.6} {"step": 18203, "train_loss": 3.243328332901001, "lr": 0.00017369483752673666, "tps": 1204157, "wall": 990.7} {"step": 18204, "train_loss": 3.1558353900909424, "lr": 0.00017367632455860812, "tps": 1198189, "wall": 995.7} {"step": 18205, "train_loss": 3.189730167388916, "lr": 0.0001736578121152367, "tps": 1192328, "wall": 1000.7} {"step": 18206, "train_loss": 3.2532196044921875, "lr": 0.0001736393001968321, "tps": 1186431, "wall": 1005.7} {"step": 18207, "train_loss": 3.192728042602539, "lr": 0.000173620788803604, "tps": 1180712, "wall": 1010.6} {"step": 18208, "train_loss": 3.130415439605713, "lr": 0.00017360227793576213, "tps": 1174993, "wall": 1015.6} {"step": 18209, "train_loss": 3.242400646209717, "lr": 0.00017358376759351617, "tps": 1169336, "wall": 1020.6} {"step": 18210, "train_loss": 3.1441166400909424, "lr": 0.0001735652577770758, "tps": 1163754, "wall": 1025.5} {"step": 18211, "train_loss": 3.1761527061462402, "lr": 0.00017354674848665068, "tps": 1158257, "wall": 1030.5} {"step": 18212, "train_loss": 3.149238109588623, "lr": 0.00017352823972245052, "tps": 1152814, "wall": 1035.4} {"step": 18213, "train_loss": 3.2425472736358643, "lr": 0.00017350973148468497, "tps": 1147403, "wall": 1040.3} {"step": 18214, "train_loss": 3.2133212089538574, "lr": 0.0001734912237735637, "tps": 1142076, "wall": 1045.2} {"step": 18215, "train_loss": 3.2787556648254395, "lr": 0.00017347271658929635, "tps": 1136763, "wall": 1050.2} {"step": 18216, "train_loss": 3.258481740951538, "lr": 0.00017345420993209265, "tps": 1131556, "wall": 1055.1} {"step": 18217, "train_loss": 3.2097229957580566, "lr": 0.0001734357038021621, "tps": 1126415, "wall": 1059.9} {"step": 18218, "train_loss": 3.213740348815918, "lr": 0.00017341719819971444, "tps": 1121316, "wall": 1064.8} {"step": 18219, "train_loss": 3.1902570724487305, "lr": 0.0001733986931249593, "tps": 1116184, "wall": 1069.8} {"step": 18220, "train_loss": 3.2835464477539062, "lr": 0.00017338018857810625, "tps": 1111167, "wall": 1074.7} {"step": 18221, "train_loss": 3.235687255859375, "lr": 0.00017336168455936495, "tps": 1106192, "wall": 1079.6} {"step": 18222, "train_loss": 3.3017382621765137, "lr": 0.00017334318106894503, "tps": 1101143, "wall": 1084.6} {"step": 18223, "train_loss": 3.22882080078125, "lr": 0.00017332467810705606, "tps": 1096227, "wall": 1089.5} {"step": 18224, "train_loss": 3.259021759033203, "lr": 0.0001733061756739077, "tps": 1091383, "wall": 1094.4} {"step": 18225, "train_loss": 3.319220542907715, "lr": 0.00017328767376970948, "tps": 1086599, "wall": 1099.3} {"step": 18226, "train_loss": 3.2242348194122314, "lr": 0.00017326917239467103, "tps": 1081818, "wall": 1104.2} {"step": 18227, "train_loss": 3.117523431777954, "lr": 0.00017325067154900188, "tps": 1077071, "wall": 1109.1} {"step": 18228, "train_loss": 3.2616896629333496, "lr": 0.0001732321712329117, "tps": 1072382, "wall": 1114.0} {"step": 18229, "train_loss": 3.2908596992492676, "lr": 0.00017321367144660998, "tps": 1067718, "wall": 1118.9} {"step": 18230, "train_loss": 3.157846450805664, "lr": 0.00017319517219030638, "tps": 1063139, "wall": 1123.8} {"step": 18231, "train_loss": 3.2021288871765137, "lr": 0.00017317667346421033, "tps": 1058499, "wall": 1128.8} {"step": 18232, "train_loss": 3.162757158279419, "lr": 0.00017315817526853148, "tps": 1053987, "wall": 1133.7} {"step": 18233, "train_loss": 3.220045566558838, "lr": 0.0001731396776034794, "tps": 1049524, "wall": 1138.6} {"step": 18234, "train_loss": 3.3237054347991943, "lr": 0.0001731211804692635, "tps": 1045104, "wall": 1143.5} {"step": 18235, "train_loss": 3.193063497543335, "lr": 0.00017310268386609346, "tps": 1040619, "wall": 1148.5} {"step": 18236, "train_loss": 3.2083077430725098, "lr": 0.00017308418779417875, "tps": 1036234, "wall": 1153.4} {"step": 18237, "train_loss": 3.2906274795532227, "lr": 0.00017306569225372892, "tps": 1031875, "wall": 1158.3} {"step": 18238, "train_loss": 3.2973132133483887, "lr": 0.0001730471972449534, "tps": 1027525, "wall": 1163.3} {"step": 18239, "train_loss": 3.179342031478882, "lr": 0.0001730287027680618, "tps": 1023252, "wall": 1168.2} {"step": 18240, "train_loss": 3.267298698425293, "lr": 0.00017301020882326364, "tps": 1019014, "wall": 1173.1} {"step": 18241, "train_loss": 3.1936938762664795, "lr": 0.0001729917154107683, "tps": 1014794, "wall": 1178.1} {"step": 18242, "train_loss": 3.2100934982299805, "lr": 0.0001729732225307854, "tps": 1010572, "wall": 1183.1} {"step": 18243, "train_loss": 3.2521142959594727, "lr": 0.00017295473018352441, "tps": 1006307, "wall": 1188.1} {"step": 18244, "train_loss": 3.2099225521087646, "lr": 0.00017293623836919472, "tps": 1002124, "wall": 1193.2} {"step": 18245, "train_loss": 3.269568920135498, "lr": 0.0001729177470880059, "tps": 998026, "wall": 1198.1} {"step": 18246, "train_loss": 3.2314393520355225, "lr": 0.00017289925634016742, "tps": 993962, "wall": 1203.1} {"step": 18247, "train_loss": 3.2791757583618164, "lr": 0.00017288076612588865, "tps": 989961, "wall": 1208.0} {"step": 18248, "train_loss": 3.1916344165802, "lr": 0.00017286227644537915, "tps": 986008, "wall": 1212.9} {"step": 18249, "train_loss": 3.293100595474243, "lr": 0.0001728437872988483, "tps": 982024, "wall": 1217.9} {"step": 18250, "train_loss": 3.2641873359680176, "lr": 0.00017282529868650558, "tps": 978076, "wall": 1222.9} {"step": 18251, "train_loss": 3.168034076690674, "lr": 0.00017280681060856048, "tps": 974148, "wall": 1227.9} {"step": 18252, "train_loss": 3.1399452686309814, "lr": 0.00017278832306522233, "tps": 970248, "wall": 1232.9} {"step": 18253, "train_loss": 3.2223119735717773, "lr": 0.00017276983605670068, "tps": 966414, "wall": 1237.9} {"step": 18254, "train_loss": 3.2789745330810547, "lr": 0.0001727513495832048, "tps": 962623, "wall": 1242.8} {"step": 18255, "train_loss": 3.2763214111328125, "lr": 0.00017273286364494417, "tps": 958690, "wall": 1248.0} {"step": 18256, "train_loss": 3.2961044311523438, "lr": 0.0001727143782421283, "tps": 954860, "wall": 1253.1} {"step": 18257, "train_loss": 3.176208972930908, "lr": 0.0001726958933749665, "tps": 951150, "wall": 1258.0} {"step": 18258, "train_loss": 3.2361276149749756, "lr": 0.00017267740904366812, "tps": 947462, "wall": 1263.0} {"step": 18259, "train_loss": 3.287655830383301, "lr": 0.00017265892524844265, "tps": 943779, "wall": 1268.0} {"step": 18260, "train_loss": 3.0901882648468018, "lr": 0.00017264044198949944, "tps": 940147, "wall": 1272.9} {"step": 18261, "train_loss": 3.184576988220215, "lr": 0.00017262195926704785, "tps": 936573, "wall": 1277.9} {"step": 18262, "train_loss": 3.2566323280334473, "lr": 0.0001726034770812973, "tps": 932966, "wall": 1282.9} {"step": 18263, "train_loss": 3.3349900245666504, "lr": 0.00017258499543245712, "tps": 929365, "wall": 1287.9} {"step": 18264, "train_loss": 3.2616026401519775, "lr": 0.00017256651432073664, "tps": 925886, "wall": 1292.8} {"step": 18265, "train_loss": 3.09470796585083, "lr": 0.00017254803374634525, "tps": 922447, "wall": 1297.7} {"step": 18266, "train_loss": 3.1394824981689453, "lr": 0.00017252955370949233, "tps": 919007, "wall": 1302.7} {"step": 18267, "train_loss": 3.211658000946045, "lr": 0.00017251107421038716, "tps": 915570, "wall": 1307.6} {"step": 18268, "train_loss": 3.2718422412872314, "lr": 0.00017249259524923914, "tps": 912200, "wall": 1312.5} {"step": 18269, "train_loss": 3.1930465698242188, "lr": 0.0001724741168262576, "tps": 908734, "wall": 1317.6} {"step": 18270, "train_loss": 3.234043598175049, "lr": 0.0001724556389416518, "tps": 905218, "wall": 1322.8} {"step": 18271, "train_loss": 3.2184174060821533, "lr": 0.0001724371615956311, "tps": 901610, "wall": 1328.1} {"step": 18272, "train_loss": 3.2602365016937256, "lr": 0.0001724186847884048, "tps": 898022, "wall": 1333.5} {"step": 18273, "train_loss": 3.1861650943756104, "lr": 0.0001724002085201822, "tps": 894465, "wall": 1338.9} {"step": 18274, "train_loss": 3.333404064178467, "lr": 0.00017238173279117262, "tps": 890935, "wall": 1344.3} {"step": 18275, "train_loss": 3.206122875213623, "lr": 0.00017236325760158536, "tps": 887369, "wall": 1349.8} {"step": 18276, "train_loss": 3.216935634613037, "lr": 0.0001723447829516297, "tps": 883862, "wall": 1355.2} {"step": 18277, "train_loss": 3.240205764770508, "lr": 0.00017232630884151493, "tps": 880422, "wall": 1360.6} {"step": 18278, "train_loss": 3.2574801445007324, "lr": 0.00017230783527145027, "tps": 876986, "wall": 1366.0} {"step": 18279, "train_loss": 3.2611865997314453, "lr": 0.00017228936224164505, "tps": 873599, "wall": 1371.3} {"step": 18280, "train_loss": 3.3218765258789062, "lr": 0.00017227088975230856, "tps": 870283, "wall": 1376.6} {"step": 18281, "train_loss": 3.196014881134033, "lr": 0.00017225241780364993, "tps": 867090, "wall": 1381.8} {"step": 18282, "train_loss": 3.223456382751465, "lr": 0.00017223394639587856, "tps": 863888, "wall": 1387.0} {"step": 18283, "train_loss": 3.1709346771240234, "lr": 0.00017221547552920358, "tps": 860794, "wall": 1392.0} {"step": 18284, "train_loss": 3.264650821685791, "lr": 0.00017219700520383432, "tps": 857677, "wall": 1397.2} {"step": 18285, "train_loss": 3.2402701377868652, "lr": 0.00017217853541997994, "tps": 854603, "wall": 1402.3} {"step": 18286, "train_loss": 3.2759344577789307, "lr": 0.0001721600661778497, "tps": 851550, "wall": 1407.4} {"step": 18287, "train_loss": 3.223137855529785, "lr": 0.0001721415974776529, "tps": 848511, "wall": 1412.5} {"step": 18288, "train_loss": 3.239370346069336, "lr": 0.00017212312931959853, "tps": 845520, "wall": 1417.6} {"step": 18289, "train_loss": 3.1537106037139893, "lr": 0.00017210466170389612, "tps": 842524, "wall": 1422.7} {"step": 18290, "train_loss": 3.2574453353881836, "lr": 0.00017208619463075455, "tps": 839485, "wall": 1427.9} {"step": 18291, "train_loss": 3.334625720977783, "lr": 0.0001720677281003832, "tps": 836513, "wall": 1433.1} {"step": 18292, "train_loss": 3.1959071159362793, "lr": 0.00017204926211299122, "tps": 833560, "wall": 1438.2} {"step": 18293, "train_loss": 3.247406005859375, "lr": 0.0001720307966687878, "tps": 830606, "wall": 1443.4} {"step": 18294, "train_loss": 3.251192092895508, "lr": 0.00017201233176798207, "tps": 827711, "wall": 1448.5} {"step": 18295, "train_loss": 3.2179672718048096, "lr": 0.00017199386741078332, "tps": 824839, "wall": 1453.7} {"step": 18296, "train_loss": 3.2237000465393066, "lr": 0.00017197540359740056, "tps": 821933, "wall": 1458.9} {"step": 18297, "train_loss": 3.2558822631835938, "lr": 0.00017195694032804304, "tps": 819100, "wall": 1464.0} {"step": 18298, "train_loss": 3.3103880882263184, "lr": 0.0001719384776029199, "tps": 816271, "wall": 1469.2} {"step": 18299, "train_loss": 3.298400402069092, "lr": 0.00017192001542224036, "tps": 813346, "wall": 1474.5} {"step": 18300, "train_loss": 3.1345252990722656, "lr": 0.00017190155378621339, "tps": 810413, "wall": 1480.0} {"step": 18301, "train_loss": 3.296762228012085, "lr": 0.00017188309269504829, "tps": 807480, "wall": 1485.4} {"step": 18302, "train_loss": 3.2342076301574707, "lr": 0.0001718646321489541, "tps": 804605, "wall": 1490.8} {"step": 18303, "train_loss": 3.218108892440796, "lr": 0.00017184617214813992, "tps": 801748, "wall": 1496.2} {"step": 18304, "train_loss": 3.181920051574707, "lr": 0.0001718277126928149, "tps": 799019, "wall": 1501.4} {"step": 18305, "train_loss": 3.1885128021240234, "lr": 0.0001718092537831882, "tps": 796321, "wall": 1506.6} {"step": 18306, "train_loss": 3.203770637512207, "lr": 0.0001717907954194689, "tps": 793641, "wall": 1511.7} {"step": 18307, "train_loss": 3.187790870666504, "lr": 0.00017177233760186603, "tps": 790969, "wall": 1516.9} {"step": 18308, "train_loss": 3.2091915607452393, "lr": 0.00017175388033058875, "tps": 788321, "wall": 1522.1} {"step": 18309, "train_loss": 3.1886353492736816, "lr": 0.0001717354236058461, "tps": 785702, "wall": 1527.2} {"step": 18310, "train_loss": 3.127234697341919, "lr": 0.00017171696742784723, "tps": 783111, "wall": 1532.4} {"step": 18311, "train_loss": 3.2287392616271973, "lr": 0.00017169851179680111, "tps": 780511, "wall": 1537.6} {"step": 18312, "train_loss": 3.2673518657684326, "lr": 0.00017168005671291692, "tps": 777938, "wall": 1542.7} {"step": 18313, "train_loss": 3.295553207397461, "lr": 0.0001716616021764036, "tps": 775360, "wall": 1548.0} {"step": 18314, "train_loss": 3.316927433013916, "lr": 0.0001716431481874703, "tps": 772828, "wall": 1553.1} {"step": 18315, "train_loss": 3.241177797317505, "lr": 0.00017162469474632608, "tps": 770327, "wall": 1558.2} {"step": 18316, "train_loss": 3.1693286895751953, "lr": 0.00017160624185317985, "tps": 767826, "wall": 1563.4} {"step": 18317, "train_loss": 3.2201476097106934, "lr": 0.00017158778950824078, "tps": 765355, "wall": 1568.5} {"step": 18318, "train_loss": 3.173144817352295, "lr": 0.0001715693377117178, "tps": 762880, "wall": 1573.7} {"step": 18319, "train_loss": 3.224165678024292, "lr": 0.00017155088646382004, "tps": 760442, "wall": 1578.8} {"step": 18320, "train_loss": 3.155482053756714, "lr": 0.00017153243576475643, "tps": 758003, "wall": 1584.0} {"step": 18321, "train_loss": 3.2964107990264893, "lr": 0.00017151398561473605, "tps": 755578, "wall": 1589.2} {"step": 18322, "train_loss": 3.2340919971466064, "lr": 0.00017149553601396783, "tps": 753182, "wall": 1594.3} {"step": 18323, "train_loss": 3.1833701133728027, "lr": 0.00017147708696266077, "tps": 750801, "wall": 1599.5} {"step": 18324, "train_loss": 3.1267638206481934, "lr": 0.00017145863846102392, "tps": 748454, "wall": 1604.6} {"step": 18325, "train_loss": 3.1990725994110107, "lr": 0.00017144019050926624, "tps": 746087, "wall": 1609.7} {"step": 18326, "train_loss": 3.2723658084869385, "lr": 0.00017142174310759675, "tps": 743750, "wall": 1614.9} {"step": 18327, "train_loss": 3.3403003215789795, "lr": 0.00017140329625622434, "tps": 741440, "wall": 1620.0} {"step": 18328, "train_loss": 3.212458372116089, "lr": 0.000171384849955358, "tps": 739147, "wall": 1625.1} {"step": 18329, "train_loss": 3.1583385467529297, "lr": 0.00017136640420520677, "tps": 736849, "wall": 1630.3} {"step": 18330, "train_loss": 3.1722917556762695, "lr": 0.0001713479590059795, "tps": 734569, "wall": 1635.4} {"step": 18331, "train_loss": 3.3069465160369873, "lr": 0.0001713295143578852, "tps": 732311, "wall": 1640.6} {"step": 18332, "train_loss": 3.165250301361084, "lr": 0.00017131107026113277, "tps": 730083, "wall": 1645.7} {"step": 18333, "train_loss": 3.1976754665374756, "lr": 0.0001712926267159312, "tps": 727859, "wall": 1650.8} {"step": 18334, "train_loss": 3.1482951641082764, "lr": 0.00017127418372248938, "tps": 725650, "wall": 1655.9} {"step": 18335, "train_loss": 3.318577766418457, "lr": 0.0001712557412810162, "tps": 723444, "wall": 1661.0} {"step": 18336, "train_loss": 3.2187938690185547, "lr": 0.0001712372993917207, "tps": 721216, "wall": 1666.3} {"step": 18337, "train_loss": 3.2615089416503906, "lr": 0.00017121885805481166, "tps": 719001, "wall": 1671.5} {"step": 18338, "train_loss": 3.2753283977508545, "lr": 0.00017120041727049804, "tps": 716769, "wall": 1676.8} {"step": 18339, "train_loss": 3.1708273887634277, "lr": 0.00017118197703898876, "tps": 714613, "wall": 1681.9} {"step": 18340, "train_loss": 3.182368278503418, "lr": 0.00017116353736049264, "tps": 712453, "wall": 1687.1} {"step": 18341, "train_loss": 3.1944217681884766, "lr": 0.0001711450982352186, "tps": 710345, "wall": 1692.2} {"step": 18342, "train_loss": 3.470670700073242, "lr": 0.0001711266596633756, "tps": 708246, "wall": 1697.3} {"step": 18343, "train_loss": 3.232440948486328, "lr": 0.00017110822164517243, "tps": 706173, "wall": 1702.4} {"step": 18344, "train_loss": 3.225621223449707, "lr": 0.00017108978418081794, "tps": 704098, "wall": 1707.5} {"step": 18345, "train_loss": 3.1975648403167725, "lr": 0.00017107134727052098, "tps": 702030, "wall": 1712.6} {"step": 18346, "train_loss": 3.21946382522583, "lr": 0.00017105291091449053, "tps": 699990, "wall": 1717.7} {"step": 18347, "train_loss": 3.2650113105773926, "lr": 0.0001710344751129353, "tps": 697948, "wall": 1722.8} {"step": 18348, "train_loss": 3.169952630996704, "lr": 0.00017101603986606422, "tps": 695899, "wall": 1728.0} {"step": 18349, "train_loss": 3.239302158355713, "lr": 0.00017099760517408607, "tps": 693902, "wall": 1733.1} {"step": 18350, "train_loss": 3.1554207801818848, "lr": 0.00017097917103720968, "tps": 691920, "wall": 1738.1} {"step": 18351, "train_loss": 3.3122024536132812, "lr": 0.00017096073745564394, "tps": 689942, "wall": 1743.2} {"step": 18352, "train_loss": 3.1892635822296143, "lr": 0.0001709423044295976, "tps": 687977, "wall": 1748.3} {"step": 18353, "train_loss": 3.2907466888427734, "lr": 0.00017092387195927948, "tps": 686009, "wall": 1753.4} {"step": 18354, "train_loss": 3.2504844665527344, "lr": 0.0001709054400448984, "tps": 684062, "wall": 1758.5} {"step": 18355, "train_loss": 3.295999526977539, "lr": 0.0001708870086866631, "tps": 682131, "wall": 1763.6} {"step": 18356, "train_loss": 3.1745591163635254, "lr": 0.0001708685778847825, "tps": 680213, "wall": 1768.6} {"step": 18357, "train_loss": 3.2053415775299072, "lr": 0.00017085014763946527, "tps": 678307, "wall": 1773.7} {"step": 18358, "train_loss": 3.2322328090667725, "lr": 0.00017083171795092024, "tps": 676410, "wall": 1778.8} {"step": 18359, "train_loss": 3.1955971717834473, "lr": 0.0001708132888193562, "tps": 674524, "wall": 1783.8} {"step": 18360, "train_loss": 3.2043256759643555, "lr": 0.00017079486024498182, "tps": 672626, "wall": 1789.0} {"step": 18361, "train_loss": 3.1848063468933105, "lr": 0.00017077643222800597, "tps": 670759, "wall": 1794.0} {"step": 18362, "train_loss": 3.280949115753174, "lr": 0.00017075800476863733, "tps": 668884, "wall": 1799.2} {"step": 18363, "train_loss": 3.139390230178833, "lr": 0.0001707395778670847, "tps": 667035, "wall": 1804.3} {"step": 18364, "train_loss": 3.1737775802612305, "lr": 0.00017072115152355676, "tps": 665202, "wall": 1809.3} {"step": 18365, "train_loss": 3.2525475025177, "lr": 0.0001707027257382623, "tps": 663373, "wall": 1814.4} {"step": 18366, "train_loss": 3.1748528480529785, "lr": 0.00017068430051141005, "tps": 661541, "wall": 1819.5} {"step": 18367, "train_loss": 3.338329792022705, "lr": 0.0001706658758432087, "tps": 659742, "wall": 1824.6} {"step": 18368, "train_loss": 3.051088809967041, "lr": 0.00017064745173386693, "tps": 657927, "wall": 1829.7} {"step": 18369, "train_loss": 3.1437883377075195, "lr": 0.0001706290281835936, "tps": 656068, "wall": 1835.0} {"step": 18370, "train_loss": 3.100114107131958, "lr": 0.00017061060519259723, "tps": 654284, "wall": 1840.1} {"step": 18371, "train_loss": 3.189081907272339, "lr": 0.00017059218276108663, "tps": 652482, "wall": 1845.3} {"step": 18372, "train_loss": 3.0994462966918945, "lr": 0.00017057376088927044, "tps": 650709, "wall": 1850.4} {"step": 18373, "train_loss": 3.2430944442749023, "lr": 0.00017055533957735736, "tps": 648948, "wall": 1855.6} {"step": 18374, "train_loss": 3.114865779876709, "lr": 0.00017053691882555608, "tps": 647203, "wall": 1860.7} {"step": 18375, "train_loss": 3.131443500518799, "lr": 0.00017051849863407523, "tps": 645453, "wall": 1865.8} {"step": 18376, "train_loss": 3.2778005599975586, "lr": 0.00017050007900312357, "tps": 643718, "wall": 1870.9} {"step": 18377, "train_loss": 3.2539525032043457, "lr": 0.00017048165993290964, "tps": 642000, "wall": 1876.0} {"step": 18378, "train_loss": 3.3021559715270996, "lr": 0.00017046324142364213, "tps": 640296, "wall": 1881.1} {"step": 18379, "train_loss": 3.2409896850585938, "lr": 0.00017044482347552972, "tps": 638602, "wall": 1886.2} {"step": 18380, "train_loss": 3.325817584991455, "lr": 0.00017042640608878106, "tps": 636909, "wall": 1891.3} {"step": 18381, "train_loss": 3.121093988418579, "lr": 0.0001704079892636047, "tps": 635230, "wall": 1896.5} {"step": 18382, "train_loss": 3.2199931144714355, "lr": 0.00017038957300020933, "tps": 633550, "wall": 1901.6} {"step": 18383, "train_loss": 3.2549686431884766, "lr": 0.00017037115729880365, "tps": 631862, "wall": 1906.8} {"step": 18384, "train_loss": 3.2549402713775635, "lr": 0.00017035274215959607, "tps": 630210, "wall": 1911.9} {"step": 18385, "train_loss": 3.1388020515441895, "lr": 0.00017033432758279538, "tps": 628571, "wall": 1917.0} {"step": 18386, "train_loss": 3.219696044921875, "lr": 0.0001703159135686101, "tps": 626943, "wall": 1922.0} {"step": 18387, "train_loss": 3.2069320678710938, "lr": 0.00017029750011724883, "tps": 625324, "wall": 1927.1} {"step": 18388, "train_loss": 3.2278034687042236, "lr": 0.00017027908722892017, "tps": 623699, "wall": 1932.2} {"step": 18389, "train_loss": 3.157360076904297, "lr": 0.00017026067490383268, "tps": 622072, "wall": 1937.4} {"step": 18390, "train_loss": 3.293698787689209, "lr": 0.000170242263142195, "tps": 620453, "wall": 1942.6} {"step": 18391, "train_loss": 3.304533004760742, "lr": 0.00017022385194421559, "tps": 618863, "wall": 1947.7} {"step": 18392, "train_loss": 3.2567880153656006, "lr": 0.0001702054413101031, "tps": 617274, "wall": 1952.8} {"step": 18393, "train_loss": 3.160767078399658, "lr": 0.00017018703124006615, "tps": 615698, "wall": 1957.9} {"step": 18394, "train_loss": 3.2170939445495605, "lr": 0.00017016862173431312, "tps": 614126, "wall": 1963.0} {"step": 18395, "train_loss": 3.2900567054748535, "lr": 0.00017015021279305264, "tps": 612544, "wall": 1968.2} {"step": 18396, "train_loss": 3.1937851905822754, "lr": 0.00017013180441649328, "tps": 610995, "wall": 1973.3} {"step": 18397, "train_loss": 3.251776695251465, "lr": 0.0001701133966048435, "tps": 609445, "wall": 1978.4} {"step": 18398, "train_loss": 3.2445924282073975, "lr": 0.00017009498935831188, "tps": 607904, "wall": 1983.5} {"step": 18399, "train_loss": 3.2558979988098145, "lr": 0.0001700765826771069, "tps": 606382, "wall": 1988.6} {"step": 18400, "train_loss": 3.1503515243530273, "lr": 0.00017005817656143716, "tps": 604858, "wall": 1993.7} {"step": 18401, "train_loss": 3.2074875831604004, "lr": 0.00017003977101151104, "tps": 603345, "wall": 1998.8} {"step": 18402, "train_loss": 3.2269861698150635, "lr": 0.0001700213660275371, "tps": 601829, "wall": 2004.0} {"step": 18403, "train_loss": 3.269557476043701, "lr": 0.00017000296160972383, "tps": 600335, "wall": 2009.1} {"step": 18404, "train_loss": 3.296844005584717, "lr": 0.00016998455775827975, "tps": 598858, "wall": 2014.1} {"step": 18405, "train_loss": 3.2129645347595215, "lr": 0.00016996615447341327, "tps": 597382, "wall": 2019.2} {"step": 18406, "train_loss": 3.2985758781433105, "lr": 0.00016994775175533292, "tps": 595913, "wall": 2024.3} {"step": 18407, "train_loss": 3.181575298309326, "lr": 0.00016992934960424711, "tps": 594420, "wall": 2029.5} {"step": 18408, "train_loss": 3.2482309341430664, "lr": 0.00016991094802036436, "tps": 592983, "wall": 2034.5} {"step": 18409, "train_loss": 3.2674989700317383, "lr": 0.0001698925470038931, "tps": 591526, "wall": 2039.7} {"step": 18410, "train_loss": 3.2083816528320312, "lr": 0.0001698741465550418, "tps": 590053, "wall": 2044.9} {"step": 18411, "train_loss": 3.1996231079101562, "lr": 0.00016985574667401884, "tps": 588615, "wall": 2050.0} {"step": 18412, "train_loss": 3.132753610610962, "lr": 0.00016983734736103273, "tps": 587177, "wall": 2055.1} {"step": 18413, "train_loss": 3.1874537467956543, "lr": 0.00016981894861629187, "tps": 585749, "wall": 2060.2} {"step": 18414, "train_loss": 3.204791784286499, "lr": 0.00016980055044000465, "tps": 584340, "wall": 2065.3} {"step": 18415, "train_loss": 3.3427157402038574, "lr": 0.00016978215283237948, "tps": 582848, "wall": 2070.7} {"step": 18416, "train_loss": 3.276455879211426, "lr": 0.00016976375579362484, "tps": 581386, "wall": 2076.0} {"step": 18417, "train_loss": 3.1508076190948486, "lr": 0.00016974535932394908, "tps": 579975, "wall": 2081.2} {"step": 18418, "train_loss": 3.133213996887207, "lr": 0.00016972696342356064, "tps": 578557, "wall": 2086.4} {"step": 18419, "train_loss": 3.2737350463867188, "lr": 0.00016970856809266782, "tps": 577145, "wall": 2091.6} {"step": 18420, "train_loss": 3.1705374717712402, "lr": 0.00016969017333147912, "tps": 575734, "wall": 2096.9} {"step": 18421, "train_loss": 3.2093887329101562, "lr": 0.0001696717791402028, "tps": 574327, "wall": 2102.1} {"step": 18422, "train_loss": 3.2267963886260986, "lr": 0.00016965338551904732, "tps": 572910, "wall": 2107.4} {"step": 18423, "train_loss": 3.2088541984558105, "lr": 0.00016963499246822105, "tps": 571500, "wall": 2112.7} {"step": 18424, "train_loss": 3.2686767578125, "lr": 0.00016961659998793226, "tps": 570090, "wall": 2118.1} {"step": 18425, "train_loss": 3.1097214221954346, "lr": 0.00016959820807838934, "tps": 568705, "wall": 2123.4} {"step": 18426, "train_loss": 3.226952075958252, "lr": 0.00016957981673980065, "tps": 567417, "wall": 2128.3} {"step": 18427, "train_loss": 3.3114938735961914, "lr": 0.00016956142597237457, "tps": 566131, "wall": 2133.2} {"step": 18428, "train_loss": 3.2821102142333984, "lr": 0.00016954303577631933, "tps": 564852, "wall": 2138.2} {"step": 18429, "train_loss": 3.256753921508789, "lr": 0.00016952464615184335, "tps": 563577, "wall": 2143.1} {"step": 18430, "train_loss": 3.255443811416626, "lr": 0.00016950625709915494, "tps": 562301, "wall": 2148.1} {"step": 18431, "train_loss": 3.2121214866638184, "lr": 0.0001694878686184623, "tps": 561044, "wall": 2153.1} {"step": 18432, "train_loss": 3.19439435005188, "lr": 0.00016946948070997383, "tps": 559774, "wall": 2158.1} {"step": 18433, "train_loss": 3.2602603435516357, "lr": 0.00016945109337389788, "tps": 558519, "wall": 2163.0} {"step": 18434, "train_loss": 3.3236777782440186, "lr": 0.00016943270661044264, "tps": 557277, "wall": 2168.0} {"step": 18435, "train_loss": 3.3102078437805176, "lr": 0.0001694143204198164, "tps": 555963, "wall": 2173.2} {"step": 18436, "train_loss": 3.246483564376831, "lr": 0.00016939593480222752, "tps": 554657, "wall": 2178.4} {"step": 18437, "train_loss": 3.2648987770080566, "lr": 0.00016937754975788422, "tps": 553273, "wall": 2184.0} {"step": 18438, "train_loss": 3.2585668563842773, "lr": 0.00016935916528699476, "tps": 551948, "wall": 2189.4} {"step": 18439, "train_loss": 3.2076778411865234, "lr": 0.00016934078138976743, "tps": 550659, "wall": 2194.6} {"step": 18440, "train_loss": 3.1629996299743652, "lr": 0.00016932239806641047, "tps": 549356, "wall": 2199.9} {"step": 18441, "train_loss": 3.2485013008117676, "lr": 0.00016930401531713214, "tps": 548048, "wall": 2205.3} {"step": 18442, "train_loss": 3.1286377906799316, "lr": 0.00016928563314214063, "tps": 546798, "wall": 2210.5} {"step": 18443, "train_loss": 3.229853391647339, "lr": 0.0001692672515416442, "tps": 545543, "wall": 2215.7} {"step": 18444, "train_loss": 3.2454776763916016, "lr": 0.00016924887051585118, "tps": 544293, "wall": 2220.9} {"step": 18445, "train_loss": 3.177663803100586, "lr": 0.00016923049006496962, "tps": 543112, "wall": 2225.8} {"step": 18446, "train_loss": 3.228705644607544, "lr": 0.00016921211018920782, "tps": 541927, "wall": 2230.8} {"step": 18447, "train_loss": 3.2375283241271973, "lr": 0.00016919373088877405, "tps": 540752, "wall": 2235.8} {"step": 18448, "train_loss": 3.2956161499023438, "lr": 0.00016917535216387635, "tps": 539591, "wall": 2240.7} {"step": 18449, "train_loss": 3.2742724418640137, "lr": 0.00016915697401472305, "tps": 538433, "wall": 2245.7} {"step": 18450, "train_loss": 3.1950483322143555, "lr": 0.00016913859644152236, "tps": 537278, "wall": 2250.6} {"step": 18451, "train_loss": 3.3327090740203857, "lr": 0.00016912021944448231, "tps": 536122, "wall": 2255.6} {"step": 18452, "train_loss": 3.2860066890716553, "lr": 0.00016910184302381117, "tps": 534974, "wall": 2260.5} {"step": 18453, "train_loss": 3.244230031967163, "lr": 0.00016908346717971716, "tps": 533804, "wall": 2265.6} {"step": 18454, "train_loss": 3.257692813873291, "lr": 0.00016906509191240838, "tps": 532665, "wall": 2270.6} {"step": 18455, "train_loss": 3.357895851135254, "lr": 0.00016904671722209295, "tps": 531533, "wall": 2275.6} {"step": 18456, "train_loss": 3.244044065475464, "lr": 0.0001690283431089791, "tps": 530404, "wall": 2280.5} {"step": 18457, "train_loss": 3.243483066558838, "lr": 0.00016900996957327496, "tps": 529297, "wall": 2285.4} {"step": 18458, "train_loss": 3.1672611236572266, "lr": 0.00016899159661518863, "tps": 528185, "wall": 2290.4} {"step": 18459, "train_loss": 3.165412425994873, "lr": 0.00016897322423492828, "tps": 527078, "wall": 2295.3} {"step": 18460, "train_loss": 3.1646952629089355, "lr": 0.00016895485243270195, "tps": 525968, "wall": 2300.3} {"step": 18461, "train_loss": 3.184471845626831, "lr": 0.0001689364812087178, "tps": 524870, "wall": 2305.2} {"step": 18462, "train_loss": 3.1584768295288086, "lr": 0.00016891811056318404, "tps": 523781, "wall": 2310.1} {"step": 18463, "train_loss": 3.1832776069641113, "lr": 0.00016889974049630858, "tps": 522689, "wall": 2315.1} {"step": 18464, "train_loss": 3.122893810272217, "lr": 0.00016888137100829967, "tps": 521604, "wall": 2320.0} {"step": 18465, "train_loss": 3.2233526706695557, "lr": 0.00016886300209936539, "tps": 520527, "wall": 2324.9} {"step": 18466, "train_loss": 3.2357728481292725, "lr": 0.00016884463376971374, "tps": 519444, "wall": 2329.9} {"step": 18467, "train_loss": 3.189242124557495, "lr": 0.00016882626601955283, "tps": 518367, "wall": 2334.9} {"step": 18468, "train_loss": 3.267361879348755, "lr": 0.0001688078988490908, "tps": 517307, "wall": 2339.8} {"step": 18469, "train_loss": 3.2142081260681152, "lr": 0.00016878953225853564, "tps": 516251, "wall": 2344.7} {"step": 18470, "train_loss": 3.2242915630340576, "lr": 0.00016877116624809544, "tps": 515194, "wall": 2349.6} {"step": 18471, "train_loss": 3.1771769523620605, "lr": 0.00016875280081797821, "tps": 514145, "wall": 2354.5} {"step": 18472, "train_loss": 3.2913851737976074, "lr": 0.00016873443596839206, "tps": 513095, "wall": 2359.5} {"step": 18473, "train_loss": 3.22678804397583, "lr": 0.00016871607169954497, "tps": 512054, "wall": 2364.4} {"step": 18474, "train_loss": 3.2152042388916016, "lr": 0.00016869770801164496, "tps": 511016, "wall": 2369.3} {"step": 18475, "train_loss": 3.2012059688568115, "lr": 0.0001686793449049002, "tps": 509989, "wall": 2374.2} {"step": 18476, "train_loss": 3.277143955230713, "lr": 0.00016866098237951847, "tps": 508964, "wall": 2379.2} {"step": 18477, "train_loss": 3.2658181190490723, "lr": 0.00016864262043570798, "tps": 507935, "wall": 2384.1} {"step": 18478, "train_loss": 3.174588441848755, "lr": 0.00016862425907367663, "tps": 506892, "wall": 2389.1} {"step": 18479, "train_loss": 3.2767999172210693, "lr": 0.0001686058982936325, "tps": 505883, "wall": 2394.0} {"step": 18480, "train_loss": 3.2164053916931152, "lr": 0.0001685875380957835, "tps": 504877, "wall": 2398.9} {"step": 18481, "train_loss": 3.1918869018554688, "lr": 0.00016856917848033764, "tps": 503875, "wall": 2403.8} {"step": 18482, "train_loss": 3.155505418777466, "lr": 0.00016855081944750294, "tps": 502869, "wall": 2408.8} {"step": 18483, "train_loss": 3.3298494815826416, "lr": 0.0001685324609974873, "tps": 501869, "wall": 2413.7} {"step": 18484, "train_loss": 3.188271999359131, "lr": 0.00016851410313049872, "tps": 500868, "wall": 2418.7} {"step": 18485, "train_loss": 3.1113381385803223, "lr": 0.00016849574584674518, "tps": 499857, "wall": 2423.7} {"step": 18486, "train_loss": 3.2110648155212402, "lr": 0.00016847738914643471, "tps": 498841, "wall": 2428.8} {"step": 18487, "train_loss": 3.258962869644165, "lr": 0.00016845903302977505, "tps": 497834, "wall": 2433.8} {"step": 18488, "train_loss": 3.287733793258667, "lr": 0.00016844067749697427, "tps": 496833, "wall": 2438.8} {"step": 18489, "train_loss": 3.3035902976989746, "lr": 0.00016842232254824036, "tps": 495825, "wall": 2443.9} {"step": 18490, "train_loss": 3.2134175300598145, "lr": 0.0001684039681837811, "tps": 494814, "wall": 2449.0} {"step": 18491, "train_loss": 3.2643322944641113, "lr": 0.00016838561440380448, "tps": 493821, "wall": 2454.1} {"step": 18492, "train_loss": 3.2181413173675537, "lr": 0.00016836726120851843, "tps": 492828, "wall": 2459.2} {"step": 18493, "train_loss": 3.212127923965454, "lr": 0.00016834890859813086, "tps": 491847, "wall": 2464.2} {"step": 18494, "train_loss": 3.2764158248901367, "lr": 0.00016833055657284959, "tps": 490866, "wall": 2469.3} {"step": 18495, "train_loss": 3.212951421737671, "lr": 0.00016831220513288263, "tps": 489889, "wall": 2474.3} {"step": 18496, "train_loss": 3.252415895462036, "lr": 0.00016829385427843775, "tps": 488921, "wall": 2479.4} {"step": 18497, "train_loss": 3.236875295639038, "lr": 0.00016827550400972294, "tps": 487956, "wall": 2484.4} {"step": 18498, "train_loss": 3.174379825592041, "lr": 0.00016825715432694594, "tps": 486995, "wall": 2489.4} {"step": 18499, "train_loss": 3.2257981300354004, "lr": 0.00016823880523031482, "tps": 486038, "wall": 2494.5} {"step": 18500, "train_loss": 3.2331104278564453, "lr": 0.0001682204567200372, "tps": 485083, "wall": 2499.5} {"step": 18501, "train_loss": 3.29966139793396, "lr": 0.00016820210879632107, "tps": 484093, "wall": 2504.8} {"step": 18502, "train_loss": 3.1936118602752686, "lr": 0.00016818376145937434, "tps": 483134, "wall": 2509.9} {"step": 18503, "train_loss": 3.117913007736206, "lr": 0.0001681654147094047, "tps": 482191, "wall": 2514.9} {"step": 18504, "train_loss": 3.2168922424316406, "lr": 0.00016814706854662, "tps": 481246, "wall": 2520.0} {"step": 18505, "train_loss": 3.265695095062256, "lr": 0.00016812872297122816, "tps": 480308, "wall": 2525.1} {"step": 18506, "train_loss": 3.155660629272461, "lr": 0.000168110377983437, "tps": 479371, "wall": 2530.1} {"step": 18507, "train_loss": 3.135171890258789, "lr": 0.0001680920335834542, "tps": 478440, "wall": 2535.2} {"step": 18508, "train_loss": 3.0297110080718994, "lr": 0.00016807368977148768, "tps": 477508, "wall": 2540.3} {"step": 18509, "train_loss": 3.2558069229125977, "lr": 0.00016805534654774524, "tps": 476579, "wall": 2545.4} {"step": 18510, "train_loss": 3.256498336791992, "lr": 0.0001680370039124346, "tps": 475652, "wall": 2550.5} {"step": 18511, "train_loss": 3.145932197570801, "lr": 0.0001680186618657636, "tps": 474739, "wall": 2555.5} {"step": 18512, "train_loss": 3.1850061416625977, "lr": 0.00016800032040794003, "tps": 473830, "wall": 2560.6} {"step": 18513, "train_loss": 3.3606717586517334, "lr": 0.00016798197953917163, "tps": 472910, "wall": 2565.7} {"step": 18514, "train_loss": 3.2095260620117188, "lr": 0.00016796363925966618, "tps": 472013, "wall": 2570.7} {"step": 18515, "train_loss": 3.2277779579162598, "lr": 0.00016794529956963146, "tps": 471090, "wall": 2575.9} {"step": 18516, "train_loss": 3.344259262084961, "lr": 0.0001679269604692752, "tps": 470197, "wall": 2580.9} {"step": 18517, "train_loss": 3.2199368476867676, "lr": 0.00016790862195880513, "tps": 469294, "wall": 2586.0} {"step": 18518, "train_loss": 3.257404088973999, "lr": 0.000167890284038429, "tps": 468407, "wall": 2591.0} {"step": 18519, "train_loss": 3.2253355979919434, "lr": 0.00016787194670835463, "tps": 467525, "wall": 2596.1} {"step": 18520, "train_loss": 3.1764748096466064, "lr": 0.00016785360996878957, "tps": 466647, "wall": 2601.1} {"step": 18521, "train_loss": 3.2277278900146484, "lr": 0.00016783527381994165, "tps": 465772, "wall": 2606.1} {"step": 18522, "train_loss": 3.1945345401763916, "lr": 0.00016781693826201858, "tps": 464896, "wall": 2611.2} {"step": 18523, "train_loss": 3.266494035720825, "lr": 0.00016779860329522813, "tps": 464026, "wall": 2616.2} {"step": 18524, "train_loss": 3.2380568981170654, "lr": 0.00016778026891977783, "tps": 463119, "wall": 2621.5} {"step": 18525, "train_loss": 3.1657309532165527, "lr": 0.0001677619351358755, "tps": 462227, "wall": 2626.7} {"step": 18526, "train_loss": 3.134671926498413, "lr": 0.0001677436019437288, "tps": 461318, "wall": 2632.0} {"step": 18527, "train_loss": 3.2429299354553223, "lr": 0.00016772526934354543, "tps": 460393, "wall": 2637.4} {"step": 18528, "train_loss": 3.1137499809265137, "lr": 0.00016770693733553297, "tps": 459475, "wall": 2642.8} {"step": 18529, "train_loss": 3.129747152328491, "lr": 0.00016768860591989925, "tps": 458564, "wall": 2648.2} {"step": 18530, "train_loss": 3.2600181102752686, "lr": 0.00016767027509685174, "tps": 457651, "wall": 2653.7} {"step": 18531, "train_loss": 3.203432559967041, "lr": 0.00016765194486659826, "tps": 456740, "wall": 2659.1} {"step": 18532, "train_loss": 3.2231554985046387, "lr": 0.0001676336152293463, "tps": 455833, "wall": 2664.5} {"step": 18533, "train_loss": 3.2910280227661133, "lr": 0.00016761528618530367, "tps": 454939, "wall": 2669.9} {"step": 18534, "train_loss": 3.195300579071045, "lr": 0.00016759695773467783, "tps": 454050, "wall": 2675.3} {"step": 18535, "train_loss": 3.2615959644317627, "lr": 0.00016757862987767648, "tps": 453170, "wall": 2680.6} {"step": 18536, "train_loss": 3.2279796600341797, "lr": 0.00016756030261450735, "tps": 452295, "wall": 2685.9} {"step": 18537, "train_loss": 3.279646635055542, "lr": 0.00016754197594537787, "tps": 451456, "wall": 2691.1} {"step": 18538, "train_loss": 3.1489288806915283, "lr": 0.0001675236498704957, "tps": 450620, "wall": 2696.2} {"step": 18539, "train_loss": 3.270307779312134, "lr": 0.00016750532439006852, "tps": 449783, "wall": 2701.4} {"step": 18540, "train_loss": 3.3104586601257324, "lr": 0.0001674869995043039, "tps": 448944, "wall": 2706.6} {"step": 18541, "train_loss": 3.1356077194213867, "lr": 0.00016746867521340926, "tps": 448068, "wall": 2712.0} {"step": 18542, "train_loss": 3.1778154373168945, "lr": 0.00016745035151759238, "tps": 447207, "wall": 2717.4} {"step": 18543, "train_loss": 3.2737197875976562, "lr": 0.00016743202841706082, "tps": 446348, "wall": 2722.8} {"step": 18544, "train_loss": 3.1890833377838135, "lr": 0.00016741370591202202, "tps": 445498, "wall": 2728.1} {"step": 18545, "train_loss": 3.261857509613037, "lr": 0.0001673953840026836, "tps": 444690, "wall": 2733.2} {"step": 18546, "train_loss": 3.30635404586792, "lr": 0.0001673770626892532, "tps": 443879, "wall": 2738.3} {"step": 18547, "train_loss": 3.233701229095459, "lr": 0.0001673587419719382, "tps": 443074, "wall": 2743.5} {"step": 18548, "train_loss": 3.2067787647247314, "lr": 0.00016734042185094622, "tps": 442256, "wall": 2748.7} {"step": 18549, "train_loss": 3.132453441619873, "lr": 0.00016732210232648476, "tps": 441457, "wall": 2753.8} {"step": 18550, "train_loss": 3.17025089263916, "lr": 0.00016730378339876144, "tps": 440656, "wall": 2759.0} {"step": 18551, "train_loss": 3.179672956466675, "lr": 0.00016728546506798373, "tps": 439860, "wall": 2764.1} {"step": 18552, "train_loss": 3.2624058723449707, "lr": 0.00016726714733435904, "tps": 439065, "wall": 2769.3} {"step": 18553, "train_loss": 3.215121269226074, "lr": 0.00016724883019809505, "tps": 438275, "wall": 2774.4} {"step": 18554, "train_loss": 3.1663293838500977, "lr": 0.0001672305136593991, "tps": 437487, "wall": 2779.6} {"step": 18555, "train_loss": 3.213437557220459, "lr": 0.00016721219771847877, "tps": 436704, "wall": 2784.7} {"step": 18556, "train_loss": 3.2655062675476074, "lr": 0.0001671938823755415, "tps": 435919, "wall": 2789.9} {"step": 18557, "train_loss": 3.1278598308563232, "lr": 0.0001671755676307948, "tps": 435142, "wall": 2795.0} {"step": 18558, "train_loss": 3.0842368602752686, "lr": 0.0001671572534844461, "tps": 434357, "wall": 2800.2} {"step": 18559, "train_loss": 3.240194320678711, "lr": 0.00016713893993670293, "tps": 433611, "wall": 2805.2} {"step": 18560, "train_loss": 3.1273202896118164, "lr": 0.00016712062698777272, "tps": 432869, "wall": 2810.1} {"step": 18561, "train_loss": 3.2305099964141846, "lr": 0.00016710231463786288, "tps": 432138, "wall": 2815.0} {"step": 18562, "train_loss": 3.194938898086548, "lr": 0.00016708400288718088, "tps": 431410, "wall": 2819.9} {"step": 18563, "train_loss": 3.1648242473602295, "lr": 0.0001670656917359342, "tps": 430685, "wall": 2824.8} {"step": 18564, "train_loss": 3.256624698638916, "lr": 0.0001670473811843302, "tps": 429963, "wall": 2829.7} {"step": 18565, "train_loss": 3.2027385234832764, "lr": 0.0001670290712325763, "tps": 429231, "wall": 2834.7} {"step": 18566, "train_loss": 3.1212379932403564, "lr": 0.00016701076188087996, "tps": 428503, "wall": 2839.7} {"step": 18567, "train_loss": 3.097809314727783, "lr": 0.00016699245312944863, "tps": 427781, "wall": 2844.6} {"step": 18568, "train_loss": 3.3236632347106934, "lr": 0.00016697414497848957, "tps": 427057, "wall": 2849.6} {"step": 18569, "train_loss": 3.1421117782592773, "lr": 0.00016695583742821032, "tps": 426341, "wall": 2854.5} {"step": 18570, "train_loss": 3.2985448837280273, "lr": 0.00016693753047881824, "tps": 425631, "wall": 2859.4} {"step": 18571, "train_loss": 3.0960073471069336, "lr": 0.00016691922413052064, "tps": 424918, "wall": 2864.4} {"step": 18572, "train_loss": 3.126760959625244, "lr": 0.00016690091838352493, "tps": 424207, "wall": 2869.3} {"step": 18573, "train_loss": 3.0851287841796875, "lr": 0.00016688261323803856, "tps": 423500, "wall": 2874.3} {"step": 18574, "train_loss": 3.311190128326416, "lr": 0.00016686430869426874, "tps": 422797, "wall": 2879.2} {"step": 18575, "train_loss": 3.2182130813598633, "lr": 0.0001668460047524229, "tps": 422094, "wall": 2884.2} {"step": 18576, "train_loss": 3.19521427154541, "lr": 0.0001668277014127084, "tps": 421392, "wall": 2889.1} {"step": 18577, "train_loss": 3.2722091674804688, "lr": 0.00016680939867533265, "tps": 420683, "wall": 2894.2} {"step": 18578, "train_loss": 3.1310410499572754, "lr": 0.00016679109654050284, "tps": 419973, "wall": 2899.2} {"step": 18579, "train_loss": 3.2100110054016113, "lr": 0.0001667727950084264, "tps": 419259, "wall": 2904.3} {"step": 18580, "train_loss": 3.2641701698303223, "lr": 0.00016675449407931066, "tps": 418552, "wall": 2909.4} {"step": 18581, "train_loss": 3.240091323852539, "lr": 0.0001667361937533628, "tps": 417857, "wall": 2914.4} {"step": 18582, "train_loss": 3.338698387145996, "lr": 0.00016671789403079025, "tps": 417161, "wall": 2919.4} {"step": 18583, "train_loss": 3.200185775756836, "lr": 0.00016669959491180035, "tps": 416464, "wall": 2924.4} {"step": 18584, "train_loss": 3.30855131149292, "lr": 0.0001666812963966002, "tps": 415782, "wall": 2929.4} {"step": 18585, "train_loss": 3.1754891872406006, "lr": 0.00016666299848539727, "tps": 415095, "wall": 2934.4} {"step": 18586, "train_loss": 3.177640676498413, "lr": 0.0001666447011783988, "tps": 414421, "wall": 2939.3} {"step": 18587, "train_loss": 3.2665865421295166, "lr": 0.00016662640447581204, "tps": 413748, "wall": 2944.3} {"step": 18588, "train_loss": 3.098228931427002, "lr": 0.00016660810837784422, "tps": 413074, "wall": 2949.2} {"step": 18589, "train_loss": 3.1874337196350098, "lr": 0.00016658981288470264, "tps": 412406, "wall": 2954.2} {"step": 18590, "train_loss": 3.1981043815612793, "lr": 0.00016657151799659458, "tps": 411743, "wall": 2959.1} {"step": 18591, "train_loss": 3.1004135608673096, "lr": 0.00016655322371372723, "tps": 411073, "wall": 2964.1} {"step": 18592, "train_loss": 3.2102017402648926, "lr": 0.00016653493003630784, "tps": 410413, "wall": 2969.0} {"step": 18593, "train_loss": 3.12143611907959, "lr": 0.00016651663696454368, "tps": 409750, "wall": 2974.0} {"step": 18594, "train_loss": 3.3284149169921875, "lr": 0.00016649834449864197, "tps": 409060, "wall": 2979.1} {"step": 18595, "train_loss": 3.238476037979126, "lr": 0.00016648005263880986, "tps": 408388, "wall": 2984.2} {"step": 18596, "train_loss": 3.2013723850250244, "lr": 0.00016646176138525464, "tps": 407708, "wall": 2989.3} {"step": 18597, "train_loss": 3.1248621940612793, "lr": 0.0001664434707381835, "tps": 407042, "wall": 2994.4} {"step": 18598, "train_loss": 3.2549219131469727, "lr": 0.00016642518069780358, "tps": 406367, "wall": 2999.5} {"step": 18599, "train_loss": 3.2968833446502686, "lr": 0.0001664068912643221, "tps": 405697, "wall": 3004.6} {"step": 18600, "train_loss": 3.1160011291503906, "lr": 0.00016638860243794632, "tps": 405047, "wall": 3009.6} {"step": 18601, "train_loss": 3.3232345581054688, "lr": 0.00016637031421888333, "tps": 404399, "wall": 3014.6} {"step": 18602, "train_loss": 3.2444164752960205, "lr": 0.00016635202660734026, "tps": 403760, "wall": 3019.5} {"step": 18603, "train_loss": 3.2808475494384766, "lr": 0.00016633373960352437, "tps": 403120, "wall": 3024.5} {"step": 18604, "train_loss": 3.117004871368408, "lr": 0.00016631545320764282, "tps": 402484, "wall": 3029.4} {"step": 18605, "train_loss": 3.2021970748901367, "lr": 0.0001662971674199027, "tps": 401840, "wall": 3034.4} {"step": 18606, "train_loss": 3.224606990814209, "lr": 0.00016627888224051112, "tps": 401198, "wall": 3039.5} {"step": 18607, "train_loss": 3.2097816467285156, "lr": 0.00016626059766967533, "tps": 400569, "wall": 3044.4} {"step": 18608, "train_loss": 3.1633193492889404, "lr": 0.0001662423137076024, "tps": 399931, "wall": 3049.4} {"step": 18609, "train_loss": 3.311816692352295, "lr": 0.00016622403035449943, "tps": 399306, "wall": 3054.4} {"step": 18610, "train_loss": 3.0614497661590576, "lr": 0.00016620574761057357, "tps": 398686, "wall": 3059.3} {"step": 18611, "train_loss": 3.1618409156799316, "lr": 0.00016618746547603186, "tps": 398063, "wall": 3064.2} {"step": 18612, "train_loss": 3.190789222717285, "lr": 0.0001661691839510815, "tps": 397429, "wall": 3069.3} {"step": 18613, "train_loss": 3.226046562194824, "lr": 0.00016615090303592948, "tps": 396798, "wall": 3074.3} {"step": 18614, "train_loss": 3.2749686241149902, "lr": 0.00016613262273078302, "tps": 396166, "wall": 3079.4} {"step": 18615, "train_loss": 3.180992841720581, "lr": 0.0001661143430358491, "tps": 395536, "wall": 3084.5} {"step": 18616, "train_loss": 3.301764488220215, "lr": 0.00016609606395133478, "tps": 394911, "wall": 3089.5} {"step": 18617, "train_loss": 3.2515501976013184, "lr": 0.00016607778547744726, "tps": 394289, "wall": 3094.5} {"step": 18618, "train_loss": 3.213583469390869, "lr": 0.00016605950761439337, "tps": 393666, "wall": 3099.6} {"step": 18619, "train_loss": 3.232848644256592, "lr": 0.00016604123036238034, "tps": 393046, "wall": 3104.7} {"step": 18620, "train_loss": 3.233715057373047, "lr": 0.00016602295372161524, "tps": 392424, "wall": 3109.8} {"step": 18621, "train_loss": 3.280196189880371, "lr": 0.000166004677692305, "tps": 391810, "wall": 3114.8} {"step": 18622, "train_loss": 3.2430050373077393, "lr": 0.00016598640227465667, "tps": 391199, "wall": 3119.8} {"step": 18623, "train_loss": 3.1764564514160156, "lr": 0.0001659681274688773, "tps": 390588, "wall": 3124.9} {"step": 18624, "train_loss": 3.1708903312683105, "lr": 0.00016594985327517394, "tps": 389978, "wall": 3129.9} {"step": 18625, "train_loss": 3.1966934204101562, "lr": 0.0001659315796937535, "tps": 389373, "wall": 3135.0} {"step": 18626, "train_loss": 3.253657579421997, "lr": 0.00016591330672482317, "tps": 388771, "wall": 3140.0} {"step": 18627, "train_loss": 3.134037971496582, "lr": 0.00016589503436858976, "tps": 388161, "wall": 3145.1} {"step": 18628, "train_loss": 3.301363945007324, "lr": 0.00016587676262526027, "tps": 387551, "wall": 3150.2} {"step": 18629, "train_loss": 3.2027244567871094, "lr": 0.00016585849149504183, "tps": 386938, "wall": 3155.4} {"step": 18630, "train_loss": 3.2436325550079346, "lr": 0.0001658402209781413, "tps": 386333, "wall": 3160.5} {"step": 18631, "train_loss": 3.2770168781280518, "lr": 0.00016582195107476565, "tps": 385716, "wall": 3165.7} {"step": 18632, "train_loss": 3.2194814682006836, "lr": 0.00016580368178512194, "tps": 385116, "wall": 3170.8} {"step": 18633, "train_loss": 3.162499189376831, "lr": 0.00016578541310941693, "tps": 384514, "wall": 3175.9} {"step": 18634, "train_loss": 3.1854166984558105, "lr": 0.00016576714504785777, "tps": 383918, "wall": 3181.1} {"step": 18635, "train_loss": 3.2050137519836426, "lr": 0.00016574887760065137, "tps": 383318, "wall": 3186.2} {"step": 18636, "train_loss": 3.298200845718384, "lr": 0.0001657306107680045, "tps": 382717, "wall": 3191.4} {"step": 18637, "train_loss": 3.2255020141601562, "lr": 0.00016571234455012426, "tps": 382119, "wall": 3196.5} {"step": 18638, "train_loss": 3.246384382247925, "lr": 0.00016569407894721753, "tps": 381525, "wall": 3201.7} {"step": 18639, "train_loss": 3.1682257652282715, "lr": 0.00016567581395949125, "tps": 380937, "wall": 3206.8} {"step": 18640, "train_loss": 3.360175132751465, "lr": 0.00016565754958715223, "tps": 380353, "wall": 3211.9} {"step": 18641, "train_loss": 3.137700080871582, "lr": 0.00016563928583040744, "tps": 379766, "wall": 3217.0} {"step": 18642, "train_loss": 3.0923080444335938, "lr": 0.0001656210226894638, "tps": 379178, "wall": 3222.2} {"step": 18643, "train_loss": 3.239614963531494, "lr": 0.0001656027601645281, "tps": 378585, "wall": 3227.4} {"step": 18644, "train_loss": 3.2566471099853516, "lr": 0.00016558449825580728, "tps": 378001, "wall": 3232.6} {"step": 18645, "train_loss": 3.1947295665740967, "lr": 0.00016556623696350827, "tps": 377417, "wall": 3237.8} {"step": 18646, "train_loss": 3.2118618488311768, "lr": 0.00016554797628783784, "tps": 376833, "wall": 3242.9} {"step": 18647, "train_loss": 3.174499034881592, "lr": 0.00016552971622900287, "tps": 376260, "wall": 3248.1} {"step": 18648, "train_loss": 3.294996738433838, "lr": 0.0001655114567872102, "tps": 375685, "wall": 3253.2} {"step": 18649, "train_loss": 3.2337703704833984, "lr": 0.00016549319796266672, "tps": 375116, "wall": 3258.3} {"step": 18650, "train_loss": 3.1330366134643555, "lr": 0.00016547493975557927, "tps": 374552, "wall": 3263.4} {"step": 18651, "train_loss": 3.2522850036621094, "lr": 0.0001654566821661546, "tps": 373979, "wall": 3268.6} {"step": 18652, "train_loss": 3.218860149383545, "lr": 0.0001654384251945996, "tps": 373414, "wall": 3273.7} {"step": 18653, "train_loss": 3.2604756355285645, "lr": 0.00016542016884112107, "tps": 372842, "wall": 3278.9} {"step": 18654, "train_loss": 3.2880988121032715, "lr": 0.0001654019131059258, "tps": 372280, "wall": 3284.0} {"step": 18655, "train_loss": 3.2587804794311523, "lr": 0.00016538365798922068, "tps": 371712, "wall": 3289.2} {"step": 18656, "train_loss": 3.2740297317504883, "lr": 0.0001653654034912124, "tps": 371157, "wall": 3294.3} {"step": 18657, "train_loss": 3.2602810859680176, "lr": 0.00016534714961210776, "tps": 370605, "wall": 3299.4} {"step": 18658, "train_loss": 3.1533350944519043, "lr": 0.0001653288963521136, "tps": 370053, "wall": 3304.5} {"step": 18659, "train_loss": 3.236123561859131, "lr": 0.00016531064371143667, "tps": 369504, "wall": 3309.6} {"step": 18660, "train_loss": 3.1460018157958984, "lr": 0.00016529239169028368, "tps": 368954, "wall": 3314.7} {"step": 18661, "train_loss": 3.178659200668335, "lr": 0.00016527414028886148, "tps": 368400, "wall": 3319.8} {"step": 18662, "train_loss": 3.2088799476623535, "lr": 0.0001652558895073768, "tps": 367839, "wall": 3325.1} {"step": 18663, "train_loss": 3.1725709438323975, "lr": 0.00016523763934603628, "tps": 367266, "wall": 3330.5} {"step": 18664, "train_loss": 3.209371328353882, "lr": 0.00016521938980504678, "tps": 366721, "wall": 3335.6} {"step": 18665, "train_loss": 3.196645498275757, "lr": 0.00016520114088461503, "tps": 366176, "wall": 3340.7} {"step": 18666, "train_loss": 3.1828346252441406, "lr": 0.00016518289258494773, "tps": 365625, "wall": 3345.9} {"step": 18667, "train_loss": 3.2639551162719727, "lr": 0.0001651646449062515, "tps": 365086, "wall": 3351.1} {"step": 18668, "train_loss": 3.3056554794311523, "lr": 0.00016514639784873323, "tps": 364552, "wall": 3356.1} {"step": 18669, "train_loss": 3.1789698600769043, "lr": 0.0001651281514125995, "tps": 364022, "wall": 3361.2} {"step": 18670, "train_loss": 3.150164842605591, "lr": 0.00016510990559805703, "tps": 363484, "wall": 3366.4} {"step": 18671, "train_loss": 3.239001512527466, "lr": 0.00016509166040531254, "tps": 362956, "wall": 3371.4} {"step": 18672, "train_loss": 3.2001376152038574, "lr": 0.00016507341583457262, "tps": 362427, "wall": 3376.5} {"step": 18673, "train_loss": 3.1785640716552734, "lr": 0.0001650551718860441, "tps": 361895, "wall": 3381.7} {"step": 18674, "train_loss": 3.253276824951172, "lr": 0.00016503692855993353, "tps": 361371, "wall": 3386.8} {"step": 18675, "train_loss": 3.20330548286438, "lr": 0.00016501868585644763, "tps": 360846, "wall": 3391.9} {"step": 18676, "train_loss": 3.197370767593384, "lr": 0.00016500044377579305, "tps": 360317, "wall": 3397.0} {"step": 18677, "train_loss": 3.141035318374634, "lr": 0.00016498220231817636, "tps": 359787, "wall": 3402.2} {"step": 18678, "train_loss": 3.1863512992858887, "lr": 0.00016496396148380423, "tps": 359254, "wall": 3407.5} {"step": 18679, "train_loss": 3.2773709297180176, "lr": 0.0001649457212728834, "tps": 358729, "wall": 3412.6} {"step": 18680, "train_loss": 3.202155828475952, "lr": 0.00016492748168562041, "tps": 358209, "wall": 3417.8} {"step": 18681, "train_loss": 3.330984592437744, "lr": 0.00016490924272222185, "tps": 357689, "wall": 3422.9} {"step": 18682, "train_loss": 3.269608974456787, "lr": 0.0001648910043828944, "tps": 357174, "wall": 3428.0} {"step": 18683, "train_loss": 3.1421751976013184, "lr": 0.00016487276666784468, "tps": 356652, "wall": 3433.2} {"step": 18684, "train_loss": 3.1138792037963867, "lr": 0.00016485452957727917, "tps": 356113, "wall": 3438.6} {"step": 18685, "train_loss": 3.219214916229248, "lr": 0.00016483629311140452, "tps": 355563, "wall": 3444.1} {"step": 18686, "train_loss": 3.253371238708496, "lr": 0.0001648180572704274, "tps": 355056, "wall": 3449.2} {"step": 18687, "train_loss": 3.2825145721435547, "lr": 0.0001647998220545542, "tps": 354551, "wall": 3454.3} {"step": 18688, "train_loss": 3.25343656539917, "lr": 0.00016478158746399167, "tps": 354035, "wall": 3459.6} {"step": 18689, "train_loss": 3.1427154541015625, "lr": 0.00016476335349894635, "tps": 353512, "wall": 3464.8} {"step": 18690, "train_loss": 3.235978841781616, "lr": 0.00016474512015962468, "tps": 352988, "wall": 3470.2} {"step": 18691, "train_loss": 3.125157356262207, "lr": 0.00016472688744623327, "tps": 352468, "wall": 3475.5} {"step": 18692, "train_loss": 3.264341354370117, "lr": 0.00016470865535897868, "tps": 351958, "wall": 3480.7} {"step": 18693, "train_loss": 3.196444034576416, "lr": 0.0001646904238980675, "tps": 351442, "wall": 3486.0} {"step": 18694, "train_loss": 3.219820976257324, "lr": 0.00016467219306370612, "tps": 350929, "wall": 3491.3} {"step": 18695, "train_loss": 3.198115110397339, "lr": 0.00016465396285610115, "tps": 350439, "wall": 3496.4} {"step": 18696, "train_loss": 3.261605739593506, "lr": 0.00016463573327545912, "tps": 349939, "wall": 3501.5} {"step": 18697, "train_loss": 3.176708936691284, "lr": 0.00016461750432198645, "tps": 349426, "wall": 3506.9} {"step": 18698, "train_loss": 3.1300530433654785, "lr": 0.0001645992759958897, "tps": 348929, "wall": 3512.1} {"step": 18699, "train_loss": 3.249258041381836, "lr": 0.0001645810482973753, "tps": 348450, "wall": 3517.1} {"step": 18700, "train_loss": 3.2454521656036377, "lr": 0.0001645628212266499, "tps": 347970, "wall": 3522.1} {"step": 18701, "train_loss": 3.24505615234375, "lr": 0.0001645445947839198, "tps": 347473, "wall": 3527.3} {"step": 18702, "train_loss": 3.2373876571655273, "lr": 0.0001645263689693915, "tps": 346974, "wall": 3532.6} {"step": 18703, "train_loss": 3.2765512466430664, "lr": 0.00016450814378327153, "tps": 346506, "wall": 3537.6} {"step": 18704, "train_loss": 3.183556318283081, "lr": 0.00016448991922576628, "tps": 346036, "wall": 3542.5} {"step": 18705, "train_loss": 3.201997995376587, "lr": 0.00016447169529708222, "tps": 345566, "wall": 3547.6} {"step": 18706, "train_loss": 3.310127019882202, "lr": 0.00016445347199742588, "tps": 345104, "wall": 3552.5} {"step": 18707, "train_loss": 3.1808247566223145, "lr": 0.0001644352493270035, "tps": 344633, "wall": 3557.5} {"step": 18708, "train_loss": 3.2606589794158936, "lr": 0.0001644170272860217, "tps": 344174, "wall": 3562.5} {"step": 18709, "train_loss": 3.1093106269836426, "lr": 0.00016439880587468676, "tps": 343714, "wall": 3567.4} {"step": 18710, "train_loss": 3.238856315612793, "lr": 0.00016438058509320524, "tps": 343258, "wall": 3572.4} {"step": 18711, "train_loss": 3.2357325553894043, "lr": 0.0001643623649417834, "tps": 342801, "wall": 3577.3} {"step": 18712, "train_loss": 3.2411234378814697, "lr": 0.00016434414542062774, "tps": 342341, "wall": 3582.3} {"step": 18713, "train_loss": 3.1563382148742676, "lr": 0.00016432592652994461, "tps": 341883, "wall": 3587.3} {"step": 18714, "train_loss": 3.2225160598754883, "lr": 0.00016430770826994038, "tps": 341420, "wall": 3592.4} {"step": 18715, "train_loss": 3.3066844940185547, "lr": 0.0001642894906408214, "tps": 340959, "wall": 3597.4} {"step": 18716, "train_loss": 3.288944959640503, "lr": 0.00016427127364279412, "tps": 340503, "wall": 3602.4} {"step": 18717, "train_loss": 3.164687156677246, "lr": 0.00016425305727606491, "tps": 340053, "wall": 3607.4} {"step": 18718, "train_loss": 3.241823673248291, "lr": 0.00016423484154084, "tps": 339604, "wall": 3612.3} {"step": 18719, "train_loss": 3.1523776054382324, "lr": 0.00016421662643732586, "tps": 339160, "wall": 3617.3} {"step": 18720, "train_loss": 3.215252637863159, "lr": 0.00016419841196572884, "tps": 338717, "wall": 3622.2} {"step": 18721, "train_loss": 3.2526168823242188, "lr": 0.00016418019812625514, "tps": 338275, "wall": 3627.1} {"step": 18722, "train_loss": 3.2350478172302246, "lr": 0.00016416198491911126, "tps": 337830, "wall": 3632.1} {"step": 18723, "train_loss": 3.2006871700286865, "lr": 0.0001641437723445034, "tps": 337392, "wall": 3637.0} {"step": 18724, "train_loss": 3.258021831512451, "lr": 0.0001641255604026379, "tps": 336942, "wall": 3642.0} {"step": 18725, "train_loss": 3.1983423233032227, "lr": 0.00016410734909372106, "tps": 336499, "wall": 3647.0} {"step": 18726, "train_loss": 3.2608752250671387, "lr": 0.00016408913841795922, "tps": 336051, "wall": 3652.1} {"step": 18727, "train_loss": 3.244786262512207, "lr": 0.00016407092837555863, "tps": 335613, "wall": 3657.1} {"step": 18728, "train_loss": 3.2068819999694824, "lr": 0.00016405271896672563, "tps": 335178, "wall": 3662.0} {"step": 18729, "train_loss": 3.258103847503662, "lr": 0.0001640345101916664, "tps": 334745, "wall": 3666.9} {"step": 18730, "train_loss": 3.2129998207092285, "lr": 0.0001640163020505873, "tps": 334313, "wall": 3671.9} {"step": 18731, "train_loss": 3.1495296955108643, "lr": 0.00016399809454369457, "tps": 333860, "wall": 3677.0} {"step": 18732, "train_loss": 3.2258405685424805, "lr": 0.00016397988767119439, "tps": 333399, "wall": 3682.3} {"step": 18733, "train_loss": 3.1664297580718994, "lr": 0.00016396168143329316, "tps": 332956, "wall": 3687.4} {"step": 18734, "train_loss": 3.2262625694274902, "lr": 0.00016394347583019697, "tps": 332511, "wall": 3692.6} {"step": 18735, "train_loss": 3.240783452987671, "lr": 0.00016392527086211213, "tps": 332078, "wall": 3697.6} {"step": 18736, "train_loss": 3.2854743003845215, "lr": 0.00016390706652924487, "tps": 331631, "wall": 3702.8} {"step": 18737, "train_loss": 3.2159745693206787, "lr": 0.00016388886283180142, "tps": 331174, "wall": 3708.1} {"step": 18738, "train_loss": 3.1814961433410645, "lr": 0.0001638706597699879, "tps": 330739, "wall": 3713.1} {"step": 18739, "train_loss": 3.2171356678009033, "lr": 0.00016385245734401065, "tps": 330307, "wall": 3718.2} {"step": 18740, "train_loss": 3.2573671340942383, "lr": 0.00016383425555407578, "tps": 329876, "wall": 3723.2} {"step": 18741, "train_loss": 3.070925235748291, "lr": 0.00016381605440038944, "tps": 329445, "wall": 3728.3} {"step": 18742, "train_loss": 3.192434072494507, "lr": 0.00016379785388315792, "tps": 329011, "wall": 3733.4} {"step": 18743, "train_loss": 3.2442240715026855, "lr": 0.0001637796540025874, "tps": 328589, "wall": 3738.4} {"step": 18744, "train_loss": 3.2018637657165527, "lr": 0.00016376145475888393, "tps": 328161, "wall": 3743.5} {"step": 18745, "train_loss": 3.297017812728882, "lr": 0.00016374325615225378, "tps": 327737, "wall": 3748.5} {"step": 18746, "train_loss": 3.111323833465576, "lr": 0.00016372505818290306, "tps": 327313, "wall": 3753.6} {"step": 18747, "train_loss": 3.2201595306396484, "lr": 0.00016370686085103792, "tps": 326893, "wall": 3758.6} {"step": 18748, "train_loss": 3.353745222091675, "lr": 0.0001636886641568645, "tps": 326474, "wall": 3763.6} {"step": 18749, "train_loss": 3.214190721511841, "lr": 0.00016367046810058895, "tps": 326052, "wall": 3768.7} {"step": 18750, "train_loss": 3.1884517669677734, "lr": 0.00016365227268241742, "tps": 325637, "wall": 3773.7} {"step": 18751, "train_loss": 3.2547531127929688, "lr": 0.00016363407790255595, "tps": 325219, "wall": 3778.8} {"step": 18752, "train_loss": 3.1336119174957275, "lr": 0.00016361588376121068, "tps": 324802, "wall": 3783.8} {"step": 18753, "train_loss": 3.1573967933654785, "lr": 0.00016359769025858775, "tps": 324392, "wall": 3788.8} {"step": 18754, "train_loss": 3.167726993560791, "lr": 0.0001635794973948933, "tps": 323983, "wall": 3793.8} {"step": 18755, "train_loss": 3.0999932289123535, "lr": 0.00016356130517033326, "tps": 323576, "wall": 3798.8} {"step": 18756, "train_loss": 3.332409381866455, "lr": 0.00016354311358511385, "tps": 323171, "wall": 3803.7} {"step": 18757, "train_loss": 3.1903672218322754, "lr": 0.00016352492263944107, "tps": 322768, "wall": 3808.7} {"step": 18758, "train_loss": 3.1844615936279297, "lr": 0.00016350673233352108, "tps": 322366, "wall": 3813.6} {"step": 18759, "train_loss": 3.255976676940918, "lr": 0.00016348854266755983, "tps": 321962, "wall": 3818.6} {"step": 18760, "train_loss": 3.186549663543701, "lr": 0.00016347035364176347, "tps": 321560, "wall": 3823.6} {"step": 18761, "train_loss": 3.2170002460479736, "lr": 0.00016345216525633799, "tps": 321159, "wall": 3828.6} {"step": 18762, "train_loss": 3.269423484802246, "lr": 0.0001634339775114894, "tps": 320760, "wall": 3833.6} {"step": 18763, "train_loss": 3.2589478492736816, "lr": 0.0001634157904074238, "tps": 320357, "wall": 3838.6} {"step": 18764, "train_loss": 3.1007189750671387, "lr": 0.00016339760394434716, "tps": 319964, "wall": 3843.5} {"step": 18765, "train_loss": 3.1555140018463135, "lr": 0.0001633794181224656, "tps": 319569, "wall": 3848.5} {"step": 18766, "train_loss": 3.22273325920105, "lr": 0.000163361232941985, "tps": 319178, "wall": 3853.4} {"step": 18767, "train_loss": 3.2055840492248535, "lr": 0.00016334304840311142, "tps": 318759, "wall": 3858.6} {"step": 18768, "train_loss": 3.188178062438965, "lr": 0.00016332486450605088, "tps": 318354, "wall": 3863.8} {"step": 18769, "train_loss": 3.2503857612609863, "lr": 0.0001633066812510093, "tps": 317956, "wall": 3868.8} {"step": 18770, "train_loss": 3.1565539836883545, "lr": 0.00016328849863819276, "tps": 317554, "wall": 3873.9} {"step": 18771, "train_loss": 3.203619956970215, "lr": 0.00016327031666780713, "tps": 317165, "wall": 3878.9} {"step": 18772, "train_loss": 3.253633737564087, "lr": 0.0001632521353400584, "tps": 316774, "wall": 3883.9} {"step": 18773, "train_loss": 3.1994359493255615, "lr": 0.00016323395465515255, "tps": 316376, "wall": 3889.0} {"step": 18774, "train_loss": 3.1404616832733154, "lr": 0.00016321577461329563, "tps": 315981, "wall": 3894.0} {"step": 18775, "train_loss": 3.2560057640075684, "lr": 0.00016319759521469339, "tps": 315590, "wall": 3899.0} {"step": 18776, "train_loss": 3.3059258460998535, "lr": 0.00016317941645955188, "tps": 315199, "wall": 3904.1} {"step": 18777, "train_loss": 3.2554988861083984, "lr": 0.00016316123834807705, "tps": 314814, "wall": 3909.1} {"step": 18778, "train_loss": 3.29103946685791, "lr": 0.00016314306088047474, "tps": 314431, "wall": 3914.0} {"step": 18779, "train_loss": 3.15209698677063, "lr": 0.00016312488405695094, "tps": 314051, "wall": 3919.0} {"step": 18780, "train_loss": 3.122377634048462, "lr": 0.00016310670787771155, "tps": 313665, "wall": 3924.0} {"step": 18781, "train_loss": 3.174044370651245, "lr": 0.00016308853234296242, "tps": 313282, "wall": 3929.0} {"step": 18782, "train_loss": 3.2384612560272217, "lr": 0.00016307035745290947, "tps": 312903, "wall": 3934.0} {"step": 18783, "train_loss": 3.1342215538024902, "lr": 0.0001630521832077586, "tps": 312523, "wall": 3939.0} {"step": 18784, "train_loss": 3.264561176300049, "lr": 0.0001630340096077157, "tps": 312143, "wall": 3944.0} {"step": 18785, "train_loss": 3.1607439517974854, "lr": 0.00016301583665298658, "tps": 311759, "wall": 3949.1} {"step": 18786, "train_loss": 3.3768749237060547, "lr": 0.00016299766434377716, "tps": 311381, "wall": 3954.1} {"step": 18787, "train_loss": 3.1933937072753906, "lr": 0.00016297949268029334, "tps": 311007, "wall": 3959.0} {"step": 18788, "train_loss": 3.2974696159362793, "lr": 0.00016296132166274086, "tps": 310634, "wall": 3964.0} {"step": 18789, "train_loss": 3.252896785736084, "lr": 0.00016294315129132558, "tps": 310261, "wall": 3969.0} {"step": 18790, "train_loss": 3.238722801208496, "lr": 0.0001629249815662534, "tps": 309888, "wall": 3974.0} {"step": 18791, "train_loss": 3.269820213317871, "lr": 0.00016290681248773016, "tps": 309516, "wall": 3979.0} {"step": 18792, "train_loss": 3.253228187561035, "lr": 0.00016288864405596161, "tps": 309147, "wall": 3983.9} {"step": 18793, "train_loss": 3.208204746246338, "lr": 0.00016287047627115358, "tps": 308779, "wall": 3988.9} {"step": 18794, "train_loss": 3.2536325454711914, "lr": 0.00016285230913351187, "tps": 308407, "wall": 3993.9} {"step": 18795, "train_loss": 3.266725540161133, "lr": 0.0001628341426432424, "tps": 308037, "wall": 3998.9} {"step": 18796, "train_loss": 3.1588478088378906, "lr": 0.00016281597680055073, "tps": 307664, "wall": 4004.0} {"step": 18797, "train_loss": 3.3231496810913086, "lr": 0.00016279781160564278, "tps": 307289, "wall": 4009.1} {"step": 18798, "train_loss": 3.1857128143310547, "lr": 0.00016277964705872436, "tps": 306922, "wall": 4014.1} {"step": 18799, "train_loss": 3.2704687118530273, "lr": 0.0001627614831600012, "tps": 306553, "wall": 4019.1} {"step": 18800, "train_loss": 3.1243276596069336, "lr": 0.000162743319909679, "tps": 306191, "wall": 4024.1} {"step": 18801, "train_loss": 3.269747018814087, "lr": 0.0001627251573079636, "tps": 305830, "wall": 4029.1} {"step": 18802, "train_loss": 3.2114248275756836, "lr": 0.0001627069953550607, "tps": 305473, "wall": 4034.0} {"step": 18803, "train_loss": 3.278486490249634, "lr": 0.00016268883405117608, "tps": 305117, "wall": 4038.9} {"step": 18804, "train_loss": 3.2711946964263916, "lr": 0.0001626706733965154, "tps": 304763, "wall": 4043.8} {"step": 18805, "train_loss": 3.2052183151245117, "lr": 0.00016265251339128448, "tps": 304410, "wall": 4048.7} {"step": 18806, "train_loss": 3.26198410987854, "lr": 0.00016263435403568902, "tps": 304057, "wall": 4053.6} {"step": 18807, "train_loss": 3.16243839263916, "lr": 0.00016261619532993463, "tps": 303700, "wall": 4058.6} {"step": 18808, "train_loss": 3.1947948932647705, "lr": 0.0001625980372742271, "tps": 303341, "wall": 4063.6} {"step": 18809, "train_loss": 3.217838764190674, "lr": 0.00016257987986877215, "tps": 302983, "wall": 4068.6} {"step": 18810, "train_loss": 3.2601513862609863, "lr": 0.0001625617231137754, "tps": 302631, "wall": 4073.6} {"step": 18811, "train_loss": 3.1799604892730713, "lr": 0.00016254356700944254, "tps": 302280, "wall": 4078.5} {"step": 18812, "train_loss": 3.1347920894622803, "lr": 0.00016252541155597933, "tps": 301929, "wall": 4083.5} {"step": 18813, "train_loss": 3.0974302291870117, "lr": 0.00016250725675359128, "tps": 301581, "wall": 4088.4} {"step": 18814, "train_loss": 3.1840429306030273, "lr": 0.0001624891026024842, "tps": 301234, "wall": 4093.4} {"step": 18815, "train_loss": 3.238529682159424, "lr": 0.0001624709491028636, "tps": 300883, "wall": 4098.4} {"step": 18816, "train_loss": 3.2053332328796387, "lr": 0.00016245279625493527, "tps": 300521, "wall": 4103.5} {"step": 18817, "train_loss": 3.2310070991516113, "lr": 0.00016243464405890477, "tps": 300166, "wall": 4108.6} {"step": 18818, "train_loss": 3.2012248039245605, "lr": 0.00016241649251497772, "tps": 299798, "wall": 4113.8} {"step": 18819, "train_loss": 3.269043445587158, "lr": 0.0001623983416233598, "tps": 299448, "wall": 4118.9} {"step": 18820, "train_loss": 3.219167709350586, "lr": 0.0001623801913842565, "tps": 299091, "wall": 4124.0} {"step": 18821, "train_loss": 3.26711106300354, "lr": 0.00016236204179787355, "tps": 298737, "wall": 4129.1} {"step": 18822, "train_loss": 3.2914962768554688, "lr": 0.00016234389286441653, "tps": 298394, "wall": 4134.1} {"step": 18823, "train_loss": 3.252410411834717, "lr": 0.00016232574458409103, "tps": 298052, "wall": 4139.0} {"step": 18824, "train_loss": 3.3664634227752686, "lr": 0.00016230759695710253, "tps": 297712, "wall": 4144.0} {"step": 18825, "train_loss": 3.257460594177246, "lr": 0.00016228944998365673, "tps": 297374, "wall": 4148.9} {"step": 18826, "train_loss": 3.123443365097046, "lr": 0.0001622713036639592, "tps": 297037, "wall": 4153.8} {"step": 18827, "train_loss": 3.1333260536193848, "lr": 0.00016225315799821543, "tps": 296699, "wall": 4158.8} {"step": 18828, "train_loss": 3.246983051300049, "lr": 0.00016223501298663102, "tps": 296364, "wall": 4163.7} {"step": 18829, "train_loss": 3.329892158508301, "lr": 0.00016221686862941153, "tps": 296029, "wall": 4168.6} {"step": 18830, "train_loss": 3.252906560897827, "lr": 0.00016219872492676248, "tps": 295696, "wall": 4173.6} {"step": 18831, "train_loss": 3.262890338897705, "lr": 0.00016218058187888933, "tps": 295363, "wall": 4178.5} {"step": 18832, "train_loss": 3.153700351715088, "lr": 0.0001621624394859977, "tps": 295027, "wall": 4183.5} {"step": 18833, "train_loss": 3.2020797729492188, "lr": 0.00016214429774829317, "tps": 294695, "wall": 4188.4} {"step": 18834, "train_loss": 3.29994535446167, "lr": 0.0001621261566659811, "tps": 294364, "wall": 4193.3} {"step": 18835, "train_loss": 3.2044124603271484, "lr": 0.000162108016239267, "tps": 294034, "wall": 4198.3} {"step": 18836, "train_loss": 3.219830274581909, "lr": 0.00016208987646835655, "tps": 293706, "wall": 4203.2} {"step": 18837, "train_loss": 3.1854209899902344, "lr": 0.000162071737353455, "tps": 293377, "wall": 4208.1} {"step": 18838, "train_loss": 3.2083804607391357, "lr": 0.000162053598894768, "tps": 293049, "wall": 4213.1} {"step": 18839, "train_loss": 3.3660154342651367, "lr": 0.000162035461092501, "tps": 292720, "wall": 4218.0} {"step": 18840, "train_loss": 3.245582103729248, "lr": 0.00016201732394685939, "tps": 292393, "wall": 4222.9} {"step": 18841, "train_loss": 3.274447441101074, "lr": 0.00016199918745804864, "tps": 292068, "wall": 4227.9} {"step": 18842, "train_loss": 3.136084794998169, "lr": 0.00016198105162627425, "tps": 291738, "wall": 4232.9} {"step": 18843, "train_loss": 3.115279197692871, "lr": 0.00016196291645174168, "tps": 291409, "wall": 4237.9} {"step": 18844, "train_loss": 3.1954782009124756, "lr": 0.0001619447819346563, "tps": 291084, "wall": 4242.8} {"step": 18845, "train_loss": 3.1513161659240723, "lr": 0.0001619266480752236, "tps": 290754, "wall": 4247.9} {"step": 18846, "train_loss": 3.1691155433654785, "lr": 0.00016190851487364895, "tps": 290431, "wall": 4252.8} {"step": 18847, "train_loss": 3.2525973320007324, "lr": 0.00016189038233013777, "tps": 290110, "wall": 4257.8} {"step": 18848, "train_loss": 3.250307321548462, "lr": 0.0001618722504448955, "tps": 289789, "wall": 4262.7} {"step": 18849, "train_loss": 3.2190794944763184, "lr": 0.00016185411921812754, "tps": 289469, "wall": 4267.7} {"step": 18850, "train_loss": 3.237694501876831, "lr": 0.00016183598865003926, "tps": 289149, "wall": 4272.6} {"step": 18851, "train_loss": 3.1396138668060303, "lr": 0.000161817858740836, "tps": 288830, "wall": 4277.5} {"step": 18852, "train_loss": 3.2215664386749268, "lr": 0.00016179972949072324, "tps": 288511, "wall": 4282.5} {"step": 18853, "train_loss": 3.300110101699829, "lr": 0.00016178160089990628, "tps": 288192, "wall": 4287.5} {"step": 18854, "train_loss": 3.3139240741729736, "lr": 0.0001617634729685905, "tps": 287875, "wall": 4292.4} {"step": 18855, "train_loss": 3.227632522583008, "lr": 0.00016174534569698122, "tps": 287559, "wall": 4297.4} {"step": 18856, "train_loss": 3.2236344814300537, "lr": 0.00016172721908528384, "tps": 287244, "wall": 4302.3} {"step": 18857, "train_loss": 3.3153045177459717, "lr": 0.00016170909313370366, "tps": 286923, "wall": 4307.3} {"step": 18858, "train_loss": 3.2753796577453613, "lr": 0.000161690967842446, "tps": 286607, "wall": 4312.3} {"step": 18859, "train_loss": 3.2909457683563232, "lr": 0.00016167284321171624, "tps": 286295, "wall": 4317.3} {"step": 18860, "train_loss": 3.263331890106201, "lr": 0.0001616547192417197, "tps": 285982, "wall": 4322.2} {"step": 18861, "train_loss": 3.2109475135803223, "lr": 0.0001616365959326616, "tps": 285670, "wall": 4327.2} {"step": 18862, "train_loss": 3.156780481338501, "lr": 0.00016161847328474734, "tps": 285354, "wall": 4332.2} {"step": 18863, "train_loss": 3.2415175437927246, "lr": 0.00016160035129818217, "tps": 285041, "wall": 4337.2} {"step": 18864, "train_loss": 3.2870359420776367, "lr": 0.00016158222997317138, "tps": 284728, "wall": 4342.2} {"step": 18865, "train_loss": 3.1919188499450684, "lr": 0.00016156410930992022, "tps": 284416, "wall": 4347.2} {"step": 18866, "train_loss": 3.3241958618164062, "lr": 0.00016154598930863404, "tps": 284104, "wall": 4352.2} {"step": 18867, "train_loss": 3.168476104736328, "lr": 0.00016152786996951802, "tps": 283793, "wall": 4357.2} {"step": 18868, "train_loss": 3.2361862659454346, "lr": 0.00016150975129277742, "tps": 283483, "wall": 4362.2} {"step": 18869, "train_loss": 3.2379071712493896, "lr": 0.00016149163327861755, "tps": 283168, "wall": 4367.2} {"step": 18870, "train_loss": 3.20632266998291, "lr": 0.00016147351592724367, "tps": 282860, "wall": 4372.2} {"step": 18871, "train_loss": 3.212897300720215, "lr": 0.0001614553992388609, "tps": 282550, "wall": 4377.2} {"step": 18872, "train_loss": 3.214235782623291, "lr": 0.00016143728321367458, "tps": 282243, "wall": 4382.2} {"step": 18873, "train_loss": 3.1779837608337402, "lr": 0.00016141916785188988, "tps": 281929, "wall": 4387.4} {"step": 18874, "train_loss": 3.3009533882141113, "lr": 0.00016140105315371202, "tps": 281624, "wall": 4392.3} {"step": 18875, "train_loss": 3.2055304050445557, "lr": 0.00016138293911934618, "tps": 281315, "wall": 4397.4} {"step": 18876, "train_loss": 3.261903762817383, "lr": 0.0001613648257489976, "tps": 281011, "wall": 4402.4} {"step": 18877, "train_loss": 3.192735195159912, "lr": 0.00016134671304287142, "tps": 280707, "wall": 4407.4} {"step": 18878, "train_loss": 3.2260403633117676, "lr": 0.00016132860100117284, "tps": 280397, "wall": 4412.5} {"step": 18879, "train_loss": 3.1003432273864746, "lr": 0.00016131048962410703, "tps": 280087, "wall": 4417.6} {"step": 18880, "train_loss": 3.164961814880371, "lr": 0.0001612923789118792, "tps": 279777, "wall": 4422.7} {"step": 18881, "train_loss": 3.2372264862060547, "lr": 0.00016127426886469447, "tps": 279463, "wall": 4428.0} {"step": 18882, "train_loss": 3.1227996349334717, "lr": 0.000161256159482758, "tps": 279151, "wall": 4433.1} {"step": 18883, "train_loss": 3.2792534828186035, "lr": 0.00016123805076627496, "tps": 278845, "wall": 4438.2} {"step": 18884, "train_loss": 3.249234437942505, "lr": 0.00016121994271545042, "tps": 278539, "wall": 4443.3} {"step": 18885, "train_loss": 3.2488558292388916, "lr": 0.00016120183533048957, "tps": 278233, "wall": 4448.5} {"step": 18886, "train_loss": 3.190122127532959, "lr": 0.0001611837286115975, "tps": 277927, "wall": 4453.6} {"step": 18887, "train_loss": 3.255979061126709, "lr": 0.00016116562255897936, "tps": 277622, "wall": 4458.7} {"step": 18888, "train_loss": 3.1567299365997314, "lr": 0.0001611475171728402, "tps": 277313, "wall": 4463.9} {"step": 18889, "train_loss": 3.1386842727661133, "lr": 0.00016112941245338512, "tps": 277010, "wall": 4469.1} {"step": 18890, "train_loss": 3.2176401615142822, "lr": 0.00016111130840081928, "tps": 276708, "wall": 4474.2} {"step": 18891, "train_loss": 3.4112024307250977, "lr": 0.00016109320501534775, "tps": 276405, "wall": 4479.3} {"step": 18892, "train_loss": 3.147789239883423, "lr": 0.00016107510229717553, "tps": 276102, "wall": 4484.5} {"step": 18893, "train_loss": 3.173384666442871, "lr": 0.0001610570002465078, "tps": 275797, "wall": 4489.7} {"step": 18894, "train_loss": 3.2521986961364746, "lr": 0.00016103889886354952, "tps": 275492, "wall": 4494.9} {"step": 18895, "train_loss": 3.1712584495544434, "lr": 0.00016102079814850576, "tps": 275189, "wall": 4500.1} {"step": 18896, "train_loss": 3.311678409576416, "lr": 0.00016100269810158163, "tps": 274886, "wall": 4505.3} {"step": 18897, "train_loss": 3.3343584537506104, "lr": 0.0001609845987229821, "tps": 274583, "wall": 4510.5} {"step": 18898, "train_loss": 3.2095589637756348, "lr": 0.00016096650001291228, "tps": 274281, "wall": 4515.7} {"step": 18899, "train_loss": 3.2259674072265625, "lr": 0.00016094840197157707, "tps": 273982, "wall": 4520.8} {"step": 18900, "train_loss": 3.246372938156128, "lr": 0.0001609303045991816, "tps": 273681, "wall": 4526.0} {"step": 18901, "train_loss": 3.2388076782226562, "lr": 0.0001609122078959308, "tps": 273382, "wall": 4531.2} {"step": 18902, "train_loss": 3.282797336578369, "lr": 0.00016089411186202975, "tps": 273084, "wall": 4536.4} {"step": 18903, "train_loss": 3.276393413543701, "lr": 0.00016087601649768338, "tps": 272785, "wall": 4541.6} {"step": 18904, "train_loss": 3.279265880584717, "lr": 0.0001608579218030967, "tps": 272483, "wall": 4546.9} {"step": 18905, "train_loss": 3.240539073944092, "lr": 0.00016083982777847467, "tps": 272186, "wall": 4552.1} {"step": 18906, "train_loss": 3.1943440437316895, "lr": 0.00016082173442402223, "tps": 271889, "wall": 4557.3} {"step": 18907, "train_loss": 3.1539015769958496, "lr": 0.00016080364173994447, "tps": 271594, "wall": 4562.5} {"step": 18908, "train_loss": 3.1873011589050293, "lr": 0.00016078554972644623, "tps": 271297, "wall": 4567.8} {"step": 18909, "train_loss": 3.2181546688079834, "lr": 0.00016076745838373245, "tps": 271004, "wall": 4572.9} {"step": 18910, "train_loss": 3.204749345779419, "lr": 0.00016074936771200818, "tps": 270710, "wall": 4578.1} {"step": 18911, "train_loss": 3.1656274795532227, "lr": 0.00016073127771147817, "tps": 270417, "wall": 4583.3} {"step": 18912, "train_loss": 3.1958930492401123, "lr": 0.00016071318838234753, "tps": 270126, "wall": 4588.5} {"step": 18913, "train_loss": 3.243664264678955, "lr": 0.00016069509972482107, "tps": 269832, "wall": 4593.8} {"step": 18914, "train_loss": 3.2508106231689453, "lr": 0.00016067701173910374, "tps": 269542, "wall": 4599.0} {"step": 18915, "train_loss": 3.194397449493408, "lr": 0.00016065892442540048, "tps": 269246, "wall": 4604.3} {"step": 18916, "train_loss": 3.21034574508667, "lr": 0.000160640837783916, "tps": 268950, "wall": 4609.6} {"step": 18917, "train_loss": 3.1969945430755615, "lr": 0.00016062275181485548, "tps": 268657, "wall": 4614.8} {"step": 18918, "train_loss": 3.2904741764068604, "lr": 0.00016060466651842355, "tps": 268366, "wall": 4620.1} {"step": 18919, "train_loss": 3.134617328643799, "lr": 0.00016058658189482515, "tps": 268074, "wall": 4625.4} {"step": 18920, "train_loss": 3.1907057762145996, "lr": 0.00016056849794426526, "tps": 267785, "wall": 4630.6} {"step": 18921, "train_loss": 3.203084945678711, "lr": 0.00016055041466694854, "tps": 267485, "wall": 4636.0} {"step": 18922, "train_loss": 3.1589715480804443, "lr": 0.00016053233206307996, "tps": 267198, "wall": 4641.3} {"step": 18923, "train_loss": 3.181334972381592, "lr": 0.00016051425013286435, "tps": 266901, "wall": 4646.7} {"step": 18924, "train_loss": 3.254195213317871, "lr": 0.00016049616887650657, "tps": 266615, "wall": 4651.9} {"step": 18925, "train_loss": 3.2879700660705566, "lr": 0.0001604780882942114, "tps": 266331, "wall": 4657.1} {"step": 18926, "train_loss": 3.2071609497070312, "lr": 0.0001604600083861836, "tps": 266048, "wall": 4662.3} {"step": 18927, "train_loss": 3.2974441051483154, "lr": 0.0001604419291526281, "tps": 265761, "wall": 4667.6} {"step": 18928, "train_loss": 3.1037330627441406, "lr": 0.00016042385059374966, "tps": 265480, "wall": 4672.8} {"step": 18929, "train_loss": 3.233140468597412, "lr": 0.00016040577270975303, "tps": 265195, "wall": 4678.0} {"step": 18930, "train_loss": 3.2231531143188477, "lr": 0.00016038769550084307, "tps": 264913, "wall": 4683.3} {"step": 18931, "train_loss": 3.170924663543701, "lr": 0.00016036961896722448, "tps": 264630, "wall": 4688.5} {"step": 18932, "train_loss": 3.2027883529663086, "lr": 0.00016035154310910205, "tps": 264341, "wall": 4693.9} {"step": 18933, "train_loss": 3.238187551498413, "lr": 0.00016033346792668064, "tps": 264050, "wall": 4699.3} {"step": 18934, "train_loss": 3.1902663707733154, "lr": 0.0001603153934201649, "tps": 263771, "wall": 4704.6} {"step": 18935, "train_loss": 3.1410794258117676, "lr": 0.0001602973195897596, "tps": 263488, "wall": 4709.8} {"step": 18936, "train_loss": 3.280715227127075, "lr": 0.0001602792464356695, "tps": 263207, "wall": 4715.1} {"step": 18937, "train_loss": 3.291881799697876, "lr": 0.00016026117395809934, "tps": 262929, "wall": 4720.4} {"step": 18938, "train_loss": 3.1426262855529785, "lr": 0.0001602431021572538, "tps": 262647, "wall": 4725.7} {"step": 18939, "train_loss": 3.3687381744384766, "lr": 0.00016022503103333766, "tps": 262382, "wall": 4730.7} {"step": 18940, "train_loss": 3.252866744995117, "lr": 0.0001602069605865556, "tps": 262116, "wall": 4735.7} {"step": 18941, "train_loss": 3.179286241531372, "lr": 0.00016018889081711234, "tps": 261825, "wall": 4741.3} {"step": 18942, "train_loss": 3.2040140628814697, "lr": 0.0001601708217252125, "tps": 261552, "wall": 4746.5} {"step": 18943, "train_loss": 3.190093517303467, "lr": 0.00016015275331106085, "tps": 261274, "wall": 4751.8} {"step": 18944, "train_loss": 3.2463839054107666, "lr": 0.00016013468557486213, "tps": 261011, "wall": 4756.8} {"step": 18945, "train_loss": 3.2752108573913574, "lr": 0.00016011661851682085, "tps": 260750, "wall": 4761.8} {"step": 18946, "train_loss": 3.2599246501922607, "lr": 0.0001600985521371418, "tps": 260488, "wall": 4766.9} {"step": 18947, "train_loss": 3.1827664375305176, "lr": 0.00016008048643602956, "tps": 260228, "wall": 4771.9} {"step": 18948, "train_loss": 3.3451037406921387, "lr": 0.00016006242141368882, "tps": 259966, "wall": 4776.9} {"step": 18949, "train_loss": 3.2349953651428223, "lr": 0.00016004435707032418, "tps": 259702, "wall": 4782.0} {"step": 18950, "train_loss": 3.2346715927124023, "lr": 0.00016002629340614033, "tps": 259436, "wall": 4787.2} {"step": 18951, "train_loss": 3.2599596977233887, "lr": 0.0001600082304213419, "tps": 259173, "wall": 4792.3} {"step": 18952, "train_loss": 3.1648144721984863, "lr": 0.00015999016811613345, "tps": 258911, "wall": 4797.4} {"step": 18953, "train_loss": 3.2338242530822754, "lr": 0.00015997210649071962, "tps": 258650, "wall": 4802.5} {"step": 18954, "train_loss": 3.2334542274475098, "lr": 0.00015995404554530507, "tps": 258387, "wall": 4807.6} {"step": 18955, "train_loss": 3.1350181102752686, "lr": 0.00015993598528009427, "tps": 258125, "wall": 4812.8} {"step": 18956, "train_loss": 3.140904426574707, "lr": 0.00015991792569529188, "tps": 257864, "wall": 4817.9} {"step": 18957, "train_loss": 3.15860652923584, "lr": 0.00015989986679110257, "tps": 257604, "wall": 4823.0} {"step": 18958, "train_loss": 3.282909870147705, "lr": 0.0001598818085677307, "tps": 257345, "wall": 4828.1} {"step": 18959, "train_loss": 3.13313627243042, "lr": 0.00015986375102538102, "tps": 257091, "wall": 4833.2} {"step": 18960, "train_loss": 3.1784439086914062, "lr": 0.00015984569416425802, "tps": 256836, "wall": 4838.2} {"step": 18961, "train_loss": 3.1037638187408447, "lr": 0.00015982763798456624, "tps": 256580, "wall": 4843.3} {"step": 18962, "train_loss": 3.137359142303467, "lr": 0.00015980958248651024, "tps": 256324, "wall": 4848.4} {"step": 18963, "train_loss": 3.1934547424316406, "lr": 0.0001597915276702945, "tps": 256070, "wall": 4853.5} {"step": 18964, "train_loss": 3.1408066749572754, "lr": 0.00015977347353612374, "tps": 255815, "wall": 4858.6} {"step": 18965, "train_loss": 3.230217218399048, "lr": 0.00015975542008420218, "tps": 255556, "wall": 4863.7} {"step": 18966, "train_loss": 3.222574234008789, "lr": 0.00015973736731473456, "tps": 255299, "wall": 4868.9} {"step": 18967, "train_loss": 3.2269797325134277, "lr": 0.00015971931522792526, "tps": 255040, "wall": 4874.1} {"step": 18968, "train_loss": 3.210980176925659, "lr": 0.0001597012638239788, "tps": 254782, "wall": 4879.3} {"step": 18969, "train_loss": 3.2333691120147705, "lr": 0.00015968321310309976, "tps": 254525, "wall": 4884.5} {"step": 18970, "train_loss": 3.1744136810302734, "lr": 0.00015966516306549245, "tps": 254271, "wall": 4889.6} {"step": 18971, "train_loss": 3.2702598571777344, "lr": 0.0001596471137113615, "tps": 254014, "wall": 4894.8} {"step": 18972, "train_loss": 3.136093854904175, "lr": 0.0001596290650409113, "tps": 253759, "wall": 4900.0} {"step": 18973, "train_loss": 3.2456612586975098, "lr": 0.00015961101705434628, "tps": 253503, "wall": 4905.2} {"step": 18974, "train_loss": 3.204662322998047, "lr": 0.00015959296975187094, "tps": 253246, "wall": 4910.4} {"step": 18975, "train_loss": 3.1944544315338135, "lr": 0.00015957492313368974, "tps": 252990, "wall": 4915.6} {"step": 18976, "train_loss": 3.1813597679138184, "lr": 0.00015955687720000706, "tps": 252736, "wall": 4920.8} {"step": 18977, "train_loss": 3.260594367980957, "lr": 0.00015953883195102736, "tps": 252481, "wall": 4926.1} {"step": 18978, "train_loss": 3.1537013053894043, "lr": 0.000159520787386955, "tps": 252227, "wall": 4931.3} {"step": 18979, "train_loss": 3.2380034923553467, "lr": 0.0001595027435079945, "tps": 251968, "wall": 4936.6} {"step": 18980, "train_loss": 3.1756591796875, "lr": 0.00015948470031435018, "tps": 251713, "wall": 4941.9} {"step": 18981, "train_loss": 3.2328009605407715, "lr": 0.00015946665780622635, "tps": 251459, "wall": 4947.1} {"step": 18982, "train_loss": 3.1273438930511475, "lr": 0.00015944861598382758, "tps": 251205, "wall": 4952.4} {"step": 18983, "train_loss": 3.2163515090942383, "lr": 0.00015943057484735823, "tps": 250953, "wall": 4957.6} {"step": 18984, "train_loss": 3.2493414878845215, "lr": 0.00015941253439702248, "tps": 250702, "wall": 4962.9} {"step": 18985, "train_loss": 3.2241463661193848, "lr": 0.00015939449463302485, "tps": 250445, "wall": 4968.2} {"step": 18986, "train_loss": 3.1178698539733887, "lr": 0.00015937645555556972, "tps": 250193, "wall": 4973.5} {"step": 18987, "train_loss": 3.0725042819976807, "lr": 0.00015935841716486132, "tps": 249940, "wall": 4978.8} {"step": 18988, "train_loss": 3.2155117988586426, "lr": 0.0001593403794611041, "tps": 249690, "wall": 4984.0} {"step": 18989, "train_loss": 3.288203239440918, "lr": 0.00015932234244450227, "tps": 249440, "wall": 4989.3} {"step": 18990, "train_loss": 3.2009174823760986, "lr": 0.0001593043061152603, "tps": 249189, "wall": 4994.6} {"step": 18991, "train_loss": 3.2120184898376465, "lr": 0.00015928627047358238, "tps": 248939, "wall": 4999.9} {"step": 18992, "train_loss": 3.2430124282836914, "lr": 0.0001592682355196729, "tps": 248680, "wall": 5005.3} {"step": 18993, "train_loss": 3.2295708656311035, "lr": 0.00015925020125373616, "tps": 248427, "wall": 5010.7} {"step": 18994, "train_loss": 3.2264974117279053, "lr": 0.00015923216767597638, "tps": 248173, "wall": 5016.1} {"step": 18995, "train_loss": 3.207690715789795, "lr": 0.0001592141347865979, "tps": 247927, "wall": 5021.3} {"step": 18996, "train_loss": 3.156282901763916, "lr": 0.00015919610258580504, "tps": 247673, "wall": 5026.7} {"step": 18997, "train_loss": 3.2122082710266113, "lr": 0.00015917807107380195, "tps": 247428, "wall": 5032.0} {"step": 18998, "train_loss": 3.125825881958008, "lr": 0.00015916004025079297, "tps": 247186, "wall": 5037.2} {"step": 18999, "train_loss": 3.141915798187256, "lr": 0.0001591420101169824, "tps": 246943, "wall": 5042.4} {"step": 19000, "train_loss": 3.2072885036468506, "lr": 0.0001591239806725744, "tps": 246699, "wall": 5047.6, "val_loss_monitor": 3.383429572428505} {"step": 19001, "train_loss": 3.160752296447754, "lr": 0.00015910595191777325, "tps": 244082, "wall": 5102.0} {"step": 19002, "train_loss": 3.2724575996398926, "lr": 0.00015908792385278315, "tps": 243855, "wall": 5107.1} {"step": 19003, "train_loss": 3.203174114227295, "lr": 0.00015906989647780835, "tps": 243624, "wall": 5112.2} {"step": 19004, "train_loss": 3.201399564743042, "lr": 0.00015905186979305307, "tps": 243396, "wall": 5117.2} {"step": 19005, "train_loss": 3.0484516620635986, "lr": 0.00015903384379872145, "tps": 243163, "wall": 5122.4} {"step": 19006, "train_loss": 3.193265438079834, "lr": 0.00015901581849501786, "tps": 242911, "wall": 5128.0} {"step": 19007, "train_loss": 3.2593493461608887, "lr": 0.0001589977938821463, "tps": 242679, "wall": 5133.2} {"step": 19008, "train_loss": 3.356161594390869, "lr": 0.00015897976996031104, "tps": 242449, "wall": 5138.3} {"step": 19009, "train_loss": 3.1645216941833496, "lr": 0.00015896174672971625, "tps": 242226, "wall": 5143.3} {"step": 19010, "train_loss": 3.214663028717041, "lr": 0.00015894372419056612, "tps": 241999, "wall": 5148.4} {"step": 19011, "train_loss": 3.2980804443359375, "lr": 0.00015892570234306473, "tps": 241764, "wall": 5153.7} {"step": 19012, "train_loss": 3.2208261489868164, "lr": 0.0001589076811874163, "tps": 241542, "wall": 5158.7} {"step": 19013, "train_loss": 3.160428285598755, "lr": 0.000158889660723825, "tps": 241316, "wall": 5163.8} {"step": 19014, "train_loss": 3.2440454959869385, "lr": 0.0001588716409524949, "tps": 241093, "wall": 5168.8} {"step": 19015, "train_loss": 3.27866530418396, "lr": 0.0001588536218736302, "tps": 240872, "wall": 5173.8} {"step": 19016, "train_loss": 3.2367634773254395, "lr": 0.00015883560348743493, "tps": 240647, "wall": 5178.9} {"step": 19017, "train_loss": 3.2582898139953613, "lr": 0.0001588175857941133, "tps": 240427, "wall": 5184.0} {"step": 19018, "train_loss": 3.1860060691833496, "lr": 0.0001587995687938693, "tps": 240204, "wall": 5189.0} {"step": 19019, "train_loss": 3.2094380855560303, "lr": 0.00015878155248690715, "tps": 239980, "wall": 5194.1} {"step": 19020, "train_loss": 3.2489471435546875, "lr": 0.00015876353687343086, "tps": 239757, "wall": 5199.3} {"step": 19021, "train_loss": 3.268490791320801, "lr": 0.00015874552195364454, "tps": 239529, "wall": 5204.5} {"step": 19022, "train_loss": 3.2997689247131348, "lr": 0.00015872750772775226, "tps": 239303, "wall": 5209.7} {"step": 19023, "train_loss": 3.140005588531494, "lr": 0.0001587094941959581, "tps": 239081, "wall": 5214.8} {"step": 19024, "train_loss": 3.29316782951355, "lr": 0.0001586914813584661, "tps": 238855, "wall": 5220.0} {"step": 19025, "train_loss": 3.086707830429077, "lr": 0.00015867346921548032, "tps": 238632, "wall": 5225.1} {"step": 19026, "train_loss": 3.2347207069396973, "lr": 0.00015865545776720484, "tps": 238411, "wall": 5230.3} {"step": 19027, "train_loss": 3.2132444381713867, "lr": 0.0001586374470138436, "tps": 238188, "wall": 5235.4} {"step": 19028, "train_loss": 3.2230005264282227, "lr": 0.00015861943695560067, "tps": 237969, "wall": 5240.5} {"step": 19029, "train_loss": 3.2486510276794434, "lr": 0.00015860142759268006, "tps": 237747, "wall": 5245.7} {"step": 19030, "train_loss": 3.32328462600708, "lr": 0.0001585834189252859, "tps": 237526, "wall": 5250.8} {"step": 19031, "train_loss": 3.2000956535339355, "lr": 0.00015856541095362201, "tps": 237307, "wall": 5256.0} {"step": 19032, "train_loss": 3.2259650230407715, "lr": 0.00015854740367789245, "tps": 237091, "wall": 5261.0} {"step": 19033, "train_loss": 3.3087096214294434, "lr": 0.00015852939709830132, "tps": 236866, "wall": 5266.3} {"step": 19034, "train_loss": 3.1638236045837402, "lr": 0.00015851139121505242, "tps": 236643, "wall": 5271.6} {"step": 19035, "train_loss": 3.256898880004883, "lr": 0.00015849338602834983, "tps": 236421, "wall": 5276.8} {"step": 19036, "train_loss": 3.273411273956299, "lr": 0.00015847538153839752, "tps": 236199, "wall": 5282.0} {"step": 19037, "train_loss": 3.2435336112976074, "lr": 0.0001584573777453994, "tps": 235975, "wall": 5287.3} {"step": 19038, "train_loss": 3.273984909057617, "lr": 0.00015843937464955941, "tps": 235755, "wall": 5292.5} {"step": 19039, "train_loss": 3.1898295879364014, "lr": 0.00015842137225108153, "tps": 235534, "wall": 5297.8} {"step": 19040, "train_loss": 3.155311107635498, "lr": 0.0001584033705501697, "tps": 235314, "wall": 5303.0} {"step": 19041, "train_loss": 3.1933083534240723, "lr": 0.00015838536954702778, "tps": 235096, "wall": 5308.2} {"step": 19042, "train_loss": 3.1175806522369385, "lr": 0.00015836736924185974, "tps": 234877, "wall": 5313.4} {"step": 19043, "train_loss": 3.2419962882995605, "lr": 0.00015834936963486952, "tps": 234655, "wall": 5318.7} {"step": 19044, "train_loss": 3.1434102058410645, "lr": 0.0001583313707262609, "tps": 234437, "wall": 5324.0} {"step": 19045, "train_loss": 3.196408748626709, "lr": 0.00015831337251623787, "tps": 234216, "wall": 5329.2} {"step": 19046, "train_loss": 3.0862808227539062, "lr": 0.0001582953750050043, "tps": 233998, "wall": 5334.5} {"step": 19047, "train_loss": 3.2441585063934326, "lr": 0.0001582773781927641, "tps": 233782, "wall": 5339.7} {"step": 19048, "train_loss": 3.185424327850342, "lr": 0.00015825938207972103, "tps": 233567, "wall": 5344.9} {"step": 19049, "train_loss": 3.1981041431427, "lr": 0.00015824138666607906, "tps": 233351, "wall": 5350.1} {"step": 19050, "train_loss": 3.2190351486206055, "lr": 0.00015822339195204204, "tps": 233134, "wall": 5355.4} {"step": 19051, "train_loss": 3.237471103668213, "lr": 0.00015820539793781372, "tps": 232919, "wall": 5360.6} {"step": 19052, "train_loss": 3.2052364349365234, "lr": 0.000158187404623598, "tps": 232705, "wall": 5365.8} {"step": 19053, "train_loss": 3.2752041816711426, "lr": 0.00015816941200959877, "tps": 232492, "wall": 5371.0} {"step": 19054, "train_loss": 3.3032541275024414, "lr": 0.00015815142009601972, "tps": 232274, "wall": 5376.3} {"step": 19055, "train_loss": 3.184960126876831, "lr": 0.00015813342888306475, "tps": 232062, "wall": 5381.6} {"step": 19056, "train_loss": 3.248709201812744, "lr": 0.0001581154383709376, "tps": 231845, "wall": 5386.9} {"step": 19057, "train_loss": 3.216005802154541, "lr": 0.00015809744855984218, "tps": 231631, "wall": 5392.1} {"step": 19058, "train_loss": 3.2685446739196777, "lr": 0.0001580794594499822, "tps": 231416, "wall": 5397.4} {"step": 19059, "train_loss": 3.2350802421569824, "lr": 0.00015806147104156136, "tps": 231199, "wall": 5402.8} {"step": 19060, "train_loss": 3.193593978881836, "lr": 0.00015804348333478365, "tps": 230987, "wall": 5408.0} {"step": 19061, "train_loss": 3.1297004222869873, "lr": 0.00015802549632985263, "tps": 230774, "wall": 5413.3} {"step": 19062, "train_loss": 3.2121450901031494, "lr": 0.00015800751002697217, "tps": 230562, "wall": 5418.5} {"step": 19063, "train_loss": 3.0948164463043213, "lr": 0.00015798952442634603, "tps": 230352, "wall": 5423.8} {"step": 19064, "train_loss": 3.161168098449707, "lr": 0.00015797153952817788, "tps": 230143, "wall": 5429.0} {"step": 19065, "train_loss": 3.2240004539489746, "lr": 0.00015795355533267146, "tps": 229932, "wall": 5434.2} {"step": 19066, "train_loss": 3.1958987712860107, "lr": 0.0001579355718400305, "tps": 229723, "wall": 5439.5} {"step": 19067, "train_loss": 3.169532537460327, "lr": 0.00015791758905045887, "tps": 229505, "wall": 5444.9} {"step": 19068, "train_loss": 3.2900242805480957, "lr": 0.00015789960696416003, "tps": 229282, "wall": 5450.5} {"step": 19069, "train_loss": 3.204965114593506, "lr": 0.00015788162558133783, "tps": 229074, "wall": 5455.7} {"step": 19070, "train_loss": 3.160449504852295, "lr": 0.00015786364490219597, "tps": 228869, "wall": 5460.9} {"step": 19071, "train_loss": 3.2074618339538574, "lr": 0.00015784566492693807, "tps": 228663, "wall": 5466.1} {"step": 19072, "train_loss": 3.193692207336426, "lr": 0.00015782768565576784, "tps": 228456, "wall": 5471.4} {"step": 19073, "train_loss": 3.172700881958008, "lr": 0.00015780970708888893, "tps": 228254, "wall": 5476.5} {"step": 19074, "train_loss": 3.200061321258545, "lr": 0.00015779172922650506, "tps": 228051, "wall": 5481.6} {"step": 19075, "train_loss": 3.21844482421875, "lr": 0.00015777375206881984, "tps": 227848, "wall": 5486.8} {"step": 19076, "train_loss": 3.177751064300537, "lr": 0.00015775577561603693, "tps": 227646, "wall": 5492.0} {"step": 19077, "train_loss": 3.2590742111206055, "lr": 0.0001577377998683599, "tps": 227443, "wall": 5497.2} {"step": 19078, "train_loss": 3.2376708984375, "lr": 0.0001577198248259925, "tps": 227242, "wall": 5502.3} {"step": 19079, "train_loss": 3.2123847007751465, "lr": 0.0001577018504891383, "tps": 227034, "wall": 5507.7} {"step": 19080, "train_loss": 3.1433701515197754, "lr": 0.0001576838768580009, "tps": 226834, "wall": 5512.8} {"step": 19081, "train_loss": 3.159217357635498, "lr": 0.0001576659039327839, "tps": 226633, "wall": 5518.0} {"step": 19082, "train_loss": 3.077436923980713, "lr": 0.00015764793171369092, "tps": 226433, "wall": 5523.1} {"step": 19083, "train_loss": 3.231559991836548, "lr": 0.00015762996020092556, "tps": 226233, "wall": 5528.3} {"step": 19084, "train_loss": 3.241999626159668, "lr": 0.00015761198939469133, "tps": 226032, "wall": 5533.5} {"step": 19085, "train_loss": 3.1534743309020996, "lr": 0.0001575940192951919, "tps": 225832, "wall": 5538.7} {"step": 19086, "train_loss": 3.2425379753112793, "lr": 0.00015757604990263078, "tps": 225633, "wall": 5543.9} {"step": 19087, "train_loss": 3.2858760356903076, "lr": 0.00015755808121721158, "tps": 225437, "wall": 5549.0} {"step": 19088, "train_loss": 3.1683900356292725, "lr": 0.00015754011323913778, "tps": 225245, "wall": 5554.0} {"step": 19089, "train_loss": 3.2125813961029053, "lr": 0.00015752214596861296, "tps": 225053, "wall": 5559.0} {"step": 19090, "train_loss": 3.3217291831970215, "lr": 0.00015750417940584068, "tps": 224862, "wall": 5564.1} {"step": 19091, "train_loss": 3.200684070587158, "lr": 0.0001574862135510244, "tps": 224667, "wall": 5569.2} {"step": 19092, "train_loss": 3.2832441329956055, "lr": 0.00015746824840436765, "tps": 224477, "wall": 5574.2} {"step": 19093, "train_loss": 3.207334041595459, "lr": 0.000157450283966074, "tps": 224284, "wall": 5579.3} {"step": 19094, "train_loss": 3.249661445617676, "lr": 0.00015743232023634693, "tps": 224095, "wall": 5584.3} {"step": 19095, "train_loss": 3.242112159729004, "lr": 0.00015741435721538993, "tps": 223906, "wall": 5589.3} {"step": 19096, "train_loss": 3.195868968963623, "lr": 0.00015739639490340644, "tps": 223714, "wall": 5594.4} {"step": 19097, "train_loss": 3.199418544769287, "lr": 0.0001573784333006, "tps": 223525, "wall": 5599.4} {"step": 19098, "train_loss": 3.305062770843506, "lr": 0.00015736047240717403, "tps": 223337, "wall": 5604.4} {"step": 19099, "train_loss": 3.2055411338806152, "lr": 0.00015734251222333204, "tps": 223149, "wall": 5609.4} {"step": 19100, "train_loss": 3.2498059272766113, "lr": 0.00015732455274927745, "tps": 222960, "wall": 5614.5} {"step": 19101, "train_loss": 3.2080605030059814, "lr": 0.00015730659398521373, "tps": 222771, "wall": 5619.5} {"step": 19102, "train_loss": 3.021635055541992, "lr": 0.00015728863593134432, "tps": 222584, "wall": 5624.5} {"step": 19103, "train_loss": 3.174800395965576, "lr": 0.0001572706785878726, "tps": 222393, "wall": 5629.7} {"step": 19104, "train_loss": 3.1835989952087402, "lr": 0.00015725272195500205, "tps": 222208, "wall": 5634.6} {"step": 19105, "train_loss": 3.221675395965576, "lr": 0.00015723476603293608, "tps": 222022, "wall": 5639.7} {"step": 19106, "train_loss": 3.153398275375366, "lr": 0.000157216810821878, "tps": 221836, "wall": 5644.7} {"step": 19107, "train_loss": 3.175851583480835, "lr": 0.00015719885632203132, "tps": 221649, "wall": 5649.7} {"step": 19108, "train_loss": 3.098214626312256, "lr": 0.00015718090253359943, "tps": 221464, "wall": 5654.8} {"step": 19109, "train_loss": 3.1144702434539795, "lr": 0.00015716294945678562, "tps": 221276, "wall": 5659.8} {"step": 19110, "train_loss": 3.1935524940490723, "lr": 0.00015714499709179337, "tps": 221090, "wall": 5664.9} {"step": 19111, "train_loss": 3.2138023376464844, "lr": 0.00015712704543882598, "tps": 220906, "wall": 5669.9} {"step": 19112, "train_loss": 3.1581549644470215, "lr": 0.00015710909449808677, "tps": 220722, "wall": 5674.9} {"step": 19113, "train_loss": 3.14493465423584, "lr": 0.00015709114426977916, "tps": 220539, "wall": 5680.0} {"step": 19114, "train_loss": 3.1628079414367676, "lr": 0.00015707319475410656, "tps": 220355, "wall": 5685.0} {"step": 19115, "train_loss": 3.2684781551361084, "lr": 0.0001570552459512721, "tps": 220169, "wall": 5690.1} {"step": 19116, "train_loss": 3.310657501220703, "lr": 0.00015703729786147928, "tps": 219987, "wall": 5695.1} {"step": 19117, "train_loss": 3.261248826980591, "lr": 0.00015701935048493138, "tps": 219795, "wall": 5700.4} {"step": 19118, "train_loss": 3.1875486373901367, "lr": 0.00015700140382183162, "tps": 219607, "wall": 5705.6} {"step": 19119, "train_loss": 3.143819808959961, "lr": 0.00015698345787238334, "tps": 219415, "wall": 5710.8} {"step": 19120, "train_loss": 3.153550863265991, "lr": 0.00015696551263678988, "tps": 219232, "wall": 5715.9} {"step": 19121, "train_loss": 3.270310401916504, "lr": 0.00015694756811525457, "tps": 219049, "wall": 5721.0} {"step": 19122, "train_loss": 3.2405643463134766, "lr": 0.00015692962430798063, "tps": 218866, "wall": 5726.1} {"step": 19123, "train_loss": 3.302093505859375, "lr": 0.0001569116812151712, "tps": 218686, "wall": 5731.1} {"step": 19124, "train_loss": 3.2422714233398438, "lr": 0.00015689373883702977, "tps": 218504, "wall": 5736.1} {"step": 19125, "train_loss": 3.309636116027832, "lr": 0.0001568757971737594, "tps": 218320, "wall": 5741.3} {"step": 19126, "train_loss": 3.290555000305176, "lr": 0.00015685785622556345, "tps": 218134, "wall": 5746.5} {"step": 19127, "train_loss": 3.2631521224975586, "lr": 0.0001568399159926451, "tps": 217952, "wall": 5751.6} {"step": 19128, "train_loss": 3.2268941402435303, "lr": 0.00015682197647520768, "tps": 217771, "wall": 5756.7} {"step": 19129, "train_loss": 3.1496798992156982, "lr": 0.00015680403767345425, "tps": 217588, "wall": 5761.8} {"step": 19130, "train_loss": 3.187504768371582, "lr": 0.0001567860995875881, "tps": 217411, "wall": 5766.8} {"step": 19131, "train_loss": 3.151993751525879, "lr": 0.0001567681622178125, "tps": 217233, "wall": 5771.8} {"step": 19132, "train_loss": 3.3803558349609375, "lr": 0.00015675022556433058, "tps": 217056, "wall": 5776.8} {"step": 19133, "train_loss": 3.2233591079711914, "lr": 0.00015673228962734544, "tps": 216879, "wall": 5781.9} {"step": 19134, "train_loss": 3.2227067947387695, "lr": 0.00015671435440706038, "tps": 216702, "wall": 5786.9} {"step": 19135, "train_loss": 3.3492255210876465, "lr": 0.00015669641990367854, "tps": 216524, "wall": 5791.9} {"step": 19136, "train_loss": 3.213557243347168, "lr": 0.0001566784861174031, "tps": 216347, "wall": 5797.0} {"step": 19137, "train_loss": 3.2351162433624268, "lr": 0.00015666055304843716, "tps": 216171, "wall": 5802.0} {"step": 19138, "train_loss": 3.2214322090148926, "lr": 0.00015664262069698393, "tps": 215992, "wall": 5807.1} {"step": 19139, "train_loss": 3.1211400032043457, "lr": 0.00015662468906324652, "tps": 215818, "wall": 5812.1} {"step": 19140, "train_loss": 3.199348211288452, "lr": 0.00015660675814742805, "tps": 215643, "wall": 5817.1} {"step": 19141, "train_loss": 3.187283515930176, "lr": 0.00015658882794973165, "tps": 215468, "wall": 5822.2} {"step": 19142, "train_loss": 3.2330236434936523, "lr": 0.00015657089847036045, "tps": 215293, "wall": 5827.2} {"step": 19143, "train_loss": 3.120915651321411, "lr": 0.00015655296970951756, "tps": 215119, "wall": 5832.2} {"step": 19144, "train_loss": 3.212920665740967, "lr": 0.00015653504166740598, "tps": 214945, "wall": 5837.2} {"step": 19145, "train_loss": 3.2963974475860596, "lr": 0.00015651711434422894, "tps": 214771, "wall": 5842.3} {"step": 19146, "train_loss": 3.2063775062561035, "lr": 0.0001564991877401895, "tps": 214597, "wall": 5847.3} {"step": 19147, "train_loss": 3.2115983963012695, "lr": 0.00015648126185549064, "tps": 214424, "wall": 5852.3} {"step": 19148, "train_loss": 3.210827589035034, "lr": 0.0001564633366903355, "tps": 214251, "wall": 5857.4} {"step": 19149, "train_loss": 3.306234836578369, "lr": 0.00015644541224492712, "tps": 214079, "wall": 5862.4} {"step": 19150, "train_loss": 3.164044141769409, "lr": 0.00015642748851946853, "tps": 213904, "wall": 5867.5} {"step": 19151, "train_loss": 3.2034859657287598, "lr": 0.00015640956551416283, "tps": 213732, "wall": 5872.5} {"step": 19152, "train_loss": 3.218623161315918, "lr": 0.00015639164322921295, "tps": 213560, "wall": 5877.5} {"step": 19153, "train_loss": 3.2452406883239746, "lr": 0.00015637372166482205, "tps": 213389, "wall": 5882.6} {"step": 19154, "train_loss": 3.241443157196045, "lr": 0.000156355800821193, "tps": 213218, "wall": 5887.6} {"step": 19155, "train_loss": 3.224553108215332, "lr": 0.0001563378806985289, "tps": 213047, "wall": 5892.6} {"step": 19156, "train_loss": 3.2279748916625977, "lr": 0.00015631996129703278, "tps": 212876, "wall": 5897.6} {"step": 19157, "train_loss": 3.2684192657470703, "lr": 0.00015630204261690754, "tps": 212706, "wall": 5902.7} {"step": 19158, "train_loss": 3.1986212730407715, "lr": 0.00015628412465835623, "tps": 212536, "wall": 5907.7} {"step": 19159, "train_loss": 3.1159677505493164, "lr": 0.0001562662074215818, "tps": 212366, "wall": 5912.8} {"step": 19160, "train_loss": 3.259958267211914, "lr": 0.00015624829090678718, "tps": 212196, "wall": 5917.8} {"step": 19161, "train_loss": 3.168100118637085, "lr": 0.0001562303751141754, "tps": 212027, "wall": 5922.8} {"step": 19162, "train_loss": 3.3011107444763184, "lr": 0.00015621246004394942, "tps": 211855, "wall": 5927.9} {"step": 19163, "train_loss": 3.205981731414795, "lr": 0.0001561945456963121, "tps": 211686, "wall": 5933.0} {"step": 19164, "train_loss": 3.226304292678833, "lr": 0.00015617663207146643, "tps": 211519, "wall": 5938.0} {"step": 19165, "train_loss": 3.210675001144409, "lr": 0.00015615871916961532, "tps": 211351, "wall": 5943.0} {"step": 19166, "train_loss": 3.1269423961639404, "lr": 0.0001561408069909617, "tps": 211183, "wall": 5948.0} {"step": 19167, "train_loss": 3.176568031311035, "lr": 0.0001561228955357085, "tps": 211016, "wall": 5953.1} {"step": 19168, "train_loss": 3.1292526721954346, "lr": 0.00015610498480405851, "tps": 210848, "wall": 5958.1} {"step": 19169, "train_loss": 3.1987099647521973, "lr": 0.00015608707479621473, "tps": 210682, "wall": 5963.1} {"step": 19170, "train_loss": 3.1011898517608643, "lr": 0.0001560691655123801, "tps": 210515, "wall": 5968.2} {"step": 19171, "train_loss": 3.2382824420928955, "lr": 0.00015605125695275737, "tps": 210348, "wall": 5973.2} {"step": 19172, "train_loss": 3.152097702026367, "lr": 0.00015603334911754946, "tps": 210183, "wall": 5978.2} {"step": 19173, "train_loss": 3.258760452270508, "lr": 0.00015601544200695923, "tps": 210016, "wall": 5983.3} {"step": 19174, "train_loss": 3.267796039581299, "lr": 0.00015599753562118952, "tps": 209848, "wall": 5988.4} {"step": 19175, "train_loss": 3.168231964111328, "lr": 0.00015597962996044323, "tps": 209683, "wall": 5993.4} {"step": 19176, "train_loss": 3.1989665031433105, "lr": 0.00015596172502492313, "tps": 209518, "wall": 5998.4} {"step": 19177, "train_loss": 3.189882516860962, "lr": 0.00015594382081483209, "tps": 209354, "wall": 6003.5} {"step": 19178, "train_loss": 3.2100648880004883, "lr": 0.00015592591733037289, "tps": 209188, "wall": 6008.5} {"step": 19179, "train_loss": 3.158540725708008, "lr": 0.00015590801457174836, "tps": 209024, "wall": 6013.6} {"step": 19180, "train_loss": 3.1158154010772705, "lr": 0.00015589011253916137, "tps": 208860, "wall": 6018.6} {"step": 19181, "train_loss": 3.2300570011138916, "lr": 0.0001558722112328146, "tps": 208696, "wall": 6023.6} {"step": 19182, "train_loss": 3.142167091369629, "lr": 0.0001558543106529109, "tps": 208533, "wall": 6028.7} {"step": 19183, "train_loss": 3.211838483810425, "lr": 0.00015583641079965305, "tps": 208368, "wall": 6033.7} {"step": 19184, "train_loss": 3.11098051071167, "lr": 0.0001558185116732438, "tps": 208204, "wall": 6038.8} {"step": 19185, "train_loss": 3.131094455718994, "lr": 0.00015580061327388588, "tps": 208039, "wall": 6043.9} {"step": 19186, "train_loss": 3.2850754261016846, "lr": 0.00015578271560178216, "tps": 207871, "wall": 6049.1} {"step": 19187, "train_loss": 3.1907193660736084, "lr": 0.0001557648186571353, "tps": 207707, "wall": 6054.2} {"step": 19188, "train_loss": 3.092535972595215, "lr": 0.00015574692244014798, "tps": 207546, "wall": 6059.2} {"step": 19189, "train_loss": 3.334477424621582, "lr": 0.00015572902695102308, "tps": 207382, "wall": 6064.3} {"step": 19190, "train_loss": 3.2749760150909424, "lr": 0.00015571113218996319, "tps": 207211, "wall": 6069.6} {"step": 19191, "train_loss": 3.1812336444854736, "lr": 0.00015569323815717108, "tps": 207041, "wall": 6074.9} {"step": 19192, "train_loss": 3.150078773498535, "lr": 0.00015567534485284946, "tps": 206877, "wall": 6080.1} {"step": 19193, "train_loss": 3.184670925140381, "lr": 0.00015565745227720106, "tps": 206714, "wall": 6085.2} {"step": 19194, "train_loss": 3.2270541191101074, "lr": 0.00015563956043042842, "tps": 206548, "wall": 6090.4} {"step": 19195, "train_loss": 3.218618869781494, "lr": 0.0001556216693127344, "tps": 206384, "wall": 6095.6} {"step": 19196, "train_loss": 3.247243881225586, "lr": 0.0001556037789243215, "tps": 206217, "wall": 6100.8} {"step": 19197, "train_loss": 3.2843940258026123, "lr": 0.00015558588926539263, "tps": 206047, "wall": 6106.2} {"step": 19198, "train_loss": 3.167386293411255, "lr": 0.00015556800033615016, "tps": 205884, "wall": 6111.3} {"step": 19199, "train_loss": 3.332395553588867, "lr": 0.0001555501121367969, "tps": 205720, "wall": 6116.5} {"step": 19200, "train_loss": 3.28155255317688, "lr": 0.00015553222466753547, "tps": 205555, "wall": 6121.7} {"step": 19201, "train_loss": 3.3090476989746094, "lr": 0.0001555143379285685, "tps": 205390, "wall": 6127.0} {"step": 19202, "train_loss": 3.192434310913086, "lr": 0.00015549645192009854, "tps": 205225, "wall": 6132.2} {"step": 19203, "train_loss": 3.248654842376709, "lr": 0.00015547856664232837, "tps": 205060, "wall": 6137.5} {"step": 19204, "train_loss": 3.27083158493042, "lr": 0.00015546068209546041, "tps": 204894, "wall": 6142.8} {"step": 19205, "train_loss": 3.271329879760742, "lr": 0.00015544279827969733, "tps": 204729, "wall": 6148.0} {"step": 19206, "train_loss": 3.229477643966675, "lr": 0.0001554249151952417, "tps": 204556, "wall": 6153.5} {"step": 19207, "train_loss": 3.186143636703491, "lr": 0.0001554070328422962, "tps": 204389, "wall": 6158.9} {"step": 19208, "train_loss": 3.2601757049560547, "lr": 0.00015538915122106329, "tps": 204221, "wall": 6164.3} {"step": 19209, "train_loss": 3.1840672492980957, "lr": 0.00015537127033174556, "tps": 204055, "wall": 6169.6} {"step": 19210, "train_loss": 3.140514373779297, "lr": 0.0001553533901745456, "tps": 203890, "wall": 6174.9} {"step": 19211, "train_loss": 3.196136474609375, "lr": 0.0001553355107496659, "tps": 203728, "wall": 6180.2} {"step": 19212, "train_loss": 3.1889309883117676, "lr": 0.00015531763205730906, "tps": 203563, "wall": 6185.5} {"step": 19213, "train_loss": 3.236732244491577, "lr": 0.00015529975409767758, "tps": 203400, "wall": 6190.8} {"step": 19214, "train_loss": 3.2585461139678955, "lr": 0.00015528187687097403, "tps": 203238, "wall": 6196.1} {"step": 19215, "train_loss": 3.212705135345459, "lr": 0.00015526400037740076, "tps": 203075, "wall": 6201.3} {"step": 19216, "train_loss": 3.2042055130004883, "lr": 0.0001552461246171605, "tps": 202912, "wall": 6206.6} {"step": 19217, "train_loss": 3.2463111877441406, "lr": 0.0001552282495904556, "tps": 202751, "wall": 6211.9} {"step": 19218, "train_loss": 3.258850574493408, "lr": 0.0001552103752974886, "tps": 202590, "wall": 6217.2} {"step": 19219, "train_loss": 3.1557979583740234, "lr": 0.000155192501738462, "tps": 202429, "wall": 6222.4} {"step": 19220, "train_loss": 3.1839842796325684, "lr": 0.0001551746289135782, "tps": 202265, "wall": 6227.8} {"step": 19221, "train_loss": 3.222482919692993, "lr": 0.00015515675682303975, "tps": 202105, "wall": 6233.0} {"step": 19222, "train_loss": 3.196194648742676, "lr": 0.00015513888546704903, "tps": 201946, "wall": 6238.3} {"step": 19223, "train_loss": 3.259625196456909, "lr": 0.0001551210148458085, "tps": 201786, "wall": 6243.5} {"step": 19224, "train_loss": 3.24033260345459, "lr": 0.00015510314495952073, "tps": 201628, "wall": 6248.8} {"step": 19225, "train_loss": 3.253288745880127, "lr": 0.00015508527580838797, "tps": 201467, "wall": 6254.1} {"step": 19226, "train_loss": 3.216348171234131, "lr": 0.00015506740739261275, "tps": 201307, "wall": 6259.4} {"step": 19227, "train_loss": 3.2252707481384277, "lr": 0.00015504953971239745, "tps": 201147, "wall": 6264.7} {"step": 19228, "train_loss": 3.427628993988037, "lr": 0.00015503167276794444, "tps": 200989, "wall": 6269.9} {"step": 19229, "train_loss": 3.159284830093384, "lr": 0.00015501380655945615, "tps": 200831, "wall": 6275.2} {"step": 19230, "train_loss": 3.2309389114379883, "lr": 0.00015499594108713503, "tps": 200675, "wall": 6280.4} {"step": 19231, "train_loss": 3.1535651683807373, "lr": 0.00015497807635118336, "tps": 200514, "wall": 6285.8} {"step": 19232, "train_loss": 3.2035956382751465, "lr": 0.00015496021235180362, "tps": 200361, "wall": 6290.9} {"step": 19233, "train_loss": 3.094303607940674, "lr": 0.00015494234908919801, "tps": 200206, "wall": 6296.1} {"step": 19234, "train_loss": 3.1886794567108154, "lr": 0.0001549244865635691, "tps": 200052, "wall": 6301.3} {"step": 19235, "train_loss": 3.2185914516448975, "lr": 0.00015490662477511905, "tps": 199898, "wall": 6306.4} {"step": 19236, "train_loss": 3.232215404510498, "lr": 0.00015488876372405028, "tps": 199744, "wall": 6311.7} {"step": 19237, "train_loss": 3.2582755088806152, "lr": 0.00015487090341056517, "tps": 199589, "wall": 6316.9} {"step": 19238, "train_loss": 3.2777833938598633, "lr": 0.00015485304383486596, "tps": 199437, "wall": 6322.0} {"step": 19239, "train_loss": 3.127882957458496, "lr": 0.000154835184997155, "tps": 199284, "wall": 6327.2} {"step": 19240, "train_loss": 3.205540657043457, "lr": 0.0001548173268976346, "tps": 199132, "wall": 6332.3} {"step": 19241, "train_loss": 3.198707342147827, "lr": 0.000154799469536507, "tps": 198980, "wall": 6337.5} {"step": 19242, "train_loss": 3.236715316772461, "lr": 0.00015478161291397453, "tps": 198828, "wall": 6342.7} {"step": 19243, "train_loss": 3.2219316959381104, "lr": 0.0001547637570302395, "tps": 198674, "wall": 6348.0} {"step": 19244, "train_loss": 3.2501273155212402, "lr": 0.0001547459018855042, "tps": 198523, "wall": 6353.1} {"step": 19245, "train_loss": 3.1948118209838867, "lr": 0.00015472804747997083, "tps": 198372, "wall": 6358.3} {"step": 19246, "train_loss": 3.3368566036224365, "lr": 0.00015471019381384165, "tps": 198220, "wall": 6363.5} {"step": 19247, "train_loss": 3.3450310230255127, "lr": 0.00015469234088731897, "tps": 198069, "wall": 6368.7} {"step": 19248, "train_loss": 3.3204073905944824, "lr": 0.00015467448870060496, "tps": 197919, "wall": 6373.8} {"step": 19249, "train_loss": 3.2621374130249023, "lr": 0.00015465663725390186, "tps": 197769, "wall": 6379.0} {"step": 19250, "train_loss": 3.178145170211792, "lr": 0.00015463878654741194, "tps": 197616, "wall": 6384.2} {"step": 19251, "train_loss": 3.285971164703369, "lr": 0.00015462093658133737, "tps": 197463, "wall": 6389.5} {"step": 19252, "train_loss": 3.2714600563049316, "lr": 0.00015460308735588033, "tps": 197311, "wall": 6394.8} {"step": 19253, "train_loss": 3.2392349243164062, "lr": 0.00015458523887124307, "tps": 197161, "wall": 6400.0} {"step": 19254, "train_loss": 3.1856493949890137, "lr": 0.0001545673911276278, "tps": 197010, "wall": 6405.2} {"step": 19255, "train_loss": 3.2085373401641846, "lr": 0.00015454954412523665, "tps": 196857, "wall": 6410.5} {"step": 19256, "train_loss": 3.160560131072998, "lr": 0.00015453169786427178, "tps": 196706, "wall": 6415.8} {"step": 19257, "train_loss": 3.201167583465576, "lr": 0.00015451385234493544, "tps": 196554, "wall": 6421.1} {"step": 19258, "train_loss": 3.1419289112091064, "lr": 0.00015449600756742963, "tps": 196404, "wall": 6426.3} {"step": 19259, "train_loss": 3.3088619709014893, "lr": 0.00015447816353195663, "tps": 196255, "wall": 6431.5} {"step": 19260, "train_loss": 3.2158613204956055, "lr": 0.00015446032023871853, "tps": 196106, "wall": 6436.7} {"step": 19261, "train_loss": 3.2324328422546387, "lr": 0.0001544424776879175, "tps": 195954, "wall": 6442.1} {"step": 19262, "train_loss": 3.245863199234009, "lr": 0.00015442463587975565, "tps": 195806, "wall": 6447.3} {"step": 19263, "train_loss": 3.147852659225464, "lr": 0.000154406794814435, "tps": 195658, "wall": 6452.5} {"step": 19264, "train_loss": 3.186396598815918, "lr": 0.00015438895449215777, "tps": 195508, "wall": 6457.8} {"step": 19265, "train_loss": 3.079713821411133, "lr": 0.00015437111491312604, "tps": 195359, "wall": 6463.0} {"step": 19266, "train_loss": 3.210721492767334, "lr": 0.00015435327607754177, "tps": 195207, "wall": 6468.4} {"step": 19267, "train_loss": 3.2024340629577637, "lr": 0.00015433543798560727, "tps": 195055, "wall": 6473.8} {"step": 19268, "train_loss": 3.078171730041504, "lr": 0.0001543176006375244, "tps": 194905, "wall": 6479.1} {"step": 19269, "train_loss": 3.1214792728424072, "lr": 0.00015429976403349532, "tps": 194755, "wall": 6484.4} {"step": 19270, "train_loss": 3.2914743423461914, "lr": 0.00015428192817372205, "tps": 194608, "wall": 6489.7} {"step": 19271, "train_loss": 3.149285316467285, "lr": 0.00015426409305840667, "tps": 194461, "wall": 6494.9} {"step": 19272, "train_loss": 3.213798761367798, "lr": 0.0001542462586877512, "tps": 194316, "wall": 6500.1} {"step": 19273, "train_loss": 3.2492589950561523, "lr": 0.00015422842506195768, "tps": 194170, "wall": 6505.3} {"step": 19274, "train_loss": 3.252044200897217, "lr": 0.0001542105921812281, "tps": 194021, "wall": 6510.7} {"step": 19275, "train_loss": 3.248948335647583, "lr": 0.00015419276004576452, "tps": 193875, "wall": 6515.9} {"step": 19276, "train_loss": 3.271406412124634, "lr": 0.00015417492865576885, "tps": 193729, "wall": 6521.2} {"step": 19277, "train_loss": 3.2314953804016113, "lr": 0.0001541570980114432, "tps": 193581, "wall": 6526.5} {"step": 19278, "train_loss": 3.278520107269287, "lr": 0.00015413926811298954, "tps": 193434, "wall": 6531.8} {"step": 19279, "train_loss": 3.169469118118286, "lr": 0.00015412143896060973, "tps": 193288, "wall": 6537.0} {"step": 19280, "train_loss": 3.3137834072113037, "lr": 0.00015410361055450585, "tps": 193144, "wall": 6542.2} {"step": 19281, "train_loss": 3.1499085426330566, "lr": 0.0001540857828948799, "tps": 193000, "wall": 6547.5} {"step": 19282, "train_loss": 3.1754708290100098, "lr": 0.0001540679559819337, "tps": 192856, "wall": 6552.7} {"step": 19283, "train_loss": 3.1644108295440674, "lr": 0.0001540501298158693, "tps": 192713, "wall": 6557.9} {"step": 19284, "train_loss": 3.238986015319824, "lr": 0.00015403230439688857, "tps": 192566, "wall": 6563.2} {"step": 19285, "train_loss": 3.152111053466797, "lr": 0.00015401447972519344, "tps": 192423, "wall": 6568.5} {"step": 19286, "train_loss": 3.247568130493164, "lr": 0.0001539966558009859, "tps": 192280, "wall": 6573.7} {"step": 19287, "train_loss": 3.195505142211914, "lr": 0.0001539788326244678, "tps": 192137, "wall": 6578.9} {"step": 19288, "train_loss": 3.185011863708496, "lr": 0.0001539610101958411, "tps": 191994, "wall": 6584.2} {"step": 19289, "train_loss": 3.242246627807617, "lr": 0.00015394318851530758, "tps": 191848, "wall": 6589.5} {"step": 19290, "train_loss": 3.246488571166992, "lr": 0.0001539253675830692, "tps": 191705, "wall": 6594.8} {"step": 19291, "train_loss": 3.1783528327941895, "lr": 0.00015390754739932785, "tps": 191559, "wall": 6600.1} {"step": 19292, "train_loss": 3.1559853553771973, "lr": 0.00015388972796428539, "tps": 191415, "wall": 6605.5} {"step": 19293, "train_loss": 3.2363128662109375, "lr": 0.00015387190927814364, "tps": 191272, "wall": 6610.7} {"step": 19294, "train_loss": 3.2132716178894043, "lr": 0.0001538540913411045, "tps": 191127, "wall": 6616.1} {"step": 19295, "train_loss": 3.1772964000701904, "lr": 0.0001538362741533698, "tps": 190986, "wall": 6621.3} {"step": 19296, "train_loss": 3.2017340660095215, "lr": 0.00015381845771514133, "tps": 190839, "wall": 6626.8} {"step": 19297, "train_loss": 3.2134170532226562, "lr": 0.00015380064202662097, "tps": 190699, "wall": 6632.0} {"step": 19298, "train_loss": 3.196398973464966, "lr": 0.00015378282708801053, "tps": 190555, "wall": 6637.3} {"step": 19299, "train_loss": 3.1519603729248047, "lr": 0.0001537650128995118, "tps": 190404, "wall": 6642.9} {"step": 19300, "train_loss": 3.2099151611328125, "lr": 0.00015374719946132656, "tps": 190254, "wall": 6648.5} {"step": 19301, "train_loss": 3.2752838134765625, "lr": 0.0001537293867736567, "tps": 190108, "wall": 6654.0} {"step": 19302, "train_loss": 3.0706677436828613, "lr": 0.0001537115748367039, "tps": 189960, "wall": 6659.5} {"step": 19303, "train_loss": 3.2064321041107178, "lr": 0.00015369376365066998, "tps": 189811, "wall": 6665.1} {"step": 19304, "train_loss": 3.310788631439209, "lr": 0.00015367595321575666, "tps": 189662, "wall": 6670.7} {"step": 19305, "train_loss": 3.1906418800354004, "lr": 0.0001536581435321657, "tps": 189515, "wall": 6676.2} {"step": 19306, "train_loss": 3.1503939628601074, "lr": 0.00015364033460009896, "tps": 189369, "wall": 6681.7} {"step": 19307, "train_loss": 3.276102304458618, "lr": 0.00015362252641975803, "tps": 189222, "wall": 6687.2} {"step": 19308, "train_loss": 3.2198562622070312, "lr": 0.0001536047189913447, "tps": 189075, "wall": 6692.7} {"step": 19309, "train_loss": 3.1955971717834473, "lr": 0.00015358691231506078, "tps": 188934, "wall": 6698.1} {"step": 19310, "train_loss": 3.2090322971343994, "lr": 0.00015356910639110786, "tps": 188794, "wall": 6703.4} {"step": 19311, "train_loss": 3.1334667205810547, "lr": 0.00015355130121968774, "tps": 188651, "wall": 6708.8} {"step": 19312, "train_loss": 3.2499918937683105, "lr": 0.000153533496801002, "tps": 188512, "wall": 6714.1} {"step": 19313, "train_loss": 3.169128179550171, "lr": 0.00015351569313525246, "tps": 188373, "wall": 6719.4} {"step": 19314, "train_loss": 3.2267723083496094, "lr": 0.00015349789022264072, "tps": 188234, "wall": 6724.8} {"step": 19315, "train_loss": 3.302513837814331, "lr": 0.00015348008806336847, "tps": 188095, "wall": 6730.0} {"step": 19316, "train_loss": 3.170356273651123, "lr": 0.00015346228665763745, "tps": 187957, "wall": 6735.3} {"step": 19317, "train_loss": 3.2974419593811035, "lr": 0.0001534444860056492, "tps": 187819, "wall": 6740.6} {"step": 19318, "train_loss": 3.2673532962799072, "lr": 0.00015342668610760537, "tps": 187681, "wall": 6745.9} {"step": 19319, "train_loss": 3.147429943084717, "lr": 0.00015340888696370773, "tps": 187542, "wall": 6751.3} {"step": 19320, "train_loss": 3.327136993408203, "lr": 0.00015339108857415776, "tps": 187403, "wall": 6756.6} {"step": 19321, "train_loss": 3.2365453243255615, "lr": 0.00015337329093915712, "tps": 187266, "wall": 6762.0} {"step": 19322, "train_loss": 3.2730813026428223, "lr": 0.00015335549405890748, "tps": 187125, "wall": 6767.4} {"step": 19323, "train_loss": 3.2767651081085205, "lr": 0.00015333769793361043, "tps": 186989, "wall": 6772.7} {"step": 19324, "train_loss": 3.1812381744384766, "lr": 0.0001533199025634675, "tps": 186855, "wall": 6777.9} {"step": 19325, "train_loss": 3.2382495403289795, "lr": 0.00015330210794868037, "tps": 186720, "wall": 6783.1} {"step": 19326, "train_loss": 3.290205955505371, "lr": 0.00015328431408945053, "tps": 186585, "wall": 6788.4} {"step": 19327, "train_loss": 3.1863365173339844, "lr": 0.0001532665209859796, "tps": 186452, "wall": 6793.6} {"step": 19328, "train_loss": 3.1962509155273438, "lr": 0.00015324872863846912, "tps": 186321, "wall": 6798.7} {"step": 19329, "train_loss": 3.3592424392700195, "lr": 0.00015323093704712064, "tps": 186189, "wall": 6803.9} {"step": 19330, "train_loss": 3.1823229789733887, "lr": 0.0001532131462121358, "tps": 186060, "wall": 6809.0} {"step": 19331, "train_loss": 3.3040223121643066, "lr": 0.00015319535613371595, "tps": 185930, "wall": 6814.1} {"step": 19332, "train_loss": 3.2710046768188477, "lr": 0.00015317756681206275, "tps": 185801, "wall": 6819.1} {"step": 19333, "train_loss": 3.201185941696167, "lr": 0.00015315977824737774, "tps": 185674, "wall": 6824.2} {"step": 19334, "train_loss": 3.154003143310547, "lr": 0.00015314199043986232, "tps": 185543, "wall": 6829.3} {"step": 19335, "train_loss": 3.143190860748291, "lr": 0.00015312420338971805, "tps": 185415, "wall": 6834.4} {"step": 19336, "train_loss": 3.1749534606933594, "lr": 0.00015310641709714647, "tps": 185286, "wall": 6839.5} {"step": 19337, "train_loss": 3.234919309616089, "lr": 0.00015308863156234898, "tps": 185159, "wall": 6844.6} {"step": 19338, "train_loss": 3.1884822845458984, "lr": 0.00015307084678552708, "tps": 185032, "wall": 6849.6} {"step": 19339, "train_loss": 3.2463479042053223, "lr": 0.00015305306276688224, "tps": 184905, "wall": 6854.7} {"step": 19340, "train_loss": 3.0782856941223145, "lr": 0.00015303527950661603, "tps": 184777, "wall": 6859.8} {"step": 19341, "train_loss": 3.198199987411499, "lr": 0.0001530174970049297, "tps": 184650, "wall": 6864.8} {"step": 19342, "train_loss": 3.313718795776367, "lr": 0.00015299971526202478, "tps": 184523, "wall": 6869.9} {"step": 19343, "train_loss": 3.3362250328063965, "lr": 0.00015298193427810278, "tps": 184398, "wall": 6875.0} {"step": 19344, "train_loss": 3.1542272567749023, "lr": 0.00015296415405336502, "tps": 184273, "wall": 6880.0} {"step": 19345, "train_loss": 3.1937105655670166, "lr": 0.00015294637458801292, "tps": 184145, "wall": 6885.1} {"step": 19346, "train_loss": 3.2130770683288574, "lr": 0.00015292859588224796, "tps": 184013, "wall": 6890.4} {"step": 19347, "train_loss": 3.2818360328674316, "lr": 0.00015291081793627145, "tps": 183882, "wall": 6895.6} {"step": 19348, "train_loss": 3.1725080013275146, "lr": 0.00015289304075028482, "tps": 183753, "wall": 6900.9} {"step": 19349, "train_loss": 3.2821013927459717, "lr": 0.0001528752643244895, "tps": 183623, "wall": 6906.1} {"step": 19350, "train_loss": 3.153083086013794, "lr": 0.00015285748865908683, "tps": 183492, "wall": 6911.4} {"step": 19351, "train_loss": 3.2971301078796387, "lr": 0.00015283971375427808, "tps": 183361, "wall": 6916.7} {"step": 19352, "train_loss": 3.2606265544891357, "lr": 0.00015282193961026476, "tps": 183230, "wall": 6922.0} {"step": 19353, "train_loss": 3.095656156539917, "lr": 0.00015280416622724815, "tps": 183100, "wall": 6927.3} {"step": 19354, "train_loss": 3.325695037841797, "lr": 0.0001527863936054295, "tps": 182970, "wall": 6932.5} {"step": 19355, "train_loss": 3.2391440868377686, "lr": 0.00015276862174501025, "tps": 182840, "wall": 6937.8} {"step": 19356, "train_loss": 3.1555423736572266, "lr": 0.0001527508506461917, "tps": 182710, "wall": 6943.1} {"step": 19357, "train_loss": 3.172238826751709, "lr": 0.0001527330803091752, "tps": 182579, "wall": 6948.5} {"step": 19358, "train_loss": 3.1555166244506836, "lr": 0.00015271531073416194, "tps": 182448, "wall": 6953.8} {"step": 19359, "train_loss": 3.2114782333374023, "lr": 0.0001526975419213533, "tps": 182320, "wall": 6959.1} {"step": 19360, "train_loss": 3.282046318054199, "lr": 0.00015267977387095058, "tps": 182191, "wall": 6964.3} {"step": 19361, "train_loss": 3.2319135665893555, "lr": 0.000152662006583155, "tps": 182064, "wall": 6969.6} {"step": 19362, "train_loss": 3.1932120323181152, "lr": 0.00015264424005816785, "tps": 181936, "wall": 6974.8} {"step": 19363, "train_loss": 3.2383933067321777, "lr": 0.0001526264742961904, "tps": 181809, "wall": 6980.0} {"step": 19364, "train_loss": 3.163043737411499, "lr": 0.00015260870929742387, "tps": 181682, "wall": 6985.3} {"step": 19365, "train_loss": 3.19980788230896, "lr": 0.0001525909450620695, "tps": 181546, "wall": 6990.9} {"step": 19366, "train_loss": 3.238389492034912, "lr": 0.00015257318159032858, "tps": 181419, "wall": 6996.1} {"step": 19367, "train_loss": 3.1892762184143066, "lr": 0.00015255541888240233, "tps": 181291, "wall": 7001.4} {"step": 19368, "train_loss": 3.275131940841675, "lr": 0.00015253765693849195, "tps": 181162, "wall": 7006.8} {"step": 19369, "train_loss": 3.26267147064209, "lr": 0.0001525198957587986, "tps": 181036, "wall": 7012.0} {"step": 19370, "train_loss": 3.1319339275360107, "lr": 0.00015250213534352355, "tps": 180911, "wall": 7017.2} {"step": 19371, "train_loss": 3.1602816581726074, "lr": 0.00015248437569286794, "tps": 180785, "wall": 7022.5} {"step": 19372, "train_loss": 3.160797595977783, "lr": 0.000152466616807033, "tps": 180660, "wall": 7027.7} {"step": 19373, "train_loss": 3.2277371883392334, "lr": 0.0001524488586862199, "tps": 180536, "wall": 7032.9} {"step": 19374, "train_loss": 3.2530136108398438, "lr": 0.00015243110133062975, "tps": 180411, "wall": 7038.1} {"step": 19375, "train_loss": 3.244450807571411, "lr": 0.00015241334474046375, "tps": 180286, "wall": 7043.4} {"step": 19376, "train_loss": 3.1671531200408936, "lr": 0.000152395588915923, "tps": 180161, "wall": 7048.6} {"step": 19377, "train_loss": 3.2032384872436523, "lr": 0.00015237783385720874, "tps": 180037, "wall": 7053.9} {"step": 19378, "train_loss": 3.240461587905884, "lr": 0.000152360079564522, "tps": 179912, "wall": 7059.1} {"step": 19379, "train_loss": 3.1833722591400146, "lr": 0.0001523423260380639, "tps": 179787, "wall": 7064.4} {"step": 19380, "train_loss": 3.2403745651245117, "lr": 0.00015232457327803565, "tps": 179660, "wall": 7069.8} {"step": 19381, "train_loss": 3.260838508605957, "lr": 0.00015230682128463828, "tps": 179533, "wall": 7075.1} {"step": 19382, "train_loss": 3.175252676010132, "lr": 0.0001522890700580729, "tps": 179406, "wall": 7080.5} {"step": 19383, "train_loss": 3.2271854877471924, "lr": 0.00015227131959854058, "tps": 179274, "wall": 7086.1} {"step": 19384, "train_loss": 3.1511528491973877, "lr": 0.00015225356990624243, "tps": 179149, "wall": 7091.4} {"step": 19385, "train_loss": 3.233330726623535, "lr": 0.0001522358209813795, "tps": 179023, "wall": 7096.7} {"step": 19386, "train_loss": 3.2692952156066895, "lr": 0.00015221807282415285, "tps": 178899, "wall": 7102.0} {"step": 19387, "train_loss": 3.3291616439819336, "lr": 0.00015220032543476357, "tps": 178774, "wall": 7107.3} {"step": 19388, "train_loss": 3.172969341278076, "lr": 0.00015218257881341267, "tps": 178642, "wall": 7113.0} {"step": 19389, "train_loss": 3.321005344390869, "lr": 0.00015216483296030115, "tps": 178516, "wall": 7118.4} {"step": 19390, "train_loss": 3.2162373065948486, "lr": 0.0001521470878756301, "tps": 178394, "wall": 7123.6} {"step": 19391, "train_loss": 3.2222208976745605, "lr": 0.00015212934355960048, "tps": 178275, "wall": 7128.7} {"step": 19392, "train_loss": 3.2179110050201416, "lr": 0.00015211160001241334, "tps": 178149, "wall": 7134.1} {"step": 19393, "train_loss": 3.1717946529388428, "lr": 0.00015209385723426966, "tps": 178029, "wall": 7139.3} {"step": 19394, "train_loss": 3.2194900512695312, "lr": 0.00015207611522537046, "tps": 177908, "wall": 7144.5} {"step": 19395, "train_loss": 3.241647243499756, "lr": 0.00015205837398591673, "tps": 177790, "wall": 7149.6} {"step": 19396, "train_loss": 3.2699081897735596, "lr": 0.0001520406335161093, "tps": 177673, "wall": 7154.7} {"step": 19001, "train_loss": 3.0706946849823, "lr": 0.00015910595191777325, "tps": 255072933, "wall": 4.9} {"step": 19002, "train_loss": 3.1071674823760986, "lr": 0.00015908792385278315, "tps": 135368603, "wall": 9.2} {"step": 19003, "train_loss": 3.1043334007263184, "lr": 0.00015906989647780835, "tps": 91784632, "wall": 13.6} {"step": 19004, "train_loss": 3.1804399490356445, "lr": 0.00015905186979305307, "tps": 68931315, "wall": 18.1} {"step": 19005, "train_loss": 3.045809030532837, "lr": 0.00015903384379872145, "tps": 55259235, "wall": 22.5} {"step": 19006, "train_loss": 3.0660691261291504, "lr": 0.00015901581849501786, "tps": 45890624, "wall": 27.1} {"step": 19007, "train_loss": 3.0662598609924316, "lr": 0.0001589977938821463, "tps": 39252728, "wall": 31.7} {"step": 19008, "train_loss": 3.168743133544922, "lr": 0.00015897976996031104, "tps": 34298282, "wall": 36.3} {"step": 19009, "train_loss": 3.128330707550049, "lr": 0.00015896174672971625, "tps": 30450811, "wall": 40.9} {"step": 19010, "train_loss": 3.1675024032592773, "lr": 0.00015894372419056612, "tps": 27399432, "wall": 45.5} {"step": 19011, "train_loss": 3.057451009750366, "lr": 0.00015892570234306473, "tps": 24897558, "wall": 50.0} {"step": 19012, "train_loss": 3.1303117275238037, "lr": 0.0001589076811874163, "tps": 22816404, "wall": 54.6} {"step": 19013, "train_loss": 3.033820629119873, "lr": 0.000158889660723825, "tps": 21049088, "wall": 59.2} {"step": 19014, "train_loss": 3.062486410140991, "lr": 0.0001588716409524949, "tps": 19532642, "wall": 63.8} {"step": 19015, "train_loss": 3.2360293865203857, "lr": 0.0001588536218736302, "tps": 18224039, "wall": 68.4} {"step": 19016, "train_loss": 3.128251075744629, "lr": 0.00015883560348743493, "tps": 17078136, "wall": 73.0} {"step": 19017, "train_loss": 3.032017707824707, "lr": 0.0001588175857941133, "tps": 16066463, "wall": 77.6} {"step": 19018, "train_loss": 3.170973300933838, "lr": 0.0001587995687938693, "tps": 15164161, "wall": 82.2} {"step": 19019, "train_loss": 3.127497673034668, "lr": 0.00015878155248690715, "tps": 14356327, "wall": 86.8} {"step": 19020, "train_loss": 3.130814552307129, "lr": 0.00015876353687343086, "tps": 13630700, "wall": 91.5} {"step": 19021, "train_loss": 3.178284168243408, "lr": 0.00015874552195364454, "tps": 12968676, "wall": 96.1} {"step": 19022, "train_loss": 3.186099052429199, "lr": 0.00015872750772775226, "tps": 12373737, "wall": 100.8} {"step": 19023, "train_loss": 3.0822062492370605, "lr": 0.0001587094941959581, "tps": 11830286, "wall": 105.4} {"step": 19024, "train_loss": 3.019446849822998, "lr": 0.0001586914813584661, "tps": 11333078, "wall": 110.0} {"step": 19025, "train_loss": 3.0846524238586426, "lr": 0.00015867346921548032, "tps": 10875418, "wall": 114.7} {"step": 19026, "train_loss": 2.9670372009277344, "lr": 0.00015865545776720484, "tps": 10453075, "wall": 119.3} {"step": 19027, "train_loss": 3.0792994499206543, "lr": 0.0001586374470138436, "tps": 10059996, "wall": 124.0} {"step": 19028, "train_loss": 3.1886754035949707, "lr": 0.00015861943695560067, "tps": 9698574, "wall": 128.6} {"step": 19029, "train_loss": 3.0833351612091064, "lr": 0.00015860142759268006, "tps": 9359887, "wall": 133.2} {"step": 19030, "train_loss": 3.121382713317871, "lr": 0.0001585834189252859, "tps": 9044594, "wall": 137.9} {"step": 19031, "train_loss": 3.086498260498047, "lr": 0.00015856541095362201, "tps": 8749636, "wall": 142.6} {"step": 19032, "train_loss": 3.1182498931884766, "lr": 0.00015854740367789245, "tps": 8473472, "wall": 147.2} {"step": 19033, "train_loss": 3.1152451038360596, "lr": 0.00015852939709830132, "tps": 8213886, "wall": 151.9} {"step": 19034, "train_loss": 2.9870643615722656, "lr": 0.00015851139121505242, "tps": 7966303, "wall": 156.6} {"step": 19035, "train_loss": 3.129141092300415, "lr": 0.00015849338602834983, "tps": 7736351, "wall": 161.3} {"step": 19036, "train_loss": 3.0886452198028564, "lr": 0.00015847538153839752, "tps": 7519085, "wall": 165.9} {"step": 19037, "train_loss": 3.1375513076782227, "lr": 0.0001584573777453994, "tps": 7313550, "wall": 170.6} {"step": 19038, "train_loss": 3.082655429840088, "lr": 0.00015843937464955941, "tps": 7118991, "wall": 175.3} {"step": 19039, "train_loss": 3.0552992820739746, "lr": 0.00015842137225108153, "tps": 6934410, "wall": 179.9} {"step": 19040, "train_loss": 3.071985960006714, "lr": 0.0001584033705501697, "tps": 6758906, "wall": 184.6} {"step": 19041, "train_loss": 3.067948818206787, "lr": 0.00015838536954702778, "tps": 6592483, "wall": 189.3} {"step": 19042, "train_loss": 3.166292905807495, "lr": 0.00015836736924185974, "tps": 6433881, "wall": 194.0} {"step": 19043, "train_loss": 2.987457275390625, "lr": 0.00015834936963486952, "tps": 6282512, "wall": 198.7} {"step": 19044, "train_loss": 3.1546366214752197, "lr": 0.0001583313707262609, "tps": 6137989, "wall": 203.3} {"step": 19045, "train_loss": 3.0013160705566406, "lr": 0.00015831337251623787, "tps": 6000064, "wall": 208.0} {"step": 19046, "train_loss": 3.1825594902038574, "lr": 0.0001582953750050043, "tps": 5868372, "wall": 212.7} {"step": 19047, "train_loss": 2.947909116744995, "lr": 0.0001582773781927641, "tps": 5741328, "wall": 217.4} {"step": 19048, "train_loss": 3.1182384490966797, "lr": 0.00015825938207972103, "tps": 5620073, "wall": 222.1} {"step": 19049, "train_loss": 3.1746952533721924, "lr": 0.00015824138666607906, "tps": 5504061, "wall": 226.8} {"step": 19050, "train_loss": 3.093379497528076, "lr": 0.00015822339195204204, "tps": 5392673, "wall": 231.5} {"step": 19051, "train_loss": 2.99422550201416, "lr": 0.00015820539793781372, "tps": 5285604, "wall": 236.2} {"step": 19052, "train_loss": 3.1108102798461914, "lr": 0.000158187404623598, "tps": 5183143, "wall": 240.9} {"step": 19053, "train_loss": 3.1402547359466553, "lr": 0.00015816941200959877, "tps": 5084184, "wall": 245.6} {"step": 19054, "train_loss": 3.0890042781829834, "lr": 0.00015815142009601972, "tps": 4988981, "wall": 250.3} {"step": 19055, "train_loss": 3.072633743286133, "lr": 0.00015813342888306475, "tps": 4897581, "wall": 255.0} {"step": 19056, "train_loss": 3.0220046043395996, "lr": 0.0001581154383709376, "tps": 4809428, "wall": 259.7} {"step": 19057, "train_loss": 3.1272549629211426, "lr": 0.00015809744855984218, "tps": 4723926, "wall": 264.4} {"step": 19058, "train_loss": 3.113945722579956, "lr": 0.0001580794594499822, "tps": 4641744, "wall": 269.1} {"step": 19059, "train_loss": 3.1039509773254395, "lr": 0.00015806147104156136, "tps": 4561249, "wall": 273.9} {"step": 19060, "train_loss": 3.2088444232940674, "lr": 0.00015804348333478365, "tps": 4484773, "wall": 278.5} {"step": 19061, "train_loss": 3.130064010620117, "lr": 0.00015802549632985263, "tps": 4410678, "wall": 283.2} {"step": 19062, "train_loss": 3.079723358154297, "lr": 0.00015800751002697217, "tps": 4338868, "wall": 287.9} {"step": 19063, "train_loss": 3.1466150283813477, "lr": 0.00015798952442634603, "tps": 4269250, "wall": 292.6} {"step": 19064, "train_loss": 3.081997871398926, "lr": 0.00015797153952817788, "tps": 4201594, "wall": 297.4} {"step": 19065, "train_loss": 3.1064038276672363, "lr": 0.00015795355533267146, "tps": 4136403, "wall": 302.1} {"step": 19066, "train_loss": 3.1378655433654785, "lr": 0.0001579355718400305, "tps": 4073066, "wall": 306.8} {"step": 19067, "train_loss": 3.1792409420013428, "lr": 0.00015791758905045887, "tps": 4011447, "wall": 311.5} {"step": 19068, "train_loss": 3.0733375549316406, "lr": 0.00015789960696416003, "tps": 3951724, "wall": 316.2} {"step": 19069, "train_loss": 3.0092084407806396, "lr": 0.00015788162558133783, "tps": 3893906, "wall": 321.0} {"step": 19070, "train_loss": 3.1872406005859375, "lr": 0.00015786364490219597, "tps": 3837554, "wall": 325.7} {"step": 19071, "train_loss": 3.1011064052581787, "lr": 0.00015784566492693807, "tps": 3782804, "wall": 330.4} {"step": 19072, "train_loss": 3.0735251903533936, "lr": 0.00015782768565576784, "tps": 3729219, "wall": 335.2} {"step": 19073, "train_loss": 3.1092400550842285, "lr": 0.00015780970708888893, "tps": 3677675, "wall": 339.9} {"step": 19074, "train_loss": 3.0240883827209473, "lr": 0.00015779172922650506, "tps": 3627499, "wall": 344.6} {"step": 19075, "train_loss": 3.0919384956359863, "lr": 0.00015777375206881984, "tps": 3578609, "wall": 349.3} {"step": 19076, "train_loss": 3.1450440883636475, "lr": 0.00015775577561603693, "tps": 3531009, "wall": 354.1} {"step": 19077, "train_loss": 3.1143834590911865, "lr": 0.0001577377998683599, "tps": 3484876, "wall": 358.8} {"step": 19078, "train_loss": 3.122126579284668, "lr": 0.0001577198248259925, "tps": 3439855, "wall": 363.5} {"step": 19079, "train_loss": 3.2084736824035645, "lr": 0.0001577018504891383, "tps": 3395738, "wall": 368.2} {"step": 19080, "train_loss": 3.058856725692749, "lr": 0.0001576838768580009, "tps": 3352940, "wall": 373.0} {"step": 19081, "train_loss": 3.1287505626678467, "lr": 0.0001576659039327839, "tps": 3311268, "wall": 377.7} {"step": 19082, "train_loss": 3.078193187713623, "lr": 0.00015764793171369092, "tps": 3270470, "wall": 382.4} {"step": 19083, "train_loss": 3.0593461990356445, "lr": 0.00015762996020092556, "tps": 3230656, "wall": 387.1} {"step": 19084, "train_loss": 3.0760838985443115, "lr": 0.00015761198939469133, "tps": 3191795, "wall": 391.9} {"step": 19085, "train_loss": 3.1558423042297363, "lr": 0.0001575940192951919, "tps": 3153450, "wall": 396.7} {"step": 19086, "train_loss": 3.1071155071258545, "lr": 0.00015757604990263078, "tps": 3116448, "wall": 401.4} {"step": 19087, "train_loss": 3.078728675842285, "lr": 0.00015755808121721158, "tps": 3080387, "wall": 406.1} {"step": 19088, "train_loss": 3.1125452518463135, "lr": 0.00015754011323913778, "tps": 3045112, "wall": 410.8} {"step": 19089, "train_loss": 3.095667839050293, "lr": 0.00015752214596861296, "tps": 3010614, "wall": 415.6} {"step": 19090, "train_loss": 3.0789952278137207, "lr": 0.00015750417940584068, "tps": 2976869, "wall": 420.3} {"step": 19091, "train_loss": 3.019423246383667, "lr": 0.0001574862135510244, "tps": 2943754, "wall": 425.0} {"step": 19092, "train_loss": 3.136615037918091, "lr": 0.00015746824840436765, "tps": 2911574, "wall": 429.8} {"step": 19093, "train_loss": 3.107646942138672, "lr": 0.000157450283966074, "tps": 2880022, "wall": 434.5} {"step": 19094, "train_loss": 3.1284918785095215, "lr": 0.00015743232023634693, "tps": 2849126, "wall": 439.2} {"step": 19095, "train_loss": 3.0480711460113525, "lr": 0.00015741435721538993, "tps": 2818863, "wall": 444.0} {"step": 19096, "train_loss": 3.0991926193237305, "lr": 0.00015739639490340644, "tps": 2789265, "wall": 448.7} {"step": 19097, "train_loss": 3.0846362113952637, "lr": 0.0001573784333006, "tps": 2760215, "wall": 453.4} {"step": 19098, "train_loss": 3.1489484310150146, "lr": 0.00015736047240717403, "tps": 2731528, "wall": 458.2} {"step": 19099, "train_loss": 3.1662399768829346, "lr": 0.00015734251222333204, "tps": 2703684, "wall": 463.0} {"step": 19100, "train_loss": 3.0945329666137695, "lr": 0.00015732455274927745, "tps": 2676365, "wall": 467.7} {"step": 19101, "train_loss": 2.9759864807128906, "lr": 0.00015730659398521373, "tps": 2649690, "wall": 472.5} {"step": 19102, "train_loss": 3.030405044555664, "lr": 0.00015728863593134432, "tps": 2623569, "wall": 477.2} {"step": 19103, "train_loss": 3.0397040843963623, "lr": 0.0001572706785878726, "tps": 2597933, "wall": 481.9} {"step": 19104, "train_loss": 3.001638412475586, "lr": 0.00015725272195500205, "tps": 2572766, "wall": 486.7} {"step": 19105, "train_loss": 3.0601112842559814, "lr": 0.00015723476603293608, "tps": 2548067, "wall": 491.4} {"step": 19106, "train_loss": 3.130016326904297, "lr": 0.000157216810821878, "tps": 2523781, "wall": 496.2} {"step": 19107, "train_loss": 3.0060019493103027, "lr": 0.00015719885632203132, "tps": 2500017, "wall": 500.9} {"step": 19108, "train_loss": 3.18855619430542, "lr": 0.00015718090253359943, "tps": 2476729, "wall": 505.6} {"step": 19109, "train_loss": 3.0758938789367676, "lr": 0.00015716294945678562, "tps": 2453865, "wall": 510.4} {"step": 19110, "train_loss": 3.052621364593506, "lr": 0.00015714499709179337, "tps": 2431216, "wall": 515.2} {"step": 19111, "train_loss": 3.0364370346069336, "lr": 0.00015712704543882598, "tps": 2409210, "wall": 519.9} {"step": 19112, "train_loss": 3.0691463947296143, "lr": 0.00015710909449808677, "tps": 2387549, "wall": 524.6} {"step": 19113, "train_loss": 3.0939245223999023, "lr": 0.00015709114426977916, "tps": 2366313, "wall": 529.4} {"step": 19114, "train_loss": 3.0692787170410156, "lr": 0.00015707319475410656, "tps": 2345385, "wall": 534.1} {"step": 19115, "train_loss": 3.0773510932922363, "lr": 0.0001570552459512721, "tps": 2324882, "wall": 538.9} {"step": 19116, "train_loss": 3.08632755279541, "lr": 0.00015703729786147928, "tps": 2304701, "wall": 543.6} {"step": 19117, "train_loss": 3.090428590774536, "lr": 0.00015701935048493138, "tps": 2284828, "wall": 548.4} {"step": 19118, "train_loss": 3.050579071044922, "lr": 0.00015700140382183162, "tps": 2265285, "wall": 553.1} {"step": 19119, "train_loss": 3.1579952239990234, "lr": 0.00015698345787238334, "tps": 2246138, "wall": 557.9} {"step": 19120, "train_loss": 3.1552064418792725, "lr": 0.00015696551263678988, "tps": 2227320, "wall": 562.6} {"step": 19121, "train_loss": 3.073580265045166, "lr": 0.00015694756811525457, "tps": 2208807, "wall": 567.4} {"step": 19122, "train_loss": 3.1273155212402344, "lr": 0.00015692962430798063, "tps": 2190551, "wall": 572.1} {"step": 19123, "train_loss": 3.0805556774139404, "lr": 0.0001569116812151712, "tps": 2172475, "wall": 576.9} {"step": 19124, "train_loss": 3.0562968254089355, "lr": 0.00015689373883702977, "tps": 2154886, "wall": 581.6} {"step": 19125, "train_loss": 3.079655170440674, "lr": 0.0001568757971737594, "tps": 2137587, "wall": 586.4} {"step": 19126, "train_loss": 3.027649164199829, "lr": 0.00015685785622556345, "tps": 2120493, "wall": 591.1} {"step": 19127, "train_loss": 3.133467197418213, "lr": 0.0001568399159926451, "tps": 2103756, "wall": 595.9} {"step": 19128, "train_loss": 3.112450122833252, "lr": 0.00015682197647520768, "tps": 2087286, "wall": 600.6} {"step": 19129, "train_loss": 3.081613063812256, "lr": 0.00015680403767345425, "tps": 2070980, "wall": 605.4} {"step": 19130, "train_loss": 3.1063380241394043, "lr": 0.0001567860995875881, "tps": 2054981, "wall": 610.1} {"step": 19131, "train_loss": 3.075507640838623, "lr": 0.0001567681622178125, "tps": 2039230, "wall": 614.9} {"step": 19132, "train_loss": 3.1710972785949707, "lr": 0.00015675022556433058, "tps": 2023764, "wall": 619.6} {"step": 19133, "train_loss": 2.984713315963745, "lr": 0.00015673228962734544, "tps": 2008497, "wall": 624.3} {"step": 19134, "train_loss": 2.9767191410064697, "lr": 0.00015671435440706038, "tps": 1993486, "wall": 629.1} {"step": 19135, "train_loss": 2.975878953933716, "lr": 0.00015669641990367854, "tps": 1978457, "wall": 633.9} {"step": 19136, "train_loss": 3.1992132663726807, "lr": 0.0001566784861174031, "tps": 1963931, "wall": 638.6} {"step": 19137, "train_loss": 3.1003427505493164, "lr": 0.00015666055304843716, "tps": 1949543, "wall": 643.3} {"step": 19138, "train_loss": 3.007031202316284, "lr": 0.00015664262069698393, "tps": 1935361, "wall": 648.1} {"step": 19139, "train_loss": 3.208031415939331, "lr": 0.00015662468906324652, "tps": 1921365, "wall": 652.8} {"step": 19140, "train_loss": 3.004828691482544, "lr": 0.00015660675814742805, "tps": 1907562, "wall": 657.6} {"step": 19141, "train_loss": 3.1193153858184814, "lr": 0.00015658882794973165, "tps": 1893976, "wall": 662.4} {"step": 19142, "train_loss": 3.061735153198242, "lr": 0.00015657089847036045, "tps": 1880610, "wall": 667.1} {"step": 19143, "train_loss": 3.1531128883361816, "lr": 0.00015655296970951756, "tps": 1867438, "wall": 671.8} {"step": 19144, "train_loss": 3.2034835815429688, "lr": 0.00015653504166740598, "tps": 1854447, "wall": 676.6} {"step": 19145, "train_loss": 3.1102960109710693, "lr": 0.00015651711434422894, "tps": 1841547, "wall": 681.4} {"step": 19146, "train_loss": 3.0058233737945557, "lr": 0.0001564991877401895, "tps": 1828890, "wall": 686.1} {"step": 19147, "train_loss": 3.0735812187194824, "lr": 0.00015648126185549064, "tps": 1816433, "wall": 690.9} {"step": 19148, "train_loss": 3.116065502166748, "lr": 0.0001564633366903355, "tps": 1803983, "wall": 695.7} {"step": 19149, "train_loss": 3.1055986881256104, "lr": 0.00015644541224492712, "tps": 1791829, "wall": 700.4} {"step": 19150, "train_loss": 2.9633240699768066, "lr": 0.00015642748851946853, "tps": 1779834, "wall": 705.2} {"step": 19151, "train_loss": 3.060943603515625, "lr": 0.00015640956551416283, "tps": 1768052, "wall": 709.9} {"step": 19152, "train_loss": 3.1001381874084473, "lr": 0.00015639164322921295, "tps": 1756413, "wall": 714.6} {"step": 19153, "train_loss": 3.151503086090088, "lr": 0.00015637372166482205, "tps": 1744871, "wall": 719.4} {"step": 19154, "train_loss": 3.064758777618408, "lr": 0.000156355800821193, "tps": 1733518, "wall": 724.2} {"step": 19155, "train_loss": 3.0196967124938965, "lr": 0.0001563378806985289, "tps": 1722311, "wall": 728.9} {"step": 19156, "train_loss": 3.065180778503418, "lr": 0.00015631996129703278, "tps": 1711258, "wall": 733.7} {"step": 19157, "train_loss": 3.046538829803467, "lr": 0.00015630204261690754, "tps": 1700355, "wall": 738.4} {"step": 19158, "train_loss": 3.1315083503723145, "lr": 0.00015628412465835623, "tps": 1689583, "wall": 743.1} {"step": 19159, "train_loss": 3.0273823738098145, "lr": 0.0001562662074215818, "tps": 1678940, "wall": 747.9} {"step": 19160, "train_loss": 3.1025350093841553, "lr": 0.00015624829090678718, "tps": 1668414, "wall": 752.7} {"step": 19161, "train_loss": 3.219710350036621, "lr": 0.0001562303751141754, "tps": 1657957, "wall": 757.4} {"step": 19162, "train_loss": 2.997100353240967, "lr": 0.00015621246004394942, "tps": 1647703, "wall": 762.2} {"step": 19163, "train_loss": 3.115201234817505, "lr": 0.0001561945456963121, "tps": 1637606, "wall": 766.9} {"step": 19164, "train_loss": 3.025214672088623, "lr": 0.00015617663207146643, "tps": 1627616, "wall": 771.7} {"step": 19165, "train_loss": 3.078592538833618, "lr": 0.00015615871916961532, "tps": 1617763, "wall": 776.4} {"step": 19166, "train_loss": 3.196460723876953, "lr": 0.0001561408069909617, "tps": 1608005, "wall": 781.2} {"step": 19167, "train_loss": 2.9811956882476807, "lr": 0.0001561228955357085, "tps": 1598345, "wall": 785.9} {"step": 19168, "train_loss": 2.9800009727478027, "lr": 0.00015610498480405851, "tps": 1588856, "wall": 790.7} {"step": 19169, "train_loss": 3.0073537826538086, "lr": 0.00015608707479621473, "tps": 1579478, "wall": 795.4} {"step": 19170, "train_loss": 3.0990688800811768, "lr": 0.0001560691655123801, "tps": 1570205, "wall": 800.1} {"step": 19171, "train_loss": 3.109588384628296, "lr": 0.00015605125695275737, "tps": 1561028, "wall": 804.9} {"step": 19172, "train_loss": 3.1540675163269043, "lr": 0.00015603334911754946, "tps": 1551866, "wall": 809.7} {"step": 19173, "train_loss": 2.9662978649139404, "lr": 0.00015601544200695923, "tps": 1542784, "wall": 814.5} {"step": 19174, "train_loss": 3.101087808609009, "lr": 0.00015599753562118952, "tps": 1533933, "wall": 819.2} {"step": 19175, "train_loss": 3.2061820030212402, "lr": 0.00015597962996044323, "tps": 1525152, "wall": 824.0} {"step": 19176, "train_loss": 3.0644960403442383, "lr": 0.00015596172502492313, "tps": 1516482, "wall": 828.7} {"step": 19177, "train_loss": 3.0981812477111816, "lr": 0.00015594382081483209, "tps": 1507828, "wall": 833.5} {"step": 19178, "train_loss": 3.077131509780884, "lr": 0.00015592591733037289, "tps": 1499354, "wall": 838.3} {"step": 19179, "train_loss": 3.063624620437622, "lr": 0.00015590801457174836, "tps": 1490977, "wall": 843.1} {"step": 19180, "train_loss": 3.0020968914031982, "lr": 0.00015589011253916137, "tps": 1482684, "wall": 847.8} {"step": 19181, "train_loss": 3.1711795330047607, "lr": 0.0001558722112328146, "tps": 1474490, "wall": 852.6} {"step": 19182, "train_loss": 2.995067596435547, "lr": 0.0001558543106529109, "tps": 1466389, "wall": 857.3} {"step": 19183, "train_loss": 3.1416826248168945, "lr": 0.00015583641079965305, "tps": 1458367, "wall": 862.1} {"step": 19184, "train_loss": 3.0876340866088867, "lr": 0.0001558185116732438, "tps": 1450415, "wall": 866.9} {"step": 19185, "train_loss": 3.116255283355713, "lr": 0.00015580061327388588, "tps": 1442589, "wall": 871.6} {"step": 19186, "train_loss": 3.1702394485473633, "lr": 0.00015578271560178216, "tps": 1434772, "wall": 876.4} {"step": 19187, "train_loss": 3.125716209411621, "lr": 0.0001557648186571353, "tps": 1427094, "wall": 881.2} {"step": 19188, "train_loss": 3.1422007083892822, "lr": 0.00015574692244014798, "tps": 1419515, "wall": 885.9} {"step": 19189, "train_loss": 3.0884203910827637, "lr": 0.00015572902695102308, "tps": 1412003, "wall": 890.7} {"step": 19190, "train_loss": 2.9577648639678955, "lr": 0.00015571113218996319, "tps": 1404583, "wall": 895.4} {"step": 19191, "train_loss": 3.1832828521728516, "lr": 0.00015569323815717108, "tps": 1397250, "wall": 900.2} {"step": 19192, "train_loss": 2.993954658508301, "lr": 0.00015567534485284946, "tps": 1389943, "wall": 905.0} {"step": 19193, "train_loss": 2.9564201831817627, "lr": 0.00015565745227720106, "tps": 1382792, "wall": 909.7} {"step": 19194, "train_loss": 3.07045316696167, "lr": 0.00015563956043042842, "tps": 1375663, "wall": 914.4} {"step": 19195, "train_loss": 3.066739082336426, "lr": 0.0001556216693127344, "tps": 1368595, "wall": 919.2} {"step": 19196, "train_loss": 3.125772714614868, "lr": 0.0001556037789243215, "tps": 1361627, "wall": 924.0} {"step": 19197, "train_loss": 3.000092029571533, "lr": 0.00015558588926539263, "tps": 1354754, "wall": 928.7} {"step": 19198, "train_loss": 3.054718017578125, "lr": 0.00015556800033615016, "tps": 1347891, "wall": 933.5} {"step": 19199, "train_loss": 3.1317343711853027, "lr": 0.0001555501121367969, "tps": 1341079, "wall": 938.3} {"step": 19200, "train_loss": 3.1367664337158203, "lr": 0.00015553222466753547, "tps": 1334403, "wall": 943.0} {"step": 19201, "train_loss": 3.141004800796509, "lr": 0.0001555143379285685, "tps": 1327788, "wall": 947.8} {"step": 19202, "train_loss": 3.08660626411438, "lr": 0.00015549645192009854, "tps": 1321227, "wall": 952.5} {"step": 19203, "train_loss": 3.0951931476593018, "lr": 0.00015547856664232837, "tps": 1314736, "wall": 957.3} {"step": 19204, "train_loss": 3.0189597606658936, "lr": 0.00015546068209546041, "tps": 1308299, "wall": 962.0} {"step": 19205, "train_loss": 3.041494131088257, "lr": 0.00015544279827969733, "tps": 1301918, "wall": 966.8} {"step": 19206, "train_loss": 3.1018707752227783, "lr": 0.0001554249151952417, "tps": 1295613, "wall": 971.5} {"step": 19207, "train_loss": 3.0376858711242676, "lr": 0.0001554070328422962, "tps": 1289372, "wall": 976.3} {"step": 19208, "train_loss": 2.9721179008483887, "lr": 0.00015538915122106329, "tps": 1283197, "wall": 981.1} {"step": 19209, "train_loss": 3.08760929107666, "lr": 0.00015537127033174556, "tps": 1277081, "wall": 985.8} {"step": 19210, "train_loss": 2.995530128479004, "lr": 0.0001553533901745456, "tps": 1271024, "wall": 990.5} {"step": 19211, "train_loss": 3.029423713684082, "lr": 0.0001553355107496659, "tps": 1264948, "wall": 995.4} {"step": 19212, "train_loss": 2.9963536262512207, "lr": 0.00015531763205730906, "tps": 1258955, "wall": 1000.1} {"step": 19213, "train_loss": 3.0826170444488525, "lr": 0.00015529975409767758, "tps": 1253080, "wall": 1004.9} {"step": 19214, "train_loss": 3.05163311958313, "lr": 0.00015528187687097403, "tps": 1247227, "wall": 1009.7} {"step": 19215, "train_loss": 3.1128475666046143, "lr": 0.00015526400037740076, "tps": 1241433, "wall": 1014.4} {"step": 19216, "train_loss": 3.114543914794922, "lr": 0.0001552461246171605, "tps": 1235697, "wall": 1019.2} {"step": 19217, "train_loss": 3.0482285022735596, "lr": 0.0001552282495904556, "tps": 1230026, "wall": 1023.9} {"step": 19218, "train_loss": 3.061798572540283, "lr": 0.0001552103752974886, "tps": 1224355, "wall": 1028.7} {"step": 19219, "train_loss": 3.03859806060791, "lr": 0.000155192501738462, "tps": 1218722, "wall": 1033.5} {"step": 19220, "train_loss": 3.1178059577941895, "lr": 0.0001551746289135782, "tps": 1213144, "wall": 1038.3} {"step": 19221, "train_loss": 3.0889551639556885, "lr": 0.00015515675682303975, "tps": 1207657, "wall": 1043.1} {"step": 19222, "train_loss": 3.139186382293701, "lr": 0.00015513888546704903, "tps": 1202233, "wall": 1047.9} {"step": 19223, "train_loss": 3.061336040496826, "lr": 0.0001551210148458085, "tps": 1196860, "wall": 1052.6} {"step": 19224, "train_loss": 3.08491849899292, "lr": 0.00015510314495952073, "tps": 1191499, "wall": 1057.4} {"step": 19225, "train_loss": 3.1633307933807373, "lr": 0.00015508527580838797, "tps": 1186221, "wall": 1062.2} {"step": 19226, "train_loss": 3.068085193634033, "lr": 0.00015506740739261275, "tps": 1180987, "wall": 1067.0} {"step": 19227, "train_loss": 2.9641976356506348, "lr": 0.00015504953971239745, "tps": 1175775, "wall": 1071.7} {"step": 19228, "train_loss": 3.1059718132019043, "lr": 0.00015503167276794444, "tps": 1170641, "wall": 1076.5} {"step": 19229, "train_loss": 3.1358156204223633, "lr": 0.00015501380655945615, "tps": 1165554, "wall": 1081.3} {"step": 19230, "train_loss": 3.0129098892211914, "lr": 0.00015499594108713503, "tps": 1160489, "wall": 1086.0} {"step": 19231, "train_loss": 3.056581735610962, "lr": 0.00015497807635118336, "tps": 1155506, "wall": 1090.8} {"step": 19232, "train_loss": 3.0230515003204346, "lr": 0.00015496021235180362, "tps": 1150543, "wall": 1095.5} {"step": 19233, "train_loss": 3.06787109375, "lr": 0.00015494234908919801, "tps": 1145591, "wall": 1100.3} {"step": 19234, "train_loss": 3.1646485328674316, "lr": 0.0001549244865635691, "tps": 1140721, "wall": 1105.1} {"step": 19235, "train_loss": 3.0486748218536377, "lr": 0.00015490662477511905, "tps": 1135910, "wall": 1109.8} {"step": 19236, "train_loss": 3.0342493057250977, "lr": 0.00015488876372405028, "tps": 1131044, "wall": 1114.6} {"step": 19237, "train_loss": 3.1260135173797607, "lr": 0.00015487090341056517, "tps": 1126300, "wall": 1119.4} {"step": 19238, "train_loss": 3.130927085876465, "lr": 0.00015485304383486596, "tps": 1121577, "wall": 1124.2} {"step": 19239, "train_loss": 3.0172109603881836, "lr": 0.000154835184997155, "tps": 1116914, "wall": 1128.9} {"step": 19240, "train_loss": 3.117680549621582, "lr": 0.0001548173268976346, "tps": 1112297, "wall": 1133.7} {"step": 19241, "train_loss": 3.0418925285339355, "lr": 0.000154799469536507, "tps": 1107704, "wall": 1138.4} {"step": 19242, "train_loss": 3.068427085876465, "lr": 0.00015478161291397453, "tps": 1103145, "wall": 1143.2} {"step": 19243, "train_loss": 3.0801563262939453, "lr": 0.0001547637570302395, "tps": 1098606, "wall": 1148.0} {"step": 19244, "train_loss": 3.0603959560394287, "lr": 0.0001547459018855042, "tps": 1094117, "wall": 1152.7} {"step": 19245, "train_loss": 3.1109702587127686, "lr": 0.00015472804747997083, "tps": 1089674, "wall": 1157.5} {"step": 19246, "train_loss": 3.0678248405456543, "lr": 0.00015471019381384165, "tps": 1085270, "wall": 1162.3} {"step": 19247, "train_loss": 3.1293320655822754, "lr": 0.00015469234088731897, "tps": 1080899, "wall": 1167.0} {"step": 19248, "train_loss": 3.0395755767822266, "lr": 0.00015467448870060496, "tps": 1076569, "wall": 1171.8} {"step": 19249, "train_loss": 3.140899658203125, "lr": 0.00015465663725390186, "tps": 1072236, "wall": 1176.6} {"step": 19250, "train_loss": 3.115032911300659, "lr": 0.00015463878654741194, "tps": 1067964, "wall": 1181.3} {"step": 19251, "train_loss": 3.025420904159546, "lr": 0.00015462093658133737, "tps": 1063753, "wall": 1186.1} {"step": 19252, "train_loss": 2.9945757389068604, "lr": 0.00015460308735588033, "tps": 1059566, "wall": 1190.8} {"step": 19253, "train_loss": 3.0589699745178223, "lr": 0.00015458523887124307, "tps": 1055403, "wall": 1195.6} {"step": 19254, "train_loss": 3.1232733726501465, "lr": 0.0001545673911276278, "tps": 1051270, "wall": 1200.4} {"step": 19255, "train_loss": 3.1172289848327637, "lr": 0.00015454954412523665, "tps": 1047178, "wall": 1205.1} {"step": 19256, "train_loss": 3.1514785289764404, "lr": 0.00015453169786427178, "tps": 1043114, "wall": 1209.9} {"step": 19257, "train_loss": 3.025906562805176, "lr": 0.00015451385234493544, "tps": 1039080, "wall": 1214.6} {"step": 19258, "train_loss": 3.0857362747192383, "lr": 0.00015449600756742963, "tps": 1035082, "wall": 1219.4} {"step": 19259, "train_loss": 3.138927936553955, "lr": 0.00015447816353195663, "tps": 1031116, "wall": 1224.1} {"step": 19260, "train_loss": 2.9408681392669678, "lr": 0.00015446032023871853, "tps": 1027181, "wall": 1228.9} {"step": 19261, "train_loss": 3.0378541946411133, "lr": 0.0001544424776879175, "tps": 1023227, "wall": 1233.7} {"step": 19262, "train_loss": 3.092017650604248, "lr": 0.00015442463587975565, "tps": 1019350, "wall": 1238.5} {"step": 19263, "train_loss": 3.1794142723083496, "lr": 0.000154406794814435, "tps": 1015496, "wall": 1243.2} {"step": 19264, "train_loss": 3.1071531772613525, "lr": 0.00015438895449215777, "tps": 1011678, "wall": 1248.0} {"step": 19265, "train_loss": 2.9323439598083496, "lr": 0.00015437111491312604, "tps": 1007890, "wall": 1252.7} {"step": 19266, "train_loss": 2.991469621658325, "lr": 0.00015435327607754177, "tps": 1004128, "wall": 1257.5} {"step": 19267, "train_loss": 3.06791353225708, "lr": 0.00015433543798560727, "tps": 1000403, "wall": 1262.2} {"step": 19268, "train_loss": 3.1213836669921875, "lr": 0.0001543176006375244, "tps": 996695, "wall": 1267.0} {"step": 19269, "train_loss": 3.0330209732055664, "lr": 0.00015429976403349532, "tps": 993032, "wall": 1271.7} {"step": 19270, "train_loss": 3.0868823528289795, "lr": 0.00015428192817372205, "tps": 989376, "wall": 1276.5} {"step": 19271, "train_loss": 3.0629255771636963, "lr": 0.00015426409305840667, "tps": 985749, "wall": 1281.3} {"step": 19272, "train_loss": 3.0915629863739014, "lr": 0.0001542462586877512, "tps": 982144, "wall": 1286.0} {"step": 19273, "train_loss": 3.0360755920410156, "lr": 0.00015422842506195768, "tps": 978571, "wall": 1290.8} {"step": 19274, "train_loss": 3.185624599456787, "lr": 0.0001542105921812281, "tps": 974986, "wall": 1295.6} {"step": 19275, "train_loss": 3.059725761413574, "lr": 0.00015419276004576452, "tps": 971464, "wall": 1300.4} {"step": 19276, "train_loss": 3.0640203952789307, "lr": 0.00015417492865576885, "tps": 967977, "wall": 1305.1} {"step": 19277, "train_loss": 3.090658664703369, "lr": 0.0001541570980114432, "tps": 964511, "wall": 1309.9} {"step": 19278, "train_loss": 3.0983729362487793, "lr": 0.00015413926811298954, "tps": 961076, "wall": 1314.6} {"step": 19279, "train_loss": 3.120544195175171, "lr": 0.00015412143896060973, "tps": 957666, "wall": 1319.4} {"step": 19280, "train_loss": 3.1618173122406006, "lr": 0.00015410361055450585, "tps": 954267, "wall": 1324.2} {"step": 19281, "train_loss": 3.0469274520874023, "lr": 0.0001540857828948799, "tps": 950888, "wall": 1328.9} {"step": 19282, "train_loss": 3.0736021995544434, "lr": 0.0001540679559819337, "tps": 947536, "wall": 1333.7} {"step": 19283, "train_loss": 3.031277656555176, "lr": 0.0001540501298158693, "tps": 944218, "wall": 1338.5} {"step": 19284, "train_loss": 3.1167197227478027, "lr": 0.00015403230439688857, "tps": 940920, "wall": 1343.2} {"step": 19285, "train_loss": 3.09108829498291, "lr": 0.00015401447972519344, "tps": 937643, "wall": 1348.0} {"step": 19286, "train_loss": 3.129539966583252, "lr": 0.0001539966558009859, "tps": 934386, "wall": 1352.8} {"step": 19287, "train_loss": 3.0752711296081543, "lr": 0.0001539788326244678, "tps": 931102, "wall": 1357.6} {"step": 19288, "train_loss": 3.0884151458740234, "lr": 0.0001539610101958411, "tps": 927892, "wall": 1362.4} {"step": 19289, "train_loss": 3.0168066024780273, "lr": 0.00015394318851530758, "tps": 924713, "wall": 1367.1} {"step": 19290, "train_loss": 3.108668327331543, "lr": 0.0001539253675830692, "tps": 921548, "wall": 1371.9} {"step": 19291, "train_loss": 3.186051368713379, "lr": 0.00015390754739932785, "tps": 918417, "wall": 1376.6} {"step": 19292, "train_loss": 3.0424301624298096, "lr": 0.00015388972796428539, "tps": 915293, "wall": 1381.4} {"step": 19293, "train_loss": 3.092165231704712, "lr": 0.00015387190927814364, "tps": 912189, "wall": 1386.2} {"step": 19294, "train_loss": 3.082374095916748, "lr": 0.0001538540913411045, "tps": 909124, "wall": 1390.9} {"step": 19295, "train_loss": 3.0780348777770996, "lr": 0.0001538362741533698, "tps": 906069, "wall": 1395.7} {"step": 19296, "train_loss": 3.090616226196289, "lr": 0.00015381845771514133, "tps": 903043, "wall": 1400.4} {"step": 19297, "train_loss": 3.110755443572998, "lr": 0.00015380064202662097, "tps": 900027, "wall": 1405.2} {"step": 19298, "train_loss": 3.1610710620880127, "lr": 0.00015378282708801053, "tps": 897035, "wall": 1410.0} {"step": 19299, "train_loss": 3.1400809288024902, "lr": 0.0001537650128995118, "tps": 894027, "wall": 1414.8} {"step": 19300, "train_loss": 2.9842517375946045, "lr": 0.00015374719946132656, "tps": 891088, "wall": 1419.5} {"step": 19301, "train_loss": 3.148379325866699, "lr": 0.0001537293867736567, "tps": 888164, "wall": 1424.3} {"step": 19302, "train_loss": 3.0794644355773926, "lr": 0.0001537115748367039, "tps": 885261, "wall": 1429.0} {"step": 19303, "train_loss": 3.0708534717559814, "lr": 0.00015369376365066998, "tps": 882372, "wall": 1433.8} {"step": 19304, "train_loss": 3.0323660373687744, "lr": 0.00015367595321575666, "tps": 879502, "wall": 1438.5} {"step": 19305, "train_loss": 3.0484161376953125, "lr": 0.0001536581435321657, "tps": 876641, "wall": 1443.3} {"step": 19306, "train_loss": 3.0529165267944336, "lr": 0.00015364033460009896, "tps": 873797, "wall": 1448.1} {"step": 19307, "train_loss": 3.0432143211364746, "lr": 0.00015362252641975803, "tps": 870983, "wall": 1452.8} {"step": 19308, "train_loss": 3.056391716003418, "lr": 0.0001536047189913447, "tps": 868187, "wall": 1457.6} {"step": 19309, "train_loss": 3.0344438552856445, "lr": 0.00015358691231506078, "tps": 865412, "wall": 1462.3} {"step": 19310, "train_loss": 2.98526668548584, "lr": 0.00015356910639110786, "tps": 862655, "wall": 1467.1} {"step": 19311, "train_loss": 3.0827481746673584, "lr": 0.00015355130121968774, "tps": 859913, "wall": 1471.8} {"step": 19312, "train_loss": 3.1059679985046387, "lr": 0.000153533496801002, "tps": 857150, "wall": 1476.6} {"step": 19313, "train_loss": 3.1514992713928223, "lr": 0.00015351569313525246, "tps": 854451, "wall": 1481.4} {"step": 19314, "train_loss": 3.149385452270508, "lr": 0.00015349789022264072, "tps": 851760, "wall": 1486.1} {"step": 19315, "train_loss": 3.096709966659546, "lr": 0.00015348008806336847, "tps": 849086, "wall": 1490.9} {"step": 19316, "train_loss": 3.014857769012451, "lr": 0.00015346228665763745, "tps": 846436, "wall": 1495.6} {"step": 19317, "train_loss": 3.0761559009552, "lr": 0.0001534444860056492, "tps": 843797, "wall": 1500.4} {"step": 19318, "train_loss": 3.021873950958252, "lr": 0.00015342668610760537, "tps": 841177, "wall": 1505.1} {"step": 19319, "train_loss": 3.0685696601867676, "lr": 0.00015340888696370773, "tps": 838573, "wall": 1509.9} {"step": 19320, "train_loss": 2.9996745586395264, "lr": 0.00015339108857415776, "tps": 835984, "wall": 1514.6} {"step": 19321, "train_loss": 3.1431987285614014, "lr": 0.00015337329093915712, "tps": 833410, "wall": 1519.4} {"step": 19322, "train_loss": 3.085951328277588, "lr": 0.00015335549405890748, "tps": 830846, "wall": 1524.2} {"step": 19323, "train_loss": 3.045020341873169, "lr": 0.00015333769793361043, "tps": 828309, "wall": 1528.9} {"step": 19324, "train_loss": 2.9832277297973633, "lr": 0.0001533199025634675, "tps": 825754, "wall": 1533.7} {"step": 19325, "train_loss": 3.0473239421844482, "lr": 0.00015330210794868037, "tps": 823246, "wall": 1538.5} {"step": 19326, "train_loss": 3.1166086196899414, "lr": 0.00015328431408945053, "tps": 820757, "wall": 1543.2} {"step": 19327, "train_loss": 3.195525646209717, "lr": 0.0001532665209859796, "tps": 818280, "wall": 1548.0} {"step": 19328, "train_loss": 3.0658833980560303, "lr": 0.00015324872863846912, "tps": 815821, "wall": 1552.7} {"step": 19329, "train_loss": 3.0034990310668945, "lr": 0.00015323093704712064, "tps": 813368, "wall": 1557.5} {"step": 19330, "train_loss": 3.0243544578552246, "lr": 0.0001532131462121358, "tps": 810928, "wall": 1562.3} {"step": 19331, "train_loss": 3.1604785919189453, "lr": 0.00015319535613371595, "tps": 808499, "wall": 1567.0} {"step": 19332, "train_loss": 3.0097227096557617, "lr": 0.00015317756681206275, "tps": 806096, "wall": 1571.8} {"step": 19333, "train_loss": 3.0593771934509277, "lr": 0.00015315977824737774, "tps": 803704, "wall": 1576.5} {"step": 19334, "train_loss": 3.006241798400879, "lr": 0.00015314199043986232, "tps": 801331, "wall": 1581.3} {"step": 19335, "train_loss": 3.162973642349243, "lr": 0.00015312420338971805, "tps": 798973, "wall": 1586.0} {"step": 19336, "train_loss": 3.0635478496551514, "lr": 0.00015310641709714647, "tps": 796633, "wall": 1590.8} {"step": 19337, "train_loss": 3.104566812515259, "lr": 0.00015308863156234898, "tps": 794269, "wall": 1595.6} {"step": 19338, "train_loss": 3.121882438659668, "lr": 0.00015307084678552708, "tps": 791949, "wall": 1600.4} {"step": 19339, "train_loss": 3.0219485759735107, "lr": 0.00015305306276688224, "tps": 789648, "wall": 1605.1} {"step": 19340, "train_loss": 3.0388619899749756, "lr": 0.00015303527950661603, "tps": 787362, "wall": 1609.8} {"step": 19341, "train_loss": 3.0464117527008057, "lr": 0.0001530174970049297, "tps": 785083, "wall": 1614.6} {"step": 19342, "train_loss": 3.3224620819091797, "lr": 0.00015299971526202478, "tps": 782811, "wall": 1619.4} {"step": 19343, "train_loss": 3.076033592224121, "lr": 0.00015298193427810278, "tps": 780557, "wall": 1624.1} {"step": 19344, "train_loss": 3.078115940093994, "lr": 0.00015296415405336502, "tps": 778314, "wall": 1628.9} {"step": 19345, "train_loss": 3.0451228618621826, "lr": 0.00015294637458801292, "tps": 776091, "wall": 1633.6} {"step": 19346, "train_loss": 3.0647432804107666, "lr": 0.00015292859588224796, "tps": 773877, "wall": 1638.4} {"step": 19347, "train_loss": 3.1225197315216064, "lr": 0.00015291081793627145, "tps": 771652, "wall": 1643.2} {"step": 19348, "train_loss": 3.0241684913635254, "lr": 0.00015289304075028482, "tps": 769460, "wall": 1648.0} {"step": 19349, "train_loss": 3.0932302474975586, "lr": 0.0001528752643244895, "tps": 767279, "wall": 1652.8} {"step": 19350, "train_loss": 3.007716655731201, "lr": 0.00015285748865908683, "tps": 765083, "wall": 1657.6} {"step": 19351, "train_loss": 3.1675941944122314, "lr": 0.00015283971375427808, "tps": 762930, "wall": 1662.3} {"step": 19352, "train_loss": 3.054435968399048, "lr": 0.00015282193961026476, "tps": 760800, "wall": 1667.1} {"step": 19353, "train_loss": 3.1373658180236816, "lr": 0.00015280416622724815, "tps": 758676, "wall": 1671.8} {"step": 19354, "train_loss": 3.097175121307373, "lr": 0.0001527863936054295, "tps": 756561, "wall": 1676.6} {"step": 19355, "train_loss": 3.1496920585632324, "lr": 0.00015276862174501025, "tps": 754463, "wall": 1681.3} {"step": 19356, "train_loss": 3.0243022441864014, "lr": 0.0001527508506461917, "tps": 752361, "wall": 1686.1} {"step": 19357, "train_loss": 3.059535503387451, "lr": 0.0001527330803091752, "tps": 750280, "wall": 1690.9} {"step": 19358, "train_loss": 3.0856411457061768, "lr": 0.00015271531073416194, "tps": 748218, "wall": 1695.6} {"step": 19359, "train_loss": 3.0521750450134277, "lr": 0.0001526975419213533, "tps": 746164, "wall": 1700.4} {"step": 19360, "train_loss": 3.0687403678894043, "lr": 0.00015267977387095058, "tps": 744120, "wall": 1705.2} {"step": 19361, "train_loss": 3.038536787033081, "lr": 0.000152662006583155, "tps": 742090, "wall": 1709.9} {"step": 19362, "train_loss": 3.1232357025146484, "lr": 0.00015264424005816785, "tps": 740035, "wall": 1714.7} {"step": 19363, "train_loss": 2.9923343658447266, "lr": 0.0001526264742961904, "tps": 738030, "wall": 1719.5} {"step": 19364, "train_loss": 3.0351412296295166, "lr": 0.00015260870929742387, "tps": 736029, "wall": 1724.3} {"step": 19365, "train_loss": 3.1129817962646484, "lr": 0.0001525909450620695, "tps": 734039, "wall": 1729.0} {"step": 19366, "train_loss": 3.028008222579956, "lr": 0.00015257318159032858, "tps": 732044, "wall": 1733.8} {"step": 19367, "train_loss": 3.188481330871582, "lr": 0.00015255541888240233, "tps": 730075, "wall": 1738.6} {"step": 19368, "train_loss": 2.9056901931762695, "lr": 0.00015253765693849195, "tps": 728119, "wall": 1743.4} {"step": 19369, "train_loss": 2.9990410804748535, "lr": 0.0001525198957587986, "tps": 726174, "wall": 1748.1} {"step": 19370, "train_loss": 2.9452171325683594, "lr": 0.00015250213534352355, "tps": 724245, "wall": 1752.9} {"step": 19371, "train_loss": 3.0425164699554443, "lr": 0.00015248437569286794, "tps": 722321, "wall": 1757.6} {"step": 19372, "train_loss": 2.9551305770874023, "lr": 0.000152466616807033, "tps": 720407, "wall": 1762.4} {"step": 19373, "train_loss": 3.0913615226745605, "lr": 0.0001524488586862199, "tps": 718508, "wall": 1767.1} {"step": 19374, "train_loss": 2.9678497314453125, "lr": 0.00015243110133062975, "tps": 716619, "wall": 1771.9} {"step": 19375, "train_loss": 2.9890499114990234, "lr": 0.00015241334474046375, "tps": 714706, "wall": 1776.7} {"step": 19376, "train_loss": 3.144117593765259, "lr": 0.000152395588915923, "tps": 712833, "wall": 1781.5} {"step": 19377, "train_loss": 3.114931106567383, "lr": 0.00015237783385720874, "tps": 710970, "wall": 1786.2} {"step": 19378, "train_loss": 3.1624178886413574, "lr": 0.000152360079564522, "tps": 709122, "wall": 1791.0} {"step": 19379, "train_loss": 3.078845739364624, "lr": 0.0001523423260380639, "tps": 707282, "wall": 1795.7} {"step": 19380, "train_loss": 3.1839680671691895, "lr": 0.00015232457327803565, "tps": 705452, "wall": 1800.5} {"step": 19381, "train_loss": 2.973594903945923, "lr": 0.00015230682128463828, "tps": 703624, "wall": 1805.2} {"step": 19382, "train_loss": 3.0795798301696777, "lr": 0.0001522890700580729, "tps": 701812, "wall": 1810.0} {"step": 19383, "train_loss": 3.097287654876709, "lr": 0.00015227131959854058, "tps": 700011, "wall": 1814.8} {"step": 19384, "train_loss": 3.10255765914917, "lr": 0.00015225356990624243, "tps": 698223, "wall": 1819.5} {"step": 19385, "train_loss": 3.004234790802002, "lr": 0.0001522358209813795, "tps": 696436, "wall": 1824.3} {"step": 19386, "train_loss": 3.0749778747558594, "lr": 0.00015221807282415285, "tps": 694656, "wall": 1829.0} {"step": 19387, "train_loss": 3.0585575103759766, "lr": 0.00015220032543476357, "tps": 692867, "wall": 1833.8} {"step": 19388, "train_loss": 3.0708138942718506, "lr": 0.00015218257881341267, "tps": 691118, "wall": 1838.6} {"step": 19389, "train_loss": 3.005500316619873, "lr": 0.00015216483296030115, "tps": 689371, "wall": 1843.3} {"step": 19390, "train_loss": 3.1419925689697266, "lr": 0.0001521470878756301, "tps": 687637, "wall": 1848.1} {"step": 19391, "train_loss": 3.1605515480041504, "lr": 0.00015212934355960048, "tps": 685903, "wall": 1852.8} {"step": 19392, "train_loss": 3.102515697479248, "lr": 0.00015211160001241334, "tps": 684187, "wall": 1857.6} {"step": 19393, "train_loss": 3.0128977298736572, "lr": 0.00015209385723426966, "tps": 682478, "wall": 1862.3} {"step": 19394, "train_loss": 3.064511775970459, "lr": 0.00015207611522537046, "tps": 680768, "wall": 1867.1} {"step": 19395, "train_loss": 3.138122081756592, "lr": 0.00015205837398591673, "tps": 679078, "wall": 1871.9} {"step": 19396, "train_loss": 3.0422048568725586, "lr": 0.0001520406335161093, "tps": 677389, "wall": 1876.6} {"step": 19397, "train_loss": 3.1096692085266113, "lr": 0.00015202289381614938, "tps": 675713, "wall": 1881.4} {"step": 19398, "train_loss": 3.1022372245788574, "lr": 0.00015200515488623774, "tps": 674043, "wall": 1886.1} {"step": 19399, "train_loss": 3.1028079986572266, "lr": 0.0001519874167265754, "tps": 672383, "wall": 1890.9} {"step": 19400, "train_loss": 3.003641366958618, "lr": 0.00015196967933736328, "tps": 670716, "wall": 1895.7} {"step": 19401, "train_loss": 3.058175563812256, "lr": 0.00015195194271880232, "tps": 669079, "wall": 1900.4} {"step": 19402, "train_loss": 3.0848593711853027, "lr": 0.0001519342068710934, "tps": 667446, "wall": 1905.2} {"step": 19403, "train_loss": 3.118931293487549, "lr": 0.00015191647179443746, "tps": 665819, "wall": 1909.9} {"step": 19404, "train_loss": 3.141887664794922, "lr": 0.00015189873748903545, "tps": 664199, "wall": 1914.7} {"step": 19405, "train_loss": 3.0567786693573, "lr": 0.0001518810039550882, "tps": 662584, "wall": 1919.4} {"step": 19406, "train_loss": 3.1575045585632324, "lr": 0.00015186327119279662, "tps": 660980, "wall": 1924.2} {"step": 19407, "train_loss": 3.022277355194092, "lr": 0.00015184553920236161, "tps": 659387, "wall": 1928.9} {"step": 19408, "train_loss": 3.094045639038086, "lr": 0.00015182780798398405, "tps": 657796, "wall": 1933.7} {"step": 19409, "train_loss": 3.1157047748565674, "lr": 0.00015181007753786472, "tps": 656213, "wall": 1938.5} {"step": 19410, "train_loss": 3.06990122795105, "lr": 0.00015179234786420452, "tps": 654635, "wall": 1943.2} {"step": 19411, "train_loss": 3.0457186698913574, "lr": 0.00015177461896320434, "tps": 653067, "wall": 1948.0} {"step": 19412, "train_loss": 2.996187210083008, "lr": 0.00015175689083506494, "tps": 651505, "wall": 1952.8} {"step": 19413, "train_loss": 3.04569935798645, "lr": 0.00015173916347998713, "tps": 649938, "wall": 1957.6} {"step": 19414, "train_loss": 3.057103157043457, "lr": 0.0001517214368981718, "tps": 648384, "wall": 1962.4} {"step": 19415, "train_loss": 3.19773530960083, "lr": 0.00015170371108981975, "tps": 646849, "wall": 1967.1} {"step": 19416, "train_loss": 3.1282918453216553, "lr": 0.00015168598605513176, "tps": 645323, "wall": 1971.9} {"step": 19417, "train_loss": 3.0053610801696777, "lr": 0.0001516682617943086, "tps": 643803, "wall": 1976.7} {"step": 19418, "train_loss": 2.988119125366211, "lr": 0.00015165053830755104, "tps": 642287, "wall": 1981.4} {"step": 19419, "train_loss": 3.1240651607513428, "lr": 0.00015163281559505987, "tps": 640781, "wall": 1986.2} {"step": 19420, "train_loss": 3.0388693809509277, "lr": 0.00015161509365703587, "tps": 639277, "wall": 1991.0} {"step": 19421, "train_loss": 3.0622522830963135, "lr": 0.0001515973724936799, "tps": 637788, "wall": 1995.7} {"step": 19422, "train_loss": 3.0864572525024414, "lr": 0.00015157965210519248, "tps": 636308, "wall": 2000.5} {"step": 19423, "train_loss": 3.0582661628723145, "lr": 0.00015156193249177445, "tps": 634830, "wall": 2005.2} {"step": 19424, "train_loss": 3.13249135017395, "lr": 0.00015154421365362662, "tps": 633359, "wall": 2010.0} {"step": 19425, "train_loss": 2.966813564300537, "lr": 0.00015152649559094963, "tps": 631862, "wall": 2014.8} {"step": 19426, "train_loss": 3.071089267730713, "lr": 0.00015150877830394417, "tps": 630410, "wall": 2019.6} {"step": 19427, "train_loss": 3.1639671325683594, "lr": 0.000151491061792811, "tps": 628962, "wall": 2024.3} {"step": 19428, "train_loss": 3.1379075050354004, "lr": 0.0001514733460577508, "tps": 627519, "wall": 2029.1} {"step": 19429, "train_loss": 3.10811185836792, "lr": 0.00015145563109896418, "tps": 626078, "wall": 2033.9} {"step": 19430, "train_loss": 3.112027168273926, "lr": 0.0001514379169166519, "tps": 624650, "wall": 2038.6} {"step": 19431, "train_loss": 3.060018539428711, "lr": 0.00015142020351101464, "tps": 623228, "wall": 2043.4} {"step": 19432, "train_loss": 3.0501492023468018, "lr": 0.00015140249088225303, "tps": 621815, "wall": 2048.1} {"step": 19433, "train_loss": 3.1097564697265625, "lr": 0.00015138477903056766, "tps": 620408, "wall": 2052.9} {"step": 19434, "train_loss": 3.171339511871338, "lr": 0.00015136706795615927, "tps": 619008, "wall": 2057.6} {"step": 19435, "train_loss": 3.168745994567871, "lr": 0.00015134935765922846, "tps": 617614, "wall": 2062.4} {"step": 19436, "train_loss": 3.1085383892059326, "lr": 0.0001513316481399758, "tps": 616223, "wall": 2067.1} {"step": 19437, "train_loss": 3.1325221061706543, "lr": 0.00015131393939860194, "tps": 614837, "wall": 2071.9} {"step": 19438, "train_loss": 3.1255664825439453, "lr": 0.00015129623143530756, "tps": 613441, "wall": 2076.7} {"step": 19439, "train_loss": 3.0640337467193604, "lr": 0.00015127852425029313, "tps": 612073, "wall": 2081.5} {"step": 19440, "train_loss": 3.0230555534362793, "lr": 0.0001512608178437593, "tps": 610704, "wall": 2086.3} {"step": 19441, "train_loss": 3.0898358821868896, "lr": 0.00015124311221590667, "tps": 609345, "wall": 2091.0} {"step": 19442, "train_loss": 2.9822630882263184, "lr": 0.00015122540736693573, "tps": 607991, "wall": 2095.8} {"step": 19443, "train_loss": 3.0889954566955566, "lr": 0.00015120770329704714, "tps": 606644, "wall": 2100.5} {"step": 19444, "train_loss": 3.0939078330993652, "lr": 0.0001511900000064414, "tps": 605303, "wall": 2105.3} {"step": 19445, "train_loss": 3.0399608612060547, "lr": 0.00015117229749531905, "tps": 603965, "wall": 2110.1} {"step": 19446, "train_loss": 3.082411527633667, "lr": 0.00015115459576388064, "tps": 602638, "wall": 2114.8} {"step": 19447, "train_loss": 3.0967535972595215, "lr": 0.0001511368948123267, "tps": 601315, "wall": 2119.6} {"step": 19448, "train_loss": 3.147273540496826, "lr": 0.00015111919464085775, "tps": 600001, "wall": 2124.3} {"step": 19449, "train_loss": 3.110231876373291, "lr": 0.00015110149524967428, "tps": 598693, "wall": 2129.1} {"step": 19450, "train_loss": 3.0560965538024902, "lr": 0.00015108379663897678, "tps": 597365, "wall": 2133.9} {"step": 19451, "train_loss": 3.1860713958740234, "lr": 0.00015106609880896583, "tps": 596068, "wall": 2138.7} {"step": 19452, "train_loss": 3.1354215145111084, "lr": 0.0001510484017598418, "tps": 594774, "wall": 2143.5} {"step": 19453, "train_loss": 3.104299545288086, "lr": 0.00015103070549180516, "tps": 593486, "wall": 2148.2} {"step": 19454, "train_loss": 3.1113085746765137, "lr": 0.0001510130100050565, "tps": 592203, "wall": 2153.0} {"step": 19455, "train_loss": 3.210094928741455, "lr": 0.00015099531529979613, "tps": 590925, "wall": 2157.7} {"step": 19456, "train_loss": 3.1080384254455566, "lr": 0.00015097762137622456, "tps": 589652, "wall": 2162.5} {"step": 19457, "train_loss": 3.0955023765563965, "lr": 0.00015095992823454228, "tps": 588382, "wall": 2167.3} {"step": 19458, "train_loss": 3.0313806533813477, "lr": 0.00015094223587494966, "tps": 587127, "wall": 2172.0} {"step": 19459, "train_loss": 3.0265421867370605, "lr": 0.00015092454429764705, "tps": 585873, "wall": 2176.8} {"step": 19460, "train_loss": 3.022542953491211, "lr": 0.00015090685350283503, "tps": 584624, "wall": 2181.6} {"step": 19461, "train_loss": 3.0235581398010254, "lr": 0.0001508891634907139, "tps": 583379, "wall": 2186.3} {"step": 19462, "train_loss": 3.010587215423584, "lr": 0.00015087147426148402, "tps": 582142, "wall": 2191.1} {"step": 19463, "train_loss": 3.0364198684692383, "lr": 0.00015085378581534587, "tps": 580889, "wall": 2195.9} {"step": 19464, "train_loss": 2.9655473232269287, "lr": 0.0001508360981524997, "tps": 579669, "wall": 2200.7} {"step": 19465, "train_loss": 3.0758554935455322, "lr": 0.000150818411273146, "tps": 578448, "wall": 2205.4} {"step": 19466, "train_loss": 3.0941672325134277, "lr": 0.0001508007251774851, "tps": 577230, "wall": 2210.2} {"step": 19467, "train_loss": 3.0424373149871826, "lr": 0.0001507830398657173, "tps": 576016, "wall": 2215.0} {"step": 19468, "train_loss": 3.1140573024749756, "lr": 0.000150765355338043, "tps": 574809, "wall": 2219.7} {"step": 19469, "train_loss": 3.056342124938965, "lr": 0.00015074767159466246, "tps": 573608, "wall": 2224.5} {"step": 19470, "train_loss": 3.0601389408111572, "lr": 0.0001507299886357761, "tps": 572409, "wall": 2229.3} {"step": 19471, "train_loss": 3.0352888107299805, "lr": 0.00015071230646158417, "tps": 571217, "wall": 2234.0} {"step": 19472, "train_loss": 3.1400351524353027, "lr": 0.00015069462507228694, "tps": 570032, "wall": 2238.8} {"step": 19473, "train_loss": 3.0742249488830566, "lr": 0.00015067694446808475, "tps": 568850, "wall": 2243.6} {"step": 19474, "train_loss": 3.0713050365448, "lr": 0.00015065926464917788, "tps": 567674, "wall": 2248.3} {"step": 19475, "train_loss": 3.0671277046203613, "lr": 0.00015064158561576662, "tps": 566502, "wall": 2253.1} {"step": 19476, "train_loss": 3.131523609161377, "lr": 0.00015062390736805123, "tps": 565323, "wall": 2257.9} {"step": 19477, "train_loss": 3.1182377338409424, "lr": 0.00015060622990623198, "tps": 564163, "wall": 2262.7} {"step": 19478, "train_loss": 3.0248663425445557, "lr": 0.0001505885532305091, "tps": 563006, "wall": 2267.4} {"step": 19479, "train_loss": 3.1363296508789062, "lr": 0.00015057087734108286, "tps": 561852, "wall": 2272.2} {"step": 19480, "train_loss": 3.0732059478759766, "lr": 0.00015055320223815346, "tps": 560705, "wall": 2277.0} {"step": 19481, "train_loss": 3.0481016635894775, "lr": 0.0001505355279219211, "tps": 559559, "wall": 2281.7} {"step": 19482, "train_loss": 3.011791944503784, "lr": 0.00015051785439258608, "tps": 558426, "wall": 2286.5} {"step": 19483, "train_loss": 3.184246301651001, "lr": 0.00015050018165034862, "tps": 557296, "wall": 2291.2} {"step": 19484, "train_loss": 3.111185312271118, "lr": 0.00015048250969540878, "tps": 556171, "wall": 2296.0} {"step": 19485, "train_loss": 2.9552712440490723, "lr": 0.00015046483852796687, "tps": 555052, "wall": 2300.7} {"step": 19486, "train_loss": 3.0608081817626953, "lr": 0.00015044716814822305, "tps": 553938, "wall": 2305.5} {"step": 19487, "train_loss": 3.1035079956054688, "lr": 0.0001504294985563774, "tps": 552828, "wall": 2310.2} {"step": 19488, "train_loss": 3.135531425476074, "lr": 0.0001504118297526302, "tps": 551704, "wall": 2315.1} {"step": 19489, "train_loss": 3.1400210857391357, "lr": 0.00015039416173718157, "tps": 550603, "wall": 2319.8} {"step": 19490, "train_loss": 3.0767297744750977, "lr": 0.00015037649451023164, "tps": 549505, "wall": 2324.6} {"step": 19491, "train_loss": 3.122429370880127, "lr": 0.0001503588280719805, "tps": 548411, "wall": 2329.3} {"step": 19492, "train_loss": 3.067244052886963, "lr": 0.00015034116242262834, "tps": 547323, "wall": 2334.1} {"step": 19493, "train_loss": 3.0589494705200195, "lr": 0.00015032349756237534, "tps": 546239, "wall": 2338.8} {"step": 19494, "train_loss": 3.1319806575775146, "lr": 0.00015030583349142144, "tps": 545156, "wall": 2343.6} {"step": 19495, "train_loss": 3.069902181625366, "lr": 0.00015028817020996686, "tps": 544076, "wall": 2348.4} {"step": 19496, "train_loss": 3.111450672149658, "lr": 0.00015027050771821164, "tps": 543005, "wall": 2353.1} {"step": 19497, "train_loss": 3.0838725566864014, "lr": 0.00015025284601635593, "tps": 541939, "wall": 2357.9} {"step": 19498, "train_loss": 3.02565336227417, "lr": 0.00015023518510459967, "tps": 540876, "wall": 2362.6} {"step": 19499, "train_loss": 3.076615810394287, "lr": 0.00015021752498314305, "tps": 539817, "wall": 2367.4} {"step": 19500, "train_loss": 3.084418773651123, "lr": 0.00015019986565218614, "tps": 538764, "wall": 2372.1} {"step": 19501, "train_loss": 3.1504878997802734, "lr": 0.00015018220711192885, "tps": 537665, "wall": 2377.1} {"step": 19502, "train_loss": 3.0539300441741943, "lr": 0.00015016454936257132, "tps": 536619, "wall": 2381.9} {"step": 19503, "train_loss": 2.9787516593933105, "lr": 0.00015014689240431354, "tps": 535574, "wall": 2386.6} {"step": 19504, "train_loss": 3.0720348358154297, "lr": 0.0001501292362373556, "tps": 534536, "wall": 2391.4} {"step": 19505, "train_loss": 3.111494779586792, "lr": 0.00015011158086189737, "tps": 533503, "wall": 2396.1} {"step": 19506, "train_loss": 3.009167194366455, "lr": 0.00015009392627813898, "tps": 532472, "wall": 2400.9} {"step": 19507, "train_loss": 2.9887099266052246, "lr": 0.0001500762724862804, "tps": 531448, "wall": 2405.6} {"step": 19508, "train_loss": 2.8869199752807617, "lr": 0.00015005861948652155, "tps": 530426, "wall": 2410.4} {"step": 19509, "train_loss": 3.107851266860962, "lr": 0.0001500409672790624, "tps": 529408, "wall": 2415.2} {"step": 19510, "train_loss": 3.0999653339385986, "lr": 0.00015002331586410304, "tps": 528388, "wall": 2419.9} {"step": 19511, "train_loss": 3.0017242431640625, "lr": 0.00015000566524184326, "tps": 527381, "wall": 2424.7} {"step": 19512, "train_loss": 3.0376977920532227, "lr": 0.00014998801541248318, "tps": 526374, "wall": 2429.5} {"step": 19513, "train_loss": 3.209136486053467, "lr": 0.0001499703663762226, "tps": 525355, "wall": 2434.3} {"step": 19514, "train_loss": 3.055915355682373, "lr": 0.00014995271813326148, "tps": 524362, "wall": 2439.0} {"step": 19515, "train_loss": 3.078617572784424, "lr": 0.00014993507068379976, "tps": 523363, "wall": 2443.8} {"step": 19516, "train_loss": 3.1980061531066895, "lr": 0.00014991742402803738, "tps": 522375, "wall": 2448.6} {"step": 19517, "train_loss": 3.0797863006591797, "lr": 0.0001498997781661742, "tps": 521391, "wall": 2453.3} {"step": 19518, "train_loss": 3.1128733158111572, "lr": 0.00014988213309841014, "tps": 520409, "wall": 2458.1} {"step": 19519, "train_loss": 3.0749220848083496, "lr": 0.00014986448882494505, "tps": 519431, "wall": 2462.8} {"step": 19520, "train_loss": 3.0418200492858887, "lr": 0.00014984684534597887, "tps": 518452, "wall": 2467.6} {"step": 19521, "train_loss": 3.084869146347046, "lr": 0.00014982920266171137, "tps": 517485, "wall": 2472.3} {"step": 19522, "train_loss": 3.058450698852539, "lr": 0.00014981156077234248, "tps": 516518, "wall": 2477.1} {"step": 19523, "train_loss": 3.1274027824401855, "lr": 0.00014979391967807204, "tps": 515555, "wall": 2481.8} {"step": 19524, "train_loss": 3.0963125228881836, "lr": 0.00014977627937909986, "tps": 514595, "wall": 2486.6} {"step": 19525, "train_loss": 3.018059253692627, "lr": 0.00014975863987562576, "tps": 513640, "wall": 2491.3} {"step": 19526, "train_loss": 2.986736297607422, "lr": 0.0001497410011678496, "tps": 512674, "wall": 2496.2} {"step": 19527, "train_loss": 3.1025948524475098, "lr": 0.0001497233632559712, "tps": 511724, "wall": 2500.9} {"step": 19528, "train_loss": 2.9818711280822754, "lr": 0.00014970572614019033, "tps": 510779, "wall": 2505.7} {"step": 19529, "train_loss": 2.984518527984619, "lr": 0.0001496880898207068, "tps": 509832, "wall": 2510.5} {"step": 19530, "train_loss": 3.1250314712524414, "lr": 0.0001496704542977204, "tps": 508893, "wall": 2515.2} {"step": 19531, "train_loss": 3.0437324047088623, "lr": 0.00014965281957143089, "tps": 507959, "wall": 2520.0} {"step": 19532, "train_loss": 3.0779190063476562, "lr": 0.00014963518564203802, "tps": 507030, "wall": 2524.7} {"step": 19533, "train_loss": 3.1464157104492188, "lr": 0.00014961755250974163, "tps": 506103, "wall": 2529.5} {"step": 19534, "train_loss": 3.0487821102142334, "lr": 0.00014959992017474138, "tps": 505179, "wall": 2534.2} {"step": 19535, "train_loss": 3.1021299362182617, "lr": 0.00014958228863723701, "tps": 504260, "wall": 2539.0} {"step": 19536, "train_loss": 3.09167218208313, "lr": 0.00014956465789742836, "tps": 503345, "wall": 2543.7} {"step": 19537, "train_loss": 3.130932331085205, "lr": 0.00014954702795551503, "tps": 502432, "wall": 2548.5} {"step": 19538, "train_loss": 2.997767686843872, "lr": 0.00014952939881169677, "tps": 501522, "wall": 2553.2} {"step": 19539, "train_loss": 3.134941816329956, "lr": 0.0001495117704661733, "tps": 500604, "wall": 2558.1} {"step": 19540, "train_loss": 3.1525115966796875, "lr": 0.00014949414291914436, "tps": 499702, "wall": 2562.8} {"step": 19541, "train_loss": 2.9758875370025635, "lr": 0.00014947651617080952, "tps": 498803, "wall": 2567.6} {"step": 19542, "train_loss": 3.042649984359741, "lr": 0.0001494588902213685, "tps": 497904, "wall": 2572.3} {"step": 19543, "train_loss": 3.1264233589172363, "lr": 0.00014944126507102104, "tps": 497011, "wall": 2577.1} {"step": 19544, "train_loss": 3.0487635135650635, "lr": 0.00014942364071996673, "tps": 496119, "wall": 2581.8} {"step": 19545, "train_loss": 3.119907855987549, "lr": 0.00014940601716840522, "tps": 495233, "wall": 2586.6} {"step": 19546, "train_loss": 3.161702871322632, "lr": 0.0001493883944165362, "tps": 494351, "wall": 2591.3} {"step": 19547, "train_loss": 3.0918352603912354, "lr": 0.00014937077246455927, "tps": 493469, "wall": 2596.1} {"step": 19548, "train_loss": 3.0662457942962646, "lr": 0.00014935315131267402, "tps": 492586, "wall": 2600.9} {"step": 19549, "train_loss": 2.9865305423736572, "lr": 0.0001493355309610801, "tps": 491712, "wall": 2605.6} {"step": 19550, "train_loss": 3.0174355506896973, "lr": 0.00014931791140997716, "tps": 490843, "wall": 2610.4} {"step": 19551, "train_loss": 3.044678211212158, "lr": 0.00014930029265956466, "tps": 489966, "wall": 2615.2} {"step": 19552, "train_loss": 3.1207475662231445, "lr": 0.0001492826747100423, "tps": 489102, "wall": 2620.0} {"step": 19553, "train_loss": 3.078648328781128, "lr": 0.0001492650575616096, "tps": 488241, "wall": 2624.7} {"step": 19554, "train_loss": 3.0223031044006348, "lr": 0.00014924744121446625, "tps": 487383, "wall": 2629.5} {"step": 19555, "train_loss": 3.0723493099212646, "lr": 0.0001492298256688116, "tps": 486519, "wall": 2634.3} {"step": 19556, "train_loss": 3.1302199363708496, "lr": 0.00014921221092484537, "tps": 485665, "wall": 2639.0} {"step": 19557, "train_loss": 2.9954512119293213, "lr": 0.0001491945969827671, "tps": 484815, "wall": 2643.8} {"step": 19558, "train_loss": 2.9449992179870605, "lr": 0.0001491769838427762, "tps": 483962, "wall": 2648.6} {"step": 19559, "train_loss": 3.0924594402313232, "lr": 0.00014915937150507223, "tps": 483119, "wall": 2653.3} {"step": 19560, "train_loss": 2.9733619689941406, "lr": 0.0001491417599698548, "tps": 482280, "wall": 2658.1} {"step": 19561, "train_loss": 3.0935637950897217, "lr": 0.0001491241492373233, "tps": 481444, "wall": 2662.9} {"step": 19562, "train_loss": 3.0524373054504395, "lr": 0.0001491065393076773, "tps": 480610, "wall": 2667.6} {"step": 19563, "train_loss": 3.034027338027954, "lr": 0.0001490889301811162, "tps": 479779, "wall": 2672.4} {"step": 19564, "train_loss": 3.0988235473632812, "lr": 0.00014907132185783958, "tps": 478937, "wall": 2677.2} {"step": 19565, "train_loss": 3.0640199184417725, "lr": 0.00014905371433804687, "tps": 478114, "wall": 2681.9} {"step": 19566, "train_loss": 2.97687029838562, "lr": 0.0001490361076219375, "tps": 477293, "wall": 2686.7} {"step": 19567, "train_loss": 2.952219247817993, "lr": 0.000149018501709711, "tps": 476475, "wall": 2691.4} {"step": 19568, "train_loss": 3.176145076751709, "lr": 0.00014900089660156672, "tps": 475659, "wall": 2696.2} {"step": 19569, "train_loss": 3.006211280822754, "lr": 0.0001489832922977041, "tps": 474845, "wall": 2701.0} {"step": 19570, "train_loss": 3.157139778137207, "lr": 0.00014896568879832253, "tps": 474038, "wall": 2705.7} {"step": 19571, "train_loss": 2.9552009105682373, "lr": 0.0001489480861036216, "tps": 473229, "wall": 2710.5} {"step": 19572, "train_loss": 2.9929635524749756, "lr": 0.00014893048421380054, "tps": 472423, "wall": 2715.2} {"step": 19573, "train_loss": 2.9443180561065674, "lr": 0.00014891288312905875, "tps": 471618, "wall": 2720.0} {"step": 19574, "train_loss": 3.1628036499023438, "lr": 0.00014889528284959579, "tps": 470818, "wall": 2724.8} {"step": 19575, "train_loss": 3.0626375675201416, "lr": 0.00014887768337561082, "tps": 470020, "wall": 2729.5} {"step": 19576, "train_loss": 3.0607712268829346, "lr": 0.0001488600847073033, "tps": 469213, "wall": 2734.4} {"step": 19577, "train_loss": 3.1303019523620605, "lr": 0.00014884248684487265, "tps": 468423, "wall": 2739.1} {"step": 19578, "train_loss": 2.9928746223449707, "lr": 0.0001488248897885181, "tps": 467635, "wall": 2743.9} {"step": 19579, "train_loss": 3.06158447265625, "lr": 0.00014880729353843907, "tps": 466849, "wall": 2748.6} {"step": 19580, "train_loss": 3.119753360748291, "lr": 0.00014878969809483484, "tps": 466066, "wall": 2753.4} {"step": 19581, "train_loss": 3.101597547531128, "lr": 0.00014877210345790482, "tps": 465286, "wall": 2758.1} {"step": 19582, "train_loss": 3.1981897354125977, "lr": 0.00014875450962784824, "tps": 464509, "wall": 2762.9} {"step": 19583, "train_loss": 3.0593132972717285, "lr": 0.0001487369166048644, "tps": 463735, "wall": 2767.6} {"step": 19584, "train_loss": 3.158015012741089, "lr": 0.0001487193243891527, "tps": 462963, "wall": 2772.4} {"step": 19585, "train_loss": 3.026341438293457, "lr": 0.00014870173298091226, "tps": 462195, "wall": 2777.2} {"step": 19586, "train_loss": 3.03312087059021, "lr": 0.00014868414238034246, "tps": 461429, "wall": 2781.9} {"step": 19587, "train_loss": 3.1183817386627197, "lr": 0.00014866655258764263, "tps": 460665, "wall": 2786.7} {"step": 19588, "train_loss": 2.9600133895874023, "lr": 0.0001486489636030119, "tps": 459905, "wall": 2791.4} {"step": 19589, "train_loss": 3.051070213317871, "lr": 0.00014863137542664955, "tps": 459132, "wall": 2796.2} {"step": 19590, "train_loss": 3.052346706390381, "lr": 0.00014861378805875486, "tps": 458378, "wall": 2801.0} {"step": 19591, "train_loss": 2.956545829772949, "lr": 0.00014859620149952702, "tps": 457626, "wall": 2805.7} {"step": 19592, "train_loss": 3.061006546020508, "lr": 0.00014857861574916532, "tps": 456873, "wall": 2810.5} {"step": 19593, "train_loss": 2.9612886905670166, "lr": 0.00014856103080786889, "tps": 456124, "wall": 2815.3} {"step": 19594, "train_loss": 3.1837844848632812, "lr": 0.000148543446675837, "tps": 455379, "wall": 2820.0} {"step": 19595, "train_loss": 3.092357873916626, "lr": 0.00014852586335326878, "tps": 454636, "wall": 2824.8} {"step": 19596, "train_loss": 3.0638036727905273, "lr": 0.00014850828084036347, "tps": 453893, "wall": 2829.5} {"step": 19597, "train_loss": 2.986832857131958, "lr": 0.00014849069913732015, "tps": 453154, "wall": 2834.3} {"step": 19598, "train_loss": 3.113190174102783, "lr": 0.00014847311824433814, "tps": 452418, "wall": 2839.1} {"step": 19599, "train_loss": 3.148085117340088, "lr": 0.00014845553816161648, "tps": 451683, "wall": 2843.8} {"step": 19600, "train_loss": 2.958317756652832, "lr": 0.00014843795888935438, "tps": 450952, "wall": 2848.6} {"step": 19601, "train_loss": 3.175987720489502, "lr": 0.00014842038042775095, "tps": 450223, "wall": 2853.3} {"step": 19602, "train_loss": 3.107961654663086, "lr": 0.00014840280277700528, "tps": 449487, "wall": 2858.2} {"step": 19603, "train_loss": 3.1349735260009766, "lr": 0.00014838522593731658, "tps": 448762, "wall": 2862.9} {"step": 19604, "train_loss": 2.9762701988220215, "lr": 0.00014836764990888392, "tps": 448041, "wall": 2867.7} {"step": 19605, "train_loss": 3.0557327270507812, "lr": 0.0001483500746919064, "tps": 447321, "wall": 2872.4} {"step": 19606, "train_loss": 3.074859619140625, "lr": 0.00014833250028658306, "tps": 446602, "wall": 2877.2} {"step": 19607, "train_loss": 3.063608169555664, "lr": 0.000148314926693113, "tps": 445888, "wall": 2882.0} {"step": 19608, "train_loss": 3.0265674591064453, "lr": 0.00014829735391169545, "tps": 445177, "wall": 2886.7} {"step": 19609, "train_loss": 3.177250385284424, "lr": 0.00014827978194252928, "tps": 444467, "wall": 2891.5} {"step": 19610, "train_loss": 2.9241020679473877, "lr": 0.00014826221078581363, "tps": 443760, "wall": 2896.2} {"step": 19611, "train_loss": 3.0021328926086426, "lr": 0.00014824464044174755, "tps": 443055, "wall": 2901.0} {"step": 19612, "train_loss": 3.036313056945801, "lr": 0.00014822707091053004, "tps": 442353, "wall": 2905.7} {"step": 19613, "train_loss": 3.08512544631958, "lr": 0.00014820950219236018, "tps": 441651, "wall": 2910.5} {"step": 19614, "train_loss": 3.130675792694092, "lr": 0.00014819193428743698, "tps": 440945, "wall": 2915.3} {"step": 19615, "train_loss": 3.044494867324829, "lr": 0.00014817436719595937, "tps": 440249, "wall": 2920.1} {"step": 19616, "train_loss": 3.1623454093933105, "lr": 0.00014815680091812645, "tps": 439551, "wall": 2924.8} {"step": 19617, "train_loss": 3.1004459857940674, "lr": 0.00014813923545413716, "tps": 438859, "wall": 2929.6} {"step": 19618, "train_loss": 3.067885398864746, "lr": 0.00014812167080419054, "tps": 438171, "wall": 2934.4} {"step": 19619, "train_loss": 3.0997684001922607, "lr": 0.0001481041069684855, "tps": 437484, "wall": 2939.1} {"step": 19620, "train_loss": 3.1005282402038574, "lr": 0.000148086543947221, "tps": 436799, "wall": 2943.9} {"step": 19621, "train_loss": 3.12721586227417, "lr": 0.00014806898174059608, "tps": 436113, "wall": 2948.7} {"step": 19622, "train_loss": 3.098487615585327, "lr": 0.00014805142034880956, "tps": 435434, "wall": 2953.4} {"step": 19623, "train_loss": 3.040074348449707, "lr": 0.00014803385977206048, "tps": 434757, "wall": 2958.2} {"step": 19624, "train_loss": 3.0216569900512695, "lr": 0.0001480163000105477, "tps": 434082, "wall": 2962.9} {"step": 19625, "train_loss": 3.045552968978882, "lr": 0.00014799874106447022, "tps": 433409, "wall": 2967.7} {"step": 19626, "train_loss": 3.122314929962158, "lr": 0.00014798118293402683, "tps": 432738, "wall": 2972.4} {"step": 19627, "train_loss": 2.9834036827087402, "lr": 0.00014796362561941652, "tps": 432059, "wall": 2977.2} {"step": 19628, "train_loss": 3.1567866802215576, "lr": 0.0001479460691208382, "tps": 431391, "wall": 2982.0} {"step": 19629, "train_loss": 3.0510382652282715, "lr": 0.00014792851343849067, "tps": 430728, "wall": 2986.7} {"step": 19630, "train_loss": 3.1012778282165527, "lr": 0.0001479109585725728, "tps": 430066, "wall": 2991.5} {"step": 19631, "train_loss": 3.116921901702881, "lr": 0.0001478934045232836, "tps": 429406, "wall": 2996.2} {"step": 19632, "train_loss": 3.084625720977783, "lr": 0.00014787585129082172, "tps": 428747, "wall": 3001.0} {"step": 19633, "train_loss": 3.028101921081543, "lr": 0.00014785829887538614, "tps": 428092, "wall": 3005.7} {"step": 19634, "train_loss": 3.0453853607177734, "lr": 0.00014784074727717557, "tps": 427435, "wall": 3010.5} {"step": 19635, "train_loss": 3.0605082511901855, "lr": 0.00014782319649638904, "tps": 426781, "wall": 3015.3} {"step": 19636, "train_loss": 3.1606531143188477, "lr": 0.0001478056465332252, "tps": 426129, "wall": 3020.0} {"step": 19637, "train_loss": 3.095951557159424, "lr": 0.00014778809738788288, "tps": 425478, "wall": 3024.8} {"step": 19638, "train_loss": 3.105276346206665, "lr": 0.000147770549060561, "tps": 424831, "wall": 3029.6} {"step": 19639, "train_loss": 3.0378074645996094, "lr": 0.00014775300155145816, "tps": 424175, "wall": 3034.4} {"step": 19640, "train_loss": 3.2198486328125, "lr": 0.00014773545486077323, "tps": 423533, "wall": 3039.2} {"step": 19641, "train_loss": 2.993530511856079, "lr": 0.00014771790898870495, "tps": 422891, "wall": 3043.9} {"step": 19642, "train_loss": 2.9513816833496094, "lr": 0.00014770036393545213, "tps": 422253, "wall": 3048.7} {"step": 19643, "train_loss": 3.090789794921875, "lr": 0.00014768281970121354, "tps": 421616, "wall": 3053.5} {"step": 19644, "train_loss": 3.1097211837768555, "lr": 0.00014766527628618778, "tps": 420983, "wall": 3058.2} {"step": 19645, "train_loss": 3.0556366443634033, "lr": 0.00014764773369057375, "tps": 420352, "wall": 3063.0} {"step": 19646, "train_loss": 3.062190532684326, "lr": 0.0001476301919145701, "tps": 419722, "wall": 3067.7} {"step": 19647, "train_loss": 3.0434978008270264, "lr": 0.0001476126509583756, "tps": 419091, "wall": 3072.5} {"step": 19648, "train_loss": 3.1545376777648926, "lr": 0.0001475951108221888, "tps": 418464, "wall": 3077.2} {"step": 19649, "train_loss": 3.090697765350342, "lr": 0.00014757757150620857, "tps": 417840, "wall": 3082.0} {"step": 19650, "train_loss": 2.9873528480529785, "lr": 0.00014756003301063356, "tps": 417217, "wall": 3086.8} {"step": 19651, "train_loss": 3.1029043197631836, "lr": 0.00014754249533566234, "tps": 416596, "wall": 3091.5} {"step": 19652, "train_loss": 3.0771918296813965, "lr": 0.00014752495848149367, "tps": 415970, "wall": 3096.3} {"step": 19653, "train_loss": 3.1178767681121826, "lr": 0.00014750742244832625, "tps": 415353, "wall": 3101.1} {"step": 19654, "train_loss": 3.1480791568756104, "lr": 0.00014748988723635862, "tps": 414739, "wall": 3105.8} {"step": 19655, "train_loss": 3.109990119934082, "lr": 0.00014747235284578948, "tps": 414125, "wall": 3110.6} {"step": 19656, "train_loss": 3.126826047897339, "lr": 0.0001474548192768175, "tps": 413515, "wall": 3115.3} {"step": 19657, "train_loss": 3.115548610687256, "lr": 0.00014743728652964118, "tps": 412905, "wall": 3120.1} {"step": 19658, "train_loss": 3.011075019836426, "lr": 0.0001474197546044592, "tps": 412299, "wall": 3124.8} {"step": 19659, "train_loss": 3.1056971549987793, "lr": 0.00014740222350147016, "tps": 411692, "wall": 3129.6} {"step": 19660, "train_loss": 2.99825119972229, "lr": 0.0001473846932208727, "tps": 411089, "wall": 3134.4} {"step": 19661, "train_loss": 3.0457382202148438, "lr": 0.00014736716376286538, "tps": 410487, "wall": 3139.1} {"step": 19662, "train_loss": 3.0708413124084473, "lr": 0.0001473496351276467, "tps": 409889, "wall": 3143.9} {"step": 19663, "train_loss": 3.030060291290283, "lr": 0.0001473321073154154, "tps": 409291, "wall": 3148.6} {"step": 19664, "train_loss": 3.06610369682312, "lr": 0.0001473145803263698, "tps": 408695, "wall": 3153.4} {"step": 19665, "train_loss": 3.06199312210083, "lr": 0.00014729705416070856, "tps": 408091, "wall": 3158.2} {"step": 19666, "train_loss": 3.0476512908935547, "lr": 0.0001472795288186303, "tps": 407499, "wall": 3162.9} {"step": 19667, "train_loss": 3.1159045696258545, "lr": 0.00014726200430033345, "tps": 406907, "wall": 3167.7} {"step": 19668, "train_loss": 3.169273614883423, "lr": 0.00014724448060601653, "tps": 406315, "wall": 3172.5} {"step": 19669, "train_loss": 3.042069435119629, "lr": 0.00014722695773587802, "tps": 405727, "wall": 3177.2} {"step": 19670, "train_loss": 3.007498264312744, "lr": 0.0001472094356901166, "tps": 405138, "wall": 3182.0} {"step": 19671, "train_loss": 3.093148708343506, "lr": 0.00014719191446893053, "tps": 404554, "wall": 3186.8} {"step": 19672, "train_loss": 3.0596535205841064, "lr": 0.0001471743940725184, "tps": 403972, "wall": 3191.5} {"step": 19673, "train_loss": 3.036868095397949, "lr": 0.00014715687450107874, "tps": 403390, "wall": 3196.3} {"step": 19674, "train_loss": 3.1179003715515137, "lr": 0.00014713935575480988, "tps": 402809, "wall": 3201.1} {"step": 19675, "train_loss": 3.0697624683380127, "lr": 0.00014712183783391035, "tps": 402233, "wall": 3205.8} {"step": 19676, "train_loss": 3.057340621948242, "lr": 0.00014710432073857858, "tps": 401657, "wall": 3210.6} {"step": 19677, "train_loss": 3.0070531368255615, "lr": 0.00014708680446901307, "tps": 401078, "wall": 3215.4} {"step": 19678, "train_loss": 3.045536756515503, "lr": 0.00014706928902541208, "tps": 400506, "wall": 3220.1} {"step": 19679, "train_loss": 3.1343986988067627, "lr": 0.0001470517744079742, "tps": 399937, "wall": 3224.9} {"step": 19680, "train_loss": 3.0548288822174072, "lr": 0.0001470342606168978, "tps": 399369, "wall": 3229.6} {"step": 19681, "train_loss": 3.192142963409424, "lr": 0.00014701674765238117, "tps": 398800, "wall": 3234.4} {"step": 19682, "train_loss": 3.1281251907348633, "lr": 0.00014699923551462276, "tps": 398235, "wall": 3239.2} {"step": 19683, "train_loss": 3.0023815631866455, "lr": 0.00014698172420382104, "tps": 397669, "wall": 3243.9} {"step": 19684, "train_loss": 2.9796013832092285, "lr": 0.00014696421372017423, "tps": 397103, "wall": 3248.7} {"step": 19685, "train_loss": 3.0808911323547363, "lr": 0.00014694670406388072, "tps": 396545, "wall": 3253.5} {"step": 19686, "train_loss": 3.115570306777954, "lr": 0.000146929195235139, "tps": 395986, "wall": 3258.2} {"step": 19687, "train_loss": 3.1407387256622314, "lr": 0.0001469116872341473, "tps": 395430, "wall": 3263.0} {"step": 19688, "train_loss": 3.117920160293579, "lr": 0.0001468941800611039, "tps": 394875, "wall": 3267.7} {"step": 19689, "train_loss": 2.9870638847351074, "lr": 0.0001468766737162072, "tps": 394321, "wall": 3272.5} {"step": 19690, "train_loss": 3.102288246154785, "lr": 0.00014685916819965554, "tps": 393761, "wall": 3277.3} {"step": 19691, "train_loss": 2.9751665592193604, "lr": 0.00014684166351164714, "tps": 393211, "wall": 3282.0} {"step": 19692, "train_loss": 3.1330883502960205, "lr": 0.00014682415965238033, "tps": 392661, "wall": 3286.8} {"step": 19693, "train_loss": 3.054439067840576, "lr": 0.00014680665662205345, "tps": 392114, "wall": 3291.6} {"step": 19694, "train_loss": 3.075082778930664, "lr": 0.00014678915442086464, "tps": 391568, "wall": 3296.3} {"step": 19695, "train_loss": 3.062175989151001, "lr": 0.00014677165304901227, "tps": 391023, "wall": 3301.1} {"step": 19696, "train_loss": 3.106635808944702, "lr": 0.0001467541525066946, "tps": 390482, "wall": 3305.8} {"step": 19697, "train_loss": 3.033801794052124, "lr": 0.0001467366527941099, "tps": 389939, "wall": 3310.6} {"step": 19698, "train_loss": 2.9965178966522217, "lr": 0.0001467191539114563, "tps": 389399, "wall": 3315.3} {"step": 19699, "train_loss": 3.1177334785461426, "lr": 0.00014670165585893208, "tps": 388858, "wall": 3320.1} {"step": 19700, "train_loss": 3.1013622283935547, "lr": 0.00014668415863673554, "tps": 388318, "wall": 3324.9} {"step": 19701, "train_loss": 3.1050643920898438, "lr": 0.00014666666224506472, "tps": 387783, "wall": 3329.7} {"step": 19702, "train_loss": 3.10184907913208, "lr": 0.00014664916668411798, "tps": 387240, "wall": 3334.5} {"step": 19703, "train_loss": 3.138974666595459, "lr": 0.0001466316719540934, "tps": 386712, "wall": 3339.2} {"step": 19704, "train_loss": 3.046143054962158, "lr": 0.00014661417805518923, "tps": 386182, "wall": 3344.0} {"step": 19705, "train_loss": 3.0647010803222656, "lr": 0.00014659668498760367, "tps": 385654, "wall": 3348.7} {"step": 19706, "train_loss": 3.1663308143615723, "lr": 0.00014657919275153477, "tps": 385127, "wall": 3353.5} {"step": 19707, "train_loss": 3.0421652793884277, "lr": 0.00014656170134718082, "tps": 384603, "wall": 3358.2} {"step": 19708, "train_loss": 3.1145856380462646, "lr": 0.0001465442107747398, "tps": 384079, "wall": 3363.0} {"step": 19709, "train_loss": 2.9678738117218018, "lr": 0.00014652672103440998, "tps": 383557, "wall": 3367.7} {"step": 19710, "train_loss": 3.0925300121307373, "lr": 0.00014650923212638944, "tps": 383034, "wall": 3372.5} {"step": 19711, "train_loss": 3.0967111587524414, "lr": 0.00014649174405087625, "tps": 382513, "wall": 3377.3} {"step": 19712, "train_loss": 3.0947964191436768, "lr": 0.00014647425680806863, "tps": 381994, "wall": 3382.0} {"step": 19713, "train_loss": 3.015291929244995, "lr": 0.00014645677039816456, "tps": 381478, "wall": 3386.8} {"step": 19714, "train_loss": 3.0867819786071777, "lr": 0.0001464392848213622, "tps": 380961, "wall": 3391.5} {"step": 19715, "train_loss": 3.1751701831817627, "lr": 0.0001464218000778596, "tps": 380438, "wall": 3396.4} {"step": 19716, "train_loss": 3.1444482803344727, "lr": 0.00014640431616785483, "tps": 379925, "wall": 3401.1} {"step": 19717, "train_loss": 3.0108420848846436, "lr": 0.00014638683309154592, "tps": 379414, "wall": 3405.9} {"step": 19718, "train_loss": 3.101884603500366, "lr": 0.00014636935084913098, "tps": 378905, "wall": 3410.6} {"step": 19719, "train_loss": 3.0119245052337646, "lr": 0.00014635186944080797, "tps": 378398, "wall": 3415.4} {"step": 19720, "train_loss": 3.0730361938476562, "lr": 0.00014633438886677507, "tps": 377890, "wall": 3420.1} {"step": 19721, "train_loss": 3.1055784225463867, "lr": 0.0001463169091272301, "tps": 377384, "wall": 3424.9} {"step": 19722, "train_loss": 3.0958991050720215, "lr": 0.00014629943022237115, "tps": 376876, "wall": 3429.7} {"step": 19723, "train_loss": 3.0708181858062744, "lr": 0.0001462819521523963, "tps": 376376, "wall": 3434.4} {"step": 19724, "train_loss": 3.1177046298980713, "lr": 0.0001462644749175035, "tps": 375875, "wall": 3439.2} {"step": 19725, "train_loss": 3.0542683601379395, "lr": 0.00014624699851789065, "tps": 375375, "wall": 3443.9} {"step": 19726, "train_loss": 3.1169893741607666, "lr": 0.00014622952295375585, "tps": 374878, "wall": 3448.7} {"step": 19727, "train_loss": 3.1065759658813477, "lr": 0.00014621204822529702, "tps": 374382, "wall": 3453.4} {"step": 19728, "train_loss": 3.0675065517425537, "lr": 0.00014619457433271205, "tps": 373878, "wall": 3458.2} {"step": 19729, "train_loss": 3.1220650672912598, "lr": 0.0001461771012761989, "tps": 373383, "wall": 3463.0} {"step": 19730, "train_loss": 3.0849499702453613, "lr": 0.0001461596290559556, "tps": 372890, "wall": 3467.8} {"step": 19731, "train_loss": 3.012293577194214, "lr": 0.00014614215767218, "tps": 372397, "wall": 3472.5} {"step": 19732, "train_loss": 3.072678565979004, "lr": 0.00014612468712507006, "tps": 371905, "wall": 3477.3} {"step": 19733, "train_loss": 3.028163433074951, "lr": 0.00014610721741482364, "tps": 371414, "wall": 3482.1} {"step": 19734, "train_loss": 3.0905723571777344, "lr": 0.00014608974854163868, "tps": 370926, "wall": 3486.8} {"step": 19735, "train_loss": 3.107560157775879, "lr": 0.000146072280505713, "tps": 370439, "wall": 3491.6} {"step": 19736, "train_loss": 3.1443264484405518, "lr": 0.00014605481330724458, "tps": 369954, "wall": 3496.3} {"step": 19737, "train_loss": 3.079491138458252, "lr": 0.0001460373469464312, "tps": 369469, "wall": 3501.1} {"step": 19738, "train_loss": 3.047139883041382, "lr": 0.00014601988142347078, "tps": 368988, "wall": 3505.8} {"step": 19739, "train_loss": 3.074857234954834, "lr": 0.0001460024167385611, "tps": 368508, "wall": 3510.6} {"step": 19740, "train_loss": 3.122924566268921, "lr": 0.0001459849528919001, "tps": 368023, "wall": 3515.4} {"step": 19741, "train_loss": 2.935072660446167, "lr": 0.00014596748988368553, "tps": 367544, "wall": 3520.2} {"step": 19742, "train_loss": 3.0493762493133545, "lr": 0.0001459500277141152, "tps": 367067, "wall": 3524.9} {"step": 19743, "train_loss": 3.106293201446533, "lr": 0.00014593256638338703, "tps": 366588, "wall": 3529.7} {"step": 19744, "train_loss": 3.065931797027588, "lr": 0.00014591510589169872, "tps": 366111, "wall": 3534.5} {"step": 19745, "train_loss": 3.1555604934692383, "lr": 0.0001458976462392481, "tps": 365636, "wall": 3539.2} {"step": 19746, "train_loss": 2.970608711242676, "lr": 0.00014588018742623296, "tps": 365163, "wall": 3544.0} {"step": 19747, "train_loss": 3.080859422683716, "lr": 0.0001458627294528511, "tps": 364691, "wall": 3548.8} {"step": 19748, "train_loss": 3.208669662475586, "lr": 0.00014584527231930022, "tps": 364219, "wall": 3553.5} {"step": 19749, "train_loss": 3.0863821506500244, "lr": 0.00014582781602577808, "tps": 363750, "wall": 3558.3} {"step": 19750, "train_loss": 3.048612594604492, "lr": 0.00014581036057248245, "tps": 363281, "wall": 3563.1} {"step": 19751, "train_loss": 3.115642547607422, "lr": 0.00014579290595961113, "tps": 362815, "wall": 3567.8} {"step": 19752, "train_loss": 2.9995131492614746, "lr": 0.00014577545218736178, "tps": 362350, "wall": 3572.6} {"step": 19753, "train_loss": 3.0147769451141357, "lr": 0.00014575799925593206, "tps": 361881, "wall": 3577.4} {"step": 19754, "train_loss": 3.0309641361236572, "lr": 0.00014574054716551976, "tps": 361419, "wall": 3582.2} {"step": 19755, "train_loss": 2.945855140686035, "lr": 0.00014572309591632257, "tps": 360958, "wall": 3586.9} {"step": 19756, "train_loss": 3.192599296569824, "lr": 0.0001457056455085382, "tps": 360498, "wall": 3591.7} {"step": 19757, "train_loss": 3.0431339740753174, "lr": 0.00014568819594236424, "tps": 360039, "wall": 3596.4} {"step": 19758, "train_loss": 3.0457684993743896, "lr": 0.00014567074721799847, "tps": 359581, "wall": 3601.2} {"step": 19759, "train_loss": 3.122781276702881, "lr": 0.00014565329933563848, "tps": 359126, "wall": 3605.9} {"step": 19760, "train_loss": 3.0355916023254395, "lr": 0.00014563585229548194, "tps": 358670, "wall": 3610.7} {"step": 19761, "train_loss": 3.0706372261047363, "lr": 0.00014561840609772646, "tps": 358216, "wall": 3615.5} {"step": 19762, "train_loss": 3.1363441944122314, "lr": 0.00014560096074256972, "tps": 357763, "wall": 3620.2} {"step": 19763, "train_loss": 3.1194815635681152, "lr": 0.00014558351623020931, "tps": 357311, "wall": 3625.0} {"step": 19764, "train_loss": 2.9606237411499023, "lr": 0.00014556607256084288, "tps": 356861, "wall": 3629.8} {"step": 19765, "train_loss": 3.006558418273926, "lr": 0.00014554862973466799, "tps": 356403, "wall": 3634.6} {"step": 19766, "train_loss": 3.086573600769043, "lr": 0.00014553118775188225, "tps": 355958, "wall": 3639.3} {"step": 19767, "train_loss": 3.0661654472351074, "lr": 0.00014551374661268325, "tps": 355511, "wall": 3644.1} {"step": 19768, "train_loss": 3.0480034351348877, "lr": 0.00014549630631726857, "tps": 355068, "wall": 3648.8} {"step": 19769, "train_loss": 3.1183762550354004, "lr": 0.00014547886686583575, "tps": 354623, "wall": 3653.6} {"step": 19770, "train_loss": 3.0238523483276367, "lr": 0.00014546142825858232, "tps": 354181, "wall": 3658.3} {"step": 19771, "train_loss": 3.074462890625, "lr": 0.00014544399049570595, "tps": 353738, "wall": 3663.1} {"step": 19772, "train_loss": 3.11978816986084, "lr": 0.00014542655357740398, "tps": 353298, "wall": 3667.8} {"step": 19773, "train_loss": 3.068882465362549, "lr": 0.00014540911750387408, "tps": 352858, "wall": 3672.6} {"step": 19774, "train_loss": 3.01031231880188, "lr": 0.0001453916822753138, "tps": 352418, "wall": 3677.4} {"step": 19775, "train_loss": 3.1197094917297363, "lr": 0.00014537424789192054, "tps": 351981, "wall": 3682.1} {"step": 19776, "train_loss": 3.1668949127197266, "lr": 0.00014535681435389182, "tps": 351543, "wall": 3686.9} {"step": 19777, "train_loss": 3.113966941833496, "lr": 0.00014533938166142512, "tps": 351108, "wall": 3691.6} {"step": 19778, "train_loss": 3.1410775184631348, "lr": 0.00014532194981471802, "tps": 350670, "wall": 3696.5} {"step": 19779, "train_loss": 3.0129213333129883, "lr": 0.00014530451881396785, "tps": 350236, "wall": 3701.2} {"step": 19780, "train_loss": 2.981677770614624, "lr": 0.00014528708865937215, "tps": 349804, "wall": 3706.0} {"step": 19781, "train_loss": 3.0410423278808594, "lr": 0.00014526965935112836, "tps": 349375, "wall": 3710.7} {"step": 19782, "train_loss": 3.0998167991638184, "lr": 0.0001452522308894339, "tps": 348946, "wall": 3715.5} {"step": 19783, "train_loss": 2.9912524223327637, "lr": 0.00014523480327448623, "tps": 348518, "wall": 3720.2} {"step": 19784, "train_loss": 3.1054763793945312, "lr": 0.00014521737650648273, "tps": 348090, "wall": 3725.0} {"step": 19785, "train_loss": 3.016909599304199, "lr": 0.00014519995058562087, "tps": 347662, "wall": 3729.8} {"step": 19786, "train_loss": 3.2296061515808105, "lr": 0.000145182525512098, "tps": 347239, "wall": 3734.5} {"step": 19787, "train_loss": 3.0430588722229004, "lr": 0.0001451651012861115, "tps": 346815, "wall": 3739.2} {"step": 19788, "train_loss": 3.1583914756774902, "lr": 0.0001451476779078588, "tps": 346393, "wall": 3744.0} {"step": 19789, "train_loss": 3.1167099475860596, "lr": 0.00014513025537753725, "tps": 345971, "wall": 3748.7} {"step": 19790, "train_loss": 3.101472854614258, "lr": 0.00014511283369534423, "tps": 345551, "wall": 3753.5} {"step": 19791, "train_loss": 3.1411571502685547, "lr": 0.00014509541286147708, "tps": 345124, "wall": 3758.3} {"step": 19792, "train_loss": 3.1188106536865234, "lr": 0.00014507799287613314, "tps": 344706, "wall": 3763.1} {"step": 19793, "train_loss": 3.0777854919433594, "lr": 0.00014506057373950978, "tps": 344286, "wall": 3767.8} {"step": 19794, "train_loss": 3.12180233001709, "lr": 0.00014504315545180423, "tps": 343867, "wall": 3772.6} {"step": 19795, "train_loss": 3.1226842403411865, "lr": 0.0001450257380132139, "tps": 343451, "wall": 3777.4} {"step": 19796, "train_loss": 3.028170585632324, "lr": 0.00014500832142393612, "tps": 343036, "wall": 3782.1} {"step": 19797, "train_loss": 3.187502145767212, "lr": 0.00014499090568416802, "tps": 342623, "wall": 3786.9} {"step": 19798, "train_loss": 3.0515167713165283, "lr": 0.0001449734907941071, "tps": 342211, "wall": 3791.7} {"step": 19799, "train_loss": 3.137082576751709, "lr": 0.00014495607675395043, "tps": 341801, "wall": 3796.4} {"step": 19800, "train_loss": 2.9814586639404297, "lr": 0.00014493866356389548, "tps": 341391, "wall": 3801.1} {"step": 19801, "train_loss": 3.1291563510894775, "lr": 0.0001449212512241394, "tps": 340982, "wall": 3805.9} {"step": 19802, "train_loss": 3.074409008026123, "lr": 0.0001449038397348794, "tps": 340573, "wall": 3810.7} {"step": 19803, "train_loss": 3.1421027183532715, "lr": 0.00014488642909631284, "tps": 340161, "wall": 3815.5} {"step": 19804, "train_loss": 3.135464668273926, "lr": 0.00014486901930863683, "tps": 339754, "wall": 3820.2} {"step": 19805, "train_loss": 3.0585341453552246, "lr": 0.00014485161037204857, "tps": 339350, "wall": 3825.0} {"step": 19806, "train_loss": 3.104926109313965, "lr": 0.00014483420228674545, "tps": 338946, "wall": 3829.7} {"step": 19807, "train_loss": 3.0276739597320557, "lr": 0.0001448167950529245, "tps": 338542, "wall": 3834.5} {"step": 19808, "train_loss": 3.0555152893066406, "lr": 0.00014479938867078298, "tps": 338139, "wall": 3839.3} {"step": 19809, "train_loss": 3.077425479888916, "lr": 0.00014478198314051807, "tps": 337738, "wall": 3844.0} {"step": 19810, "train_loss": 3.1194686889648438, "lr": 0.00014476457846232684, "tps": 337339, "wall": 3848.7} {"step": 19811, "train_loss": 3.051516056060791, "lr": 0.0001447471746364066, "tps": 336939, "wall": 3853.5} {"step": 19812, "train_loss": 3.0032176971435547, "lr": 0.00014472977166295444, "tps": 336540, "wall": 3858.3} {"step": 19813, "train_loss": 2.9708428382873535, "lr": 0.0001447123695421674, "tps": 336142, "wall": 3863.0} {"step": 19814, "train_loss": 3.0514328479766846, "lr": 0.00014469496827424286, "tps": 335746, "wall": 3867.8} {"step": 19815, "train_loss": 3.0892210006713867, "lr": 0.00014467756785937775, "tps": 335350, "wall": 3872.5} {"step": 19816, "train_loss": 3.067704677581787, "lr": 0.00014466016829776913, "tps": 334949, "wall": 3877.4} {"step": 19817, "train_loss": 3.094029664993286, "lr": 0.0001446427695896143, "tps": 334553, "wall": 3882.2} {"step": 19818, "train_loss": 3.0595955848693848, "lr": 0.00014462537173511023, "tps": 334160, "wall": 3886.9} {"step": 19819, "train_loss": 3.1266393661499023, "lr": 0.00014460797473445398, "tps": 333769, "wall": 3891.7} {"step": 19820, "train_loss": 3.071225881576538, "lr": 0.00014459057858784275, "tps": 333379, "wall": 3896.4} {"step": 19821, "train_loss": 3.13077449798584, "lr": 0.0001445731832954735, "tps": 332990, "wall": 3901.2} {"step": 19822, "train_loss": 3.143637180328369, "lr": 0.00014455578885754324, "tps": 332601, "wall": 3905.9} {"step": 19823, "train_loss": 3.1185619831085205, "lr": 0.00014453839527424917, "tps": 332212, "wall": 3910.7} {"step": 19824, "train_loss": 3.215238332748413, "lr": 0.00014452100254578815, "tps": 331825, "wall": 3915.5} {"step": 19825, "train_loss": 3.1293225288391113, "lr": 0.0001445036106723574, "tps": 331439, "wall": 3920.2} {"step": 19826, "train_loss": 2.987574577331543, "lr": 0.00014448621965415382, "tps": 331054, "wall": 3925.0} {"step": 19827, "train_loss": 2.995490074157715, "lr": 0.00014446882949137435, "tps": 330671, "wall": 3929.7} {"step": 19828, "train_loss": 3.1020302772521973, "lr": 0.00014445144018421612, "tps": 330282, "wall": 3934.6} {"step": 19829, "train_loss": 3.1945056915283203, "lr": 0.00014443405173287607, "tps": 329902, "wall": 3939.3} {"step": 19830, "train_loss": 3.113037109375, "lr": 0.0001444166641375511, "tps": 329521, "wall": 3944.0} {"step": 19831, "train_loss": 3.1309452056884766, "lr": 0.00014439927739843834, "tps": 329141, "wall": 3948.8} {"step": 19832, "train_loss": 3.014993906021118, "lr": 0.00014438189151573467, "tps": 328761, "wall": 3953.6} {"step": 19833, "train_loss": 3.072174310684204, "lr": 0.00014436450648963692, "tps": 328381, "wall": 3958.3} {"step": 19834, "train_loss": 3.1530158519744873, "lr": 0.00014434712232034222, "tps": 328005, "wall": 3963.1} {"step": 19835, "train_loss": 3.0673489570617676, "lr": 0.00014432973900804742, "tps": 327629, "wall": 3967.8} {"step": 19836, "train_loss": 3.0798139572143555, "lr": 0.0001443123565529493, "tps": 327253, "wall": 3972.6} {"step": 19837, "train_loss": 3.0462779998779297, "lr": 0.00014429497495524503, "tps": 326878, "wall": 3977.3} {"step": 19838, "train_loss": 3.078211784362793, "lr": 0.00014427759421513137, "tps": 326503, "wall": 3982.1} {"step": 19839, "train_loss": 3.2301197052001953, "lr": 0.00014426021433280512, "tps": 326129, "wall": 3986.9} {"step": 19840, "train_loss": 3.110084295272827, "lr": 0.00014424283530846337, "tps": 325757, "wall": 3991.6} {"step": 19841, "train_loss": 3.141071081161499, "lr": 0.00014422545714230277, "tps": 325380, "wall": 3996.4} {"step": 19842, "train_loss": 2.9969654083251953, "lr": 0.0001442080798345204, "tps": 325009, "wall": 4001.2} {"step": 19843, "train_loss": 2.9822049140930176, "lr": 0.00014419070338531298, "tps": 324639, "wall": 4006.0} {"step": 19844, "train_loss": 3.0690348148345947, "lr": 0.0001441733277948773, "tps": 324271, "wall": 4010.7} {"step": 19845, "train_loss": 3.0210399627685547, "lr": 0.00014415595306341031, "tps": 323905, "wall": 4015.5} {"step": 19846, "train_loss": 3.034121513366699, "lr": 0.00014413857919110882, "tps": 323538, "wall": 4020.2} {"step": 19847, "train_loss": 3.112945795059204, "lr": 0.00014412120617816955, "tps": 323172, "wall": 4025.0} {"step": 19848, "train_loss": 3.106905460357666, "lr": 0.00014410383402478942, "tps": 322807, "wall": 4029.7} {"step": 19849, "train_loss": 3.082484722137451, "lr": 0.00014408646273116516, "tps": 322441, "wall": 4034.5} {"step": 19850, "train_loss": 3.1080710887908936, "lr": 0.00014406909229749352, "tps": 322078, "wall": 4039.2} {"step": 19851, "train_loss": 3.007131814956665, "lr": 0.00014405172272397132, "tps": 321715, "wall": 4044.0} {"step": 19852, "train_loss": 3.081766128540039, "lr": 0.00014403435401079534, "tps": 321353, "wall": 4048.8} {"step": 19853, "train_loss": 3.159497022628784, "lr": 0.00014401698615816225, "tps": 320992, "wall": 4053.5} {"step": 19854, "train_loss": 3.1732635498046875, "lr": 0.00014399961916626892, "tps": 320628, "wall": 4058.3} {"step": 19855, "train_loss": 3.09317946434021, "lr": 0.00014398225303531201, "tps": 320267, "wall": 4063.1} {"step": 19856, "train_loss": 3.0717673301696777, "lr": 0.0001439648877654882, "tps": 319909, "wall": 4067.9} {"step": 19857, "train_loss": 3.1725306510925293, "lr": 0.00014394752335699428, "tps": 319551, "wall": 4072.6} {"step": 19858, "train_loss": 3.1416749954223633, "lr": 0.00014393015981002688, "tps": 319194, "wall": 4077.4} {"step": 19859, "train_loss": 3.1551671028137207, "lr": 0.0001439127971247828, "tps": 318840, "wall": 4082.1} {"step": 19860, "train_loss": 3.1350440979003906, "lr": 0.00014389543530145867, "tps": 318485, "wall": 4086.9} {"step": 19861, "train_loss": 3.079934597015381, "lr": 0.0001438780743402511, "tps": 318131, "wall": 4091.6} {"step": 19862, "train_loss": 3.0220468044281006, "lr": 0.00014386071424135697, "tps": 317777, "wall": 4096.4} {"step": 19863, "train_loss": 3.114119052886963, "lr": 0.0001438433550049727, "tps": 317424, "wall": 4101.2} {"step": 19864, "train_loss": 3.1442489624023438, "lr": 0.00014382599663129497, "tps": 317074, "wall": 4105.9} {"step": 19865, "train_loss": 3.054871082305908, "lr": 0.00014380863912052055, "tps": 316724, "wall": 4110.6} {"step": 19866, "train_loss": 3.189697265625, "lr": 0.00014379128247284597, "tps": 316370, "wall": 4115.4} {"step": 19867, "train_loss": 3.0314881801605225, "lr": 0.00014377392668846786, "tps": 316020, "wall": 4120.2} {"step": 19868, "train_loss": 3.088994026184082, "lr": 0.00014375657176758283, "tps": 315668, "wall": 4125.0} {"step": 19869, "train_loss": 3.1061325073242188, "lr": 0.00014373921771038747, "tps": 315320, "wall": 4129.8} {"step": 19870, "train_loss": 3.0808868408203125, "lr": 0.00014372186451707837, "tps": 314974, "wall": 4134.5} {"step": 19871, "train_loss": 3.080554485321045, "lr": 0.00014370451218785214, "tps": 314628, "wall": 4139.3} {"step": 19872, "train_loss": 3.078880786895752, "lr": 0.00014368716072290534, "tps": 314284, "wall": 4144.0} {"step": 19873, "train_loss": 3.052243709564209, "lr": 0.00014366981012243444, "tps": 313939, "wall": 4148.8} {"step": 19874, "train_loss": 3.1653311252593994, "lr": 0.00014365246038663612, "tps": 313594, "wall": 4153.5} {"step": 19875, "train_loss": 3.076148271560669, "lr": 0.0001436351115157069, "tps": 313253, "wall": 4158.3} {"step": 19876, "train_loss": 3.118743658065796, "lr": 0.00014361776350984315, "tps": 312911, "wall": 4163.0} {"step": 19877, "train_loss": 3.0358645915985107, "lr": 0.00014360041636924162, "tps": 312569, "wall": 4167.8} {"step": 19878, "train_loss": 3.092345714569092, "lr": 0.0001435830700940986, "tps": 312230, "wall": 4172.5} {"step": 19879, "train_loss": 2.9657483100891113, "lr": 0.0001435657246846108, "tps": 311886, "wall": 4177.3} {"step": 19880, "train_loss": 3.018279552459717, "lr": 0.00014354838014097457, "tps": 311545, "wall": 4182.1} {"step": 19881, "train_loss": 3.102722644805908, "lr": 0.00014353103646338634, "tps": 311207, "wall": 4186.9} {"step": 19882, "train_loss": 2.9949660301208496, "lr": 0.0001435136936520428, "tps": 310869, "wall": 4191.6} {"step": 19883, "train_loss": 3.1378555297851562, "lr": 0.00014349635170714026, "tps": 310531, "wall": 4196.4} {"step": 19884, "train_loss": 3.1125762462615967, "lr": 0.00014347901062887507, "tps": 310194, "wall": 4201.2} {"step": 19885, "train_loss": 3.107964038848877, "lr": 0.0001434616704174439, "tps": 309857, "wall": 4206.0} {"step": 19886, "train_loss": 3.0610361099243164, "lr": 0.00014344433107304306, "tps": 309520, "wall": 4210.8} {"step": 19887, "train_loss": 3.1339330673217773, "lr": 0.00014342699259586888, "tps": 309187, "wall": 4215.5} {"step": 19888, "train_loss": 3.0272281169891357, "lr": 0.00014340965498611796, "tps": 308855, "wall": 4220.2} {"step": 19889, "train_loss": 3.009366989135742, "lr": 0.0001433923182439866, "tps": 308524, "wall": 4225.0} {"step": 19890, "train_loss": 3.0909571647644043, "lr": 0.0001433749823696712, "tps": 308192, "wall": 4229.7} {"step": 19891, "train_loss": 3.2728185653686523, "lr": 0.00014335764736336811, "tps": 307856, "wall": 4234.6} {"step": 19892, "train_loss": 3.0278472900390625, "lr": 0.00014334031322527384, "tps": 307527, "wall": 4239.3} {"step": 19893, "train_loss": 3.041179656982422, "lr": 0.00014332297995558451, "tps": 307198, "wall": 4244.1} {"step": 19894, "train_loss": 3.1141862869262695, "lr": 0.00014330564755449672, "tps": 306871, "wall": 4248.8} {"step": 19895, "train_loss": 3.0379586219787598, "lr": 0.00014328831602220657, "tps": 306542, "wall": 4253.6} {"step": 19896, "train_loss": 3.1668758392333984, "lr": 0.00014327098535891065, "tps": 306215, "wall": 4258.3} {"step": 19897, "train_loss": 3.195542335510254, "lr": 0.00014325365556480514, "tps": 305887, "wall": 4263.1} {"step": 19898, "train_loss": 3.0677433013916016, "lr": 0.00014323632664008633, "tps": 305563, "wall": 4267.9} {"step": 19899, "train_loss": 3.0934977531433105, "lr": 0.00014321899858495062, "tps": 305237, "wall": 4272.6} {"step": 19900, "train_loss": 3.1053037643432617, "lr": 0.00014320167139959423, "tps": 304912, "wall": 4277.4} {"step": 19901, "train_loss": 3.1030266284942627, "lr": 0.0001431843450842134, "tps": 304588, "wall": 4282.2} {"step": 19902, "train_loss": 3.147890567779541, "lr": 0.00014316701963900457, "tps": 304267, "wall": 4286.9} {"step": 19903, "train_loss": 3.1475133895874023, "lr": 0.00014314969506416385, "tps": 303945, "wall": 4291.7} {"step": 19904, "train_loss": 3.1394293308258057, "lr": 0.0001431323713598875, "tps": 303619, "wall": 4296.5} {"step": 19905, "train_loss": 3.0901894569396973, "lr": 0.0001431150485263719, "tps": 303298, "wall": 4301.2} {"step": 19906, "train_loss": 3.063114643096924, "lr": 0.00014309772656381312, "tps": 302978, "wall": 4306.0} {"step": 19907, "train_loss": 3.003429412841797, "lr": 0.00014308040547240743, "tps": 302659, "wall": 4310.8} {"step": 19908, "train_loss": 3.0520477294921875, "lr": 0.00014306308525235113, "tps": 302342, "wall": 4315.5} {"step": 19909, "train_loss": 3.094132900238037, "lr": 0.00014304576590384036, "tps": 302024, "wall": 4320.2} {"step": 19910, "train_loss": 3.0575942993164062, "lr": 0.00014302844742707124, "tps": 301708, "wall": 4325.0} {"step": 19911, "train_loss": 3.021507501602173, "lr": 0.00014301112982224008, "tps": 301392, "wall": 4329.7} {"step": 19912, "train_loss": 3.0573208332061768, "lr": 0.00014299381308954297, "tps": 301077, "wall": 4334.5} {"step": 19913, "train_loss": 3.104428291320801, "lr": 0.0001429764972291762, "tps": 300761, "wall": 4339.3} {"step": 19914, "train_loss": 3.1155331134796143, "lr": 0.00014295918224133583, "tps": 300447, "wall": 4344.0} {"step": 19915, "train_loss": 3.0609560012817383, "lr": 0.00014294186812621788, "tps": 300133, "wall": 4348.8} {"step": 19916, "train_loss": 3.0715885162353516, "lr": 0.00014292455488401875, "tps": 299821, "wall": 4353.5} {"step": 19917, "train_loss": 3.0581626892089844, "lr": 0.00014290724251493438, "tps": 299505, "wall": 4358.3} {"step": 19918, "train_loss": 3.1494853496551514, "lr": 0.00014288993101916093, "tps": 299194, "wall": 4363.1} {"step": 19919, "train_loss": 3.0048739910125732, "lr": 0.00014287262039689455, "tps": 298884, "wall": 4367.8} {"step": 19920, "train_loss": 3.0524678230285645, "lr": 0.00014285531064833133, "tps": 298575, "wall": 4372.6} {"step": 19921, "train_loss": 3.065661907196045, "lr": 0.0001428380017736672, "tps": 298266, "wall": 4377.3} {"step": 19922, "train_loss": 3.0192337036132812, "lr": 0.00014282069377309842, "tps": 297958, "wall": 4382.1} {"step": 19923, "train_loss": 3.0404748916625977, "lr": 0.00014280338664682108, "tps": 297649, "wall": 4386.8} {"step": 19924, "train_loss": 3.118368148803711, "lr": 0.00014278608039503102, "tps": 297341, "wall": 4391.6} {"step": 19925, "train_loss": 3.1515908241271973, "lr": 0.00014276877501792452, "tps": 297034, "wall": 4396.4} {"step": 19926, "train_loss": 3.0722525119781494, "lr": 0.00014275147051569746, "tps": 296728, "wall": 4401.1} {"step": 19927, "train_loss": 3.1658639907836914, "lr": 0.0001427341668885459, "tps": 296422, "wall": 4405.9} {"step": 19928, "train_loss": 2.967118978500366, "lr": 0.00014271686413666593, "tps": 296117, "wall": 4410.6} {"step": 19929, "train_loss": 3.102062225341797, "lr": 0.0001426995622602535, "tps": 295808, "wall": 4415.5} {"step": 19930, "train_loss": 3.0971150398254395, "lr": 0.00014268226125950458, "tps": 295503, "wall": 4420.2} {"step": 19931, "train_loss": 3.0352141857147217, "lr": 0.00014266496113461523, "tps": 295200, "wall": 4425.0} {"step": 19932, "train_loss": 3.0628411769866943, "lr": 0.00014264766188578132, "tps": 294897, "wall": 4429.8} {"step": 19933, "train_loss": 3.091385841369629, "lr": 0.0001426303635131989, "tps": 294593, "wall": 4434.6} {"step": 19934, "train_loss": 3.0546069145202637, "lr": 0.00014261306601706398, "tps": 294291, "wall": 4439.3} {"step": 19935, "train_loss": 3.0051536560058594, "lr": 0.00014259576939757232, "tps": 293990, "wall": 4444.1} {"step": 19936, "train_loss": 3.1554455757141113, "lr": 0.00014257847365492008, "tps": 293692, "wall": 4448.8} {"step": 19937, "train_loss": 3.1591858863830566, "lr": 0.00014256117878930303, "tps": 293393, "wall": 4453.6} {"step": 19938, "train_loss": 3.012204170227051, "lr": 0.00014254388480091712, "tps": 293095, "wall": 4458.3} {"step": 19939, "train_loss": 3.2310118675231934, "lr": 0.0001425265916899583, "tps": 292798, "wall": 4463.1} {"step": 19940, "train_loss": 3.115532875061035, "lr": 0.00014250929945662248, "tps": 292502, "wall": 4467.8} {"step": 19941, "train_loss": 3.0600361824035645, "lr": 0.00014249200810110538, "tps": 292206, "wall": 4472.6} {"step": 19942, "train_loss": 3.063992500305176, "lr": 0.0001424747176236031, "tps": 291906, "wall": 4477.4} {"step": 19943, "train_loss": 3.0594606399536133, "lr": 0.00014245742802431144, "tps": 291611, "wall": 4482.2} {"step": 19944, "train_loss": 3.12270450592041, "lr": 0.00014244013930342616, "tps": 291317, "wall": 4486.9} {"step": 19945, "train_loss": 3.1421327590942383, "lr": 0.0001424228514611432, "tps": 291021, "wall": 4491.7} {"step": 19946, "train_loss": 3.129326820373535, "lr": 0.00014240556449765843, "tps": 290727, "wall": 4496.5} {"step": 19947, "train_loss": 3.0403056144714355, "lr": 0.0001423882784131675, "tps": 290435, "wall": 4501.2} {"step": 19948, "train_loss": 3.2030692100524902, "lr": 0.00014237099320786646, "tps": 290143, "wall": 4506.0} {"step": 19949, "train_loss": 3.093508243560791, "lr": 0.00014235370888195095, "tps": 289852, "wall": 4510.7} {"step": 19950, "train_loss": 3.1027121543884277, "lr": 0.00014233642543561684, "tps": 289562, "wall": 4515.5} {"step": 19951, "train_loss": 3.1327919960021973, "lr": 0.00014231914286905997, "tps": 289271, "wall": 4520.2} {"step": 19952, "train_loss": 3.039346694946289, "lr": 0.00014230186118247598, "tps": 288981, "wall": 4525.0} {"step": 19953, "train_loss": 3.0944700241088867, "lr": 0.00014228458037606072, "tps": 288692, "wall": 4529.7} {"step": 19954, "train_loss": 3.084719181060791, "lr": 0.00014226730045000996, "tps": 288399, "wall": 4534.6} {"step": 19955, "train_loss": 2.994905948638916, "lr": 0.00014225002140451934, "tps": 288112, "wall": 4539.3} {"step": 19956, "train_loss": 3.0155680179595947, "lr": 0.0001422327432397848, "tps": 287825, "wall": 4544.1} {"step": 19957, "train_loss": 3.024533748626709, "lr": 0.00014221546595600195, "tps": 287539, "wall": 4548.8} {"step": 19958, "train_loss": 3.151942253112793, "lr": 0.0001421981895533664, "tps": 287253, "wall": 4553.6} {"step": 19959, "train_loss": 3.001674175262451, "lr": 0.00014218091403207407, "tps": 286968, "wall": 4558.3} {"step": 19960, "train_loss": 3.045192241668701, "lr": 0.0001421636393923205, "tps": 286682, "wall": 4563.1} {"step": 19961, "train_loss": 2.9811062812805176, "lr": 0.00014214636563430143, "tps": 286397, "wall": 4567.9} {"step": 19962, "train_loss": 3.0067081451416016, "lr": 0.00014212909275821263, "tps": 286112, "wall": 4572.7} {"step": 19963, "train_loss": 3.0614147186279297, "lr": 0.0001421118207642496, "tps": 285829, "wall": 4577.4} {"step": 19964, "train_loss": 3.0146312713623047, "lr": 0.00014209454965260804, "tps": 285546, "wall": 4582.2} {"step": 19965, "train_loss": 3.106353759765625, "lr": 0.00014207727942348376, "tps": 285265, "wall": 4586.9} {"step": 19966, "train_loss": 3.0921058654785156, "lr": 0.00014206001007707216, "tps": 284984, "wall": 4591.7} {"step": 19967, "train_loss": 3.0953423976898193, "lr": 0.000142042741613569, "tps": 284698, "wall": 4596.5} {"step": 19968, "train_loss": 3.070249319076538, "lr": 0.00014202547403316995, "tps": 284419, "wall": 4601.3} {"step": 19969, "train_loss": 3.088815450668335, "lr": 0.00014200820733607046, "tps": 284140, "wall": 4606.0} {"step": 19970, "train_loss": 3.0412073135375977, "lr": 0.0001419909415224663, "tps": 283862, "wall": 4610.7} {"step": 19971, "train_loss": 3.134153366088867, "lr": 0.00014197367659255292, "tps": 283585, "wall": 4615.5} {"step": 19972, "train_loss": 3.0107619762420654, "lr": 0.00014195641254652593, "tps": 283307, "wall": 4620.2} {"step": 19973, "train_loss": 3.112795829772949, "lr": 0.000141939149384581, "tps": 283031, "wall": 4625.0} {"step": 19974, "train_loss": 3.072890281677246, "lr": 0.00014192188710691357, "tps": 282755, "wall": 4629.7} {"step": 19975, "train_loss": 3.0600924491882324, "lr": 0.0001419046257137192, "tps": 282478, "wall": 4634.5} {"step": 19976, "train_loss": 3.0323996543884277, "lr": 0.00014188736520519358, "tps": 282201, "wall": 4639.3} {"step": 19977, "train_loss": 3.1325790882110596, "lr": 0.00014187010558153196, "tps": 281927, "wall": 4644.0} {"step": 19978, "train_loss": 3.021399974822998, "lr": 0.0001418528468429301, "tps": 281653, "wall": 4648.8} {"step": 19979, "train_loss": 3.103438377380371, "lr": 0.0001418355889895834, "tps": 281380, "wall": 4653.5} {"step": 19980, "train_loss": 3.038283348083496, "lr": 0.00014181833202168731, "tps": 281103, "wall": 4658.3} {"step": 19981, "train_loss": 3.098548650741577, "lr": 0.00014180107593943743, "tps": 280830, "wall": 4663.1} {"step": 19982, "train_loss": 2.997373580932617, "lr": 0.00014178382074302924, "tps": 280558, "wall": 4667.8} {"step": 19983, "train_loss": 3.0739192962646484, "lr": 0.00014176656643265809, "tps": 280287, "wall": 4672.6} {"step": 19984, "train_loss": 3.1211838722229004, "lr": 0.00014174931300851954, "tps": 280016, "wall": 4677.4} {"step": 19985, "train_loss": 3.0851693153381348, "lr": 0.00014173206047080902, "tps": 279745, "wall": 4682.1} {"step": 19986, "train_loss": 2.9862115383148193, "lr": 0.0001417148088197219, "tps": 279476, "wall": 4686.9} {"step": 19987, "train_loss": 2.947746515274048, "lr": 0.00014169755805545372, "tps": 279205, "wall": 4691.6} {"step": 19988, "train_loss": 3.0888421535491943, "lr": 0.00014168030817819985, "tps": 278937, "wall": 4696.4} {"step": 19989, "train_loss": 3.1557846069335938, "lr": 0.00014166305918815559, "tps": 278669, "wall": 4701.1} {"step": 19990, "train_loss": 3.062145471572876, "lr": 0.00014164581108551652, "tps": 278400, "wall": 4705.9} {"step": 19991, "train_loss": 3.069459915161133, "lr": 0.00014162856387047782, "tps": 278132, "wall": 4710.7} {"step": 19992, "train_loss": 3.1160929203033447, "lr": 0.00014161131754323512, "tps": 277863, "wall": 4715.5} {"step": 19993, "train_loss": 3.100496530532837, "lr": 0.00014159407210398363, "tps": 277597, "wall": 4720.2} {"step": 19994, "train_loss": 3.0970985889434814, "lr": 0.0001415768275529187, "tps": 277333, "wall": 4725.0} {"step": 19995, "train_loss": 3.07938814163208, "lr": 0.00014155958389023573, "tps": 277068, "wall": 4729.7} {"step": 19996, "train_loss": 3.022282123565674, "lr": 0.00014154234111613006, "tps": 276804, "wall": 4734.5} {"step": 19997, "train_loss": 3.070558547973633, "lr": 0.0001415250992307969, "tps": 276540, "wall": 4739.2} {"step": 19998, "train_loss": 3.0052413940429688, "lr": 0.0001415078582344318, "tps": 276277, "wall": 4744.0} {"step": 19999, "train_loss": 3.0171761512756348, "lr": 0.00014149061812722988, "tps": 276014, "wall": 4748.7} {"step": 20000, "train_loss": 3.073108196258545, "lr": 0.0001414733789093864, "tps": 275751, "wall": 4753.5, "val_loss_monitor": 3.4275573795869136, "val_loss_full": 3.445671060348036} {"step": 20001, "train_loss": 3.199326515197754, "lr": 0.00014145614058109685, "tps": 266307, "wall": 4922.3} {"step": 20002, "train_loss": 3.3114395141601562, "lr": 0.00014143890314255634, "tps": 266063, "wall": 4927.1} {"step": 20003, "train_loss": 3.2406673431396484, "lr": 0.00014142166659396015, "tps": 265819, "wall": 4931.9} {"step": 20004, "train_loss": 3.239340305328369, "lr": 0.0001414044309355036, "tps": 265576, "wall": 4936.6} {"step": 20005, "train_loss": 3.0809998512268066, "lr": 0.0001413871961673819, "tps": 265334, "wall": 4941.4} {"step": 20006, "train_loss": 3.224431276321411, "lr": 0.0001413699622897903, "tps": 265093, "wall": 4946.1} {"step": 20007, "train_loss": 3.2888548374176025, "lr": 0.00014135272930292407, "tps": 264851, "wall": 4950.9} {"step": 20008, "train_loss": 3.399301528930664, "lr": 0.00014133549720697834, "tps": 264607, "wall": 4955.7} {"step": 20009, "train_loss": 3.1917667388916016, "lr": 0.0001413182660021483, "tps": 264367, "wall": 4960.4} {"step": 20010, "train_loss": 3.2318506240844727, "lr": 0.00014130103568862928, "tps": 264126, "wall": 4965.2} {"step": 20011, "train_loss": 3.3299779891967773, "lr": 0.0001412838062666163, "tps": 263886, "wall": 4970.0} {"step": 20012, "train_loss": 3.244643211364746, "lr": 0.0001412665777363047, "tps": 263647, "wall": 4974.7} {"step": 20013, "train_loss": 3.1826958656311035, "lr": 0.00014124935009788954, "tps": 263408, "wall": 4979.5} {"step": 20014, "train_loss": 3.271972179412842, "lr": 0.00014123212335156597, "tps": 263169, "wall": 4984.3} {"step": 20015, "train_loss": 3.312291383743286, "lr": 0.00014121489749752922, "tps": 262931, "wall": 4989.0} {"step": 20016, "train_loss": 3.264313220977783, "lr": 0.00014119767253597436, "tps": 262694, "wall": 4993.8} {"step": 20017, "train_loss": 3.2871763706207275, "lr": 0.0001411804484670965, "tps": 262457, "wall": 4998.5} {"step": 20018, "train_loss": 3.215226173400879, "lr": 0.00014116322529109083, "tps": 262220, "wall": 5003.3} {"step": 20019, "train_loss": 3.2341971397399902, "lr": 0.00014114600300815238, "tps": 261984, "wall": 5008.0} {"step": 20020, "train_loss": 3.27803373336792, "lr": 0.00014112878161847624, "tps": 261749, "wall": 5012.8} {"step": 20021, "train_loss": 3.288785696029663, "lr": 0.0001411115611222576, "tps": 261510, "wall": 5017.6} {"step": 20022, "train_loss": 3.330935478210449, "lr": 0.0001410943415196915, "tps": 261275, "wall": 5022.4} {"step": 20023, "train_loss": 3.166125535964966, "lr": 0.0001410771228109728, "tps": 261040, "wall": 5027.2} {"step": 20024, "train_loss": 3.326072931289673, "lr": 0.00014105990499629683, "tps": 260806, "wall": 5031.9} {"step": 20025, "train_loss": 3.105760335922241, "lr": 0.00014104268807585855, "tps": 260572, "wall": 5036.7} {"step": 20026, "train_loss": 3.2657177448272705, "lr": 0.0001410254720498529, "tps": 260339, "wall": 5041.4} {"step": 20027, "train_loss": 3.2389228343963623, "lr": 0.00014100825691847505, "tps": 260106, "wall": 5046.2} {"step": 20028, "train_loss": 3.248149871826172, "lr": 0.00014099104268191983, "tps": 259874, "wall": 5051.0} {"step": 20029, "train_loss": 3.2768001556396484, "lr": 0.00014097382934038247, "tps": 259643, "wall": 5055.7} {"step": 20030, "train_loss": 3.356790542602539, "lr": 0.00014095661689405783, "tps": 259412, "wall": 5060.5} {"step": 20031, "train_loss": 3.2327077388763428, "lr": 0.0001409394053431408, "tps": 259181, "wall": 5065.2} {"step": 20032, "train_loss": 3.2465434074401855, "lr": 0.00014092219468782663, "tps": 258950, "wall": 5070.0} {"step": 20033, "train_loss": 3.333836317062378, "lr": 0.00014090498492831004, "tps": 258716, "wall": 5074.8} {"step": 20034, "train_loss": 3.1898751258850098, "lr": 0.00014088777606478597, "tps": 258488, "wall": 5079.6} {"step": 20035, "train_loss": 3.278903007507324, "lr": 0.0001408705680974496, "tps": 258259, "wall": 5084.3} {"step": 20036, "train_loss": 3.3007616996765137, "lr": 0.00014085336102649567, "tps": 258030, "wall": 5089.1} {"step": 20037, "train_loss": 3.2716832160949707, "lr": 0.00014083615485211906, "tps": 257802, "wall": 5093.9} {"step": 20038, "train_loss": 3.2949838638305664, "lr": 0.00014081894957451488, "tps": 257573, "wall": 5098.6} {"step": 20039, "train_loss": 3.223390579223633, "lr": 0.0001408017451938779, "tps": 257346, "wall": 5103.4} {"step": 20040, "train_loss": 3.1798830032348633, "lr": 0.00014078454171040296, "tps": 257119, "wall": 5108.2} {"step": 20041, "train_loss": 3.214672088623047, "lr": 0.0001407673391242851, "tps": 256891, "wall": 5112.9} {"step": 20042, "train_loss": 3.152073860168457, "lr": 0.0001407501374357191, "tps": 256665, "wall": 5117.7} {"step": 20043, "train_loss": 3.26426362991333, "lr": 0.00014073293664489976, "tps": 256439, "wall": 5122.5} {"step": 20044, "train_loss": 3.164396047592163, "lr": 0.00014071573675202207, "tps": 256214, "wall": 5127.2} {"step": 20045, "train_loss": 3.22573184967041, "lr": 0.00014069853775728074, "tps": 255989, "wall": 5132.0} {"step": 20046, "train_loss": 3.1076254844665527, "lr": 0.00014068133966087075, "tps": 255762, "wall": 5136.8} {"step": 20047, "train_loss": 3.2751784324645996, "lr": 0.00014066414246298684, "tps": 255538, "wall": 5141.6} {"step": 20048, "train_loss": 3.2111897468566895, "lr": 0.0001406469461638237, "tps": 255314, "wall": 5146.3} {"step": 20049, "train_loss": 3.2238192558288574, "lr": 0.00014062975076357636, "tps": 255091, "wall": 5151.1} {"step": 20050, "train_loss": 3.2496891021728516, "lr": 0.0001406125562624395, "tps": 254868, "wall": 5155.8} {"step": 20051, "train_loss": 3.267252206802368, "lr": 0.0001405953626606078, "tps": 254646, "wall": 5160.6} {"step": 20052, "train_loss": 3.2252211570739746, "lr": 0.00014057816995827617, "tps": 254423, "wall": 5165.4} {"step": 20053, "train_loss": 3.298024892807007, "lr": 0.00014056097815563935, "tps": 254201, "wall": 5170.1} {"step": 20054, "train_loss": 3.332819700241089, "lr": 0.00014054378725289203, "tps": 253980, "wall": 5174.9} {"step": 20055, "train_loss": 3.2078354358673096, "lr": 0.00014052659725022907, "tps": 253760, "wall": 5179.7} {"step": 20056, "train_loss": 3.266993284225464, "lr": 0.0001405094081478451, "tps": 253539, "wall": 5184.4} {"step": 20057, "train_loss": 3.237792730331421, "lr": 0.00014049221994593474, "tps": 253319, "wall": 5189.2} {"step": 20058, "train_loss": 3.302931070327759, "lr": 0.0001404750326446929, "tps": 253097, "wall": 5194.0} {"step": 20059, "train_loss": 3.2595276832580566, "lr": 0.0001404578462443142, "tps": 252877, "wall": 5198.8} {"step": 20060, "train_loss": 3.2160186767578125, "lr": 0.00014044066074499326, "tps": 252658, "wall": 5203.5} {"step": 20061, "train_loss": 3.1496071815490723, "lr": 0.00014042347614692487, "tps": 252439, "wall": 5208.3} {"step": 20062, "train_loss": 3.2378933429718018, "lr": 0.0001404062924503037, "tps": 252222, "wall": 5213.1} {"step": 20063, "train_loss": 3.112274646759033, "lr": 0.00014038910965532422, "tps": 252004, "wall": 5217.8} {"step": 20064, "train_loss": 3.1830458641052246, "lr": 0.00014037192776218134, "tps": 251787, "wall": 5222.6} {"step": 20065, "train_loss": 3.241384983062744, "lr": 0.00014035474677106944, "tps": 251570, "wall": 5227.3} {"step": 20066, "train_loss": 3.2220191955566406, "lr": 0.0001403375666821834, "tps": 251351, "wall": 5232.2} {"step": 20067, "train_loss": 3.1870577335357666, "lr": 0.00014032038749571765, "tps": 251136, "wall": 5236.9} {"step": 20068, "train_loss": 3.3117146492004395, "lr": 0.00014030320921186684, "tps": 250920, "wall": 5241.7} {"step": 20069, "train_loss": 3.221151113510132, "lr": 0.00014028603183082567, "tps": 250705, "wall": 5246.4} {"step": 20070, "train_loss": 3.1852164268493652, "lr": 0.00014026885535278863, "tps": 250490, "wall": 5251.2} {"step": 20071, "train_loss": 3.2322492599487305, "lr": 0.00014025167977795025, "tps": 250273, "wall": 5256.0} {"step": 20072, "train_loss": 3.2171738147735596, "lr": 0.00014023450510650516, "tps": 250059, "wall": 5260.8} {"step": 20073, "train_loss": 3.190509796142578, "lr": 0.000140217331338648, "tps": 249845, "wall": 5265.5} {"step": 20074, "train_loss": 3.203660488128662, "lr": 0.00014020015847457308, "tps": 249632, "wall": 5270.3} {"step": 20075, "train_loss": 3.2412023544311523, "lr": 0.0001401829865144752, "tps": 249419, "wall": 5275.1} {"step": 20076, "train_loss": 3.1979875564575195, "lr": 0.00014016581545854873, "tps": 249206, "wall": 5279.8} {"step": 20077, "train_loss": 3.28645658493042, "lr": 0.0001401486453069882, "tps": 248993, "wall": 5284.6} {"step": 20078, "train_loss": 3.256610870361328, "lr": 0.0001401314760599882, "tps": 248782, "wall": 5289.4} {"step": 20079, "train_loss": 3.236800193786621, "lr": 0.00014011430771774315, "tps": 248570, "wall": 5294.1} {"step": 20080, "train_loss": 3.157106876373291, "lr": 0.00014009714028044744, "tps": 248360, "wall": 5298.9} {"step": 20081, "train_loss": 3.1769895553588867, "lr": 0.00014007997374829577, "tps": 248149, "wall": 5303.6} {"step": 20082, "train_loss": 3.0890095233917236, "lr": 0.00014006280812148237, "tps": 247939, "wall": 5308.4} {"step": 20083, "train_loss": 3.260110855102539, "lr": 0.0001400456434002019, "tps": 247729, "wall": 5313.1} {"step": 20084, "train_loss": 3.2616302967071533, "lr": 0.00014002847958464865, "tps": 247517, "wall": 5318.0} {"step": 20085, "train_loss": 3.1766533851623535, "lr": 0.00014001131667501713, "tps": 247308, "wall": 5322.7} {"step": 20086, "train_loss": 3.265820026397705, "lr": 0.00013999415467150176, "tps": 247099, "wall": 5327.5} {"step": 20087, "train_loss": 3.304600954055786, "lr": 0.00013997699357429694, "tps": 246888, "wall": 5332.3} {"step": 20088, "train_loss": 3.1910500526428223, "lr": 0.000139959833383597, "tps": 246681, "wall": 5337.1} {"step": 20089, "train_loss": 3.2411141395568848, "lr": 0.00013994267409959648, "tps": 246473, "wall": 5341.8} {"step": 20090, "train_loss": 3.3531103134155273, "lr": 0.00013992551572248964, "tps": 246266, "wall": 5346.6} {"step": 20091, "train_loss": 3.229034423828125, "lr": 0.00013990835825247085, "tps": 246059, "wall": 5351.4} {"step": 20092, "train_loss": 3.312211036682129, "lr": 0.00013989120168973458, "tps": 245852, "wall": 5356.1} {"step": 20093, "train_loss": 3.230971097946167, "lr": 0.0001398740460344751, "tps": 245646, "wall": 5360.9} {"step": 20094, "train_loss": 3.276858329772949, "lr": 0.0001398568912868867, "tps": 245440, "wall": 5365.7} {"step": 20095, "train_loss": 3.2676382064819336, "lr": 0.00013983973744716385, "tps": 245233, "wall": 5370.4} {"step": 20096, "train_loss": 3.2192604541778564, "lr": 0.00013982258451550076, "tps": 245024, "wall": 5375.3} {"step": 20097, "train_loss": 3.2157745361328125, "lr": 0.00013980543249209173, "tps": 244819, "wall": 5380.1} {"step": 20098, "train_loss": 3.330918788909912, "lr": 0.00013978828137713116, "tps": 244614, "wall": 5384.8} {"step": 20099, "train_loss": 3.221867322921753, "lr": 0.00013977113117081318, "tps": 244410, "wall": 5389.6} {"step": 20100, "train_loss": 3.2704622745513916, "lr": 0.00013975398187333232, "tps": 244206, "wall": 5394.4} {"step": 20101, "train_loss": 3.228421449661255, "lr": 0.0001397368334848826, "tps": 244002, "wall": 5399.1} {"step": 20102, "train_loss": 3.040325164794922, "lr": 0.00013971968600565835, "tps": 243799, "wall": 5403.9} {"step": 20103, "train_loss": 3.200536012649536, "lr": 0.0001397025394358539, "tps": 243597, "wall": 5408.7} {"step": 20104, "train_loss": 3.203113317489624, "lr": 0.00013968539377566343, "tps": 243393, "wall": 5413.5} {"step": 20105, "train_loss": 3.248549699783325, "lr": 0.00013966824902528107, "tps": 243192, "wall": 5418.2} {"step": 20106, "train_loss": 3.168543577194214, "lr": 0.00013965110518490123, "tps": 242991, "wall": 5423.0} {"step": 20107, "train_loss": 3.200345516204834, "lr": 0.00013963396225471803, "tps": 242790, "wall": 5427.7} {"step": 20108, "train_loss": 3.123354911804199, "lr": 0.00013961682023492554, "tps": 242589, "wall": 5432.5} {"step": 20109, "train_loss": 3.133057117462158, "lr": 0.00013959967912571816, "tps": 242385, "wall": 5437.3} {"step": 20110, "train_loss": 3.21640944480896, "lr": 0.00013958253892728997, "tps": 242185, "wall": 5442.1} {"step": 20111, "train_loss": 3.232999324798584, "lr": 0.00013956539963983503, "tps": 241985, "wall": 5446.9} {"step": 20112, "train_loss": 3.1710476875305176, "lr": 0.0001395482612635477, "tps": 241786, "wall": 5451.6} {"step": 20113, "train_loss": 3.1672863960266113, "lr": 0.00013953112379862202, "tps": 241586, "wall": 5456.4} {"step": 20114, "train_loss": 3.184748649597168, "lr": 0.000139513987245252, "tps": 241388, "wall": 5461.2} {"step": 20115, "train_loss": 3.293008804321289, "lr": 0.000139496851603632, "tps": 241189, "wall": 5465.9} {"step": 20116, "train_loss": 3.3348946571350098, "lr": 0.000139479716873956, "tps": 240991, "wall": 5470.7} {"step": 20117, "train_loss": 3.2887887954711914, "lr": 0.00013946258305641806, "tps": 240792, "wall": 5475.5} {"step": 20118, "train_loss": 3.20279598236084, "lr": 0.0001394454501512124, "tps": 240595, "wall": 5480.2} {"step": 20119, "train_loss": 3.1616382598876953, "lr": 0.000139428318158533, "tps": 240397, "wall": 5485.0} {"step": 20120, "train_loss": 3.168285369873047, "lr": 0.00013941118707857402, "tps": 240200, "wall": 5489.8} {"step": 20121, "train_loss": 3.2981557846069336, "lr": 0.00013939405691152946, "tps": 240001, "wall": 5494.6} {"step": 20122, "train_loss": 3.259949207305908, "lr": 0.00013937692765759332, "tps": 239805, "wall": 5499.4} {"step": 20123, "train_loss": 3.3230013847351074, "lr": 0.0001393597993169598, "tps": 239610, "wall": 5504.1} {"step": 20124, "train_loss": 3.2563252449035645, "lr": 0.00013934267188982279, "tps": 239415, "wall": 5508.9} {"step": 20125, "train_loss": 3.330714225769043, "lr": 0.00013932554537637634, "tps": 239221, "wall": 5513.6} {"step": 20126, "train_loss": 3.314980983734131, "lr": 0.0001393084197768145, "tps": 239027, "wall": 5518.4} {"step": 20127, "train_loss": 3.2899813652038574, "lr": 0.00013929129509133124, "tps": 238833, "wall": 5523.1} {"step": 20128, "train_loss": 3.2524523735046387, "lr": 0.00013927417132012055, "tps": 238640, "wall": 5527.9} {"step": 20129, "train_loss": 3.16758131980896, "lr": 0.0001392570484633764, "tps": 238446, "wall": 5532.6} {"step": 20130, "train_loss": 3.2060446739196777, "lr": 0.00013923992652129283, "tps": 238254, "wall": 5537.4} {"step": 20131, "train_loss": 3.1692757606506348, "lr": 0.0001392228054940637, "tps": 238060, "wall": 5542.2} {"step": 20132, "train_loss": 3.4102702140808105, "lr": 0.00013920568538188302, "tps": 237867, "wall": 5546.9} {"step": 20133, "train_loss": 3.242835760116577, "lr": 0.0001391885661849447, "tps": 237674, "wall": 5551.7} {"step": 20134, "train_loss": 3.2498531341552734, "lr": 0.00013917144790344263, "tps": 237479, "wall": 5556.6} {"step": 20135, "train_loss": 3.378279447555542, "lr": 0.00013915433053757084, "tps": 237287, "wall": 5561.3} {"step": 20136, "train_loss": 3.2394590377807617, "lr": 0.00013913721408752308, "tps": 237096, "wall": 5566.1} {"step": 20137, "train_loss": 3.2622246742248535, "lr": 0.0001391200985534934, "tps": 236906, "wall": 5570.8} {"step": 20138, "train_loss": 3.2424259185791016, "lr": 0.00013910298393567564, "tps": 236715, "wall": 5575.6} {"step": 20139, "train_loss": 3.1410319805145264, "lr": 0.00013908587023426353, "tps": 236525, "wall": 5580.3} {"step": 20140, "train_loss": 3.2170073986053467, "lr": 0.0001390687574494512, "tps": 236336, "wall": 5585.1} {"step": 20141, "train_loss": 3.2061824798583984, "lr": 0.00013905164558143237, "tps": 236147, "wall": 5589.8} {"step": 20142, "train_loss": 3.256087303161621, "lr": 0.00013903453463040075, "tps": 235958, "wall": 5594.6} {"step": 20143, "train_loss": 3.128544807434082, "lr": 0.0001390174245965504, "tps": 235769, "wall": 5599.4} {"step": 20144, "train_loss": 3.233412265777588, "lr": 0.00013900031548007505, "tps": 235581, "wall": 5604.1} {"step": 20145, "train_loss": 3.3198728561401367, "lr": 0.0001389832072811685, "tps": 235393, "wall": 5608.9} {"step": 20146, "train_loss": 3.223142385482788, "lr": 0.00013896610000002453, "tps": 235204, "wall": 5613.7} {"step": 20147, "train_loss": 3.229780673980713, "lr": 0.00013894899363683694, "tps": 235014, "wall": 5618.4} {"step": 20148, "train_loss": 3.231616497039795, "lr": 0.00013893188819179958, "tps": 234827, "wall": 5623.2} {"step": 20149, "train_loss": 3.327247142791748, "lr": 0.00013891478366510622, "tps": 234640, "wall": 5628.0} {"step": 20150, "train_loss": 3.184147357940674, "lr": 0.00013889768005695045, "tps": 234454, "wall": 5632.7} {"step": 20151, "train_loss": 3.2231483459472656, "lr": 0.00013888057736752624, "tps": 234267, "wall": 5637.5} {"step": 20152, "train_loss": 3.2459309101104736, "lr": 0.00013886347559702723, "tps": 234081, "wall": 5642.3} {"step": 20153, "train_loss": 3.2675914764404297, "lr": 0.00013884637474564712, "tps": 233896, "wall": 5647.0} {"step": 20154, "train_loss": 3.264202356338501, "lr": 0.00013882927481357972, "tps": 233711, "wall": 5651.7} {"step": 20155, "train_loss": 3.2471532821655273, "lr": 0.00013881217580101867, "tps": 233526, "wall": 5656.5} {"step": 20156, "train_loss": 3.245576858520508, "lr": 0.00013879507770815763, "tps": 233341, "wall": 5661.3} {"step": 20157, "train_loss": 3.286909818649292, "lr": 0.0001387779805351904, "tps": 233157, "wall": 5666.0} {"step": 20158, "train_loss": 3.221846580505371, "lr": 0.00013876088428231063, "tps": 232973, "wall": 5670.8} {"step": 20159, "train_loss": 3.139765739440918, "lr": 0.00013874378894971186, "tps": 232788, "wall": 5675.6} {"step": 20160, "train_loss": 3.2817537784576416, "lr": 0.0001387266945375879, "tps": 232604, "wall": 5680.3} {"step": 20161, "train_loss": 3.1909196376800537, "lr": 0.00013870960104613231, "tps": 232422, "wall": 5685.1} {"step": 20162, "train_loss": 3.3272929191589355, "lr": 0.0001386925084755388, "tps": 232239, "wall": 5689.8} {"step": 20163, "train_loss": 3.2262396812438965, "lr": 0.00013867541682600096, "tps": 232057, "wall": 5694.6} {"step": 20164, "train_loss": 3.2462377548217773, "lr": 0.00013865832609771234, "tps": 231874, "wall": 5699.3} {"step": 20165, "train_loss": 3.2326364517211914, "lr": 0.00013864123629086668, "tps": 231692, "wall": 5704.1} {"step": 20166, "train_loss": 3.1500487327575684, "lr": 0.00013862414740565746, "tps": 231511, "wall": 5708.9} {"step": 20167, "train_loss": 3.1925101280212402, "lr": 0.00013860705944227823, "tps": 231329, "wall": 5713.6} {"step": 20168, "train_loss": 3.14860200881958, "lr": 0.00013858997240092275, "tps": 231148, "wall": 5718.4} {"step": 20169, "train_loss": 3.2217493057250977, "lr": 0.00013857288628178443, "tps": 230968, "wall": 5723.1} {"step": 20170, "train_loss": 3.1179630756378174, "lr": 0.0001385558010850568, "tps": 230788, "wall": 5727.9} {"step": 20171, "train_loss": 3.255622386932373, "lr": 0.0001385387168109335, "tps": 230608, "wall": 5732.6} {"step": 20172, "train_loss": 3.1789143085479736, "lr": 0.0001385216334596081, "tps": 230426, "wall": 5737.4} {"step": 20173, "train_loss": 3.2840652465820312, "lr": 0.0001385045510312739, "tps": 230247, "wall": 5742.2} {"step": 20174, "train_loss": 3.2928216457366943, "lr": 0.00013848746952612465, "tps": 230068, "wall": 5746.9} {"step": 20175, "train_loss": 3.1887733936309814, "lr": 0.00013847038894435377, "tps": 229890, "wall": 5751.7} {"step": 20176, "train_loss": 3.219806671142578, "lr": 0.00013845330928615463, "tps": 229711, "wall": 5756.4} {"step": 20177, "train_loss": 3.209111213684082, "lr": 0.00013843623055172092, "tps": 229533, "wall": 5761.2} {"step": 20178, "train_loss": 3.232203960418701, "lr": 0.0001384191527412459, "tps": 229355, "wall": 5766.0} {"step": 20179, "train_loss": 3.171365976333618, "lr": 0.00013840207585492323, "tps": 229177, "wall": 5770.7} {"step": 20180, "train_loss": 3.1361119747161865, "lr": 0.00013838499989294627, "tps": 229000, "wall": 5775.5} {"step": 20181, "train_loss": 3.2524948120117188, "lr": 0.00013836792485550837, "tps": 228823, "wall": 5780.2} {"step": 20182, "train_loss": 3.1628122329711914, "lr": 0.00013835085074280308, "tps": 228646, "wall": 5785.0} {"step": 20183, "train_loss": 3.229619026184082, "lr": 0.00013833377755502376, "tps": 228469, "wall": 5789.7} {"step": 20184, "train_loss": 3.126828193664551, "lr": 0.00013831670529236377, "tps": 228290, "wall": 5794.6} {"step": 20185, "train_loss": 3.1475939750671387, "lr": 0.00013829963395501667, "tps": 228115, "wall": 5799.3} {"step": 20186, "train_loss": 3.3013062477111816, "lr": 0.00013828256354317568, "tps": 227939, "wall": 5804.1} {"step": 20187, "train_loss": 3.211092472076416, "lr": 0.00013826549405703418, "tps": 227765, "wall": 5808.8} {"step": 20188, "train_loss": 3.110560894012451, "lr": 0.00013824842549678564, "tps": 227590, "wall": 5813.5} {"step": 20189, "train_loss": 3.35916805267334, "lr": 0.0001382313578626234, "tps": 227415, "wall": 5818.3} {"step": 20190, "train_loss": 3.296027183532715, "lr": 0.00013821429115474065, "tps": 227241, "wall": 5823.0} {"step": 20191, "train_loss": 3.202608585357666, "lr": 0.00013819722537333095, "tps": 227066, "wall": 5827.8} {"step": 20192, "train_loss": 3.16446590423584, "lr": 0.00013818016051858747, "tps": 226892, "wall": 5832.6} {"step": 20193, "train_loss": 3.2076501846313477, "lr": 0.00013816309659070352, "tps": 226718, "wall": 5837.3} {"step": 20194, "train_loss": 3.2459328174591064, "lr": 0.00013814603358987246, "tps": 226546, "wall": 5842.1} {"step": 20195, "train_loss": 3.243391513824463, "lr": 0.00013812897151628753, "tps": 226373, "wall": 5846.8} {"step": 20196, "train_loss": 3.270900011062622, "lr": 0.0001381119103701421, "tps": 226200, "wall": 5851.6} {"step": 20197, "train_loss": 3.307056427001953, "lr": 0.00013809485015162936, "tps": 226025, "wall": 5856.4} {"step": 20198, "train_loss": 3.187182903289795, "lr": 0.00013807779086094256, "tps": 225853, "wall": 5861.2} {"step": 20199, "train_loss": 3.3521432876586914, "lr": 0.000138060732498275, "tps": 225681, "wall": 5865.9} {"step": 20200, "train_loss": 3.3059873580932617, "lr": 0.00013804367506381991, "tps": 225509, "wall": 5870.7} {"step": 20201, "train_loss": 3.324284791946411, "lr": 0.00013802661855777046, "tps": 225338, "wall": 5875.4} {"step": 20202, "train_loss": 3.2065348625183105, "lr": 0.00013800956298031997, "tps": 225167, "wall": 5880.2} {"step": 20203, "train_loss": 3.270657777786255, "lr": 0.00013799250833166157, "tps": 224997, "wall": 5884.9} {"step": 20204, "train_loss": 3.2947044372558594, "lr": 0.0001379754546119884, "tps": 224827, "wall": 5889.7} {"step": 20205, "train_loss": 3.29617977142334, "lr": 0.00013795840182149379, "tps": 224656, "wall": 5894.4} {"step": 20206, "train_loss": 3.2481937408447266, "lr": 0.00013794134996037086, "tps": 224486, "wall": 5899.2} {"step": 20207, "train_loss": 3.198902130126953, "lr": 0.0001379242990288127, "tps": 224316, "wall": 5903.9} {"step": 20208, "train_loss": 3.2844324111938477, "lr": 0.00013790724902701252, "tps": 224147, "wall": 5908.7} {"step": 20209, "train_loss": 3.2008323669433594, "lr": 0.00013789019995516353, "tps": 223978, "wall": 5913.4} {"step": 20210, "train_loss": 3.158738374710083, "lr": 0.0001378731518134587, "tps": 223807, "wall": 5918.2} {"step": 20211, "train_loss": 3.2227649688720703, "lr": 0.00013785610460209134, "tps": 223638, "wall": 5923.0} {"step": 20212, "train_loss": 3.2076117992401123, "lr": 0.00013783905832125443, "tps": 223470, "wall": 5927.8} {"step": 20213, "train_loss": 3.255948543548584, "lr": 0.0001378220129711411, "tps": 223302, "wall": 5932.5} {"step": 20214, "train_loss": 3.273622751235962, "lr": 0.00013780496855194448, "tps": 223135, "wall": 5937.3} {"step": 20215, "train_loss": 3.2296886444091797, "lr": 0.00013778792506385755, "tps": 222967, "wall": 5942.0} {"step": 20216, "train_loss": 3.2282679080963135, "lr": 0.00013777088250707353, "tps": 222800, "wall": 5946.8} {"step": 20217, "train_loss": 3.2660348415374756, "lr": 0.00013775384088178543, "tps": 222633, "wall": 5951.5} {"step": 20218, "train_loss": 3.2741472721099854, "lr": 0.00013773680018818615, "tps": 222466, "wall": 5956.3} {"step": 20219, "train_loss": 3.1821179389953613, "lr": 0.00013771976042646896, "tps": 222299, "wall": 5961.0} {"step": 20220, "train_loss": 3.204150676727295, "lr": 0.00013770272159682674, "tps": 222133, "wall": 5965.8} {"step": 20221, "train_loss": 3.2433881759643555, "lr": 0.00013768568369945254, "tps": 221967, "wall": 5970.6} {"step": 20222, "train_loss": 3.2174429893493652, "lr": 0.00013766864673453937, "tps": 221799, "wall": 5975.4} {"step": 20223, "train_loss": 3.2764861583709717, "lr": 0.00013765161070228022, "tps": 221634, "wall": 5980.1} {"step": 20224, "train_loss": 3.256632089614868, "lr": 0.00013763457560286808, "tps": 221468, "wall": 5984.9} {"step": 20225, "train_loss": 3.272481918334961, "lr": 0.00013761754143649593, "tps": 221304, "wall": 5989.6} {"step": 20226, "train_loss": 3.230292797088623, "lr": 0.00013760050820335677, "tps": 221139, "wall": 5994.4} {"step": 20227, "train_loss": 3.2429630756378174, "lr": 0.0001375834759036434, "tps": 220975, "wall": 5999.1} {"step": 20228, "train_loss": 3.4515178203582764, "lr": 0.00013756644453754893, "tps": 220810, "wall": 6003.9} {"step": 20229, "train_loss": 3.1782100200653076, "lr": 0.00013754941410526632, "tps": 220646, "wall": 6008.7} {"step": 20230, "train_loss": 3.2482752799987793, "lr": 0.00013753238460698826, "tps": 220481, "wall": 6013.5} {"step": 20231, "train_loss": 3.166210412979126, "lr": 0.00013751535604290788, "tps": 220319, "wall": 6018.2} {"step": 20232, "train_loss": 3.218651294708252, "lr": 0.00013749832841321798, "tps": 220156, "wall": 6022.9} {"step": 20233, "train_loss": 3.1080684661865234, "lr": 0.00013748130171811152, "tps": 219994, "wall": 6027.7} {"step": 20234, "train_loss": 3.2003726959228516, "lr": 0.00013746427595778135, "tps": 219831, "wall": 6032.4} {"step": 20235, "train_loss": 3.2368505001068115, "lr": 0.00013744725113242024, "tps": 219666, "wall": 6037.3} {"step": 20236, "train_loss": 3.248305559158325, "lr": 0.00013743022724222126, "tps": 219503, "wall": 6042.0} {"step": 20237, "train_loss": 3.275510311126709, "lr": 0.00013741320428737707, "tps": 219341, "wall": 6046.8} {"step": 20238, "train_loss": 3.2953786849975586, "lr": 0.00013739618226808054, "tps": 219180, "wall": 6051.6} {"step": 20239, "train_loss": 3.1469759941101074, "lr": 0.00013737916118452455, "tps": 219018, "wall": 6056.3} {"step": 20240, "train_loss": 3.2248263359069824, "lr": 0.00013736214103690191, "tps": 218857, "wall": 6061.1} {"step": 20241, "train_loss": 3.2188267707824707, "lr": 0.00013734512182540538, "tps": 218697, "wall": 6065.8} {"step": 20242, "train_loss": 3.254351854324341, "lr": 0.0001373281035502278, "tps": 218537, "wall": 6070.6} {"step": 20243, "train_loss": 3.243912935256958, "lr": 0.000137311086211562, "tps": 218376, "wall": 6075.3} {"step": 20244, "train_loss": 3.2706708908081055, "lr": 0.00013729406980960053, "tps": 218216, "wall": 6080.1} {"step": 20245, "train_loss": 3.2064924240112305, "lr": 0.00013727705434453643, "tps": 218057, "wall": 6084.8} {"step": 20246, "train_loss": 3.3560874462127686, "lr": 0.00013726003981656234, "tps": 217898, "wall": 6089.6} {"step": 20247, "train_loss": 3.366300582885742, "lr": 0.0001372430262258709, "tps": 217736, "wall": 6094.4} {"step": 20248, "train_loss": 3.3433475494384766, "lr": 0.00013722601357265502, "tps": 217577, "wall": 6099.1} {"step": 20249, "train_loss": 3.281816005706787, "lr": 0.00013720900185710728, "tps": 217418, "wall": 6103.9} {"step": 20250, "train_loss": 3.196805715560913, "lr": 0.00013719199107942048, "tps": 217259, "wall": 6108.7} {"step": 20251, "train_loss": 3.3017544746398926, "lr": 0.00013717498123978734, "tps": 217101, "wall": 6113.4} {"step": 20252, "train_loss": 3.2950377464294434, "lr": 0.00013715797233840036, "tps": 216944, "wall": 6118.2} {"step": 20253, "train_loss": 3.2595913410186768, "lr": 0.00013714096437545247, "tps": 216785, "wall": 6122.9} {"step": 20254, "train_loss": 3.2012624740600586, "lr": 0.0001371239573511362, "tps": 216628, "wall": 6127.7} {"step": 20255, "train_loss": 3.2247109413146973, "lr": 0.00013710695126564418, "tps": 216470, "wall": 6132.4} {"step": 20256, "train_loss": 3.178619623184204, "lr": 0.0001370899461191691, "tps": 216313, "wall": 6137.2} {"step": 20257, "train_loss": 3.225890636444092, "lr": 0.00013707294191190366, "tps": 216156, "wall": 6142.0} {"step": 20258, "train_loss": 3.1574206352233887, "lr": 0.0001370559386440403, "tps": 216000, "wall": 6146.7} {"step": 20259, "train_loss": 3.3313140869140625, "lr": 0.00013703893631577188, "tps": 215844, "wall": 6151.5} {"step": 20260, "train_loss": 3.2347660064697266, "lr": 0.00013702193492729086, "tps": 215685, "wall": 6156.3} {"step": 20261, "train_loss": 3.244708776473999, "lr": 0.00013700493447878976, "tps": 215529, "wall": 6161.0} {"step": 20262, "train_loss": 3.2597742080688477, "lr": 0.00013698793497046133, "tps": 215374, "wall": 6165.8} {"step": 20263, "train_loss": 3.164531707763672, "lr": 0.0001369709364024981, "tps": 215218, "wall": 6170.6} {"step": 20264, "train_loss": 3.2013630867004395, "lr": 0.00013695393877509245, "tps": 215063, "wall": 6175.3} {"step": 20265, "train_loss": 3.0804224014282227, "lr": 0.00013693694208843723, "tps": 214908, "wall": 6180.1} {"step": 20266, "train_loss": 3.2250585556030273, "lr": 0.00013691994634272475, "tps": 214753, "wall": 6184.9} {"step": 20267, "train_loss": 3.2178547382354736, "lr": 0.0001369029515381476, "tps": 214598, "wall": 6189.6} {"step": 20268, "train_loss": 3.098438262939453, "lr": 0.00013688595767489834, "tps": 214443, "wall": 6194.4} {"step": 20269, "train_loss": 3.134901285171509, "lr": 0.0001368689647531694, "tps": 214290, "wall": 6199.1} {"step": 20270, "train_loss": 3.3043668270111084, "lr": 0.00013685197277315335, "tps": 214136, "wall": 6203.9} {"step": 20271, "train_loss": 3.1656150817871094, "lr": 0.00013683498173504272, "tps": 213983, "wall": 6208.6} {"step": 20272, "train_loss": 3.2233619689941406, "lr": 0.0001368179916390298, "tps": 213830, "wall": 6213.4} {"step": 20273, "train_loss": 3.2703981399536133, "lr": 0.00013680100248530724, "tps": 213675, "wall": 6218.2} {"step": 20274, "train_loss": 3.265113353729248, "lr": 0.00013678401427406745, "tps": 213522, "wall": 6223.0} {"step": 20275, "train_loss": 3.2685232162475586, "lr": 0.00013676702700550277, "tps": 213370, "wall": 6227.7} {"step": 20276, "train_loss": 3.2954654693603516, "lr": 0.00013675004067980576, "tps": 213216, "wall": 6232.5} {"step": 20277, "train_loss": 3.253481864929199, "lr": 0.00013673305529716886, "tps": 213064, "wall": 6237.3} {"step": 20278, "train_loss": 3.297661542892456, "lr": 0.00013671607085778426, "tps": 212912, "wall": 6242.0} {"step": 20279, "train_loss": 3.1771676540374756, "lr": 0.0001366990873618446, "tps": 212761, "wall": 6246.8} {"step": 20280, "train_loss": 3.3386082649230957, "lr": 0.00013668210480954223, "tps": 212609, "wall": 6251.5} {"step": 20281, "train_loss": 3.1750454902648926, "lr": 0.0001366651232010694, "tps": 212458, "wall": 6256.3} {"step": 20282, "train_loss": 3.1930391788482666, "lr": 0.0001366481425366186, "tps": 212306, "wall": 6261.1} {"step": 20283, "train_loss": 3.189385414123535, "lr": 0.0001366311628163822, "tps": 212155, "wall": 6265.8} {"step": 20284, "train_loss": 3.2626352310180664, "lr": 0.00013661418404055237, "tps": 212005, "wall": 6270.6} {"step": 20285, "train_loss": 3.1602885723114014, "lr": 0.0001365972062093217, "tps": 211852, "wall": 6275.4} {"step": 20286, "train_loss": 3.270695686340332, "lr": 0.00013658022932288227, "tps": 211703, "wall": 6280.2} {"step": 20287, "train_loss": 3.2120676040649414, "lr": 0.0001365632533814266, "tps": 211553, "wall": 6284.9} {"step": 20288, "train_loss": 3.199958086013794, "lr": 0.00013654627838514692, "tps": 211403, "wall": 6289.7} {"step": 20289, "train_loss": 3.2564854621887207, "lr": 0.00013652930433423545, "tps": 211254, "wall": 6294.4} {"step": 20290, "train_loss": 3.2676467895507812, "lr": 0.00013651233122888458, "tps": 211105, "wall": 6299.2} {"step": 20291, "train_loss": 3.1979434490203857, "lr": 0.00013649535906928658, "tps": 210956, "wall": 6303.9} {"step": 20292, "train_loss": 3.166590690612793, "lr": 0.00013647838785563359, "tps": 210807, "wall": 6308.7} {"step": 20293, "train_loss": 3.2532379627227783, "lr": 0.000136461417588118, "tps": 210659, "wall": 6313.4} {"step": 20294, "train_loss": 3.2316739559173584, "lr": 0.00013644444826693195, "tps": 210511, "wall": 6318.2} {"step": 20295, "train_loss": 3.1956021785736084, "lr": 0.0001364274798922677, "tps": 210362, "wall": 6323.0} {"step": 20296, "train_loss": 3.224010467529297, "lr": 0.00013641051246431754, "tps": 210214, "wall": 6327.8} {"step": 20297, "train_loss": 3.2295258045196533, "lr": 0.00013639354598327357, "tps": 210066, "wall": 6332.5} {"step": 20298, "train_loss": 3.2127575874328613, "lr": 0.00013637658044932802, "tps": 209916, "wall": 6337.4} {"step": 20299, "train_loss": 3.1684746742248535, "lr": 0.00013635961586267313, "tps": 209769, "wall": 6342.1} {"step": 20300, "train_loss": 3.2271623611450195, "lr": 0.00013634265222350105, "tps": 209622, "wall": 6346.9} {"step": 20301, "train_loss": 3.2963027954101562, "lr": 0.00013632568953200383, "tps": 209476, "wall": 6351.6} {"step": 20302, "train_loss": 3.0867745876312256, "lr": 0.00013630872778837383, "tps": 209329, "wall": 6356.4} {"step": 20303, "train_loss": 3.223172903060913, "lr": 0.0001362917669928031, "tps": 209183, "wall": 6361.1} {"step": 20304, "train_loss": 3.331897735595703, "lr": 0.00013627480714548367, "tps": 209037, "wall": 6365.9} {"step": 20305, "train_loss": 3.2053465843200684, "lr": 0.00013625784824660784, "tps": 208891, "wall": 6370.6} {"step": 20306, "train_loss": 3.1725687980651855, "lr": 0.00013624089029636756, "tps": 208746, "wall": 6375.4} {"step": 20307, "train_loss": 3.29789400100708, "lr": 0.00013622393329495503, "tps": 208600, "wall": 6380.2} {"step": 20308, "train_loss": 3.2390494346618652, "lr": 0.00013620697724256236, "tps": 208455, "wall": 6384.9} {"step": 20309, "train_loss": 3.21136474609375, "lr": 0.0001361900221393815, "tps": 208310, "wall": 6389.7} {"step": 20310, "train_loss": 3.2240688800811768, "lr": 0.0001361730679856047, "tps": 208163, "wall": 6394.5} {"step": 20311, "train_loss": 3.1440083980560303, "lr": 0.00013615611478142388, "tps": 208019, "wall": 6399.2} {"step": 20312, "train_loss": 3.268683433532715, "lr": 0.0001361391625270311, "tps": 207874, "wall": 6404.0} {"step": 20313, "train_loss": 3.187352180480957, "lr": 0.00013612221122261855, "tps": 207730, "wall": 6408.8} {"step": 20314, "train_loss": 3.2444660663604736, "lr": 0.00013610526086837798, "tps": 207585, "wall": 6413.6} {"step": 20315, "train_loss": 3.3244376182556152, "lr": 0.00013608831146450165, "tps": 207441, "wall": 6418.3} {"step": 20316, "train_loss": 3.1906776428222656, "lr": 0.00013607136301118145, "tps": 207298, "wall": 6423.1} {"step": 20317, "train_loss": 3.3174543380737305, "lr": 0.0001360544155086093, "tps": 207155, "wall": 6427.8} {"step": 20318, "train_loss": 3.2755050659179688, "lr": 0.00013603746895697735, "tps": 207012, "wall": 6432.6} {"step": 20319, "train_loss": 3.1619184017181396, "lr": 0.00013602052335647753, "tps": 206867, "wall": 6437.4} {"step": 20320, "train_loss": 3.3423876762390137, "lr": 0.00013600357870730164, "tps": 206725, "wall": 6442.2} {"step": 20321, "train_loss": 3.25521183013916, "lr": 0.00013598663500964184, "tps": 206582, "wall": 6446.9} {"step": 20322, "train_loss": 3.283172369003296, "lr": 0.00013596969226368997, "tps": 206440, "wall": 6451.7} {"step": 20323, "train_loss": 3.283308267593384, "lr": 0.000135952750469638, "tps": 206296, "wall": 6456.5} {"step": 20324, "train_loss": 3.2007880210876465, "lr": 0.00013593580962767779, "tps": 206154, "wall": 6461.3} {"step": 20325, "train_loss": 3.249699592590332, "lr": 0.0001359188697380013, "tps": 206012, "wall": 6466.0} {"step": 20326, "train_loss": 3.3113203048706055, "lr": 0.00013590193080080033, "tps": 205871, "wall": 6470.8} {"step": 20327, "train_loss": 3.2031075954437256, "lr": 0.00013588499281626693, "tps": 205731, "wall": 6475.5} {"step": 20328, "train_loss": 3.213724136352539, "lr": 0.00013586805578459277, "tps": 205590, "wall": 6480.3} {"step": 20329, "train_loss": 3.382561206817627, "lr": 0.00013585111970596992, "tps": 205449, "wall": 6485.0} {"step": 20330, "train_loss": 3.1960432529449463, "lr": 0.00013583418458059017, "tps": 205309, "wall": 6489.8} {"step": 20331, "train_loss": 3.3261146545410156, "lr": 0.00013581725040864523, "tps": 205168, "wall": 6494.5} {"step": 20332, "train_loss": 3.29312801361084, "lr": 0.00013580031719032708, "tps": 205028, "wall": 6499.3} {"step": 20333, "train_loss": 3.2127182483673096, "lr": 0.00013578338492582748, "tps": 204888, "wall": 6504.1} {"step": 20334, "train_loss": 3.1739041805267334, "lr": 0.00013576645361533825, "tps": 204749, "wall": 6508.8} {"step": 20335, "train_loss": 3.1573305130004883, "lr": 0.00013574952325905122, "tps": 204609, "wall": 6513.6} {"step": 20336, "train_loss": 3.189138412475586, "lr": 0.00013573259385715812, "tps": 204468, "wall": 6518.4} {"step": 20337, "train_loss": 3.254424571990967, "lr": 0.00013571566540985074, "tps": 204329, "wall": 6523.1} {"step": 20338, "train_loss": 3.2075893878936768, "lr": 0.0001356987379173209, "tps": 204191, "wall": 6527.9} {"step": 20339, "train_loss": 3.262329339981079, "lr": 0.00013568181137976035, "tps": 204052, "wall": 6532.6} {"step": 20340, "train_loss": 3.0934128761291504, "lr": 0.00013566488579736067, "tps": 203914, "wall": 6537.4} {"step": 20341, "train_loss": 3.216012477874756, "lr": 0.00013564796117031386, "tps": 203776, "wall": 6542.1} {"step": 20342, "train_loss": 3.3319637775421143, "lr": 0.0001356310374988115, "tps": 203638, "wall": 6546.9} {"step": 20343, "train_loss": 3.356078624725342, "lr": 0.0001356141147830452, "tps": 203500, "wall": 6551.7} {"step": 20344, "train_loss": 3.163996696472168, "lr": 0.00013559719302320687, "tps": 203361, "wall": 6556.4} {"step": 20345, "train_loss": 3.21012544631958, "lr": 0.0001355802722194881, "tps": 203223, "wall": 6561.2} {"step": 20346, "train_loss": 3.222745656967163, "lr": 0.00013556335237208052, "tps": 203086, "wall": 6566.0} {"step": 20347, "train_loss": 3.3061752319335938, "lr": 0.0001355464334811759, "tps": 202949, "wall": 6570.7} {"step": 20348, "train_loss": 3.189617156982422, "lr": 0.0001355295155469658, "tps": 202811, "wall": 6575.5} {"step": 20349, "train_loss": 3.303628444671631, "lr": 0.00013551259856964194, "tps": 202674, "wall": 6580.3} {"step": 20350, "train_loss": 3.1631321907043457, "lr": 0.000135495682549396, "tps": 202538, "wall": 6585.0} {"step": 20351, "train_loss": 3.31057071685791, "lr": 0.00013547876748641944, "tps": 202402, "wall": 6589.8} {"step": 20352, "train_loss": 3.279472827911377, "lr": 0.00013546185338090405, "tps": 202266, "wall": 6594.5} {"step": 20353, "train_loss": 3.1134960651397705, "lr": 0.00013544494023304135, "tps": 202130, "wall": 6599.3} {"step": 20354, "train_loss": 3.345065116882324, "lr": 0.00013542802804302286, "tps": 201994, "wall": 6604.1} {"step": 20355, "train_loss": 3.255680561065674, "lr": 0.00013541111681104035, "tps": 201859, "wall": 6608.8} {"step": 20356, "train_loss": 3.1613245010375977, "lr": 0.00013539420653728524, "tps": 201724, "wall": 6613.6} {"step": 20357, "train_loss": 3.1854352951049805, "lr": 0.00013537729722194912, "tps": 201589, "wall": 6618.3} {"step": 20358, "train_loss": 3.171919345855713, "lr": 0.00013536038886522358, "tps": 201454, "wall": 6623.1} {"step": 20359, "train_loss": 3.229196548461914, "lr": 0.00013534348146730015, "tps": 201319, "wall": 6627.8} {"step": 20360, "train_loss": 3.2945117950439453, "lr": 0.00013532657502837028, "tps": 201184, "wall": 6632.6} {"step": 20361, "train_loss": 3.2512736320495605, "lr": 0.0001353096695486256, "tps": 201048, "wall": 6637.4} {"step": 20362, "train_loss": 3.2097458839416504, "lr": 0.00013529276502825756, "tps": 200914, "wall": 6642.2} {"step": 20363, "train_loss": 3.2547097206115723, "lr": 0.0001352758614674576, "tps": 200780, "wall": 6646.9} {"step": 20364, "train_loss": 3.180023193359375, "lr": 0.00013525895886641736, "tps": 200646, "wall": 6651.7} {"step": 20365, "train_loss": 3.216188907623291, "lr": 0.00013524205722532812, "tps": 200513, "wall": 6656.5} {"step": 20366, "train_loss": 3.2605855464935303, "lr": 0.00013522515654438154, "tps": 200379, "wall": 6661.2} {"step": 20367, "train_loss": 3.209519147872925, "lr": 0.00013520825682376893, "tps": 200246, "wall": 6666.0} {"step": 20368, "train_loss": 3.288983106613159, "lr": 0.0001351913580636817, "tps": 200114, "wall": 6670.7} {"step": 20369, "train_loss": 3.272742748260498, "lr": 0.00013517446026431148, "tps": 199980, "wall": 6675.5} {"step": 20370, "train_loss": 3.1469531059265137, "lr": 0.00013515756342584952, "tps": 199848, "wall": 6680.2} {"step": 20371, "train_loss": 3.1723134517669678, "lr": 0.0001351406675484872, "tps": 199715, "wall": 6685.0} {"step": 20372, "train_loss": 3.1813416481018066, "lr": 0.0001351237726324161, "tps": 199583, "wall": 6689.8} {"step": 20373, "train_loss": 3.2383694648742676, "lr": 0.00013510687867782743, "tps": 199449, "wall": 6694.6} {"step": 20374, "train_loss": 3.2674574851989746, "lr": 0.00013508998568491262, "tps": 199317, "wall": 6699.3} {"step": 20375, "train_loss": 3.2597403526306152, "lr": 0.00013507309365386308, "tps": 199186, "wall": 6704.1} {"step": 20376, "train_loss": 3.176821231842041, "lr": 0.00013505620258487015, "tps": 199054, "wall": 6708.9} {"step": 20377, "train_loss": 3.214625835418701, "lr": 0.00013503931247812507, "tps": 198922, "wall": 6713.6} {"step": 20378, "train_loss": 3.2526955604553223, "lr": 0.00013502242333381933, "tps": 198791, "wall": 6718.4} {"step": 20379, "train_loss": 3.19881534576416, "lr": 0.00013500553515214417, "tps": 198661, "wall": 6723.1} {"step": 20380, "train_loss": 3.2551536560058594, "lr": 0.00013498864793329087, "tps": 198530, "wall": 6727.9} {"step": 20381, "train_loss": 3.279520034790039, "lr": 0.0001349717616774508, "tps": 198399, "wall": 6732.6} {"step": 20382, "train_loss": 3.1907403469085693, "lr": 0.00013495487638481515, "tps": 198269, "wall": 6737.4} {"step": 20383, "train_loss": 3.2413277626037598, "lr": 0.00013493799205557534, "tps": 198139, "wall": 6742.2} {"step": 20384, "train_loss": 3.1696572303771973, "lr": 0.00013492110868992255, "tps": 198009, "wall": 6746.9} {"step": 20385, "train_loss": 3.2510952949523926, "lr": 0.00013490422628804796, "tps": 197879, "wall": 6751.7} {"step": 20386, "train_loss": 3.282480478286743, "lr": 0.00013488734485014297, "tps": 197748, "wall": 6756.5} {"step": 20387, "train_loss": 3.351085662841797, "lr": 0.00013487046437639876, "tps": 197618, "wall": 6761.2} {"step": 20388, "train_loss": 3.1881141662597656, "lr": 0.00013485358486700646, "tps": 197488, "wall": 6766.0} {"step": 20389, "train_loss": 3.336724042892456, "lr": 0.00013483670632215744, "tps": 197360, "wall": 6770.8} {"step": 20390, "train_loss": 3.233491897583008, "lr": 0.0001348198287420428, "tps": 197231, "wall": 6775.5} {"step": 20391, "train_loss": 3.237936496734619, "lr": 0.00013480295212685368, "tps": 197102, "wall": 6780.3} {"step": 20392, "train_loss": 3.233189582824707, "lr": 0.0001347860764767814, "tps": 196973, "wall": 6785.1} {"step": 20393, "train_loss": 3.189460277557373, "lr": 0.00013476920179201707, "tps": 196845, "wall": 6789.8} {"step": 20394, "train_loss": 3.2329859733581543, "lr": 0.00013475232807275175, "tps": 196716, "wall": 6794.6} {"step": 20395, "train_loss": 3.2561731338500977, "lr": 0.00013473545531917668, "tps": 196589, "wall": 6799.3} {"step": 20396, "train_loss": 3.28717041015625, "lr": 0.00013471858353148307, "tps": 196461, "wall": 6804.1} {"step": 20397, "train_loss": 3.2421834468841553, "lr": 0.00013470171270986184, "tps": 196334, "wall": 6808.8} {"step": 20398, "train_loss": 3.201056957244873, "lr": 0.00013468484285450436, "tps": 196207, "wall": 6813.6} {"step": 20399, "train_loss": 3.20231294631958, "lr": 0.00013466797396560155, "tps": 196078, "wall": 6818.4} {"step": 20400, "train_loss": 3.2496254444122314, "lr": 0.00013465110604334444, "tps": 195951, "wall": 6823.1} {"step": 20401, "train_loss": 3.266540765762329, "lr": 0.00013463423908792433, "tps": 195824, "wall": 6827.9} {"step": 20402, "train_loss": 3.201026201248169, "lr": 0.0001346173730995321, "tps": 195697, "wall": 6832.6} {"step": 20403, "train_loss": 3.2766988277435303, "lr": 0.00013460050807835897, "tps": 195570, "wall": 6837.4} {"step": 20404, "train_loss": 3.200808048248291, "lr": 0.0001345836440245959, "tps": 195444, "wall": 6842.2} {"step": 20405, "train_loss": 3.188546657562256, "lr": 0.00013456678093843385, "tps": 195317, "wall": 6846.9} {"step": 20406, "train_loss": 3.162091016769409, "lr": 0.00013454991882006403, "tps": 195191, "wall": 6851.7} {"step": 20407, "train_loss": 3.1675286293029785, "lr": 0.00013453305766967732, "tps": 195066, "wall": 6856.4} {"step": 20408, "train_loss": 3.338846445083618, "lr": 0.0001345161974874647, "tps": 194940, "wall": 6861.2} {"step": 20409, "train_loss": 3.257042407989502, "lr": 0.00013449933827361726, "tps": 194815, "wall": 6865.9} {"step": 20410, "train_loss": 3.218893051147461, "lr": 0.00013448248002832599, "tps": 194689, "wall": 6870.7} {"step": 20411, "train_loss": 3.323065757751465, "lr": 0.00013446562275178168, "tps": 194562, "wall": 6875.5} {"step": 20412, "train_loss": 3.27424955368042, "lr": 0.00013444876644417555, "tps": 194437, "wall": 6880.3} {"step": 20413, "train_loss": 3.148074150085449, "lr": 0.0001344319111056984, "tps": 194312, "wall": 6885.0} {"step": 20414, "train_loss": 3.2871036529541016, "lr": 0.00013441505673654112, "tps": 194188, "wall": 6889.8} {"step": 20415, "train_loss": 3.1993000507354736, "lr": 0.00013439820333689478, "tps": 194063, "wall": 6894.6} {"step": 20416, "train_loss": 3.2343180179595947, "lr": 0.00013438135090695018, "tps": 193939, "wall": 6899.3} {"step": 20417, "train_loss": 3.2107911109924316, "lr": 0.00013436449944689827, "tps": 193814, "wall": 6904.1} {"step": 20418, "train_loss": 3.3212170600891113, "lr": 0.00013434764895692996, "tps": 193691, "wall": 6908.8} {"step": 20419, "train_loss": 3.146495819091797, "lr": 0.00013433079943723608, "tps": 193567, "wall": 6913.6} {"step": 20420, "train_loss": 3.179767608642578, "lr": 0.0001343139508880076, "tps": 193443, "wall": 6918.4} {"step": 20421, "train_loss": 3.213400363922119, "lr": 0.0001342971033094353, "tps": 193319, "wall": 6923.1} {"step": 20422, "train_loss": 3.2168989181518555, "lr": 0.00013428025670171004, "tps": 193195, "wall": 6927.9} {"step": 20423, "train_loss": 3.163872718811035, "lr": 0.00013426341106502268, "tps": 193072, "wall": 6932.7} {"step": 20424, "train_loss": 3.1712327003479004, "lr": 0.00013424656639956405, "tps": 192947, "wall": 6937.5} {"step": 20425, "train_loss": 3.2091634273529053, "lr": 0.00013422972270552488, "tps": 192824, "wall": 6942.3} {"step": 20426, "train_loss": 3.214953660964966, "lr": 0.00013421287998309614, "tps": 192702, "wall": 6947.0} {"step": 20427, "train_loss": 3.1390342712402344, "lr": 0.00013419603823246854, "tps": 192579, "wall": 6951.8} {"step": 20428, "train_loss": 3.2786808013916016, "lr": 0.00013417919745383275, "tps": 192457, "wall": 6956.5} {"step": 20429, "train_loss": 3.1980042457580566, "lr": 0.00013416235764737976, "tps": 192335, "wall": 6961.3} {"step": 20430, "train_loss": 3.2920892238616943, "lr": 0.00013414551881330025, "tps": 192213, "wall": 6966.0} {"step": 20431, "train_loss": 3.23043155670166, "lr": 0.00013412868095178483, "tps": 192092, "wall": 6970.8} {"step": 20432, "train_loss": 3.2872378826141357, "lr": 0.00013411184406302443, "tps": 191969, "wall": 6975.6} {"step": 20433, "train_loss": 3.203054666519165, "lr": 0.00013409500814720972, "tps": 191848, "wall": 6980.3} {"step": 20434, "train_loss": 3.2644495964050293, "lr": 0.00013407817320453135, "tps": 191727, "wall": 6985.0} {"step": 20435, "train_loss": 3.234210252761841, "lr": 0.00013406133923518014, "tps": 191606, "wall": 6989.8} {"step": 20436, "train_loss": 3.222041130065918, "lr": 0.00013404450623934663, "tps": 191483, "wall": 6994.6} {"step": 20437, "train_loss": 3.198563575744629, "lr": 0.00013402767421722173, "tps": 191363, "wall": 6999.4} {"step": 20438, "train_loss": 3.2157928943634033, "lr": 0.00013401084316899597, "tps": 191242, "wall": 7004.2} {"step": 20439, "train_loss": 3.140204906463623, "lr": 0.00013399401309485996, "tps": 191121, "wall": 7008.9} {"step": 20440, "train_loss": 3.192072868347168, "lr": 0.00013397718399500445, "tps": 191000, "wall": 7013.7} {"step": 20441, "train_loss": 3.0238490104675293, "lr": 0.0001339603558696201, "tps": 190880, "wall": 7018.4} {"step": 20442, "train_loss": 3.2246367931365967, "lr": 0.0001339435287188974, "tps": 190761, "wall": 7023.2} {"step": 20443, "train_loss": 3.227820634841919, "lr": 0.00013392670254302715, "tps": 190641, "wall": 7027.9} {"step": 20444, "train_loss": 3.1008141040802, "lr": 0.00013390987734219985, "tps": 190521, "wall": 7032.7} {"step": 20445, "train_loss": 3.2477798461914062, "lr": 0.00013389305311660606, "tps": 190402, "wall": 7037.5} {"step": 20446, "train_loss": 3.2355399131774902, "lr": 0.00013387622986643646, "tps": 190282, "wall": 7042.2} {"step": 20447, "train_loss": 3.2625269889831543, "lr": 0.0001338594075918816, "tps": 190163, "wall": 7047.0} {"step": 20448, "train_loss": 3.2466964721679688, "lr": 0.000133842586293132, "tps": 190044, "wall": 7051.8} {"step": 20449, "train_loss": 3.048534393310547, "lr": 0.00013382576597037834, "tps": 189923, "wall": 7056.6} {"step": 20450, "train_loss": 3.1502387523651123, "lr": 0.000133808946623811, "tps": 189804, "wall": 7061.4} {"step": 20451, "train_loss": 3.2300872802734375, "lr": 0.00013379212825362054, "tps": 189685, "wall": 7066.1} {"step": 20452, "train_loss": 3.17171049118042, "lr": 0.00013377531085999756, "tps": 189567, "wall": 7070.9} {"step": 20453, "train_loss": 3.204139232635498, "lr": 0.0001337584944431325, "tps": 189449, "wall": 7075.6} {"step": 20454, "train_loss": 3.008485794067383, "lr": 0.00013374167900321584, "tps": 189331, "wall": 7080.4} {"step": 20455, "train_loss": 3.2713782787323, "lr": 0.00013372486454043818, "tps": 189212, "wall": 7085.2} {"step": 20456, "train_loss": 3.1297831535339355, "lr": 0.0001337080510549898, "tps": 189094, "wall": 7090.0} {"step": 20457, "train_loss": 3.178770065307617, "lr": 0.00013369123854706144, "tps": 188976, "wall": 7094.7} {"step": 20458, "train_loss": 3.305238962173462, "lr": 0.00013367442701684337, "tps": 188858, "wall": 7099.5} {"step": 20459, "train_loss": 3.2874460220336914, "lr": 0.000133657616464526, "tps": 188741, "wall": 7104.3} {"step": 20460, "train_loss": 3.2907400131225586, "lr": 0.00013364080689029988, "tps": 188623, "wall": 7109.0} {"step": 20461, "train_loss": 3.2028324604034424, "lr": 0.00013362399829435536, "tps": 188507, "wall": 7113.8} {"step": 20462, "train_loss": 3.303443431854248, "lr": 0.0001336071906768828, "tps": 188388, "wall": 7118.6} {"step": 20463, "train_loss": 3.1558051109313965, "lr": 0.00013359038403807275, "tps": 188272, "wall": 7123.3} {"step": 20464, "train_loss": 3.165804386138916, "lr": 0.00013357357837811545, "tps": 188155, "wall": 7128.1} {"step": 20465, "train_loss": 3.241726875305176, "lr": 0.0001335567736972013, "tps": 188038, "wall": 7132.9} {"step": 20466, "train_loss": 3.2791261672973633, "lr": 0.00013353996999552076, "tps": 187922, "wall": 7137.7} {"step": 20467, "train_loss": 3.218547821044922, "lr": 0.00013352316727326412, "tps": 187806, "wall": 7142.4} {"step": 20468, "train_loss": 3.306337594985962, "lr": 0.00013350636553062165, "tps": 187690, "wall": 7147.2} {"step": 20469, "train_loss": 3.2626209259033203, "lr": 0.0001334895647677838, "tps": 187574, "wall": 7151.9} {"step": 20470, "train_loss": 3.1813201904296875, "lr": 0.00013347276498494086, "tps": 187459, "wall": 7156.7} {"step": 20471, "train_loss": 3.14701247215271, "lr": 0.000133455966182283, "tps": 187343, "wall": 7161.5} {"step": 20472, "train_loss": 3.20980167388916, "lr": 0.00013343916836000078, "tps": 187227, "wall": 7166.2} {"step": 20473, "train_loss": 3.1080398559570312, "lr": 0.00013342237151828422, "tps": 187112, "wall": 7171.0} {"step": 20474, "train_loss": 3.2907824516296387, "lr": 0.0001334055756573238, "tps": 186995, "wall": 7175.8} {"step": 20475, "train_loss": 3.3249943256378174, "lr": 0.0001333887807773097, "tps": 186880, "wall": 7180.6} {"step": 20476, "train_loss": 3.1779677867889404, "lr": 0.00013337198687843219, "tps": 186765, "wall": 7185.4} {"step": 20477, "train_loss": 3.1667048931121826, "lr": 0.00013335519396088147, "tps": 186649, "wall": 7190.2} {"step": 20478, "train_loss": 3.300562858581543, "lr": 0.0001333384020248478, "tps": 186534, "wall": 7195.0} {"step": 20479, "train_loss": 3.283839702606201, "lr": 0.00013332161107052138, "tps": 186420, "wall": 7199.7} {"step": 20480, "train_loss": 3.1681466102600098, "lr": 0.0001333048210980925, "tps": 186305, "wall": 7204.5} {"step": 20481, "train_loss": 3.1993980407714844, "lr": 0.0001332880321077513, "tps": 186191, "wall": 7209.3} {"step": 20482, "train_loss": 3.168170928955078, "lr": 0.00013327124409968794, "tps": 186077, "wall": 7214.0} {"step": 20483, "train_loss": 3.1286892890930176, "lr": 0.00013325445707409265, "tps": 185964, "wall": 7218.8} {"step": 20484, "train_loss": 3.138457775115967, "lr": 0.00013323767103115544, "tps": 185850, "wall": 7223.6} {"step": 20485, "train_loss": 3.1955156326293945, "lr": 0.00013322088597106667, "tps": 185737, "wall": 7228.3} {"step": 20486, "train_loss": 3.1871466636657715, "lr": 0.00013320410189401644, "tps": 185623, "wall": 7233.1} {"step": 20487, "train_loss": 3.1292014122009277, "lr": 0.00013318731880019474, "tps": 185508, "wall": 7238.0} {"step": 20488, "train_loss": 3.13114857673645, "lr": 0.00013317053668979187, "tps": 185395, "wall": 7242.7} {"step": 20489, "train_loss": 3.2428677082061768, "lr": 0.00013315375556299786, "tps": 185282, "wall": 7247.5} {"step": 20490, "train_loss": 3.2523298263549805, "lr": 0.00013313697542000275, "tps": 185170, "wall": 7252.2} {"step": 20491, "train_loss": 3.259737014770508, "lr": 0.0001331201962609967, "tps": 185057, "wall": 7257.0} {"step": 20492, "train_loss": 3.109525680541992, "lr": 0.0001331034180861698, "tps": 184944, "wall": 7261.8} {"step": 20493, "train_loss": 3.264265298843384, "lr": 0.00013308664089571202, "tps": 184832, "wall": 7266.6} {"step": 20494, "train_loss": 3.1239004135131836, "lr": 0.00013306986468981352, "tps": 184719, "wall": 7271.3} {"step": 20495, "train_loss": 3.2707977294921875, "lr": 0.0001330530894686643, "tps": 184607, "wall": 7276.1} {"step": 20496, "train_loss": 3.1184704303741455, "lr": 0.00013303631523245435, "tps": 184496, "wall": 7280.9} {"step": 20497, "train_loss": 3.181334972381592, "lr": 0.00013301954198137374, "tps": 184384, "wall": 7285.6} {"step": 20498, "train_loss": 3.243043899536133, "lr": 0.00013300276971561244, "tps": 184272, "wall": 7290.4} {"step": 20499, "train_loss": 3.2486536502838135, "lr": 0.00013298599843536053, "tps": 184158, "wall": 7295.3} {"step": 20500, "train_loss": 3.0620810985565186, "lr": 0.00013296922814080793, "tps": 184047, "wall": 7300.1} {"step": 20501, "train_loss": 3.206723213195801, "lr": 0.00013295245883214454, "tps": 183931, "wall": 7305.0} {"step": 20502, "train_loss": 3.1594579219818115, "lr": 0.0001329356905095605, "tps": 183820, "wall": 7309.7} {"step": 20503, "train_loss": 3.284555673599243, "lr": 0.00013291892317324563, "tps": 183709, "wall": 7314.5} {"step": 20504, "train_loss": 3.1921536922454834, "lr": 0.0001329021568233899, "tps": 183598, "wall": 7319.3} {"step": 20505, "train_loss": 3.1292710304260254, "lr": 0.00013288539146018326, "tps": 183488, "wall": 7324.1} {"step": 20506, "train_loss": 3.0938823223114014, "lr": 0.00013286862708381564, "tps": 183377, "wall": 7328.8} {"step": 20507, "train_loss": 3.2112491130828857, "lr": 0.00013285186369447688, "tps": 183266, "wall": 7333.6} {"step": 20508, "train_loss": 3.2163245677948, "lr": 0.000132835101292357, "tps": 183156, "wall": 7338.4} {"step": 20509, "train_loss": 3.2730329036712646, "lr": 0.00013281833987764576, "tps": 183045, "wall": 7343.2} {"step": 20510, "train_loss": 3.17529559135437, "lr": 0.000132801579450533, "tps": 182935, "wall": 7348.0} {"step": 20511, "train_loss": 3.2258853912353516, "lr": 0.0001327848200112088, "tps": 182825, "wall": 7352.8} {"step": 20512, "train_loss": 3.272282123565674, "lr": 0.00013276806155986285, "tps": 182714, "wall": 7357.6} {"step": 20513, "train_loss": 3.3408632278442383, "lr": 0.00013275130409668492, "tps": 182604, "wall": 7362.4} {"step": 20514, "train_loss": 3.2360267639160156, "lr": 0.00013273454762186506, "tps": 182495, "wall": 7367.1} {"step": 20515, "train_loss": 3.2599542140960693, "lr": 0.00013271779213559287, "tps": 182386, "wall": 7371.9} {"step": 20516, "train_loss": 3.2091426849365234, "lr": 0.00013270103763805832, "tps": 182277, "wall": 7376.7} {"step": 20517, "train_loss": 3.243656873703003, "lr": 0.0001326842841294511, "tps": 182168, "wall": 7381.4} {"step": 20518, "train_loss": 3.296485662460327, "lr": 0.00013266753160996104, "tps": 182059, "wall": 7386.2} {"step": 20519, "train_loss": 3.098538398742676, "lr": 0.00013265078007977793, "tps": 181951, "wall": 7391.0} {"step": 20520, "train_loss": 3.242785930633545, "lr": 0.0001326340295390915, "tps": 181842, "wall": 7395.8} {"step": 20521, "train_loss": 3.2839488983154297, "lr": 0.00013261727998809146, "tps": 181733, "wall": 7400.5} {"step": 20522, "train_loss": 3.152229070663452, "lr": 0.00013260053142696767, "tps": 181624, "wall": 7405.3} {"step": 20523, "train_loss": 3.2234673500061035, "lr": 0.00013258378385590976, "tps": 181516, "wall": 7410.1} {"step": 20524, "train_loss": 3.26762318611145, "lr": 0.00013256703727510745, "tps": 181407, "wall": 7415.0} {"step": 20525, "train_loss": 3.1058900356292725, "lr": 0.00013255029168475051, "tps": 181300, "wall": 7419.7} {"step": 20526, "train_loss": 3.080942153930664, "lr": 0.00013253354708502862, "tps": 181192, "wall": 7424.5} {"step": 20527, "train_loss": 3.136813163757324, "lr": 0.00013251680347613136, "tps": 181085, "wall": 7429.2} {"step": 20528, "train_loss": 3.2174527645111084, "lr": 0.00013250006085824856, "tps": 180977, "wall": 7434.0} {"step": 20529, "train_loss": 3.327327251434326, "lr": 0.0001324833192315698, "tps": 180870, "wall": 7438.8} {"step": 20530, "train_loss": 3.2590479850769043, "lr": 0.00013246657859628463, "tps": 180763, "wall": 7443.5} {"step": 20531, "train_loss": 3.230801582336426, "lr": 0.00013244983895258292, "tps": 180656, "wall": 7448.3} {"step": 20532, "train_loss": 3.184624671936035, "lr": 0.00013243310030065412, "tps": 180549, "wall": 7453.1} {"step": 20533, "train_loss": 3.222454786300659, "lr": 0.00013241636264068785, "tps": 180442, "wall": 7457.9} {"step": 20534, "train_loss": 3.1667044162750244, "lr": 0.00013239962597287383, "tps": 180335, "wall": 7462.7} {"step": 20535, "train_loss": 3.273191452026367, "lr": 0.00013238289029740154, "tps": 180229, "wall": 7467.4} {"step": 20536, "train_loss": 3.1555635929107666, "lr": 0.00013236615561446063, "tps": 180123, "wall": 7472.2} {"step": 20537, "train_loss": 3.219813823699951, "lr": 0.00013234942192424072, "tps": 180015, "wall": 7477.0} {"step": 20538, "train_loss": 3.219275951385498, "lr": 0.00013233268922693115, "tps": 179909, "wall": 7481.8} {"step": 20539, "train_loss": 3.1920058727264404, "lr": 0.00013231595752272174, "tps": 179803, "wall": 7486.5} {"step": 20540, "train_loss": 3.140568494796753, "lr": 0.00013229922681180193, "tps": 179697, "wall": 7491.3} {"step": 20541, "train_loss": 3.194056510925293, "lr": 0.0001322824970943611, "tps": 179592, "wall": 7496.1} {"step": 20542, "train_loss": 3.2782576084136963, "lr": 0.00013226576837058898, "tps": 179486, "wall": 7500.9} {"step": 20543, "train_loss": 3.2246713638305664, "lr": 0.00013224904064067493, "tps": 179381, "wall": 7505.6} {"step": 20544, "train_loss": 3.1974198818206787, "lr": 0.0001322323139048085, "tps": 179276, "wall": 7510.4} {"step": 20545, "train_loss": 3.23329758644104, "lr": 0.0001322155881631792, "tps": 179171, "wall": 7515.2} {"step": 20546, "train_loss": 3.174142360687256, "lr": 0.0001321988634159765, "tps": 179066, "wall": 7519.9} {"step": 20547, "train_loss": 3.264392852783203, "lr": 0.00013218213966338972, "tps": 178960, "wall": 7524.7} {"step": 20548, "train_loss": 3.1992926597595215, "lr": 0.00013216541690560848, "tps": 178856, "wall": 7529.5} {"step": 20549, "train_loss": 3.2965962886810303, "lr": 0.00013214869514282217, "tps": 178750, "wall": 7534.3} {"step": 20550, "train_loss": 3.2726199626922607, "lr": 0.00013213197437522012, "tps": 178645, "wall": 7539.1} {"step": 20551, "train_loss": 3.257071018218994, "lr": 0.00013211525460299188, "tps": 178541, "wall": 7543.9} {"step": 20552, "train_loss": 3.2399120330810547, "lr": 0.00013209853582632673, "tps": 178437, "wall": 7548.6} {"step": 20553, "train_loss": 3.252535343170166, "lr": 0.0001320818180454142, "tps": 178333, "wall": 7553.4} {"step": 20554, "train_loss": 3.2253615856170654, "lr": 0.00013206510126044353, "tps": 178229, "wall": 7558.2} {"step": 20555, "train_loss": 3.253046989440918, "lr": 0.00013204838547160413, "tps": 178124, "wall": 7563.0} {"step": 20556, "train_loss": 3.3098955154418945, "lr": 0.0001320316706790855, "tps": 178021, "wall": 7567.8} {"step": 20557, "train_loss": 3.184098720550537, "lr": 0.00013201495688307678, "tps": 177917, "wall": 7572.5} {"step": 20558, "train_loss": 3.218179702758789, "lr": 0.00013199824408376736, "tps": 177814, "wall": 7577.3} {"step": 20559, "train_loss": 3.269763708114624, "lr": 0.00013198153228134664, "tps": 177711, "wall": 7582.1} {"step": 20560, "train_loss": 3.1808202266693115, "lr": 0.00013196482147600385, "tps": 177608, "wall": 7586.8} {"step": 20561, "train_loss": 3.1357312202453613, "lr": 0.00013194811166792833, "tps": 177505, "wall": 7591.6} {"step": 20562, "train_loss": 3.2133240699768066, "lr": 0.0001319314028573094, "tps": 177401, "wall": 7596.4} {"step": 20563, "train_loss": 3.1482768058776855, "lr": 0.0001319146950443363, "tps": 177298, "wall": 7601.2} {"step": 20564, "train_loss": 3.2519397735595703, "lr": 0.00013189798822919822, "tps": 177195, "wall": 7606.0} {"step": 20565, "train_loss": 3.242807149887085, "lr": 0.0001318812824120846, "tps": 177094, "wall": 7610.7} {"step": 20566, "train_loss": 3.13411545753479, "lr": 0.00013186457759318455, "tps": 176991, "wall": 7615.5} {"step": 20567, "train_loss": 3.2431087493896484, "lr": 0.00013184787377268727, "tps": 176889, "wall": 7620.3} {"step": 20568, "train_loss": 3.256337881088257, "lr": 0.00013183117095078215, "tps": 176787, "wall": 7625.0} {"step": 20569, "train_loss": 3.245828628540039, "lr": 0.00013181446912765817, "tps": 176685, "wall": 7629.8} {"step": 20570, "train_loss": 3.158191204071045, "lr": 0.00013179776830350476, "tps": 176583, "wall": 7634.6} {"step": 20571, "train_loss": 3.2345800399780273, "lr": 0.000131781068478511, "tps": 176481, "wall": 7639.4} {"step": 20572, "train_loss": 3.265153408050537, "lr": 0.00013176436965286597, "tps": 176379, "wall": 7644.1} {"step": 20573, "train_loss": 3.268711566925049, "lr": 0.00013174767182675906, "tps": 176278, "wall": 7648.9} {"step": 20574, "train_loss": 3.218791961669922, "lr": 0.00013173097500037922, "tps": 176176, "wall": 7653.7} {"step": 20575, "train_loss": 3.2943830490112305, "lr": 0.00013171427917391565, "tps": 176074, "wall": 7658.5} {"step": 20576, "train_loss": 3.2818970680236816, "lr": 0.00013169758434755755, "tps": 175973, "wall": 7663.3} {"step": 20577, "train_loss": 3.27758526802063, "lr": 0.00013168089052149402, "tps": 175871, "wall": 7668.1} {"step": 20578, "train_loss": 3.247119665145874, "lr": 0.00013166419769591406, "tps": 175771, "wall": 7672.8} {"step": 20579, "train_loss": 3.1920971870422363, "lr": 0.0001316475058710069, "tps": 175670, "wall": 7677.6} {"step": 20580, "train_loss": 3.254361629486084, "lr": 0.0001316308150469616, "tps": 175570, "wall": 7682.4} {"step": 20581, "train_loss": 3.2085137367248535, "lr": 0.0001316141252239671, "tps": 175469, "wall": 7687.2} {"step": 20582, "train_loss": 3.194784164428711, "lr": 0.0001315974364022127, "tps": 175369, "wall": 7691.9} {"step": 20583, "train_loss": 3.205211639404297, "lr": 0.0001315807485818873, "tps": 175268, "wall": 7696.7} {"step": 20584, "train_loss": 3.282392740249634, "lr": 0.00013156406176317986, "tps": 175168, "wall": 7701.5} {"step": 20585, "train_loss": 3.2439637184143066, "lr": 0.00013154737594627962, "tps": 175068, "wall": 7706.3} {"step": 20586, "train_loss": 3.2239036560058594, "lr": 0.00013153069113137545, "tps": 174968, "wall": 7711.0} {"step": 20587, "train_loss": 3.3419432640075684, "lr": 0.00013151400731865634, "tps": 174868, "wall": 7715.8} {"step": 20588, "train_loss": 3.222358226776123, "lr": 0.00013149732450831145, "tps": 174769, "wall": 7720.6} {"step": 20589, "train_loss": 3.1709940433502197, "lr": 0.00013148064270052955, "tps": 174670, "wall": 7725.3} {"step": 20590, "train_loss": 3.260448932647705, "lr": 0.00013146396189549981, "tps": 174570, "wall": 7730.1} {"step": 20591, "train_loss": 3.3429276943206787, "lr": 0.00013144728209341108, "tps": 174471, "wall": 7734.9} {"step": 20592, "train_loss": 3.2074711322784424, "lr": 0.00013143060329445224, "tps": 174372, "wall": 7739.6} {"step": 20593, "train_loss": 3.2490603923797607, "lr": 0.00013141392549881242, "tps": 174273, "wall": 7744.4} {"step": 20594, "train_loss": 3.2122697830200195, "lr": 0.00013139724870668047, "tps": 174175, "wall": 7749.2} {"step": 20595, "train_loss": 3.2262771129608154, "lr": 0.00013138057291824516, "tps": 174076, "wall": 7753.9} {"step": 20596, "train_loss": 3.1384189128875732, "lr": 0.0001313638981336956, "tps": 173977, "wall": 7758.7} {"step": 20597, "train_loss": 3.2000041007995605, "lr": 0.0001313472243532206, "tps": 173879, "wall": 7763.5} {"step": 20598, "train_loss": 3.258668899536133, "lr": 0.00013133055157700895, "tps": 173780, "wall": 7768.3} {"step": 20599, "train_loss": 3.2727532386779785, "lr": 0.0001313138798052497, "tps": 173682, "wall": 7773.0} {"step": 20600, "train_loss": 3.3201475143432617, "lr": 0.00013129720903813164, "tps": 173582, "wall": 7777.9} {"step": 20601, "train_loss": 3.2087862491607666, "lr": 0.00013128053927584347, "tps": 173484, "wall": 7782.7} {"step": 20602, "train_loss": 3.2247462272644043, "lr": 0.00013126387051857428, "tps": 173386, "wall": 7787.4} {"step": 20603, "train_loss": 3.1715710163116455, "lr": 0.00013124720276651273, "tps": 173288, "wall": 7792.2} {"step": 20604, "train_loss": 3.346311569213867, "lr": 0.0001312305360198476, "tps": 173191, "wall": 7797.0} {"step": 20605, "train_loss": 3.1709847450256348, "lr": 0.0001312138702787678, "tps": 173093, "wall": 7801.8} {"step": 20606, "train_loss": 3.199744462966919, "lr": 0.00013119720554346208, "tps": 172996, "wall": 7806.5} {"step": 20607, "train_loss": 3.1860568523406982, "lr": 0.00013118054181411926, "tps": 172898, "wall": 7811.3} {"step": 20608, "train_loss": 3.2627358436584473, "lr": 0.00013116387909092804, "tps": 172801, "wall": 7816.1} {"step": 20609, "train_loss": 3.154468536376953, "lr": 0.00013114721737407715, "tps": 172704, "wall": 7820.9} {"step": 20610, "train_loss": 3.278287410736084, "lr": 0.00013113055666375546, "tps": 172607, "wall": 7825.6} {"step": 20611, "train_loss": 3.162809371948242, "lr": 0.00013111389696015164, "tps": 172510, "wall": 7830.4} {"step": 20612, "train_loss": 3.2119336128234863, "lr": 0.00013109723826345432, "tps": 172411, "wall": 7835.3} {"step": 20613, "train_loss": 3.25168776512146, "lr": 0.00013108058057385237, "tps": 172315, "wall": 7840.0} {"step": 20614, "train_loss": 3.203745126724243, "lr": 0.00013106392389153443, "tps": 172219, "wall": 7844.8} {"step": 20615, "train_loss": 3.172703742980957, "lr": 0.0001310472682166891, "tps": 172123, "wall": 7849.5} {"step": 20616, "train_loss": 3.110898971557617, "lr": 0.0001310306135495052, "tps": 172027, "wall": 7854.3} {"step": 20617, "train_loss": 3.162977933883667, "lr": 0.00013101395989017126, "tps": 171931, "wall": 7859.1} {"step": 20618, "train_loss": 3.252845048904419, "lr": 0.00013099730723887602, "tps": 171835, "wall": 7863.8} {"step": 20619, "train_loss": 3.2139229774475098, "lr": 0.00013098065559580813, "tps": 171739, "wall": 7868.6} {"step": 20620, "train_loss": 3.308394432067871, "lr": 0.00013096400496115618, "tps": 171643, "wall": 7873.4} {"step": 20621, "train_loss": 3.220479726791382, "lr": 0.00013094735533510871, "tps": 171548, "wall": 7878.2} {"step": 20622, "train_loss": 3.178293228149414, "lr": 0.0001309307067178545, "tps": 171452, "wall": 7882.9} {"step": 20623, "train_loss": 3.175417184829712, "lr": 0.00013091405910958202, "tps": 171357, "wall": 7887.7} {"step": 20624, "train_loss": 3.164930582046509, "lr": 0.00013089741251047995, "tps": 171261, "wall": 7892.5} {"step": 20625, "train_loss": 3.104764461517334, "lr": 0.00013088076692073682, "tps": 171165, "wall": 7897.3} {"step": 20626, "train_loss": 3.2256274223327637, "lr": 0.00013086412234054109, "tps": 171070, "wall": 7902.1} {"step": 20627, "train_loss": 3.348329544067383, "lr": 0.0001308474787700815, "tps": 170976, "wall": 7906.8} {"step": 20628, "train_loss": 3.2159337997436523, "lr": 0.00013083083620954645, "tps": 170881, "wall": 7911.6} {"step": 20629, "train_loss": 3.234346866607666, "lr": 0.0001308141946591245, "tps": 170786, "wall": 7916.4} {"step": 20630, "train_loss": 3.179037094116211, "lr": 0.0001307975541190042, "tps": 170691, "wall": 7921.2} {"step": 20631, "train_loss": 3.293806552886963, "lr": 0.0001307809145893741, "tps": 170596, "wall": 7925.9} {"step": 20632, "train_loss": 3.282930612564087, "lr": 0.0001307642760704225, "tps": 170502, "wall": 7930.7} {"step": 20633, "train_loss": 3.237788677215576, "lr": 0.00013074763856233806, "tps": 170408, "wall": 7935.5} {"step": 20634, "train_loss": 3.195713996887207, "lr": 0.00013073100206530925, "tps": 170314, "wall": 7940.2} {"step": 20635, "train_loss": 3.236327886581421, "lr": 0.0001307143665795244, "tps": 170220, "wall": 7945.0} {"step": 20636, "train_loss": 3.042227029800415, "lr": 0.00013069773210517207, "tps": 170126, "wall": 7949.8} {"step": 20637, "train_loss": 3.2745213508605957, "lr": 0.00013068109864244068, "tps": 170031, "wall": 7954.6} {"step": 20638, "train_loss": 3.166609287261963, "lr": 0.00013066446619151858, "tps": 169938, "wall": 7959.3} {"step": 20639, "train_loss": 3.257261276245117, "lr": 0.0001306478347525943, "tps": 169845, "wall": 7964.1} {"step": 20640, "train_loss": 3.2430543899536133, "lr": 0.00013063120432585618, "tps": 169752, "wall": 7968.9} {"step": 20641, "train_loss": 3.216519355773926, "lr": 0.00013061457491149252, "tps": 169658, "wall": 7973.6} {"step": 20642, "train_loss": 3.2470450401306152, "lr": 0.0001305979465096919, "tps": 169565, "wall": 7978.4} {"step": 20643, "train_loss": 3.222078561782837, "lr": 0.00013058131912064248, "tps": 169472, "wall": 7983.2} {"step": 20644, "train_loss": 3.245574951171875, "lr": 0.0001305646927445328, "tps": 169379, "wall": 7987.9} {"step": 20645, "train_loss": 3.2786002159118652, "lr": 0.00013054806738155113, "tps": 169286, "wall": 7992.7} {"step": 20646, "train_loss": 3.2329823970794678, "lr": 0.0001305314430318857, "tps": 169193, "wall": 7997.5} {"step": 20647, "train_loss": 3.155913829803467, "lr": 0.000130514819695725, "tps": 169100, "wall": 8002.2} {"step": 20648, "train_loss": 3.266810894012451, "lr": 0.00013049819737325725, "tps": 169008, "wall": 8007.0} {"step": 20649, "train_loss": 3.251863718032837, "lr": 0.00013048157606467074, "tps": 168915, "wall": 8011.8} {"step": 20650, "train_loss": 3.3050405979156494, "lr": 0.00013046495577015386, "tps": 168822, "wall": 8016.6} {"step": 20651, "train_loss": 3.3481929302215576, "lr": 0.0001304483364898947, "tps": 168729, "wall": 8021.4} {"step": 20652, "train_loss": 3.225926399230957, "lr": 0.0001304317182240817, "tps": 168636, "wall": 8026.2} {"step": 20653, "train_loss": 3.268740177154541, "lr": 0.00013041510097290302, "tps": 168542, "wall": 8031.1} {"step": 20654, "train_loss": 3.2378015518188477, "lr": 0.00013039848473654688, "tps": 168450, "wall": 8035.9} {"step": 20655, "train_loss": 3.2129268646240234, "lr": 0.0001303818695152016, "tps": 168358, "wall": 8040.6} {"step": 20656, "train_loss": 3.1551899909973145, "lr": 0.00013036525530905535, "tps": 168266, "wall": 8045.4} {"step": 20657, "train_loss": 3.1395821571350098, "lr": 0.00013034864211829627, "tps": 168174, "wall": 8050.2} {"step": 20658, "train_loss": 3.1676993370056152, "lr": 0.0001303320299431127, "tps": 168083, "wall": 8055.0} {"step": 20659, "train_loss": 3.205624580383301, "lr": 0.00013031541878369274, "tps": 167992, "wall": 8059.7} {"step": 20660, "train_loss": 3.15566086769104, "lr": 0.0001302988086402245, "tps": 167900, "wall": 8064.5} {"step": 20661, "train_loss": 3.2559945583343506, "lr": 0.0001302821995128963, "tps": 167810, "wall": 8069.3} {"step": 20662, "train_loss": 3.294163465499878, "lr": 0.00013026559140189616, "tps": 167718, "wall": 8074.1} {"step": 20663, "train_loss": 3.2699644565582275, "lr": 0.0001302489843074122, "tps": 167626, "wall": 8078.9} {"step": 20664, "train_loss": 3.203815460205078, "lr": 0.00013023237822963268, "tps": 167535, "wall": 8083.7} {"step": 20665, "train_loss": 3.3295493125915527, "lr": 0.00013021577316874562, "tps": 167445, "wall": 8088.4} {"step": 20666, "train_loss": 3.227123737335205, "lr": 0.00013019916912493907, "tps": 167354, "wall": 8093.2} {"step": 20667, "train_loss": 3.1471645832061768, "lr": 0.0001301825660984013, "tps": 167264, "wall": 8098.0} {"step": 20668, "train_loss": 3.2587127685546875, "lr": 0.00013016596408932016, "tps": 167173, "wall": 8102.7} {"step": 20669, "train_loss": 3.19454288482666, "lr": 0.00013014936309788393, "tps": 167083, "wall": 8107.5} {"step": 20670, "train_loss": 3.2714083194732666, "lr": 0.00013013276312428057, "tps": 166993, "wall": 8112.3} {"step": 20671, "train_loss": 3.180224895477295, "lr": 0.00013011616416869806, "tps": 166902, "wall": 8117.1} {"step": 20672, "train_loss": 3.1960058212280273, "lr": 0.00013009956623132455, "tps": 166812, "wall": 8121.8} {"step": 20673, "train_loss": 3.1708478927612305, "lr": 0.00013008296931234806, "tps": 166722, "wall": 8126.6} {"step": 20674, "train_loss": 3.193127155303955, "lr": 0.0001300663734119565, "tps": 166632, "wall": 8131.4} {"step": 20675, "train_loss": 3.2022387981414795, "lr": 0.00013004977853033796, "tps": 166541, "wall": 8136.2} {"step": 20676, "train_loss": 3.2778868675231934, "lr": 0.00013003318466768042, "tps": 166452, "wall": 8141.0} {"step": 20677, "train_loss": 3.123178482055664, "lr": 0.00013001659182417175, "tps": 166362, "wall": 8145.8} {"step": 20678, "train_loss": 3.2516746520996094, "lr": 0.00013000000000000004, "tps": 166273, "wall": 8150.5} {"step": 20679, "train_loss": 3.1738243103027344, "lr": 0.0001299834091953532, "tps": 166184, "wall": 8155.3} {"step": 20680, "train_loss": 3.0881152153015137, "lr": 0.00012996681941041915, "tps": 166095, "wall": 8160.1} {"step": 20681, "train_loss": 3.2280659675598145, "lr": 0.00012995023064538586, "tps": 166005, "wall": 8164.9} {"step": 20682, "train_loss": 3.2252273559570312, "lr": 0.0001299336429004413, "tps": 165917, "wall": 8169.6} {"step": 20683, "train_loss": 3.204354763031006, "lr": 0.00012991705617577316, "tps": 165828, "wall": 8174.4} {"step": 20684, "train_loss": 3.1262054443359375, "lr": 0.00012990047047156957, "tps": 165739, "wall": 8179.2} {"step": 20685, "train_loss": 3.2905986309051514, "lr": 0.00012988388578801828, "tps": 165651, "wall": 8183.9} {"step": 20686, "train_loss": 3.238468885421753, "lr": 0.00012986730212530726, "tps": 165563, "wall": 8188.7} {"step": 20687, "train_loss": 3.258206367492676, "lr": 0.0001298507194836243, "tps": 165473, "wall": 8193.5} {"step": 20688, "train_loss": 3.2284419536590576, "lr": 0.00012983413786315723, "tps": 165384, "wall": 8198.3} {"step": 20689, "train_loss": 3.2318267822265625, "lr": 0.00012981755726409398, "tps": 165296, "wall": 8203.1} {"step": 20690, "train_loss": 3.238292932510376, "lr": 0.0001298009776866223, "tps": 165208, "wall": 8207.9} {"step": 20691, "train_loss": 3.213667869567871, "lr": 0.00012978439913093, "tps": 165120, "wall": 8212.6} {"step": 20692, "train_loss": 3.2509846687316895, "lr": 0.00012976782159720494, "tps": 165032, "wall": 8217.4} {"step": 20693, "train_loss": 3.208359479904175, "lr": 0.0001297512450856349, "tps": 164944, "wall": 8222.2} {"step": 20694, "train_loss": 3.233574628829956, "lr": 0.00012973466959640754, "tps": 164857, "wall": 8226.9} {"step": 20695, "train_loss": 3.251230239868164, "lr": 0.00012971809512971082, "tps": 164769, "wall": 8231.7} {"step": 20696, "train_loss": 3.2070088386535645, "lr": 0.00012970152168573237, "tps": 164681, "wall": 8236.5} {"step": 20697, "train_loss": 3.2678685188293457, "lr": 0.00012968494926465996, "tps": 164594, "wall": 8241.3} {"step": 20698, "train_loss": 3.2952795028686523, "lr": 0.00012966837786668132, "tps": 164507, "wall": 8246.0} {"step": 20699, "train_loss": 3.2384181022644043, "lr": 0.00012965180749198424, "tps": 164420, "wall": 8250.8} {"step": 20700, "train_loss": 3.2142174243927, "lr": 0.0001296352381407563, "tps": 164331, "wall": 8255.6} {"step": 20701, "train_loss": 3.1926307678222656, "lr": 0.00012961866981318532, "tps": 164244, "wall": 8260.4} {"step": 20702, "train_loss": 3.269256591796875, "lr": 0.00012960210250945889, "tps": 164157, "wall": 8265.2} {"step": 20703, "train_loss": 3.251858949661255, "lr": 0.0001295855362297648, "tps": 164071, "wall": 8269.9} {"step": 20704, "train_loss": 3.326671600341797, "lr": 0.00012956897097429063, "tps": 163984, "wall": 8274.7} {"step": 20705, "train_loss": 3.2687580585479736, "lr": 0.00012955240674322396, "tps": 163897, "wall": 8279.5} {"step": 20706, "train_loss": 3.23616099357605, "lr": 0.00012953584353675264, "tps": 163811, "wall": 8284.2} {"step": 20707, "train_loss": 3.1682329177856445, "lr": 0.00012951928135506414, "tps": 163725, "wall": 8289.0} {"step": 20708, "train_loss": 3.3064770698547363, "lr": 0.00012950272019834606, "tps": 163639, "wall": 8293.8} {"step": 20709, "train_loss": 3.1507880687713623, "lr": 0.00012948616006678613, "tps": 163553, "wall": 8298.5} {"step": 20710, "train_loss": 3.3139705657958984, "lr": 0.0001294696009605719, "tps": 163467, "wall": 8303.3} {"step": 20711, "train_loss": 3.243286371231079, "lr": 0.00012945304287989082, "tps": 163381, "wall": 8308.0} {"step": 20712, "train_loss": 3.2761974334716797, "lr": 0.00012943648582493066, "tps": 163296, "wall": 8312.8} {"step": 20713, "train_loss": 3.2389752864837646, "lr": 0.00012941992979587888, "tps": 163209, "wall": 8317.6} {"step": 20714, "train_loss": 3.2559638023376465, "lr": 0.00012940337479292296, "tps": 163123, "wall": 8322.4} {"step": 20715, "train_loss": 3.1759796142578125, "lr": 0.0001293868208162506, "tps": 163038, "wall": 8327.1} {"step": 20716, "train_loss": 3.174933433532715, "lr": 0.0001293702678660492, "tps": 162952, "wall": 8331.9} {"step": 20717, "train_loss": 3.116382598876953, "lr": 0.00012935371594250628, "tps": 162867, "wall": 8336.7} {"step": 20718, "train_loss": 3.2445693016052246, "lr": 0.00012933716504580942, "tps": 162781, "wall": 8341.5} {"step": 20719, "train_loss": 3.184401035308838, "lr": 0.00012932061517614604, "tps": 162696, "wall": 8346.2} {"step": 20720, "train_loss": 3.067561388015747, "lr": 0.00012930406633370362, "tps": 162611, "wall": 8351.0} {"step": 20721, "train_loss": 3.176206588745117, "lr": 0.00012928751851866966, "tps": 162527, "wall": 8355.8} {"step": 20722, "train_loss": 3.2602062225341797, "lr": 0.00012927097173123157, "tps": 162441, "wall": 8360.6} {"step": 20723, "train_loss": 3.1199026107788086, "lr": 0.0001292544259715769, "tps": 162356, "wall": 8365.4} {"step": 20724, "train_loss": 3.351511001586914, "lr": 0.00012923788123989294, "tps": 162271, "wall": 8370.1} {"step": 20725, "train_loss": 3.062392234802246, "lr": 0.0001292213375363671, "tps": 162184, "wall": 8375.0} {"step": 20726, "train_loss": 3.352105140686035, "lr": 0.00012920479486118702, "tps": 162100, "wall": 8379.8} {"step": 20727, "train_loss": 3.2091221809387207, "lr": 0.00012918825321453985, "tps": 162015, "wall": 8384.5} {"step": 20728, "train_loss": 3.2394518852233887, "lr": 0.00012917171259661304, "tps": 161931, "wall": 8389.3} {"step": 20729, "train_loss": 3.202681541442871, "lr": 0.00012915517300759403, "tps": 161847, "wall": 8394.1} {"step": 20730, "train_loss": 3.1569771766662598, "lr": 0.00012913863444767012, "tps": 161763, "wall": 8398.9} {"step": 20731, "train_loss": 3.2757480144500732, "lr": 0.00012912209691702862, "tps": 161679, "wall": 8403.6} {"step": 20732, "train_loss": 3.230222225189209, "lr": 0.000129105560415857, "tps": 161595, "wall": 8408.4} {"step": 20733, "train_loss": 3.317377805709839, "lr": 0.00012908902494434253, "tps": 161511, "wall": 8413.2} {"step": 20734, "train_loss": 3.2508437633514404, "lr": 0.00012907249050267237, "tps": 161426, "wall": 8418.0} {"step": 20735, "train_loss": 3.2655982971191406, "lr": 0.00012905595709103407, "tps": 161343, "wall": 8422.7} {"step": 20736, "train_loss": 3.1967897415161133, "lr": 0.00012903942470961482, "tps": 161260, "wall": 8427.5} {"step": 20737, "train_loss": 3.219820022583008, "lr": 0.0001290228933586018, "tps": 161176, "wall": 8432.3} {"step": 20738, "train_loss": 3.213974952697754, "lr": 0.00012900636303818242, "tps": 161092, "wall": 8437.1} {"step": 20739, "train_loss": 3.217221736907959, "lr": 0.00012898983374854382, "tps": 161009, "wall": 8441.9} {"step": 20740, "train_loss": 3.2441651821136475, "lr": 0.00012897330548987342, "tps": 160926, "wall": 8446.6} {"step": 20741, "train_loss": 3.2066574096679688, "lr": 0.0001289567782623583, "tps": 160843, "wall": 8451.4} {"step": 20742, "train_loss": 3.214111566543579, "lr": 0.00012894025206618563, "tps": 160760, "wall": 8456.1} {"step": 20743, "train_loss": 3.218897819519043, "lr": 0.0001289237269015428, "tps": 160678, "wall": 8460.9} {"step": 20744, "train_loss": 3.2098336219787598, "lr": 0.0001289072027686169, "tps": 160595, "wall": 8465.6} {"step": 20745, "train_loss": 3.2015647888183594, "lr": 0.00012889067966759512, "tps": 160512, "wall": 8470.4} {"step": 20746, "train_loss": 3.1089324951171875, "lr": 0.00012887415759866468, "tps": 160430, "wall": 8475.2} {"step": 20747, "train_loss": 3.251631259918213, "lr": 0.00012885763656201275, "tps": 160348, "wall": 8479.9} {"step": 20748, "train_loss": 3.1050755977630615, "lr": 0.0001288411165578263, "tps": 160265, "wall": 8484.7} {"step": 20749, "train_loss": 3.2140040397644043, "lr": 0.00012882459758629274, "tps": 160183, "wall": 8489.5} {"step": 20750, "train_loss": 3.216867446899414, "lr": 0.00012880807964759907, "tps": 160101, "wall": 8494.2} {"step": 20751, "train_loss": 3.17128586769104, "lr": 0.00012879156274193232, "tps": 160018, "wall": 8499.1} {"step": 20752, "train_loss": 3.2278695106506348, "lr": 0.00012877504686947976, "tps": 159936, "wall": 8503.8} {"step": 20753, "train_loss": 3.2696993350982666, "lr": 0.00012875853203042842, "tps": 159854, "wall": 8508.6} {"step": 20754, "train_loss": 3.366973876953125, "lr": 0.0001287420182249653, "tps": 159772, "wall": 8513.3} {"step": 20755, "train_loss": 3.2648348808288574, "lr": 0.00012872550545327757, "tps": 159690, "wall": 8518.1} {"step": 20756, "train_loss": 3.1747875213623047, "lr": 0.00012870899371555217, "tps": 159609, "wall": 8522.9} {"step": 20757, "train_loss": 3.2182180881500244, "lr": 0.00012869248301197633, "tps": 159527, "wall": 8527.6} {"step": 20758, "train_loss": 3.207197666168213, "lr": 0.000128675973342737, "tps": 159446, "wall": 8532.4} {"step": 20759, "train_loss": 3.2614784240722656, "lr": 0.00012865946470802108, "tps": 159365, "wall": 8537.2} {"step": 20760, "train_loss": 3.1996519565582275, "lr": 0.00012864295710801575, "tps": 159283, "wall": 8541.9} {"step": 20761, "train_loss": 3.300274133682251, "lr": 0.00012862645054290795, "tps": 159202, "wall": 8546.7} {"step": 20762, "train_loss": 3.1604294776916504, "lr": 0.0001286099450128846, "tps": 159121, "wall": 8551.5} {"step": 20763, "train_loss": 3.227053642272949, "lr": 0.00012859344051813283, "tps": 159039, "wall": 8556.3} {"step": 20764, "train_loss": 3.20845890045166, "lr": 0.0001285769370588395, "tps": 158958, "wall": 8561.1} {"step": 20765, "train_loss": 3.185720443725586, "lr": 0.0001285604346351915, "tps": 158877, "wall": 8565.8} {"step": 20766, "train_loss": 3.291257381439209, "lr": 0.00012854393324737587, "tps": 158796, "wall": 8570.6} {"step": 20767, "train_loss": 3.258906841278076, "lr": 0.00012852743289557957, "tps": 158716, "wall": 8575.4} {"step": 20768, "train_loss": 3.208167552947998, "lr": 0.00012851093357998936, "tps": 158635, "wall": 8580.2} {"step": 20769, "train_loss": 3.3029587268829346, "lr": 0.0001284944353007923, "tps": 158555, "wall": 8584.9} {"step": 20770, "train_loss": 3.246346950531006, "lr": 0.00012847793805817527, "tps": 158474, "wall": 8589.7} {"step": 20771, "train_loss": 3.09163236618042, "lr": 0.000128461441852325, "tps": 158394, "wall": 8594.5} {"step": 20772, "train_loss": 3.1554598808288574, "lr": 0.00012844494668342855, "tps": 158314, "wall": 8599.2} {"step": 20773, "train_loss": 3.298187017440796, "lr": 0.00012842845255167272, "tps": 158233, "wall": 8604.0} {"step": 20774, "train_loss": 3.15644907951355, "lr": 0.00012841195945724422, "tps": 158153, "wall": 8608.8} {"step": 20775, "train_loss": 3.2517402172088623, "lr": 0.00012839546740033012, "tps": 158074, "wall": 8613.5} {"step": 20776, "train_loss": 3.1324658393859863, "lr": 0.000128378976381117, "tps": 157993, "wall": 8618.3} {"step": 20777, "train_loss": 3.2047934532165527, "lr": 0.0001283624863997919, "tps": 157914, "wall": 8623.1} {"step": 20778, "train_loss": 3.2160298824310303, "lr": 0.00012834599745654147, "tps": 157834, "wall": 8627.9} {"step": 20779, "train_loss": 3.120616912841797, "lr": 0.0001283295095515525, "tps": 157754, "wall": 8632.6} {"step": 20780, "train_loss": 3.1378138065338135, "lr": 0.0001283130226850119, "tps": 157675, "wall": 8637.4} {"step": 20781, "train_loss": 3.296704053878784, "lr": 0.0001282965368571063, "tps": 157595, "wall": 8642.2} {"step": 20782, "train_loss": 3.229853630065918, "lr": 0.00012828005206802243, "tps": 157516, "wall": 8646.9} {"step": 20783, "train_loss": 3.3414344787597656, "lr": 0.00012826356831794716, "tps": 157437, "wall": 8651.7} {"step": 20784, "train_loss": 3.252432346343994, "lr": 0.00012824708560706718, "tps": 157358, "wall": 8656.5} {"step": 20785, "train_loss": 3.2484166622161865, "lr": 0.00012823060393556905, "tps": 157276, "wall": 8661.4} {"step": 20786, "train_loss": 3.076554298400879, "lr": 0.0001282141233036397, "tps": 157198, "wall": 8666.1} {"step": 20787, "train_loss": 3.288846969604492, "lr": 0.00012819764371146576, "tps": 157119, "wall": 8670.9} {"step": 20788, "train_loss": 3.2429990768432617, "lr": 0.00012818116515923378, "tps": 157039, "wall": 8675.7} {"step": 20789, "train_loss": 3.2947230339050293, "lr": 0.00012816468764713062, "tps": 156960, "wall": 8680.5} {"step": 20790, "train_loss": 3.1855297088623047, "lr": 0.0001281482111753428, "tps": 156881, "wall": 8685.3} {"step": 20791, "train_loss": 3.25189471244812, "lr": 0.00012813173574405696, "tps": 156803, "wall": 8690.0} {"step": 20792, "train_loss": 3.226888656616211, "lr": 0.00012811526135345989, "tps": 156724, "wall": 8694.8} {"step": 20793, "train_loss": 3.1900129318237305, "lr": 0.00012809878800373802, "tps": 156646, "wall": 8699.6} {"step": 20794, "train_loss": 3.2492141723632812, "lr": 0.0001280823156950781, "tps": 156568, "wall": 8704.3} {"step": 20795, "train_loss": 3.3018264770507812, "lr": 0.00012806584442766672, "tps": 156490, "wall": 8709.1} {"step": 20796, "train_loss": 3.175161838531494, "lr": 0.00012804937420169034, "tps": 156412, "wall": 8713.8} {"step": 20797, "train_loss": 3.209564447402954, "lr": 0.00012803290501733566, "tps": 156334, "wall": 8718.6} {"step": 20798, "train_loss": 3.103860855102539, "lr": 0.00012801643687478925, "tps": 156256, "wall": 8723.4} {"step": 20799, "train_loss": 3.169995069503784, "lr": 0.00012799996977423756, "tps": 156178, "wall": 8728.1} {"step": 20800, "train_loss": 3.1371562480926514, "lr": 0.00012798350371586722, "tps": 156101, "wall": 8732.9} {"step": 20801, "train_loss": 3.1813342571258545, "lr": 0.00012796703869986475, "tps": 156022, "wall": 8737.7} {"step": 20802, "train_loss": 3.2711753845214844, "lr": 0.00012795057472641657, "tps": 155944, "wall": 8742.5} {"step": 20803, "train_loss": 3.156158208847046, "lr": 0.0001279341117957093, "tps": 155867, "wall": 8747.2} {"step": 20804, "train_loss": 3.255107879638672, "lr": 0.00012791764990792944, "tps": 155790, "wall": 8752.0} {"step": 20805, "train_loss": 3.1989450454711914, "lr": 0.00012790118906326334, "tps": 155712, "wall": 8756.8} {"step": 20806, "train_loss": 3.254640579223633, "lr": 0.0001278847292618976, "tps": 155635, "wall": 8761.5} {"step": 20807, "train_loss": 3.260509729385376, "lr": 0.00012786827050401866, "tps": 155558, "wall": 8766.3} {"step": 20808, "train_loss": 3.1376867294311523, "lr": 0.00012785181278981286, "tps": 155481, "wall": 8771.1} {"step": 20809, "train_loss": 3.227761745452881, "lr": 0.00012783535611946679, "tps": 155404, "wall": 8775.8} {"step": 20810, "train_loss": 3.1798770427703857, "lr": 0.0001278189004931667, "tps": 155327, "wall": 8780.6} {"step": 20811, "train_loss": 3.3529343605041504, "lr": 0.00012780244591109914, "tps": 155250, "wall": 8785.4} {"step": 20812, "train_loss": 3.24111270904541, "lr": 0.0001277859923734505, "tps": 155174, "wall": 8790.1} {"step": 20813, "train_loss": 3.143954038619995, "lr": 0.00012776953988040702, "tps": 155096, "wall": 8795.0} {"step": 20814, "train_loss": 3.126979112625122, "lr": 0.0001277530884321553, "tps": 155020, "wall": 8799.7} {"step": 20815, "train_loss": 3.2375707626342773, "lr": 0.00012773663802888153, "tps": 154943, "wall": 8804.5} {"step": 20816, "train_loss": 3.280104637145996, "lr": 0.00012772018867077212, "tps": 154867, "wall": 8809.2} {"step": 20817, "train_loss": 3.3077826499938965, "lr": 0.00012770374035801343, "tps": 154791, "wall": 8814.0} {"step": 20818, "train_loss": 3.3154022693634033, "lr": 0.00012768729309079176, "tps": 154714, "wall": 8818.8} {"step": 20819, "train_loss": 3.1682024002075195, "lr": 0.00012767084686929342, "tps": 154638, "wall": 8823.5} {"step": 20820, "train_loss": 3.2970268726348877, "lr": 0.00012765440169370472, "tps": 154562, "wall": 8828.3} {"step": 20821, "train_loss": 3.2762489318847656, "lr": 0.00012763795756421192, "tps": 154486, "wall": 8833.1} {"step": 20822, "train_loss": 3.199324369430542, "lr": 0.00012762151448100136, "tps": 154410, "wall": 8837.8} {"step": 20823, "train_loss": 3.192317485809326, "lr": 0.0001276050724442593, "tps": 154335, "wall": 8842.6} {"step": 20824, "train_loss": 3.1747658252716064, "lr": 0.00012758863145417192, "tps": 154259, "wall": 8847.3} {"step": 20825, "train_loss": 3.171611785888672, "lr": 0.00012757219151092558, "tps": 154183, "wall": 8852.1} {"step": 20826, "train_loss": 3.2607674598693848, "lr": 0.00012755575261470646, "tps": 154107, "wall": 8857.0} {"step": 20827, "train_loss": 3.1575021743774414, "lr": 0.0001275393147657007, "tps": 154031, "wall": 8861.7} {"step": 20828, "train_loss": 3.0721564292907715, "lr": 0.00012752287796409468, "tps": 153956, "wall": 8866.5} {"step": 20829, "train_loss": 3.2108638286590576, "lr": 0.00012750644221007446, "tps": 153880, "wall": 8871.2} {"step": 20830, "train_loss": 3.223625659942627, "lr": 0.00012749000750382622, "tps": 153805, "wall": 8876.0} {"step": 20831, "train_loss": 3.0978264808654785, "lr": 0.00012747357384553624, "tps": 153730, "wall": 8880.8} {"step": 20832, "train_loss": 3.227022171020508, "lr": 0.0001274571412353906, "tps": 153655, "wall": 8885.6} {"step": 20833, "train_loss": 3.303910732269287, "lr": 0.00012744070967357545, "tps": 153580, "wall": 8890.3} {"step": 20834, "train_loss": 3.2639524936676025, "lr": 0.00012742427916027699, "tps": 153505, "wall": 8895.1} {"step": 20835, "train_loss": 3.264397144317627, "lr": 0.00012740784969568126, "tps": 153430, "wall": 8899.8} {"step": 20836, "train_loss": 3.2970001697540283, "lr": 0.00012739142127997445, "tps": 153356, "wall": 8904.6} {"step": 20837, "train_loss": 3.176356554031372, "lr": 0.00012737499391334264, "tps": 153281, "wall": 8909.3} {"step": 20838, "train_loss": 3.29410457611084, "lr": 0.00012735856759597187, "tps": 153206, "wall": 8914.1} {"step": 20839, "train_loss": 3.167142868041992, "lr": 0.0001273421423280483, "tps": 153131, "wall": 8918.9} {"step": 20840, "train_loss": 3.154815196990967, "lr": 0.00012732571810975796, "tps": 153057, "wall": 8923.7} {"step": 20841, "train_loss": 3.27652645111084, "lr": 0.00012730929494128682, "tps": 152982, "wall": 8928.5} {"step": 20842, "train_loss": 3.297590494155884, "lr": 0.00012729287282282109, "tps": 152907, "wall": 8933.3} {"step": 20843, "train_loss": 3.2033724784851074, "lr": 0.00012727645175454667, "tps": 152833, "wall": 8938.0} {"step": 20844, "train_loss": 3.1608660221099854, "lr": 0.0001272600317366496, "tps": 152759, "wall": 8942.8} {"step": 20845, "train_loss": 3.297410488128662, "lr": 0.00012724361276931595, "tps": 152685, "wall": 8947.6} {"step": 20846, "train_loss": 3.304265022277832, "lr": 0.00012722719485273168, "tps": 152611, "wall": 8952.3} {"step": 20847, "train_loss": 3.223519802093506, "lr": 0.00012721077798708268, "tps": 152537, "wall": 8957.1} {"step": 20848, "train_loss": 3.2164154052734375, "lr": 0.00012719436217255512, "tps": 152463, "wall": 8961.9} {"step": 20849, "train_loss": 3.158933162689209, "lr": 0.00012717794740933481, "tps": 152389, "wall": 8966.6} {"step": 20850, "train_loss": 3.2048635482788086, "lr": 0.00012716153369760768, "tps": 152316, "wall": 8971.4} {"step": 20851, "train_loss": 3.2603816986083984, "lr": 0.00012714512103755978, "tps": 152241, "wall": 8976.2} {"step": 20852, "train_loss": 3.1920676231384277, "lr": 0.0001271287094293769, "tps": 152168, "wall": 8981.0} {"step": 20853, "train_loss": 3.232215404510498, "lr": 0.0001271122988732451, "tps": 152095, "wall": 8985.7} {"step": 20854, "train_loss": 3.1504149436950684, "lr": 0.00012709588936935022, "tps": 152021, "wall": 8990.5} {"step": 20855, "train_loss": 3.2815375328063965, "lr": 0.00012707948091787802, "tps": 151948, "wall": 8995.3} {"step": 20856, "train_loss": 3.318711042404175, "lr": 0.0001270630735190146, "tps": 151875, "wall": 9000.0} {"step": 20857, "train_loss": 3.0977230072021484, "lr": 0.00012704666717294568, "tps": 151801, "wall": 9004.8} {"step": 20858, "train_loss": 3.156367540359497, "lr": 0.00012703026187985708, "tps": 151728, "wall": 9009.6} {"step": 20859, "train_loss": 3.292454957962036, "lr": 0.00012701385763993478, "tps": 151655, "wall": 9014.4} {"step": 20860, "train_loss": 3.122588634490967, "lr": 0.00012699745445336454, "tps": 151582, "wall": 9019.2} {"step": 20861, "train_loss": 3.2823104858398438, "lr": 0.00012698105232033206, "tps": 151510, "wall": 9023.9} {"step": 20862, "train_loss": 3.214695453643799, "lr": 0.00012696465124102337, "tps": 151437, "wall": 9028.7} {"step": 20863, "train_loss": 3.2345800399780273, "lr": 0.00012694825121562411, "tps": 151364, "wall": 9033.4} {"step": 20864, "train_loss": 3.2211406230926514, "lr": 0.00012693185224432003, "tps": 151291, "wall": 9038.3} {"step": 20865, "train_loss": 3.1947548389434814, "lr": 0.00012691545432729702, "tps": 151218, "wall": 9043.0} {"step": 20866, "train_loss": 3.140665054321289, "lr": 0.0001268990574647408, "tps": 151146, "wall": 9047.8} {"step": 20867, "train_loss": 3.1589887142181396, "lr": 0.00012688266165683705, "tps": 151073, "wall": 9052.6} {"step": 20868, "train_loss": 3.2620491981506348, "lr": 0.00012686626690377157, "tps": 151000, "wall": 9057.4} {"step": 20869, "train_loss": 3.140671491622925, "lr": 0.00012684987320573009, "tps": 150928, "wall": 9062.2} {"step": 20870, "train_loss": 3.217428207397461, "lr": 0.00012683348056289817, "tps": 150856, "wall": 9066.9} {"step": 20871, "train_loss": 3.2042086124420166, "lr": 0.00012681708897546175, "tps": 150784, "wall": 9071.7} {"step": 20872, "train_loss": 3.1300525665283203, "lr": 0.00012680069844360627, "tps": 150712, "wall": 9076.5} {"step": 20873, "train_loss": 3.1613757610321045, "lr": 0.00012678430896751762, "tps": 150640, "wall": 9081.2} {"step": 20874, "train_loss": 3.1537091732025146, "lr": 0.00012676792054738134, "tps": 150568, "wall": 9086.0} {"step": 20875, "train_loss": 3.282578706741333, "lr": 0.00012675153318338303, "tps": 150496, "wall": 9090.8} {"step": 20876, "train_loss": 3.161571502685547, "lr": 0.00012673514687570848, "tps": 150423, "wall": 9095.6} {"step": 20877, "train_loss": 3.2852377891540527, "lr": 0.00012671876162454325, "tps": 150352, "wall": 9100.3} {"step": 20878, "train_loss": 3.2800450325012207, "lr": 0.00012670237743007284, "tps": 150281, "wall": 9105.1} {"step": 20879, "train_loss": 3.2245254516601562, "lr": 0.000126685994292483, "tps": 150209, "wall": 9109.9} {"step": 20880, "train_loss": 3.2461018562316895, "lr": 0.00012666961221195929, "tps": 150138, "wall": 9114.6} {"step": 20881, "train_loss": 3.3453197479248047, "lr": 0.00012665323118868718, "tps": 150066, "wall": 9119.4} {"step": 20882, "train_loss": 3.182499408721924, "lr": 0.00012663685122285242, "tps": 149995, "wall": 9124.2} {"step": 20883, "train_loss": 3.2412242889404297, "lr": 0.0001266204723146404, "tps": 149924, "wall": 9128.9} {"step": 20884, "train_loss": 3.2297677993774414, "lr": 0.0001266040944642367, "tps": 149853, "wall": 9133.7} {"step": 20885, "train_loss": 3.3764231204986572, "lr": 0.00012658771767182691, "tps": 149782, "wall": 9138.5} {"step": 20886, "train_loss": 3.1945695877075195, "lr": 0.00012657134193759653, "tps": 149711, "wall": 9143.2} {"step": 20887, "train_loss": 3.2374649047851562, "lr": 0.00012655496726173097, "tps": 149640, "wall": 9148.0} {"step": 20888, "train_loss": 3.2990102767944336, "lr": 0.00012653859364441584, "tps": 149569, "wall": 9152.8} {"step": 20889, "train_loss": 3.2290244102478027, "lr": 0.00012652222108583655, "tps": 149498, "wall": 9157.6} {"step": 20890, "train_loss": 3.2061362266540527, "lr": 0.00012650584958617865, "tps": 149427, "wall": 9162.4} {"step": 20891, "train_loss": 3.1175291538238525, "lr": 0.00012648947914562753, "tps": 149357, "wall": 9167.1} {"step": 20892, "train_loss": 3.2402732372283936, "lr": 0.0001264731097643686, "tps": 149286, "wall": 9171.9} {"step": 20893, "train_loss": 3.230593681335449, "lr": 0.00012645674144258742, "tps": 149216, "wall": 9176.7} {"step": 20894, "train_loss": 3.2737085819244385, "lr": 0.00012644037418046929, "tps": 149146, "wall": 9181.4} {"step": 20895, "train_loss": 3.235318660736084, "lr": 0.00012642400797819962, "tps": 149076, "wall": 9186.2} {"step": 20896, "train_loss": 3.3579626083374023, "lr": 0.00012640764283596391, "tps": 149006, "wall": 9190.9} {"step": 20897, "train_loss": 3.247743844985962, "lr": 0.0001263912787539475, "tps": 148935, "wall": 9195.7} {"step": 20898, "train_loss": 3.164783477783203, "lr": 0.00012637491573233564, "tps": 148865, "wall": 9200.5} {"step": 20899, "train_loss": 3.3133363723754883, "lr": 0.0001263585537713139, "tps": 148795, "wall": 9205.2} {"step": 20900, "train_loss": 3.2476119995117188, "lr": 0.00012634219287106755, "tps": 148726, "wall": 9210.0} {"step": 20901, "train_loss": 3.1215763092041016, "lr": 0.00012632583303178181, "tps": 148655, "wall": 9214.8} {"step": 20902, "train_loss": 3.2092742919921875, "lr": 0.0001263094742536422, "tps": 148586, "wall": 9219.6} {"step": 20903, "train_loss": 3.31253719329834, "lr": 0.0001262931165368339, "tps": 148516, "wall": 9224.3} {"step": 20904, "train_loss": 3.2026679515838623, "lr": 0.0001262767598815422, "tps": 148446, "wall": 9229.1} {"step": 20905, "train_loss": 3.199768543243408, "lr": 0.00012626040428795245, "tps": 148377, "wall": 9233.8} {"step": 20906, "train_loss": 3.1491780281066895, "lr": 0.00012624404975624995, "tps": 148308, "wall": 9238.6} {"step": 20907, "train_loss": 3.2176456451416016, "lr": 0.00012622769628661988, "tps": 148238, "wall": 9243.4} {"step": 20908, "train_loss": 3.2198987007141113, "lr": 0.0001262113438792476, "tps": 148169, "wall": 9248.1} {"step": 20909, "train_loss": 3.3039872646331787, "lr": 0.00012619499253431818, "tps": 148100, "wall": 9252.9} {"step": 20910, "train_loss": 3.2030248641967773, "lr": 0.00012617864225201707, "tps": 148031, "wall": 9257.6} {"step": 20911, "train_loss": 3.13696026802063, "lr": 0.00012616229303252937, "tps": 147962, "wall": 9262.4} {"step": 20912, "train_loss": 3.2134928703308105, "lr": 0.0001261459448760402, "tps": 147893, "wall": 9267.2} {"step": 20913, "train_loss": 3.321643114089966, "lr": 0.00012612959778273493, "tps": 147824, "wall": 9271.9} {"step": 20914, "train_loss": 3.1822445392608643, "lr": 0.00012611325175279867, "tps": 147754, "wall": 9276.7} {"step": 20915, "train_loss": 3.2325916290283203, "lr": 0.00012609690678641648, "tps": 147686, "wall": 9281.5} {"step": 20916, "train_loss": 3.1603140830993652, "lr": 0.00012608056288377368, "tps": 147617, "wall": 9286.3} {"step": 20917, "train_loss": 3.166170835494995, "lr": 0.00012606422004505534, "tps": 147549, "wall": 9291.0} {"step": 20918, "train_loss": 3.1884899139404297, "lr": 0.00012604787827044653, "tps": 147481, "wall": 9295.8} {"step": 20919, "train_loss": 3.1044509410858154, "lr": 0.00012603153756013256, "tps": 147412, "wall": 9300.5} {"step": 20920, "train_loss": 3.211918830871582, "lr": 0.00012601519791429836, "tps": 147344, "wall": 9305.3} {"step": 20921, "train_loss": 3.211252212524414, "lr": 0.000125998859333129, "tps": 147276, "wall": 9310.0} {"step": 20922, "train_loss": 3.2325732707977295, "lr": 0.00012598252181680977, "tps": 147207, "wall": 9314.8} {"step": 20923, "train_loss": 3.1924500465393066, "lr": 0.0001259661853655256, "tps": 147139, "wall": 9319.6} {"step": 20924, "train_loss": 3.1542012691497803, "lr": 0.00012594984997946147, "tps": 147070, "wall": 9324.4} {"step": 20925, "train_loss": 3.103025197982788, "lr": 0.0001259335156588026, "tps": 147002, "wall": 9329.1} {"step": 20926, "train_loss": 3.132639169692993, "lr": 0.0001259171824037339, "tps": 146934, "wall": 9333.9} {"step": 20927, "train_loss": 3.171902656555176, "lr": 0.00012590085021444054, "tps": 146866, "wall": 9338.7} {"step": 20928, "train_loss": 3.197105646133423, "lr": 0.0001258845190911074, "tps": 146798, "wall": 9343.4} {"step": 20929, "train_loss": 3.2577714920043945, "lr": 0.0001258681890339195, "tps": 146730, "wall": 9348.2} {"step": 20930, "train_loss": 3.2678608894348145, "lr": 0.00012585186004306187, "tps": 146663, "wall": 9353.0} {"step": 20931, "train_loss": 3.1867496967315674, "lr": 0.00012583553211871945, "tps": 146595, "wall": 9357.7} {"step": 20932, "train_loss": 3.1760120391845703, "lr": 0.0001258192052610772, "tps": 146527, "wall": 9362.5} {"step": 20933, "train_loss": 3.211977958679199, "lr": 0.0001258028794703201, "tps": 146460, "wall": 9367.3} {"step": 20934, "train_loss": 3.3225154876708984, "lr": 0.00012578655474663312, "tps": 146392, "wall": 9372.0} {"step": 20935, "train_loss": 3.2517223358154297, "lr": 0.00012577023109020108, "tps": 146325, "wall": 9376.8} {"step": 20936, "train_loss": 3.1874709129333496, "lr": 0.00012575390850120898, "tps": 146258, "wall": 9381.5} {"step": 20937, "train_loss": 3.277486801147461, "lr": 0.00012573758697984175, "tps": 146191, "wall": 9386.3} {"step": 20938, "train_loss": 3.2458548545837402, "lr": 0.00012572126652628414, "tps": 146124, "wall": 9391.0} {"step": 20939, "train_loss": 3.2621936798095703, "lr": 0.00012570494714072124, "tps": 146056, "wall": 9395.9} {"step": 20940, "train_loss": 3.234717845916748, "lr": 0.00012568862882333774, "tps": 145988, "wall": 9400.7} {"step": 20941, "train_loss": 3.1253366470336914, "lr": 0.0001256723115743185, "tps": 145921, "wall": 9405.4} {"step": 20942, "train_loss": 3.1977338790893555, "lr": 0.00012565599539384853, "tps": 145854, "wall": 9410.2} {"step": 20943, "train_loss": 3.1914825439453125, "lr": 0.00012563968028211242, "tps": 145788, "wall": 9414.9} {"step": 20944, "train_loss": 3.1480813026428223, "lr": 0.0001256233662392952, "tps": 145721, "wall": 9419.7} {"step": 20945, "train_loss": 3.149245262145996, "lr": 0.0001256070532655816, "tps": 145655, "wall": 9424.4} {"step": 20946, "train_loss": 3.175133228302002, "lr": 0.00012559074136115635, "tps": 145588, "wall": 9429.2} {"step": 20947, "train_loss": 3.1400296688079834, "lr": 0.00012557443052620436, "tps": 145522, "wall": 9433.9} {"step": 20948, "train_loss": 3.2504305839538574, "lr": 0.0001255581207609103, "tps": 145455, "wall": 9438.7} {"step": 20949, "train_loss": 3.202255964279175, "lr": 0.00012554181206545891, "tps": 145389, "wall": 9443.5} {"step": 20950, "train_loss": 3.2751028537750244, "lr": 0.00012552550444003505, "tps": 145323, "wall": 9448.2} {"step": 20951, "train_loss": 3.1720023155212402, "lr": 0.00012550919788482338, "tps": 145256, "wall": 9453.0} {"step": 20952, "train_loss": 3.242668628692627, "lr": 0.0001254928924000086, "tps": 145189, "wall": 9457.8} {"step": 20953, "train_loss": 3.1067285537719727, "lr": 0.00012547658798577546, "tps": 145123, "wall": 9462.6} {"step": 20954, "train_loss": 3.19991397857666, "lr": 0.00012546028464230865, "tps": 145057, "wall": 9467.3} {"step": 20955, "train_loss": 3.151646852493286, "lr": 0.0001254439823697928, "tps": 144991, "wall": 9472.1} {"step": 20956, "train_loss": 3.1984682083129883, "lr": 0.00012542768116841272, "tps": 144925, "wall": 9476.9} {"step": 20957, "train_loss": 3.1800408363342285, "lr": 0.00012541138103835294, "tps": 144859, "wall": 9481.6} {"step": 20958, "train_loss": 3.23445200920105, "lr": 0.00012539508197979813, "tps": 144794, "wall": 9486.3} {"step": 20959, "train_loss": 3.179119110107422, "lr": 0.000125378783992933, "tps": 144728, "wall": 9491.1} {"step": 20960, "train_loss": 3.230145215988159, "lr": 0.0001253624870779421, "tps": 144663, "wall": 9495.8} {"step": 20961, "train_loss": 3.2151942253112793, "lr": 0.00012534619123501, "tps": 144597, "wall": 9500.6} {"step": 20962, "train_loss": 3.3130698204040527, "lr": 0.00012532989646432148, "tps": 144532, "wall": 9505.4} {"step": 20963, "train_loss": 3.157508611679077, "lr": 0.0001253136027660609, "tps": 144467, "wall": 9510.1} {"step": 20964, "train_loss": 3.216676950454712, "lr": 0.00012529731014041304, "tps": 144400, "wall": 9514.9} {"step": 20965, "train_loss": 3.19075083732605, "lr": 0.00012528101858756238, "tps": 144335, "wall": 9519.7} {"step": 20966, "train_loss": 3.2370455265045166, "lr": 0.0001252647281076934, "tps": 144270, "wall": 9524.4} {"step": 20967, "train_loss": 3.2359843254089355, "lr": 0.00012524843870099074, "tps": 144205, "wall": 9529.2} {"step": 20968, "train_loss": 3.101543664932251, "lr": 0.00012523215036763894, "tps": 144140, "wall": 9533.9} {"step": 20969, "train_loss": 3.195937395095825, "lr": 0.00012521586310782235, "tps": 144075, "wall": 9538.7} {"step": 20970, "train_loss": 3.136078357696533, "lr": 0.0001251995769217257, "tps": 144010, "wall": 9543.4} {"step": 20971, "train_loss": 3.28680419921875, "lr": 0.00012518329180953334, "tps": 143945, "wall": 9548.2} {"step": 20972, "train_loss": 3.132467746734619, "lr": 0.00012516700777142972, "tps": 143881, "wall": 9552.9} {"step": 20973, "train_loss": 3.336954355239868, "lr": 0.00012515072480759947, "tps": 143816, "wall": 9557.7} {"step": 20974, "train_loss": 3.230764150619507, "lr": 0.0001251344429182269, "tps": 143751, "wall": 9562.4} {"step": 20975, "train_loss": 3.2175769805908203, "lr": 0.00012511816210349641, "tps": 143686, "wall": 9567.2} {"step": 20976, "train_loss": 3.2187132835388184, "lr": 0.00012510188236359264, "tps": 143622, "wall": 9572.0} {"step": 20977, "train_loss": 3.146336555480957, "lr": 0.00012508560369869982, "tps": 143556, "wall": 9576.8} {"step": 20978, "train_loss": 3.2876431941986084, "lr": 0.00012506932610900238, "tps": 143492, "wall": 9581.5} {"step": 20979, "train_loss": 3.15682315826416, "lr": 0.0001250530495946848, "tps": 143428, "wall": 9586.3} {"step": 20980, "train_loss": 3.239483594894409, "lr": 0.0001250367741559314, "tps": 143363, "wall": 9591.1} {"step": 20981, "train_loss": 3.175149917602539, "lr": 0.00012502049979292655, "tps": 143299, "wall": 9595.8} {"step": 20982, "train_loss": 3.2593512535095215, "lr": 0.00012500422650585464, "tps": 143235, "wall": 9600.6} {"step": 20983, "train_loss": 3.1915581226348877, "lr": 0.00012498795429489995, "tps": 143171, "wall": 9605.3} {"step": 20984, "train_loss": 3.1677401065826416, "lr": 0.0001249716831602469, "tps": 143107, "wall": 9610.1} {"step": 20985, "train_loss": 3.159802198410034, "lr": 0.00012495541310207978, "tps": 143043, "wall": 9614.8} {"step": 20986, "train_loss": 3.2755937576293945, "lr": 0.00012493914412058275, "tps": 142979, "wall": 9619.6} {"step": 20987, "train_loss": 3.2787351608276367, "lr": 0.00012492287621594037, "tps": 142915, "wall": 9624.3} {"step": 20988, "train_loss": 3.288628101348877, "lr": 0.00012490660938833682, "tps": 142851, "wall": 9629.1} {"step": 20989, "train_loss": 3.265063524246216, "lr": 0.00012489034363795626, "tps": 142788, "wall": 9633.8} {"step": 20990, "train_loss": 3.1480021476745605, "lr": 0.00012487407896498312, "tps": 142723, "wall": 9638.7} {"step": 20991, "train_loss": 3.2417330741882324, "lr": 0.00012485781536960143, "tps": 142660, "wall": 9643.4} {"step": 20992, "train_loss": 3.169431209564209, "lr": 0.00012484155285199565, "tps": 142596, "wall": 9648.2} {"step": 20993, "train_loss": 3.244352340698242, "lr": 0.00012482529141234988, "tps": 142533, "wall": 9652.9} {"step": 20994, "train_loss": 3.17659592628479, "lr": 0.0001248090310508483, "tps": 142469, "wall": 9657.7} {"step": 20995, "train_loss": 3.166095495223999, "lr": 0.00012479277176767525, "tps": 142406, "wall": 9662.4} {"step": 20996, "train_loss": 3.2812397480010986, "lr": 0.00012477651356301484, "tps": 142343, "wall": 9667.2} {"step": 20997, "train_loss": 3.147313117980957, "lr": 0.00012476025643705114, "tps": 142279, "wall": 9672.0} {"step": 20998, "train_loss": 3.318089246749878, "lr": 0.00012474400038996848, "tps": 142216, "wall": 9676.7} {"step": 20999, "train_loss": 3.2246901988983154, "lr": 0.00012472774542195096, "tps": 142153, "wall": 9681.5} {"step": 21000, "train_loss": 3.2413811683654785, "lr": 0.00012471149153318257, "tps": 142089, "wall": 9686.3, "val_loss_monitor": 3.3743893812232275} {"step": 21001, "train_loss": 3.1414949893951416, "lr": 0.0001246952387238477, "tps": 141342, "wall": 9737.9} {"step": 21002, "train_loss": 3.1661603450775146, "lr": 0.00012467898699413028, "tps": 141280, "wall": 9742.7} {"step": 21003, "train_loss": 3.1176390647888184, "lr": 0.00012466273634421438, "tps": 141217, "wall": 9747.5} {"step": 21004, "train_loss": 3.223235607147217, "lr": 0.00012464648677428425, "tps": 141155, "wall": 9752.3} {"step": 21005, "train_loss": 3.155801296234131, "lr": 0.0001246302382845238, "tps": 141092, "wall": 9757.1} {"step": 21006, "train_loss": 3.3176777362823486, "lr": 0.00012461399087511724, "tps": 141030, "wall": 9761.8} {"step": 21007, "train_loss": 3.3044095039367676, "lr": 0.00012459774454624855, "tps": 140968, "wall": 9766.6} {"step": 21008, "train_loss": 3.2461187839508057, "lr": 0.0001245814992981017, "tps": 140907, "wall": 9771.3} {"step": 21009, "train_loss": 3.2263097763061523, "lr": 0.00012456525513086087, "tps": 140845, "wall": 9776.1} {"step": 21010, "train_loss": 3.126614570617676, "lr": 0.00012454901204470996, "tps": 140783, "wall": 9780.8} {"step": 21011, "train_loss": 3.245187759399414, "lr": 0.00012453277003983296, "tps": 140722, "wall": 9785.5} {"step": 21012, "train_loss": 3.0272607803344727, "lr": 0.00012451652911641398, "tps": 140660, "wall": 9790.3} {"step": 21013, "train_loss": 3.2107300758361816, "lr": 0.00012450028927463692, "tps": 140599, "wall": 9795.0} {"step": 21014, "train_loss": 3.1951489448547363, "lr": 0.00012448405051468565, "tps": 140537, "wall": 9799.8} {"step": 21015, "train_loss": 3.1533870697021484, "lr": 0.00012446781283674432, "tps": 140475, "wall": 9804.6} {"step": 21016, "train_loss": 3.134713649749756, "lr": 0.0001244515762409968, "tps": 140414, "wall": 9809.3} {"step": 21017, "train_loss": 3.1562881469726562, "lr": 0.00012443534072762688, "tps": 140353, "wall": 9814.1} {"step": 21018, "train_loss": 3.1408731937408447, "lr": 0.00012441910629681867, "tps": 140291, "wall": 9818.9} {"step": 21019, "train_loss": 3.2273895740509033, "lr": 0.000124402872948756, "tps": 140230, "wall": 9823.6} {"step": 21020, "train_loss": 3.2382516860961914, "lr": 0.0001243866406836227, "tps": 140169, "wall": 9828.4} {"step": 21021, "train_loss": 3.3683812618255615, "lr": 0.00012437040950160277, "tps": 140107, "wall": 9833.2} {"step": 21022, "train_loss": 3.2318825721740723, "lr": 0.00012435417940287992, "tps": 140046, "wall": 9837.9} {"step": 21023, "train_loss": 3.3461992740631104, "lr": 0.00012433795038763822, "tps": 139985, "wall": 9842.7} {"step": 21024, "train_loss": 3.21915864944458, "lr": 0.00012432172245606136, "tps": 139924, "wall": 9847.4} {"step": 21025, "train_loss": 3.2291407585144043, "lr": 0.0001243054956083331, "tps": 139863, "wall": 9852.2} {"step": 21026, "train_loss": 3.2768514156341553, "lr": 0.0001242892698446375, "tps": 139803, "wall": 9856.9} {"step": 21027, "train_loss": 3.1653661727905273, "lr": 0.00012427304516515817, "tps": 139742, "wall": 9861.6} {"step": 21028, "train_loss": 3.189826011657715, "lr": 0.00012425682157007895, "tps": 139681, "wall": 9866.4} {"step": 21029, "train_loss": 3.2073028087615967, "lr": 0.00012424059905958367, "tps": 139621, "wall": 9871.2} {"step": 21030, "train_loss": 3.1858105659484863, "lr": 0.00012422437763385608, "tps": 139559, "wall": 9876.0} {"step": 21031, "train_loss": 3.18884539604187, "lr": 0.00012420815729307985, "tps": 139498, "wall": 9880.8} {"step": 21032, "train_loss": 3.33022141456604, "lr": 0.00012419193803743885, "tps": 139438, "wall": 9885.5} {"step": 21033, "train_loss": 3.2186732292175293, "lr": 0.00012417571986711676, "tps": 139377, "wall": 9890.3} {"step": 21034, "train_loss": 3.1457080841064453, "lr": 0.00012415950278229723, "tps": 139317, "wall": 9895.0} {"step": 21035, "train_loss": 3.217036724090576, "lr": 0.00012414328678316415, "tps": 139257, "wall": 9899.8} {"step": 21036, "train_loss": 3.2493491172790527, "lr": 0.00012412707186990103, "tps": 139196, "wall": 9904.5} {"step": 21037, "train_loss": 3.120047092437744, "lr": 0.00012411085804269162, "tps": 139136, "wall": 9909.3} {"step": 21038, "train_loss": 3.2115378379821777, "lr": 0.00012409464530171963, "tps": 139076, "wall": 9914.0} {"step": 21039, "train_loss": 3.1915841102600098, "lr": 0.00012407843364716862, "tps": 139016, "wall": 9918.8} {"step": 21040, "train_loss": 3.1761298179626465, "lr": 0.00012406222307922236, "tps": 138956, "wall": 9923.5} {"step": 21041, "train_loss": 3.220282793045044, "lr": 0.00012404601359806446, "tps": 138896, "wall": 9928.3} {"step": 21042, "train_loss": 3.1486093997955322, "lr": 0.00012402980520387843, "tps": 138837, "wall": 9933.0} {"step": 21043, "train_loss": 3.2272019386291504, "lr": 0.00012401359789684805, "tps": 138776, "wall": 9937.8} {"step": 21044, "train_loss": 3.121610641479492, "lr": 0.00012399739167715678, "tps": 138716, "wall": 9942.6} {"step": 21045, "train_loss": 3.2291948795318604, "lr": 0.0001239811865449882, "tps": 138656, "wall": 9947.4} {"step": 21046, "train_loss": 3.2208521366119385, "lr": 0.000123964982500526, "tps": 138597, "wall": 9952.1} {"step": 21047, "train_loss": 3.1666951179504395, "lr": 0.0001239487795439537, "tps": 138537, "wall": 9956.9} {"step": 21048, "train_loss": 3.1925277709960938, "lr": 0.00012393257767545472, "tps": 138478, "wall": 9961.6} {"step": 21049, "train_loss": 3.242249011993408, "lr": 0.00012391637689521278, "tps": 138418, "wall": 9966.4} {"step": 21050, "train_loss": 3.1577272415161133, "lr": 0.00012390017720341132, "tps": 138359, "wall": 9971.1} {"step": 21051, "train_loss": 3.3149242401123047, "lr": 0.00012388397860023379, "tps": 138300, "wall": 9975.9} {"step": 21052, "train_loss": 3.2025890350341797, "lr": 0.00012386778108586382, "tps": 138240, "wall": 9980.7} {"step": 21053, "train_loss": 3.1623964309692383, "lr": 0.0001238515846604848, "tps": 138181, "wall": 9985.4} {"step": 21054, "train_loss": 3.2468392848968506, "lr": 0.00012383538932428018, "tps": 138122, "wall": 9990.1} {"step": 21055, "train_loss": 3.2199506759643555, "lr": 0.00012381919507743354, "tps": 138062, "wall": 9995.0} {"step": 21056, "train_loss": 3.2599759101867676, "lr": 0.00012380300192012825, "tps": 138003, "wall": 9999.7} {"step": 21057, "train_loss": 3.0767626762390137, "lr": 0.0001237868098525477, "tps": 137944, "wall": 10004.5} {"step": 21058, "train_loss": 3.2004098892211914, "lr": 0.00012377061887487546, "tps": 137885, "wall": 10009.2} {"step": 21059, "train_loss": 3.304469347000122, "lr": 0.00012375442898729478, "tps": 137825, "wall": 10014.0} {"step": 21060, "train_loss": 3.175568103790283, "lr": 0.00012373824018998918, "tps": 137766, "wall": 10018.8} {"step": 21061, "train_loss": 3.3042097091674805, "lr": 0.00012372205248314198, "tps": 137708, "wall": 10023.5} {"step": 21062, "train_loss": 3.113173246383667, "lr": 0.00012370586586693655, "tps": 137649, "wall": 10028.3} {"step": 21063, "train_loss": 3.230842113494873, "lr": 0.00012368968034155638, "tps": 137590, "wall": 10033.0} {"step": 21064, "train_loss": 3.237622022628784, "lr": 0.00012367349590718465, "tps": 137532, "wall": 10037.8} {"step": 21065, "train_loss": 3.1279547214508057, "lr": 0.00012365731256400476, "tps": 137473, "wall": 10042.5} {"step": 21066, "train_loss": 3.2922539710998535, "lr": 0.0001236411303122001, "tps": 137414, "wall": 10047.3} {"step": 21067, "train_loss": 3.2410011291503906, "lr": 0.00012362494915195389, "tps": 137356, "wall": 10052.1} {"step": 21068, "train_loss": 3.2759485244750977, "lr": 0.00012360876908344945, "tps": 137296, "wall": 10056.9} {"step": 21069, "train_loss": 3.1553795337677, "lr": 0.00012359259010687014, "tps": 137238, "wall": 10061.6} {"step": 21070, "train_loss": 3.277731418609619, "lr": 0.0001235764122223992, "tps": 137180, "wall": 10066.4} {"step": 21071, "train_loss": 3.273055076599121, "lr": 0.00012356023543021974, "tps": 137121, "wall": 10071.2} {"step": 21072, "train_loss": 3.1940715312957764, "lr": 0.0001235440597305153, "tps": 137063, "wall": 10075.9} {"step": 21073, "train_loss": 3.2198119163513184, "lr": 0.00012352788512346894, "tps": 137005, "wall": 10080.6} {"step": 21074, "train_loss": 3.266052722930908, "lr": 0.00012351171160926384, "tps": 136947, "wall": 10085.4} {"step": 21075, "train_loss": 3.1663007736206055, "lr": 0.0001234955391880834, "tps": 136889, "wall": 10090.2} {"step": 21076, "train_loss": 3.1994364261627197, "lr": 0.00012347936786011058, "tps": 136831, "wall": 10094.9} {"step": 21077, "train_loss": 3.168853521347046, "lr": 0.0001234631976255288, "tps": 136773, "wall": 10099.7} {"step": 21078, "train_loss": 3.3612735271453857, "lr": 0.00012344702848452116, "tps": 136715, "wall": 10104.4} {"step": 21079, "train_loss": 3.184464693069458, "lr": 0.00012343086043727072, "tps": 136658, "wall": 10109.2} {"step": 21080, "train_loss": 3.162910223007202, "lr": 0.0001234146934839608, "tps": 136600, "wall": 10113.9} {"step": 21081, "train_loss": 3.2286806106567383, "lr": 0.00012339852762477445, "tps": 136542, "wall": 10118.7} {"step": 21082, "train_loss": 3.148510456085205, "lr": 0.0001233823628598947, "tps": 136484, "wall": 10123.5} {"step": 21083, "train_loss": 3.1341185569763184, "lr": 0.0001233661991895049, "tps": 136427, "wall": 10128.2} {"step": 21084, "train_loss": 3.2627785205841064, "lr": 0.00012335003661378797, "tps": 136369, "wall": 10133.0} {"step": 21085, "train_loss": 3.202695846557617, "lr": 0.000123333875132927, "tps": 136312, "wall": 10137.7} {"step": 21086, "train_loss": 3.2025132179260254, "lr": 0.00012331771474710524, "tps": 136254, "wall": 10142.5} {"step": 21087, "train_loss": 3.086113214492798, "lr": 0.00012330155545650556, "tps": 136197, "wall": 10147.2} {"step": 21088, "train_loss": 3.2725014686584473, "lr": 0.00012328539726131108, "tps": 136139, "wall": 10152.0} {"step": 21089, "train_loss": 3.30767560005188, "lr": 0.00012326924016170486, "tps": 136082, "wall": 10156.7} {"step": 21090, "train_loss": 3.1847729682922363, "lr": 0.00012325308415786997, "tps": 136025, "wall": 10161.5} {"step": 21091, "train_loss": 3.1946794986724854, "lr": 0.0001232369292499893, "tps": 135968, "wall": 10166.2} {"step": 21092, "train_loss": 3.325294017791748, "lr": 0.000123220775438246, "tps": 135911, "wall": 10171.0} {"step": 21093, "train_loss": 3.2027435302734375, "lr": 0.00012320462272282293, "tps": 135852, "wall": 10175.8} {"step": 21094, "train_loss": 3.231304168701172, "lr": 0.00012318847110390316, "tps": 135795, "wall": 10180.6} {"step": 21095, "train_loss": 3.259477138519287, "lr": 0.00012317232058166967, "tps": 135739, "wall": 10185.3} {"step": 21096, "train_loss": 3.2472331523895264, "lr": 0.0001231561711563053, "tps": 135682, "wall": 10190.1} {"step": 21097, "train_loss": 3.2023510932922363, "lr": 0.0001231400228279931, "tps": 135625, "wall": 10194.8} {"step": 21098, "train_loss": 3.23830509185791, "lr": 0.000123123875596916, "tps": 135568, "wall": 10199.6} {"step": 21099, "train_loss": 3.140645980834961, "lr": 0.00012310772946325677, "tps": 135512, "wall": 10204.3} {"step": 21100, "train_loss": 3.2042336463928223, "lr": 0.0001230915844271985, "tps": 135455, "wall": 10209.1} {"step": 21101, "train_loss": 3.2011303901672363, "lr": 0.000123075440488924, "tps": 135398, "wall": 10213.8} {"step": 21102, "train_loss": 3.259782075881958, "lr": 0.00012305929764861614, "tps": 135342, "wall": 10218.6} {"step": 21103, "train_loss": 3.229660987854004, "lr": 0.0001230431559064578, "tps": 135285, "wall": 10223.4} {"step": 21104, "train_loss": 3.1897854804992676, "lr": 0.0001230270152626319, "tps": 135228, "wall": 10228.1} {"step": 21105, "train_loss": 3.23950457572937, "lr": 0.0001230108757173211, "tps": 135172, "wall": 10232.9} {"step": 21106, "train_loss": 3.1927852630615234, "lr": 0.0001229947372707084, "tps": 135115, "wall": 10237.7} {"step": 21107, "train_loss": 3.100492477416992, "lr": 0.00012297859992297663, "tps": 135058, "wall": 10242.4} {"step": 21108, "train_loss": 3.1249704360961914, "lr": 0.00012296246367430843, "tps": 135002, "wall": 10247.2} {"step": 21109, "train_loss": 3.227090358734131, "lr": 0.0001229463285248867, "tps": 134946, "wall": 10252.0} {"step": 21110, "train_loss": 3.252760887145996, "lr": 0.0001229301944748943, "tps": 134890, "wall": 10256.7} {"step": 21111, "train_loss": 3.156312942504883, "lr": 0.0001229140615245138, "tps": 134833, "wall": 10261.5} {"step": 21112, "train_loss": 3.2051727771759033, "lr": 0.00012289792967392813, "tps": 134777, "wall": 10266.2} {"step": 21113, "train_loss": 3.2436344623565674, "lr": 0.0001228817989233199, "tps": 134721, "wall": 10271.0} {"step": 21114, "train_loss": 3.1647181510925293, "lr": 0.00012286566927287198, "tps": 134665, "wall": 10275.7} {"step": 21115, "train_loss": 3.267975330352783, "lr": 0.000122849540722767, "tps": 134609, "wall": 10280.5} {"step": 21116, "train_loss": 3.1264171600341797, "lr": 0.00012283341327318765, "tps": 134553, "wall": 10285.3} {"step": 21117, "train_loss": 3.2082736492156982, "lr": 0.00012281728692431666, "tps": 134497, "wall": 10290.0} {"step": 21118, "train_loss": 3.349858283996582, "lr": 0.00012280116167633673, "tps": 134440, "wall": 10294.9} {"step": 21119, "train_loss": 3.1376700401306152, "lr": 0.00012278503752943042, "tps": 134385, "wall": 10299.6} {"step": 21120, "train_loss": 3.272181749343872, "lr": 0.00012276891448378057, "tps": 134330, "wall": 10304.4} {"step": 21121, "train_loss": 3.2171642780303955, "lr": 0.00012275279253956968, "tps": 134274, "wall": 10309.1} {"step": 21122, "train_loss": 3.089168071746826, "lr": 0.00012273667169698034, "tps": 134218, "wall": 10313.9} {"step": 21123, "train_loss": 3.1984736919403076, "lr": 0.00012272055195619537, "tps": 134163, "wall": 10318.6} {"step": 21124, "train_loss": 3.191232204437256, "lr": 0.0001227044333173972, "tps": 134108, "wall": 10323.4} {"step": 21125, "train_loss": 3.2110819816589355, "lr": 0.0001226883157807684, "tps": 134052, "wall": 10328.1} {"step": 21126, "train_loss": 3.1996116638183594, "lr": 0.00012267219934649173, "tps": 133997, "wall": 10332.9} {"step": 21127, "train_loss": 3.2066240310668945, "lr": 0.00012265608401474962, "tps": 133942, "wall": 10337.6} {"step": 21128, "train_loss": 3.2115719318389893, "lr": 0.00012263996978572461, "tps": 133887, "wall": 10342.4} {"step": 21129, "train_loss": 3.163719654083252, "lr": 0.00012262385665959933, "tps": 133831, "wall": 10347.1} {"step": 21130, "train_loss": 3.2491111755371094, "lr": 0.0001226077446365562, "tps": 133776, "wall": 10351.9} {"step": 21131, "train_loss": 3.2778799533843994, "lr": 0.0001225916337167779, "tps": 133720, "wall": 10356.7} {"step": 21132, "train_loss": 3.2158689498901367, "lr": 0.00012257552390044683, "tps": 133665, "wall": 10361.5} {"step": 21133, "train_loss": 3.1074917316436768, "lr": 0.00012255941518774546, "tps": 133610, "wall": 10366.2} {"step": 21134, "train_loss": 3.164573907852173, "lr": 0.00012254330757885631, "tps": 133555, "wall": 10371.0} {"step": 21135, "train_loss": 3.2432799339294434, "lr": 0.00012252720107396188, "tps": 133500, "wall": 10375.7} {"step": 21136, "train_loss": 3.219557762145996, "lr": 0.00012251109567324453, "tps": 133445, "wall": 10380.5} {"step": 21137, "train_loss": 3.3270773887634277, "lr": 0.00012249499137688682, "tps": 133391, "wall": 10385.3} {"step": 21138, "train_loss": 3.2968995571136475, "lr": 0.00012247888818507115, "tps": 133336, "wall": 10390.0} {"step": 21139, "train_loss": 3.2181971073150635, "lr": 0.0001224627860979798, "tps": 133281, "wall": 10394.8} {"step": 21140, "train_loss": 3.1550912857055664, "lr": 0.00012244668511579538, "tps": 133227, "wall": 10399.5} {"step": 21141, "train_loss": 3.1548011302948, "lr": 0.00012243058523870017, "tps": 133172, "wall": 10404.3} {"step": 21142, "train_loss": 3.220107078552246, "lr": 0.0001224144864668765, "tps": 133117, "wall": 10409.0} {"step": 21143, "train_loss": 3.147615909576416, "lr": 0.00012239838880050692, "tps": 133063, "wall": 10413.8} {"step": 21144, "train_loss": 3.241300582885742, "lr": 0.00012238229223977362, "tps": 133008, "wall": 10418.6} {"step": 21145, "train_loss": 3.186167001724243, "lr": 0.00012236619678485894, "tps": 132953, "wall": 10423.3} {"step": 21146, "train_loss": 3.2381882667541504, "lr": 0.00012235010243594533, "tps": 132899, "wall": 10428.1} {"step": 21147, "train_loss": 3.372809886932373, "lr": 0.000122334009193215, "tps": 132845, "wall": 10432.9} {"step": 21148, "train_loss": 3.2532734870910645, "lr": 0.00012231791705685034, "tps": 132791, "wall": 10437.6} {"step": 21149, "train_loss": 3.1786351203918457, "lr": 0.00012230182602703362, "tps": 132736, "wall": 10442.4} {"step": 21150, "train_loss": 3.1913444995880127, "lr": 0.000122285736103947, "tps": 132682, "wall": 10447.1} {"step": 21151, "train_loss": 3.1225905418395996, "lr": 0.00012226964728777296, "tps": 132628, "wall": 10451.8} {"step": 21152, "train_loss": 3.2770981788635254, "lr": 0.00012225355957869359, "tps": 132575, "wall": 10456.6} {"step": 21153, "train_loss": 3.2313766479492188, "lr": 0.00012223747297689116, "tps": 132520, "wall": 10461.4} {"step": 21154, "train_loss": 3.2747957706451416, "lr": 0.00012222138748254797, "tps": 132466, "wall": 10466.1} {"step": 21155, "train_loss": 3.1863412857055664, "lr": 0.00012220530309584618, "tps": 132413, "wall": 10470.9} {"step": 21156, "train_loss": 3.2478487491607666, "lr": 0.00012218921981696805, "tps": 132358, "wall": 10475.7} {"step": 21157, "train_loss": 3.221402168273926, "lr": 0.00012217313764609572, "tps": 132304, "wall": 10480.4} {"step": 21158, "train_loss": 3.119091272354126, "lr": 0.00012215705658341129, "tps": 132250, "wall": 10485.2} {"step": 21159, "train_loss": 3.241304397583008, "lr": 0.00012214097662909709, "tps": 132197, "wall": 10490.0} {"step": 21160, "train_loss": 3.1900575160980225, "lr": 0.0001221248977833352, "tps": 132143, "wall": 10494.7} {"step": 21161, "train_loss": 3.2858195304870605, "lr": 0.0001221088200463077, "tps": 132089, "wall": 10499.5} {"step": 21162, "train_loss": 3.208690643310547, "lr": 0.00012209274341819684, "tps": 132036, "wall": 10504.2} {"step": 21163, "train_loss": 3.2011899948120117, "lr": 0.0001220766678991847, "tps": 131983, "wall": 10509.0} {"step": 21164, "train_loss": 3.213325262069702, "lr": 0.0001220605934894533, "tps": 131929, "wall": 10513.7} {"step": 21165, "train_loss": 3.2004785537719727, "lr": 0.00012204452018918482, "tps": 131876, "wall": 10518.5} {"step": 21166, "train_loss": 3.2350006103515625, "lr": 0.00012202844799856135, "tps": 131822, "wall": 10523.2} {"step": 21167, "train_loss": 3.147771120071411, "lr": 0.00012201237691776483, "tps": 131769, "wall": 10528.0} {"step": 21168, "train_loss": 3.1898858547210693, "lr": 0.00012199630694697748, "tps": 131716, "wall": 10532.7} {"step": 21169, "train_loss": 3.160799980163574, "lr": 0.00012198023808638128, "tps": 131662, "wall": 10537.5} {"step": 21170, "train_loss": 3.123119354248047, "lr": 0.00012196417033615817, "tps": 131609, "wall": 10542.3} {"step": 21171, "train_loss": 3.275782823562622, "lr": 0.00012194810369649032, "tps": 131556, "wall": 10547.0} {"step": 21172, "train_loss": 3.2202460765838623, "lr": 0.00012193203816755958, "tps": 131503, "wall": 10551.8} {"step": 21173, "train_loss": 3.1496922969818115, "lr": 0.00012191597374954806, "tps": 131449, "wall": 10556.6} {"step": 21174, "train_loss": 3.273519515991211, "lr": 0.00012189991044263774, "tps": 131397, "wall": 10561.3} {"step": 21175, "train_loss": 3.1384811401367188, "lr": 0.00012188384824701047, "tps": 131344, "wall": 10566.1} {"step": 21176, "train_loss": 3.2397217750549316, "lr": 0.00012186778716284832, "tps": 131291, "wall": 10570.8} {"step": 21177, "train_loss": 3.2442641258239746, "lr": 0.00012185172719033317, "tps": 131238, "wall": 10575.6} {"step": 21178, "train_loss": 3.1888136863708496, "lr": 0.00012183566832964694, "tps": 131185, "wall": 10580.3} {"step": 21179, "train_loss": 3.2480628490448, "lr": 0.0001218196105809716, "tps": 131133, "wall": 10585.1} {"step": 21180, "train_loss": 3.2011349201202393, "lr": 0.00012180355394448906, "tps": 131080, "wall": 10589.8} {"step": 21181, "train_loss": 3.122347831726074, "lr": 0.00012178749842038106, "tps": 131027, "wall": 10594.6} {"step": 21182, "train_loss": 3.192446708679199, "lr": 0.0001217714440088297, "tps": 130974, "wall": 10599.4} {"step": 21183, "train_loss": 3.1422007083892822, "lr": 0.00012175539071001671, "tps": 130921, "wall": 10604.2} {"step": 21184, "train_loss": 3.248000144958496, "lr": 0.00012173933852412394, "tps": 130869, "wall": 10608.9} {"step": 21185, "train_loss": 3.273139476776123, "lr": 0.00012172328745133328, "tps": 130816, "wall": 10613.7} {"step": 21186, "train_loss": 3.2380118370056152, "lr": 0.00012170723749182653, "tps": 130764, "wall": 10618.4} {"step": 21187, "train_loss": 3.1094002723693848, "lr": 0.00012169118864578549, "tps": 130711, "wall": 10623.2} {"step": 21188, "train_loss": 3.2244420051574707, "lr": 0.00012167514091339203, "tps": 130659, "wall": 10627.9} {"step": 21189, "train_loss": 3.2685470581054688, "lr": 0.0001216590942948279, "tps": 130607, "wall": 10632.7} {"step": 21190, "train_loss": 3.2129435539245605, "lr": 0.0001216430487902748, "tps": 130555, "wall": 10637.4} {"step": 21191, "train_loss": 3.197504997253418, "lr": 0.00012162700439991459, "tps": 130503, "wall": 10642.2} {"step": 21192, "train_loss": 3.246663808822632, "lr": 0.00012161096112392898, "tps": 130451, "wall": 10646.9} {"step": 21193, "train_loss": 3.24788236618042, "lr": 0.00012159491896249977, "tps": 130398, "wall": 10651.7} {"step": 21194, "train_loss": 3.2385640144348145, "lr": 0.00012157887791580866, "tps": 130346, "wall": 10656.5} {"step": 21195, "train_loss": 3.172478199005127, "lr": 0.00012156283798403728, "tps": 130294, "wall": 10661.3} {"step": 21196, "train_loss": 3.1840670108795166, "lr": 0.00012154679916736745, "tps": 130242, "wall": 10666.0} {"step": 21197, "train_loss": 3.2675225734710693, "lr": 0.00012153076146598079, "tps": 130190, "wall": 10670.8} {"step": 21198, "train_loss": 3.1469240188598633, "lr": 0.00012151472488005895, "tps": 130138, "wall": 10675.5} {"step": 21199, "train_loss": 3.280050754547119, "lr": 0.00012149868940978369, "tps": 130086, "wall": 10680.3} {"step": 21200, "train_loss": 3.1439919471740723, "lr": 0.0001214826550553366, "tps": 130034, "wall": 10685.1} {"step": 21201, "train_loss": 3.193413257598877, "lr": 0.00012146662181689927, "tps": 129983, "wall": 10689.8} {"step": 21202, "train_loss": 3.2687017917633057, "lr": 0.00012145058969465344, "tps": 129931, "wall": 10694.6} {"step": 21203, "train_loss": 3.23435640335083, "lr": 0.00012143455868878064, "tps": 129879, "wall": 10699.3} {"step": 21204, "train_loss": 3.217231273651123, "lr": 0.00012141852879946248, "tps": 129828, "wall": 10704.1} {"step": 21205, "train_loss": 3.2162508964538574, "lr": 0.00012140250002688058, "tps": 129776, "wall": 10708.8} {"step": 21206, "train_loss": 3.2080225944519043, "lr": 0.0001213864723712165, "tps": 129725, "wall": 10713.6} {"step": 21207, "train_loss": 3.189582347869873, "lr": 0.00012137044583265172, "tps": 129673, "wall": 10718.4} {"step": 21208, "train_loss": 3.16296124458313, "lr": 0.00012135442041136795, "tps": 129621, "wall": 10723.2} {"step": 21209, "train_loss": 3.1973791122436523, "lr": 0.00012133839610754658, "tps": 129570, "wall": 10727.9} {"step": 21210, "train_loss": 3.18428111076355, "lr": 0.00012132237292136926, "tps": 129518, "wall": 10732.7} {"step": 21211, "train_loss": 3.169351816177368, "lr": 0.00012130635085301742, "tps": 129467, "wall": 10737.5} {"step": 21212, "train_loss": 3.225834608078003, "lr": 0.00012129032990267253, "tps": 129416, "wall": 10742.2} {"step": 21213, "train_loss": 3.265120029449463, "lr": 0.00012127431007051617, "tps": 129364, "wall": 10747.0} {"step": 21214, "train_loss": 3.1326210498809814, "lr": 0.0001212582913567298, "tps": 129313, "wall": 10751.7} {"step": 21215, "train_loss": 3.176901340484619, "lr": 0.00012124227376149474, "tps": 129262, "wall": 10756.5} {"step": 21216, "train_loss": 3.249265670776367, "lr": 0.00012122625728499264, "tps": 129211, "wall": 10761.3} {"step": 21217, "train_loss": 3.1636931896209717, "lr": 0.00012121024192740483, "tps": 129160, "wall": 10766.0} {"step": 21218, "train_loss": 3.217471122741699, "lr": 0.00012119422768891269, "tps": 129109, "wall": 10770.8} {"step": 21219, "train_loss": 3.1512346267700195, "lr": 0.00012117821456969771, "tps": 129057, "wall": 10775.6} {"step": 21220, "train_loss": 3.1674964427948, "lr": 0.0001211622025699413, "tps": 129007, "wall": 10780.3} {"step": 21221, "train_loss": 3.2963547706604004, "lr": 0.00012114619168982473, "tps": 128956, "wall": 10785.1} {"step": 21222, "train_loss": 3.139901876449585, "lr": 0.00012113018192952953, "tps": 128905, "wall": 10789.8} {"step": 21223, "train_loss": 3.0344924926757812, "lr": 0.00012111417328923696, "tps": 128855, "wall": 10794.6} {"step": 21224, "train_loss": 3.1438026428222656, "lr": 0.00012109816576912831, "tps": 128804, "wall": 10799.3} {"step": 21225, "train_loss": 3.189706802368164, "lr": 0.00012108215936938507, "tps": 128754, "wall": 10804.1} {"step": 21226, "train_loss": 3.253920555114746, "lr": 0.00012106615409018843, "tps": 128703, "wall": 10808.8} {"step": 21227, "train_loss": 3.143179416656494, "lr": 0.00012105014993171979, "tps": 128653, "wall": 10813.6} {"step": 21228, "train_loss": 3.3405604362487793, "lr": 0.00012103414689416039, "tps": 128602, "wall": 10818.3} {"step": 21229, "train_loss": 3.1682233810424805, "lr": 0.00012101814497769149, "tps": 128551, "wall": 10823.1} {"step": 21230, "train_loss": 3.14495587348938, "lr": 0.0001210021441824945, "tps": 128501, "wall": 10827.9} {"step": 21231, "train_loss": 3.162968158721924, "lr": 0.0001209861445087505, "tps": 128451, "wall": 10832.6} {"step": 21232, "train_loss": 3.0680489540100098, "lr": 0.00012097014595664078, "tps": 128400, "wall": 10837.4} {"step": 21233, "train_loss": 3.068777561187744, "lr": 0.00012095414852634668, "tps": 128350, "wall": 10842.1} {"step": 21234, "train_loss": 3.274592399597168, "lr": 0.00012093815221804932, "tps": 128299, "wall": 10846.9} {"step": 21235, "train_loss": 3.245940685272217, "lr": 0.00012092215703192988, "tps": 128249, "wall": 10851.6} {"step": 21236, "train_loss": 3.164155960083008, "lr": 0.00012090616296816968, "tps": 128199, "wall": 10856.4} {"step": 21237, "train_loss": 3.2639660835266113, "lr": 0.0001208901700269498, "tps": 128149, "wall": 10861.1} {"step": 21238, "train_loss": 3.2515883445739746, "lr": 0.0001208741782084514, "tps": 128099, "wall": 10865.9} {"step": 21239, "train_loss": 3.2714691162109375, "lr": 0.00012085818751285571, "tps": 128049, "wall": 10870.6} {"step": 21240, "train_loss": 3.2770919799804688, "lr": 0.00012084219794034386, "tps": 127999, "wall": 10875.4} {"step": 21241, "train_loss": 3.2038679122924805, "lr": 0.00012082620949109689, "tps": 127949, "wall": 10880.2} {"step": 21242, "train_loss": 3.2277493476867676, "lr": 0.00012081022216529602, "tps": 127899, "wall": 10884.9} {"step": 21243, "train_loss": 3.25758957862854, "lr": 0.00012079423596312234, "tps": 127850, "wall": 10889.7} {"step": 21244, "train_loss": 3.2343311309814453, "lr": 0.00012077825088475685, "tps": 127800, "wall": 10894.4} {"step": 21245, "train_loss": 3.1394472122192383, "lr": 0.00012076226693038077, "tps": 127749, "wall": 10899.3} {"step": 21246, "train_loss": 3.1897099018096924, "lr": 0.00012074628410017505, "tps": 127700, "wall": 10904.0} {"step": 21247, "train_loss": 3.254587173461914, "lr": 0.00012073030239432084, "tps": 127650, "wall": 10908.7} {"step": 21248, "train_loss": 3.1935014724731445, "lr": 0.00012071432181299914, "tps": 127601, "wall": 10913.5} {"step": 21249, "train_loss": 3.2465624809265137, "lr": 0.0001206983423563909, "tps": 127551, "wall": 10918.3} {"step": 21250, "train_loss": 3.163729667663574, "lr": 0.00012068236402467727, "tps": 127501, "wall": 10923.0} {"step": 21251, "train_loss": 3.231536865234375, "lr": 0.00012066638681803922, "tps": 127452, "wall": 10927.8} {"step": 21252, "train_loss": 3.0414156913757324, "lr": 0.00012065041073665764, "tps": 127402, "wall": 10932.5} {"step": 21253, "train_loss": 3.1559181213378906, "lr": 0.00012063443578071365, "tps": 127353, "wall": 10937.3} {"step": 21254, "train_loss": 3.283381462097168, "lr": 0.0001206184619503881, "tps": 127304, "wall": 10942.0} {"step": 21255, "train_loss": 3.2807908058166504, "lr": 0.000120602489245862, "tps": 127254, "wall": 10946.8} {"step": 21256, "train_loss": 3.246659278869629, "lr": 0.0001205865176673163, "tps": 127205, "wall": 10951.5} {"step": 21257, "train_loss": 3.106555461883545, "lr": 0.0001205705472149319, "tps": 127155, "wall": 10956.4} {"step": 21258, "train_loss": 3.2637908458709717, "lr": 0.00012055457788888968, "tps": 127106, "wall": 10961.1} {"step": 21259, "train_loss": 3.227661609649658, "lr": 0.00012053860968937064, "tps": 127057, "wall": 10965.9} {"step": 21260, "train_loss": 3.068397045135498, "lr": 0.00012052264261655559, "tps": 127008, "wall": 10970.6} {"step": 21261, "train_loss": 3.1653363704681396, "lr": 0.00012050667667062536, "tps": 126959, "wall": 10975.4} {"step": 21262, "train_loss": 3.2147836685180664, "lr": 0.00012049071185176098, "tps": 126910, "wall": 10980.1} {"step": 21263, "train_loss": 3.203577995300293, "lr": 0.0001204747481601431, "tps": 126861, "wall": 10984.9} {"step": 21264, "train_loss": 3.325342893600464, "lr": 0.00012045878559595276, "tps": 126812, "wall": 10989.6} {"step": 21265, "train_loss": 3.2106103897094727, "lr": 0.00012044282415937064, "tps": 126763, "wall": 10994.4} {"step": 21266, "train_loss": 3.1563944816589355, "lr": 0.00012042686385057758, "tps": 126714, "wall": 10999.2} {"step": 21267, "train_loss": 3.2138619422912598, "lr": 0.0001204109046697544, "tps": 126665, "wall": 11003.9} {"step": 21268, "train_loss": 3.2471113204956055, "lr": 0.00012039494661708191, "tps": 126616, "wall": 11008.7} {"step": 21269, "train_loss": 3.1922197341918945, "lr": 0.0001203789896927408, "tps": 126568, "wall": 11013.4} {"step": 21270, "train_loss": 3.2958316802978516, "lr": 0.00012036303389691193, "tps": 126518, "wall": 11018.3} {"step": 21271, "train_loss": 3.260822296142578, "lr": 0.00012034707922977601, "tps": 126469, "wall": 11023.0} {"step": 21272, "train_loss": 3.136636734008789, "lr": 0.00012033112569151366, "tps": 126421, "wall": 11027.8} {"step": 21273, "train_loss": 3.2261829376220703, "lr": 0.00012031517328230584, "tps": 126372, "wall": 11032.5} {"step": 21274, "train_loss": 3.229283332824707, "lr": 0.0001202992220023331, "tps": 126324, "wall": 11037.3} {"step": 21275, "train_loss": 3.1358532905578613, "lr": 0.00012028327185177608, "tps": 126275, "wall": 11042.0} {"step": 21276, "train_loss": 3.1487579345703125, "lr": 0.00012026732283081565, "tps": 126227, "wall": 11046.8} {"step": 21277, "train_loss": 3.23421573638916, "lr": 0.00012025137493963239, "tps": 126179, "wall": 11051.5} {"step": 21278, "train_loss": 3.132730722427368, "lr": 0.00012023542817840688, "tps": 126130, "wall": 11056.3} {"step": 21279, "train_loss": 3.2737009525299072, "lr": 0.00012021948254731987, "tps": 126082, "wall": 11061.1} {"step": 21280, "train_loss": 3.2052206993103027, "lr": 0.00012020353804655193, "tps": 126034, "wall": 11065.8} {"step": 21281, "train_loss": 3.133671760559082, "lr": 0.00012018759467628373, "tps": 125986, "wall": 11070.5} {"step": 21282, "train_loss": 3.2055163383483887, "lr": 0.00012017165243669591, "tps": 125937, "wall": 11075.4} {"step": 21283, "train_loss": 3.199936866760254, "lr": 0.00012015571132796894, "tps": 125889, "wall": 11080.1} {"step": 21284, "train_loss": 3.1612424850463867, "lr": 0.00012013977135028351, "tps": 125841, "wall": 11084.9} {"step": 21285, "train_loss": 3.2805323600769043, "lr": 0.00012012383250382015, "tps": 125793, "wall": 11089.6} {"step": 21286, "train_loss": 3.227053642272949, "lr": 0.00012010789478875937, "tps": 125745, "wall": 11094.4} {"step": 21287, "train_loss": 3.1658973693847656, "lr": 0.00012009195820528183, "tps": 125697, "wall": 11099.1} {"step": 21288, "train_loss": 3.2627034187316895, "lr": 0.000120076022753568, "tps": 125649, "wall": 11103.9} {"step": 21289, "train_loss": 3.1389315128326416, "lr": 0.0001200600884337983, "tps": 125601, "wall": 11108.6} {"step": 21290, "train_loss": 3.095700979232788, "lr": 0.0001200441552461534, "tps": 125553, "wall": 11113.4} {"step": 21291, "train_loss": 3.1344120502471924, "lr": 0.00012002822319081373, "tps": 125506, "wall": 11118.1} {"step": 21292, "train_loss": 3.2430496215820312, "lr": 0.00012001229226795967, "tps": 125458, "wall": 11122.9} {"step": 21293, "train_loss": 3.1708006858825684, "lr": 0.00011999636247777186, "tps": 125410, "wall": 11127.6} {"step": 21294, "train_loss": 3.210287570953369, "lr": 0.00011998043382043066, "tps": 125362, "wall": 11132.4} {"step": 21295, "train_loss": 3.240084648132324, "lr": 0.00011996450629611645, "tps": 125314, "wall": 11137.2} {"step": 21296, "train_loss": 3.189366102218628, "lr": 0.00011994857990500978, "tps": 125266, "wall": 11142.0} {"step": 21297, "train_loss": 3.239828109741211, "lr": 0.00011993265464729102, "tps": 125219, "wall": 11146.7} {"step": 21298, "train_loss": 3.2318737506866455, "lr": 0.0001199167305231405, "tps": 125171, "wall": 11151.5} {"step": 21299, "train_loss": 3.2473556995391846, "lr": 0.00011990080753273872, "tps": 125124, "wall": 11156.3} {"step": 21300, "train_loss": 3.2260918617248535, "lr": 0.00011988488567626595, "tps": 125076, "wall": 11161.0} {"step": 21301, "train_loss": 3.173725128173828, "lr": 0.0001198689649539027, "tps": 125029, "wall": 11165.8} {"step": 21302, "train_loss": 3.1087231636047363, "lr": 0.00011985304536582918, "tps": 124981, "wall": 11170.6} {"step": 21303, "train_loss": 3.1918320655822754, "lr": 0.00011983712691222575, "tps": 124934, "wall": 11175.3} {"step": 21304, "train_loss": 3.1463782787323, "lr": 0.00011982120959327281, "tps": 124887, "wall": 11180.1} {"step": 21305, "train_loss": 3.2491841316223145, "lr": 0.00011980529340915065, "tps": 124839, "wall": 11184.8} {"step": 21306, "train_loss": 3.2125821113586426, "lr": 0.0001197893783600395, "tps": 124792, "wall": 11189.6} {"step": 21307, "train_loss": 3.208919048309326, "lr": 0.0001197734644461197, "tps": 124745, "wall": 11194.3} {"step": 21308, "train_loss": 3.1795942783355713, "lr": 0.00011975755166757157, "tps": 124697, "wall": 11199.1} {"step": 21309, "train_loss": 3.297840118408203, "lr": 0.00011974164002457521, "tps": 124650, "wall": 11203.9} {"step": 21310, "train_loss": 3.1613662242889404, "lr": 0.00011972572951731104, "tps": 124603, "wall": 11208.6} {"step": 21311, "train_loss": 3.1820790767669678, "lr": 0.00011970982014595929, "tps": 124556, "wall": 11213.4} {"step": 21312, "train_loss": 3.1801795959472656, "lr": 0.00011969391191070001, "tps": 124509, "wall": 11218.1} {"step": 21313, "train_loss": 3.204881191253662, "lr": 0.00011967800481171361, "tps": 124462, "wall": 11222.9} {"step": 21314, "train_loss": 3.203350067138672, "lr": 0.00011966209884918016, "tps": 124415, "wall": 11227.7} {"step": 21315, "train_loss": 3.2268943786621094, "lr": 0.00011964619402327985, "tps": 124369, "wall": 11232.4} {"step": 21316, "train_loss": 3.2731668949127197, "lr": 0.00011963029033419296, "tps": 124322, "wall": 11237.2} {"step": 21317, "train_loss": 3.179032564163208, "lr": 0.00011961438778209948, "tps": 124275, "wall": 11242.0} {"step": 21318, "train_loss": 3.277346134185791, "lr": 0.00011959848636717971, "tps": 124228, "wall": 11246.7} {"step": 21319, "train_loss": 3.2377636432647705, "lr": 0.00011958258608961373, "tps": 124181, "wall": 11251.5} {"step": 21320, "train_loss": 3.1218113899230957, "lr": 0.00011956668694958157, "tps": 124134, "wall": 11256.3} {"step": 21321, "train_loss": 3.1700048446655273, "lr": 0.00011955078894726348, "tps": 124087, "wall": 11261.0} {"step": 21322, "train_loss": 3.256303310394287, "lr": 0.0001195348920828395, "tps": 124041, "wall": 11265.8} {"step": 21323, "train_loss": 3.1822566986083984, "lr": 0.00011951899635648964, "tps": 123994, "wall": 11270.5} {"step": 21324, "train_loss": 3.2162928581237793, "lr": 0.00011950310176839407, "tps": 123948, "wall": 11275.3} {"step": 21325, "train_loss": 3.2042016983032227, "lr": 0.00011948720831873283, "tps": 123901, "wall": 11280.1} {"step": 21326, "train_loss": 3.254281759262085, "lr": 0.0001194713160076859, "tps": 123855, "wall": 11284.8} {"step": 21327, "train_loss": 3.148345947265625, "lr": 0.00011945542483543335, "tps": 123809, "wall": 11289.6} {"step": 21328, "train_loss": 3.2155885696411133, "lr": 0.00011943953480215512, "tps": 123762, "wall": 11294.3} {"step": 21329, "train_loss": 3.2834060192108154, "lr": 0.00011942364590803135, "tps": 123716, "wall": 11299.1} {"step": 21330, "train_loss": 3.1878774166107178, "lr": 0.00011940775815324195, "tps": 123670, "wall": 11303.8} {"step": 21331, "train_loss": 3.1553995609283447, "lr": 0.00011939187153796685, "tps": 123623, "wall": 11308.6} {"step": 21332, "train_loss": 3.218027353286743, "lr": 0.00011937598606238614, "tps": 123577, "wall": 11313.4} {"step": 21333, "train_loss": 3.1678993701934814, "lr": 0.00011936010172667969, "tps": 123530, "wall": 11318.2} {"step": 21334, "train_loss": 3.1585419178009033, "lr": 0.0001193442185310274, "tps": 123484, "wall": 11322.9} {"step": 21335, "train_loss": 3.128370761871338, "lr": 0.0001193283364756093, "tps": 123438, "wall": 11327.7} {"step": 21336, "train_loss": 3.178389549255371, "lr": 0.00011931245556060528, "tps": 123392, "wall": 11332.4} {"step": 21337, "train_loss": 3.2208151817321777, "lr": 0.00011929657578619514, "tps": 123346, "wall": 11337.2} {"step": 21338, "train_loss": 3.201625347137451, "lr": 0.00011928069715255885, "tps": 123301, "wall": 11341.9} {"step": 21339, "train_loss": 3.252293109893799, "lr": 0.00011926481965987632, "tps": 123255, "wall": 11346.7} {"step": 21340, "train_loss": 3.259161949157715, "lr": 0.0001192489433083273, "tps": 123209, "wall": 11351.4} {"step": 21341, "train_loss": 3.1262400150299072, "lr": 0.00011923306809809176, "tps": 123163, "wall": 11356.2} {"step": 21342, "train_loss": 3.1528077125549316, "lr": 0.00011921719402934938, "tps": 123117, "wall": 11361.0} {"step": 21343, "train_loss": 3.1949095726013184, "lr": 0.0001192013211022802, "tps": 123071, "wall": 11365.7} {"step": 21344, "train_loss": 3.260690450668335, "lr": 0.00011918544931706385, "tps": 123026, "wall": 11370.5} {"step": 21345, "train_loss": 3.272170066833496, "lr": 0.00011916957867388015, "tps": 122979, "wall": 11375.3} {"step": 21346, "train_loss": 3.229490280151367, "lr": 0.000119153709172909, "tps": 122933, "wall": 11380.1} {"step": 21347, "train_loss": 3.1365888118743896, "lr": 0.00011913784081433003, "tps": 122888, "wall": 11384.8} {"step": 21348, "train_loss": 3.244128704071045, "lr": 0.00011912197359832304, "tps": 122842, "wall": 11389.6} {"step": 21349, "train_loss": 3.2182536125183105, "lr": 0.00011910610752506785, "tps": 122797, "wall": 11394.4} {"step": 21350, "train_loss": 3.194812297821045, "lr": 0.00011909024259474412, "tps": 122751, "wall": 11399.1} {"step": 21351, "train_loss": 3.1591739654541016, "lr": 0.00011907437880753152, "tps": 122706, "wall": 11403.9} {"step": 21352, "train_loss": 3.2308290004730225, "lr": 0.00011905851616360988, "tps": 122660, "wall": 11408.6} {"step": 21353, "train_loss": 3.1437785625457764, "lr": 0.00011904265466315885, "tps": 122615, "wall": 11413.4} {"step": 21354, "train_loss": 3.218501091003418, "lr": 0.00011902679430635799, "tps": 122570, "wall": 11418.1} {"step": 21355, "train_loss": 3.207712173461914, "lr": 0.00011901093509338715, "tps": 122524, "wall": 11422.9} {"step": 21356, "train_loss": 3.2248475551605225, "lr": 0.0001189950770244259, "tps": 122479, "wall": 11427.6} {"step": 21357, "train_loss": 3.1259233951568604, "lr": 0.00011897922009965381, "tps": 122434, "wall": 11432.4} {"step": 21358, "train_loss": 3.2096920013427734, "lr": 0.00011896336431925066, "tps": 122388, "wall": 11437.2} {"step": 21359, "train_loss": 3.099844455718994, "lr": 0.0001189475096833959, "tps": 122343, "wall": 11441.9} {"step": 21360, "train_loss": 3.301429271697998, "lr": 0.00011893165619226931, "tps": 122298, "wall": 11446.7} {"step": 21361, "train_loss": 3.111109733581543, "lr": 0.00011891580384605036, "tps": 122253, "wall": 11451.5} {"step": 21362, "train_loss": 3.156726598739624, "lr": 0.0001188999526449186, "tps": 122208, "wall": 11456.2} {"step": 21363, "train_loss": 3.1520895957946777, "lr": 0.00011888410258905369, "tps": 122163, "wall": 11461.0} {"step": 21364, "train_loss": 3.2383522987365723, "lr": 0.00011886825367863516, "tps": 122118, "wall": 11465.7} {"step": 21365, "train_loss": 3.1816506385803223, "lr": 0.00011885240591384246, "tps": 122073, "wall": 11470.5} {"step": 21366, "train_loss": 3.19600248336792, "lr": 0.00011883655929485525, "tps": 122029, "wall": 11475.2} {"step": 21367, "train_loss": 3.301074981689453, "lr": 0.00011882071382185294, "tps": 121984, "wall": 11480.0} {"step": 21368, "train_loss": 3.203638792037964, "lr": 0.00011880486949501502, "tps": 121939, "wall": 11484.7} {"step": 21369, "train_loss": 3.1332879066467285, "lr": 0.00011878902631452104, "tps": 121894, "wall": 11489.5} {"step": 21370, "train_loss": 3.1320459842681885, "lr": 0.00011877318428055049, "tps": 121849, "wall": 11494.3} {"step": 21371, "train_loss": 3.2856509685516357, "lr": 0.00011875734339328268, "tps": 121804, "wall": 11499.1} {"step": 21372, "train_loss": 3.2649266719818115, "lr": 0.00011874150365289724, "tps": 121759, "wall": 11503.8} {"step": 21373, "train_loss": 3.3183183670043945, "lr": 0.00011872566505957355, "tps": 121715, "wall": 11508.6} {"step": 21374, "train_loss": 3.1295881271362305, "lr": 0.00011870982761349091, "tps": 121670, "wall": 11513.4} {"step": 21375, "train_loss": 3.2577767372131348, "lr": 0.0001186939913148289, "tps": 121625, "wall": 11518.1} {"step": 21376, "train_loss": 3.124368667602539, "lr": 0.00011867815616376683, "tps": 121581, "wall": 11522.9} {"step": 21377, "train_loss": 3.230968952178955, "lr": 0.00011866232216048402, "tps": 121536, "wall": 11527.6} {"step": 21378, "train_loss": 3.233166217803955, "lr": 0.00011864648930516, "tps": 121492, "wall": 11532.4} {"step": 21379, "train_loss": 3.1455156803131104, "lr": 0.00011863065759797394, "tps": 121447, "wall": 11537.1} {"step": 21380, "train_loss": 3.232067584991455, "lr": 0.00011861482703910533, "tps": 121403, "wall": 11541.9} {"step": 21381, "train_loss": 3.2822232246398926, "lr": 0.00011859899762873348, "tps": 121359, "wall": 11546.7} {"step": 21382, "train_loss": 3.2801380157470703, "lr": 0.00011858316936703759, "tps": 121314, "wall": 11551.4} {"step": 21383, "train_loss": 3.2367653846740723, "lr": 0.00011856734225419707, "tps": 121269, "wall": 11556.2} {"step": 21384, "train_loss": 3.277611494064331, "lr": 0.00011855151629039123, "tps": 121225, "wall": 11561.0} {"step": 21385, "train_loss": 3.243183135986328, "lr": 0.00011853569147579924, "tps": 121181, "wall": 11565.7} {"step": 21386, "train_loss": 3.2736144065856934, "lr": 0.00011851986781060047, "tps": 121137, "wall": 11570.5} {"step": 21387, "train_loss": 3.1632580757141113, "lr": 0.00011850404529497417, "tps": 121093, "wall": 11575.2} {"step": 21388, "train_loss": 3.2001748085021973, "lr": 0.00011848822392909942, "tps": 121049, "wall": 11580.0} {"step": 21389, "train_loss": 3.1962523460388184, "lr": 0.00011847240371315562, "tps": 121005, "wall": 11584.8} {"step": 21390, "train_loss": 3.2211337089538574, "lr": 0.00011845658464732196, "tps": 120961, "wall": 11589.5} {"step": 21391, "train_loss": 3.290121078491211, "lr": 0.00011844076673177753, "tps": 120917, "wall": 11594.3} {"step": 21392, "train_loss": 3.3351237773895264, "lr": 0.00011842494996670163, "tps": 120873, "wall": 11599.0} {"step": 21393, "train_loss": 3.199237823486328, "lr": 0.00011840913435227343, "tps": 120829, "wall": 11603.8} {"step": 21394, "train_loss": 3.112203598022461, "lr": 0.00011839331988867198, "tps": 120785, "wall": 11608.5} {"step": 21395, "train_loss": 3.2891430854797363, "lr": 0.00011837750657607653, "tps": 120741, "wall": 11613.3} {"step": 21396, "train_loss": 3.143739700317383, "lr": 0.00011836169441466611, "tps": 120697, "wall": 11618.1} {"step": 21397, "train_loss": 3.2192304134368896, "lr": 0.00011834588340462002, "tps": 120653, "wall": 11622.9} {"step": 21398, "train_loss": 3.1731202602386475, "lr": 0.00011833007354611725, "tps": 120609, "wall": 11627.6} {"step": 21399, "train_loss": 3.080878257751465, "lr": 0.00011831426483933685, "tps": 120565, "wall": 11632.4} {"step": 21400, "train_loss": 3.1341781616210938, "lr": 0.000118298457284458, "tps": 120522, "wall": 11637.2} {"step": 21401, "train_loss": 3.2936227321624756, "lr": 0.00011828265088165976, "tps": 120478, "wall": 11641.9} {"step": 21402, "train_loss": 3.2434067726135254, "lr": 0.00011826684563112107, "tps": 120434, "wall": 11646.7} {"step": 21403, "train_loss": 3.2300939559936523, "lr": 0.00011825104153302114, "tps": 120391, "wall": 11651.4} {"step": 21404, "train_loss": 3.1629910469055176, "lr": 0.0001182352385875389, "tps": 120347, "wall": 11656.2} {"step": 21405, "train_loss": 3.316013813018799, "lr": 0.0001182194367948533, "tps": 120304, "wall": 11660.9} {"step": 21406, "train_loss": 3.1615288257598877, "lr": 0.00011820363615514352, "tps": 120261, "wall": 11665.7} {"step": 21407, "train_loss": 3.2539076805114746, "lr": 0.00011818783666858841, "tps": 120217, "wall": 11670.4} {"step": 21408, "train_loss": 3.255950450897217, "lr": 0.00011817203833536699, "tps": 120173, "wall": 11675.3} {"step": 21409, "train_loss": 3.2468905448913574, "lr": 0.00011815624115565827, "tps": 120130, "wall": 11680.0} {"step": 21410, "train_loss": 3.201822280883789, "lr": 0.00011814044512964116, "tps": 120087, "wall": 11684.8} {"step": 21411, "train_loss": 3.2043731212615967, "lr": 0.0001181246502574945, "tps": 120044, "wall": 11689.5} {"step": 21412, "train_loss": 3.082106590270996, "lr": 0.00011810885653939742, "tps": 120000, "wall": 11694.3} {"step": 21413, "train_loss": 3.0700016021728516, "lr": 0.00011809306397552866, "tps": 119957, "wall": 11699.0} {"step": 21414, "train_loss": 3.1766204833984375, "lr": 0.00011807727256606722, "tps": 119914, "wall": 11703.8} {"step": 21415, "train_loss": 3.32797908782959, "lr": 0.00011806148231119198, "tps": 119871, "wall": 11708.5} {"step": 21416, "train_loss": 3.254636764526367, "lr": 0.0001180456932110817, "tps": 119828, "wall": 11713.3} {"step": 21417, "train_loss": 3.203623056411743, "lr": 0.0001180299052659154, "tps": 119785, "wall": 11718.1} {"step": 21418, "train_loss": 3.2301383018493652, "lr": 0.00011801411847587185, "tps": 119741, "wall": 11722.8} {"step": 21419, "train_loss": 3.109409809112549, "lr": 0.00011799833284112982, "tps": 119699, "wall": 11727.6} {"step": 21420, "train_loss": 3.143376350402832, "lr": 0.00011798254836186827, "tps": 119656, "wall": 11732.3} {"step": 21421, "train_loss": 3.1888628005981445, "lr": 0.0001179667650382659, "tps": 119612, "wall": 11737.2} {"step": 21422, "train_loss": 3.2872774600982666, "lr": 0.00011795098287050148, "tps": 119569, "wall": 11742.0} {"step": 21423, "train_loss": 3.3595714569091797, "lr": 0.00011793520185875389, "tps": 119526, "wall": 11746.7} {"step": 21424, "train_loss": 3.258817672729492, "lr": 0.00011791942200320187, "tps": 119483, "wall": 11751.5} {"step": 21425, "train_loss": 3.197816848754883, "lr": 0.00011790364330402413, "tps": 119441, "wall": 11756.2} {"step": 21426, "train_loss": 3.1875457763671875, "lr": 0.00011788786576139949, "tps": 119398, "wall": 11760.9} {"step": 21427, "train_loss": 3.2788801193237305, "lr": 0.00011787208937550663, "tps": 119356, "wall": 11765.7} {"step": 21428, "train_loss": 3.2603437900543213, "lr": 0.00011785631414652419, "tps": 119313, "wall": 11770.4} {"step": 21429, "train_loss": 3.202070713043213, "lr": 0.00011784054007463101, "tps": 119270, "wall": 11775.2} {"step": 21430, "train_loss": 3.1447763442993164, "lr": 0.00011782476716000572, "tps": 119228, "wall": 11779.9} {"step": 21431, "train_loss": 3.2196192741394043, "lr": 0.00011780899540282693, "tps": 119185, "wall": 11784.7} {"step": 21432, "train_loss": 3.185129165649414, "lr": 0.00011779322480327346, "tps": 119142, "wall": 11789.5} {"step": 21433, "train_loss": 3.2535557746887207, "lr": 0.00011777745536152376, "tps": 119100, "wall": 11794.3} {"step": 21434, "train_loss": 3.1734838485717773, "lr": 0.00011776168707775668, "tps": 119057, "wall": 11799.1} {"step": 21435, "train_loss": 3.2599973678588867, "lr": 0.00011774591995215072, "tps": 119014, "wall": 11803.8} {"step": 21436, "train_loss": 3.0634939670562744, "lr": 0.00011773015398488445, "tps": 118972, "wall": 11808.6} {"step": 21437, "train_loss": 3.1945836544036865, "lr": 0.0001177143891761366, "tps": 118929, "wall": 11813.4} {"step": 21438, "train_loss": 3.2713816165924072, "lr": 0.00011769862552608568, "tps": 118887, "wall": 11818.1} {"step": 21439, "train_loss": 3.2304818630218506, "lr": 0.00011768286303491018, "tps": 118845, "wall": 11822.9} {"step": 21440, "train_loss": 3.141139507293701, "lr": 0.00011766710170278883, "tps": 118802, "wall": 11827.6} {"step": 21441, "train_loss": 3.262528657913208, "lr": 0.0001176513415299001, "tps": 118760, "wall": 11832.4} {"step": 21442, "train_loss": 3.177079677581787, "lr": 0.00011763558251642242, "tps": 118718, "wall": 11837.2} {"step": 21443, "train_loss": 3.2214012145996094, "lr": 0.00011761982466253445, "tps": 118676, "wall": 11841.9} {"step": 21444, "train_loss": 3.2818102836608887, "lr": 0.00011760406796841468, "tps": 118633, "wall": 11846.7} {"step": 21445, "train_loss": 3.141453742980957, "lr": 0.00011758831243424148, "tps": 118591, "wall": 11851.5} {"step": 21446, "train_loss": 3.2559967041015625, "lr": 0.0001175725580601935, "tps": 118549, "wall": 11856.3} {"step": 21447, "train_loss": 3.226992130279541, "lr": 0.00011755680484644911, "tps": 118507, "wall": 11861.0} {"step": 21448, "train_loss": 3.241514205932617, "lr": 0.00011754105279318672, "tps": 118465, "wall": 11865.8} {"step": 21449, "train_loss": 3.2935001850128174, "lr": 0.0001175253019005849, "tps": 118423, "wall": 11870.5} {"step": 21450, "train_loss": 3.1156997680664062, "lr": 0.00011750955216882191, "tps": 118381, "wall": 11875.3} {"step": 21451, "train_loss": 3.2124950885772705, "lr": 0.00011749380359807634, "tps": 118339, "wall": 11880.1} {"step": 21452, "train_loss": 3.15610933303833, "lr": 0.00011747805618852652, "tps": 118297, "wall": 11884.8} {"step": 21453, "train_loss": 3.1957950592041016, "lr": 0.00011746230994035075, "tps": 118255, "wall": 11889.6} {"step": 21454, "train_loss": 3.2556264400482178, "lr": 0.00011744656485372754, "tps": 118213, "wall": 11894.3} {"step": 21455, "train_loss": 3.1697206497192383, "lr": 0.0001174308209288352, "tps": 118172, "wall": 11899.1} {"step": 21456, "train_loss": 3.200535297393799, "lr": 0.00011741507816585198, "tps": 118130, "wall": 11903.8} {"step": 21457, "train_loss": 3.1788101196289062, "lr": 0.00011739933656495638, "tps": 118088, "wall": 11908.6} {"step": 21458, "train_loss": 3.2867448329925537, "lr": 0.00011738359612632668, "tps": 118047, "wall": 11913.3} {"step": 21459, "train_loss": 3.319739580154419, "lr": 0.00011736785685014107, "tps": 118004, "wall": 11918.2} {"step": 21460, "train_loss": 3.142441749572754, "lr": 0.00011735211873657798, "tps": 117963, "wall": 11922.9} {"step": 21461, "train_loss": 3.191749334335327, "lr": 0.00011733638178581565, "tps": 117921, "wall": 11927.7} {"step": 21462, "train_loss": 3.172248363494873, "lr": 0.00011732064599803227, "tps": 117880, "wall": 11932.5} {"step": 21463, "train_loss": 3.1257286071777344, "lr": 0.00011730491137340624, "tps": 117838, "wall": 11937.2} {"step": 21464, "train_loss": 3.2542903423309326, "lr": 0.00011728917791211575, "tps": 117797, "wall": 11942.0} {"step": 21465, "train_loss": 3.2738513946533203, "lr": 0.0001172734456143389, "tps": 117755, "wall": 11946.7} {"step": 21466, "train_loss": 3.2021865844726562, "lr": 0.00011725771448025411, "tps": 117714, "wall": 11951.5} {"step": 21467, "train_loss": 3.175554037094116, "lr": 0.00011724198451003942, "tps": 117672, "wall": 11956.2} {"step": 21468, "train_loss": 3.2185962200164795, "lr": 0.00011722625570387316, "tps": 117631, "wall": 11961.0} {"step": 21469, "train_loss": 3.2671258449554443, "lr": 0.00011721052806193342, "tps": 117590, "wall": 11965.7} {"step": 21470, "train_loss": 3.2923219203948975, "lr": 0.00011719480158439833, "tps": 117549, "wall": 11970.5} {"step": 21471, "train_loss": 3.2880640029907227, "lr": 0.00011717907627144615, "tps": 117507, "wall": 11975.3} {"step": 21472, "train_loss": 3.3096795082092285, "lr": 0.00011716335212325495, "tps": 117466, "wall": 11980.1} {"step": 21473, "train_loss": 3.1900854110717773, "lr": 0.00011714762914000278, "tps": 117425, "wall": 11984.8} {"step": 21474, "train_loss": 3.251659870147705, "lr": 0.00011713190732186792, "tps": 117384, "wall": 11989.6} {"step": 21475, "train_loss": 3.2097582817077637, "lr": 0.00011711618666902837, "tps": 117343, "wall": 11994.3} {"step": 21476, "train_loss": 3.2115793228149414, "lr": 0.00011710046718166217, "tps": 117302, "wall": 11999.1} {"step": 21477, "train_loss": 3.263169288635254, "lr": 0.00011708474885994749, "tps": 117261, "wall": 12003.8} {"step": 21478, "train_loss": 3.3010191917419434, "lr": 0.00011706903170406236, "tps": 117220, "wall": 12008.6} {"step": 21479, "train_loss": 3.227092981338501, "lr": 0.00011705331571418474, "tps": 117179, "wall": 12013.3} {"step": 21480, "train_loss": 3.175200939178467, "lr": 0.00011703760089049278, "tps": 117138, "wall": 12018.1} {"step": 21481, "train_loss": 3.2618002891540527, "lr": 0.00011702188723316445, "tps": 117097, "wall": 12022.9} {"step": 21482, "train_loss": 3.2059621810913086, "lr": 0.00011700617474237771, "tps": 117056, "wall": 12027.6} {"step": 21483, "train_loss": 3.1700453758239746, "lr": 0.00011699046341831063, "tps": 117015, "wall": 12032.4} {"step": 21484, "train_loss": 3.07541823387146, "lr": 0.00011697475326114116, "tps": 116974, "wall": 12037.2} {"step": 21485, "train_loss": 3.233173370361328, "lr": 0.00011695904427104723, "tps": 116933, "wall": 12041.9} {"step": 21486, "train_loss": 3.2516698837280273, "lr": 0.00011694333644820683, "tps": 116892, "wall": 12046.7} {"step": 21487, "train_loss": 3.185603380203247, "lr": 0.00011692762979279786, "tps": 116852, "wall": 12051.5} {"step": 21488, "train_loss": 3.2480506896972656, "lr": 0.00011691192430499834, "tps": 116811, "wall": 12056.2} {"step": 21489, "train_loss": 3.108774185180664, "lr": 0.0001168962199849861, "tps": 116770, "wall": 12060.9} {"step": 21490, "train_loss": 3.064317464828491, "lr": 0.00011688051683293899, "tps": 116730, "wall": 12065.7} {"step": 21491, "train_loss": 3.196620464324951, "lr": 0.00011686481484903505, "tps": 116689, "wall": 12070.5} {"step": 21492, "train_loss": 3.1737420558929443, "lr": 0.00011684911403345207, "tps": 116649, "wall": 12075.2} {"step": 21493, "train_loss": 3.2047958374023438, "lr": 0.00011683341438636781, "tps": 116608, "wall": 12080.0} {"step": 21494, "train_loss": 3.2378180027008057, "lr": 0.00011681771590796039, "tps": 116568, "wall": 12084.8} {"step": 21495, "train_loss": 3.177433967590332, "lr": 0.00011680201859840729, "tps": 116527, "wall": 12089.5} {"step": 21496, "train_loss": 3.1513512134552, "lr": 0.0001167863224578866, "tps": 116487, "wall": 12094.3} {"step": 21497, "train_loss": 3.1287901401519775, "lr": 0.00011677062748657604, "tps": 116446, "wall": 12099.1} {"step": 21498, "train_loss": 3.2248847484588623, "lr": 0.00011675493368465332, "tps": 116406, "wall": 12103.8} {"step": 21499, "train_loss": 3.2134103775024414, "lr": 0.00011673924105229632, "tps": 116365, "wall": 12108.6} {"step": 21500, "train_loss": 3.2400996685028076, "lr": 0.00011672354958968283, "tps": 116325, "wall": 12113.3} {"step": 21501, "train_loss": 3.1479122638702393, "lr": 0.00011670785929699049, "tps": 116283, "wall": 12118.3} {"step": 21502, "train_loss": 3.2474851608276367, "lr": 0.00011669217017439717, "tps": 116243, "wall": 12123.0} {"step": 21503, "train_loss": 3.2300140857696533, "lr": 0.00011667648222208052, "tps": 116202, "wall": 12127.8} {"step": 21504, "train_loss": 3.2103023529052734, "lr": 0.00011666079544021822, "tps": 116162, "wall": 12132.6} {"step": 21505, "train_loss": 3.2006545066833496, "lr": 0.00011664510982898806, "tps": 116122, "wall": 12137.3} {"step": 21506, "train_loss": 3.2630138397216797, "lr": 0.00011662942538856771, "tps": 116082, "wall": 12142.1} {"step": 21507, "train_loss": 3.182299852371216, "lr": 0.00011661374211913476, "tps": 116041, "wall": 12146.9} {"step": 21508, "train_loss": 3.1064066886901855, "lr": 0.00011659806002086699, "tps": 116001, "wall": 12151.6} {"step": 21509, "train_loss": 3.28889536857605, "lr": 0.00011658237909394194, "tps": 115961, "wall": 12156.5} {"step": 21510, "train_loss": 3.1995604038238525, "lr": 0.00011656669933853734, "tps": 115921, "wall": 12161.2} {"step": 21511, "train_loss": 3.1256370544433594, "lr": 0.00011655102075483077, "tps": 115881, "wall": 12166.0} {"step": 21512, "train_loss": 3.23915958404541, "lr": 0.00011653534334299976, "tps": 115841, "wall": 12170.7} {"step": 21513, "train_loss": 3.149015426635742, "lr": 0.00011651966710322207, "tps": 115801, "wall": 12175.5} {"step": 21514, "train_loss": 3.109100818634033, "lr": 0.00011650399203567517, "tps": 115761, "wall": 12180.3} {"step": 21515, "train_loss": 3.2302026748657227, "lr": 0.00011648831814053658, "tps": 115721, "wall": 12185.0} {"step": 21516, "train_loss": 3.226860523223877, "lr": 0.000116472645417984, "tps": 115681, "wall": 12189.8} {"step": 21517, "train_loss": 3.1830506324768066, "lr": 0.00011645697386819488, "tps": 115642, "wall": 12194.6} {"step": 21518, "train_loss": 3.1677708625793457, "lr": 0.0001164413034913467, "tps": 115602, "wall": 12199.3} {"step": 21519, "train_loss": 3.250108242034912, "lr": 0.0001164256342876171, "tps": 115562, "wall": 12204.1} {"step": 21520, "train_loss": 3.184311866760254, "lr": 0.0001164099662571835, "tps": 115522, "wall": 12208.9} {"step": 21521, "train_loss": 3.1804122924804688, "lr": 0.00011639429940022337, "tps": 115482, "wall": 12213.6} {"step": 21522, "train_loss": 3.21874737739563, "lr": 0.00011637863371691429, "tps": 115442, "wall": 12218.5} {"step": 21523, "train_loss": 3.2354369163513184, "lr": 0.00011636296920743364, "tps": 115403, "wall": 12223.2} {"step": 21524, "train_loss": 3.231954574584961, "lr": 0.00011634730587195881, "tps": 115363, "wall": 12228.0} {"step": 21525, "train_loss": 3.2483458518981934, "lr": 0.00011633164371066738, "tps": 115323, "wall": 12232.7} {"step": 21526, "train_loss": 3.2077574729919434, "lr": 0.0001163159827237367, "tps": 115284, "wall": 12237.5} {"step": 21527, "train_loss": 3.213862895965576, "lr": 0.00011630032291134409, "tps": 115245, "wall": 12242.2} {"step": 21528, "train_loss": 3.2680554389953613, "lr": 0.00011628466427366713, "tps": 115205, "wall": 12247.0} {"step": 21529, "train_loss": 3.160271406173706, "lr": 0.00011626900681088304, "tps": 115166, "wall": 12251.7} {"step": 21530, "train_loss": 3.265815258026123, "lr": 0.00011625335052316927, "tps": 115127, "wall": 12256.5} {"step": 21531, "train_loss": 3.2322945594787598, "lr": 0.00011623769541070322, "tps": 115087, "wall": 12261.3} {"step": 21532, "train_loss": 3.2129271030426025, "lr": 0.00011622204147366207, "tps": 115048, "wall": 12266.0} {"step": 21533, "train_loss": 3.103119373321533, "lr": 0.00011620638871222333, "tps": 115009, "wall": 12270.8} {"step": 21534, "train_loss": 3.1986284255981445, "lr": 0.00011619073712656421, "tps": 114969, "wall": 12275.6} {"step": 21535, "train_loss": 3.1651365756988525, "lr": 0.00011617508671686197, "tps": 114930, "wall": 12280.4} {"step": 21536, "train_loss": 3.191318988800049, "lr": 0.00011615943748329405, "tps": 114890, "wall": 12285.1} {"step": 21537, "train_loss": 3.261758327484131, "lr": 0.00011614378942603763, "tps": 114851, "wall": 12289.9} {"step": 21538, "train_loss": 3.231790542602539, "lr": 0.00011612814254526991, "tps": 114812, "wall": 12294.6} {"step": 21539, "train_loss": 3.1324710845947266, "lr": 0.0001161124968411683, "tps": 114774, "wall": 12299.3} {"step": 21540, "train_loss": 3.2074623107910156, "lr": 0.00011609685231390994, "tps": 114734, "wall": 12304.1} {"step": 21541, "train_loss": 3.0831551551818848, "lr": 0.00011608120896367198, "tps": 114695, "wall": 12308.9} {"step": 21542, "train_loss": 3.202122688293457, "lr": 0.00011606556679063181, "tps": 114657, "wall": 12313.6} {"step": 21543, "train_loss": 3.289245128631592, "lr": 0.00011604992579496647, "tps": 114618, "wall": 12318.4} {"step": 21544, "train_loss": 3.2618465423583984, "lr": 0.00011603428597685315, "tps": 114579, "wall": 12323.1} {"step": 21545, "train_loss": 3.3182132244110107, "lr": 0.00011601864733646912, "tps": 114540, "wall": 12327.9} {"step": 21546, "train_loss": 3.131106376647949, "lr": 0.00011600300987399142, "tps": 114501, "wall": 12332.6} {"step": 21547, "train_loss": 3.263410806655884, "lr": 0.00011598737358959733, "tps": 114462, "wall": 12337.4} {"step": 21548, "train_loss": 3.130114793777466, "lr": 0.00011597173848346385, "tps": 114423, "wall": 12342.2} {"step": 21549, "train_loss": 3.2984676361083984, "lr": 0.00011595610455576814, "tps": 114384, "wall": 12346.9} {"step": 21550, "train_loss": 3.22357439994812, "lr": 0.00011594047180668732, "tps": 114345, "wall": 12351.7} {"step": 21551, "train_loss": 3.143702268600464, "lr": 0.00011592484023639851, "tps": 114307, "wall": 12356.5} {"step": 21552, "train_loss": 3.279284954071045, "lr": 0.00011590920984507864, "tps": 114268, "wall": 12361.2} {"step": 21553, "train_loss": 3.1596217155456543, "lr": 0.00011589358063290494, "tps": 114229, "wall": 12366.0} {"step": 21554, "train_loss": 3.2696738243103027, "lr": 0.00011587795260005441, "tps": 114191, "wall": 12370.7} {"step": 21555, "train_loss": 3.246664047241211, "lr": 0.00011586232574670402, "tps": 114152, "wall": 12375.5} {"step": 21556, "train_loss": 3.182432174682617, "lr": 0.00011584670007303087, "tps": 114114, "wall": 12380.2} {"step": 21557, "train_loss": 3.178546905517578, "lr": 0.00011583107557921194, "tps": 114075, "wall": 12385.0} {"step": 21558, "train_loss": 3.162036418914795, "lr": 0.00011581545226542414, "tps": 114037, "wall": 12389.8} {"step": 21559, "train_loss": 3.1037869453430176, "lr": 0.00011579983013184463, "tps": 113998, "wall": 12394.5} {"step": 21560, "train_loss": 3.1720709800720215, "lr": 0.00011578420917865025, "tps": 113959, "wall": 12399.4} {"step": 21561, "train_loss": 3.1973257064819336, "lr": 0.00011576858940601796, "tps": 113920, "wall": 12404.1} {"step": 21562, "train_loss": 3.295274257659912, "lr": 0.00011575297081412477, "tps": 113882, "wall": 12408.9} {"step": 21563, "train_loss": 3.1795945167541504, "lr": 0.00011573735340314757, "tps": 113844, "wall": 12413.6} {"step": 21564, "train_loss": 3.2237329483032227, "lr": 0.00011572173717326317, "tps": 113805, "wall": 12418.4} {"step": 21565, "train_loss": 3.238373041152954, "lr": 0.00011570612212464868, "tps": 113767, "wall": 12423.2} {"step": 21566, "train_loss": 3.220930576324463, "lr": 0.0001156905082574808, "tps": 113729, "wall": 12427.9} {"step": 21567, "train_loss": 3.2184534072875977, "lr": 0.00011567489557193659, "tps": 113690, "wall": 12432.7} {"step": 21568, "train_loss": 3.255228042602539, "lr": 0.00011565928406819275, "tps": 113652, "wall": 12437.4} {"step": 21569, "train_loss": 3.253814697265625, "lr": 0.00011564367374642615, "tps": 113614, "wall": 12442.2} {"step": 21570, "train_loss": 3.1949310302734375, "lr": 0.00011562806460681373, "tps": 113576, "wall": 12447.0} {"step": 21571, "train_loss": 3.2405505180358887, "lr": 0.00011561245664953222, "tps": 113538, "wall": 12451.7} {"step": 21572, "train_loss": 3.1078357696533203, "lr": 0.00011559684987475839, "tps": 113499, "wall": 12456.5} {"step": 21573, "train_loss": 3.302013874053955, "lr": 0.00011558124428266917, "tps": 113461, "wall": 12461.3} {"step": 21574, "train_loss": 3.2419474124908447, "lr": 0.00011556563987344127, "tps": 113423, "wall": 12466.0} {"step": 21575, "train_loss": 3.1689677238464355, "lr": 0.00011555003664725137, "tps": 113385, "wall": 12470.8} {"step": 21576, "train_loss": 3.173171043395996, "lr": 0.00011553443460427635, "tps": 113347, "wall": 12475.5} {"step": 21577, "train_loss": 3.1614325046539307, "lr": 0.00011551883374469294, "tps": 113309, "wall": 12480.3} {"step": 21578, "train_loss": 3.1952998638153076, "lr": 0.00011550323406867774, "tps": 113271, "wall": 12485.0} {"step": 21579, "train_loss": 3.1388158798217773, "lr": 0.00011548763557640763, "tps": 113233, "wall": 12489.8} {"step": 21580, "train_loss": 3.165844440460205, "lr": 0.00011547203826805926, "tps": 113195, "wall": 12494.6} {"step": 21581, "train_loss": 3.2047841548919678, "lr": 0.00011545644214380922, "tps": 113157, "wall": 12499.3} {"step": 21582, "train_loss": 3.2777352333068848, "lr": 0.00011544084720383433, "tps": 113120, "wall": 12504.1} {"step": 21583, "train_loss": 3.2784430980682373, "lr": 0.00011542525344831113, "tps": 113082, "wall": 12508.8} {"step": 21584, "train_loss": 3.2485220432281494, "lr": 0.00011540966087741634, "tps": 113044, "wall": 12513.6} {"step": 21585, "train_loss": 3.2044596672058105, "lr": 0.00011539406949132658, "tps": 113005, "wall": 12518.5} {"step": 21586, "train_loss": 3.1963086128234863, "lr": 0.00011537847929021839, "tps": 112968, "wall": 12523.2} {"step": 21587, "train_loss": 3.107022285461426, "lr": 0.00011536289027426852, "tps": 112930, "wall": 12528.0} {"step": 21588, "train_loss": 3.211712598800659, "lr": 0.0001153473024436535, "tps": 112892, "wall": 12532.7} {"step": 21589, "train_loss": 3.1869897842407227, "lr": 0.00011533171579854982, "tps": 112855, "wall": 12537.5} {"step": 21590, "train_loss": 3.340569019317627, "lr": 0.00011531613033913423, "tps": 112817, "wall": 12542.3} {"step": 21591, "train_loss": 3.2218074798583984, "lr": 0.00011530054606558312, "tps": 112779, "wall": 12547.0} {"step": 21592, "train_loss": 3.13671875, "lr": 0.00011528496297807306, "tps": 112742, "wall": 12551.8} {"step": 21593, "train_loss": 3.281947374343872, "lr": 0.00011526938107678064, "tps": 112704, "wall": 12556.5} {"step": 21594, "train_loss": 3.1789050102233887, "lr": 0.00011525380036188238, "tps": 112667, "wall": 12561.3} {"step": 21595, "train_loss": 3.1247642040252686, "lr": 0.00011523822083355465, "tps": 112629, "wall": 12566.1} {"step": 21596, "train_loss": 3.19893217086792, "lr": 0.0001152226424919741, "tps": 112592, "wall": 12570.9} {"step": 21597, "train_loss": 3.2706804275512695, "lr": 0.00011520706533731708, "tps": 112554, "wall": 12575.7} {"step": 21598, "train_loss": 3.2990758419036865, "lr": 0.00011519148936976008, "tps": 112516, "wall": 12580.5} {"step": 21599, "train_loss": 3.2366409301757812, "lr": 0.00011517591458947958, "tps": 112479, "wall": 12585.2} {"step": 21600, "train_loss": 3.268458843231201, "lr": 0.00011516034099665196, "tps": 112442, "wall": 12590.0} {"step": 21601, "train_loss": 3.2188708782196045, "lr": 0.00011514476859145371, "tps": 112404, "wall": 12594.7} {"step": 21602, "train_loss": 3.188566207885742, "lr": 0.0001151291973740612, "tps": 112367, "wall": 12599.5} {"step": 21603, "train_loss": 3.141937017440796, "lr": 0.00011511362734465079, "tps": 112330, "wall": 12604.2} {"step": 21604, "train_loss": 3.291520118713379, "lr": 0.0001150980585033989, "tps": 112293, "wall": 12609.0} {"step": 21605, "train_loss": 3.2528076171875, "lr": 0.00011508249085048189, "tps": 112256, "wall": 12613.7} {"step": 21606, "train_loss": 3.2484536170959473, "lr": 0.00011506692438607602, "tps": 112219, "wall": 12618.5} {"step": 21607, "train_loss": 3.2171213626861572, "lr": 0.00011505135911035778, "tps": 112181, "wall": 12623.3} {"step": 21608, "train_loss": 3.2806015014648438, "lr": 0.00011503579502350344, "tps": 112144, "wall": 12628.0} {"step": 21609, "train_loss": 3.1429319381713867, "lr": 0.00011502023212568921, "tps": 112107, "wall": 12632.8} {"step": 21610, "train_loss": 3.1653857231140137, "lr": 0.00011500467041709155, "tps": 112070, "wall": 12637.6} {"step": 21611, "train_loss": 3.2030396461486816, "lr": 0.00011498910989788667, "tps": 112033, "wall": 12642.3} {"step": 21612, "train_loss": 3.1450915336608887, "lr": 0.00011497355056825077, "tps": 111996, "wall": 12647.1} {"step": 21613, "train_loss": 3.2421727180480957, "lr": 0.00011495799242836019, "tps": 111959, "wall": 12651.9} {"step": 21614, "train_loss": 3.1935336589813232, "lr": 0.00011494243547839118, "tps": 111922, "wall": 12656.6} {"step": 21615, "train_loss": 3.2083487510681152, "lr": 0.0001149268797185199, "tps": 111885, "wall": 12661.4} {"step": 21616, "train_loss": 3.13814640045166, "lr": 0.00011491132514892266, "tps": 111848, "wall": 12666.1} {"step": 21617, "train_loss": 3.13362979888916, "lr": 0.00011489577176977561, "tps": 111811, "wall": 12670.9} {"step": 21618, "train_loss": 3.22403621673584, "lr": 0.0001148802195812549, "tps": 111775, "wall": 12675.6} {"step": 21619, "train_loss": 3.2764110565185547, "lr": 0.00011486466858353679, "tps": 111738, "wall": 12680.4} {"step": 21620, "train_loss": 3.331752061843872, "lr": 0.00011484911877679736, "tps": 111701, "wall": 12685.2} {"step": 21621, "train_loss": 3.163407802581787, "lr": 0.00011483357016121283, "tps": 111664, "wall": 12690.0} {"step": 21622, "train_loss": 3.169689178466797, "lr": 0.00011481802273695934, "tps": 111627, "wall": 12694.7} {"step": 21623, "train_loss": 3.1703603267669678, "lr": 0.0001148024765042129, "tps": 111590, "wall": 12699.5} {"step": 21624, "train_loss": 3.1112871170043945, "lr": 0.00011478693146314974, "tps": 111554, "wall": 12704.3} {"step": 21625, "train_loss": 3.207521915435791, "lr": 0.00011477138761394597, "tps": 111517, "wall": 12709.0} {"step": 21626, "train_loss": 3.10904598236084, "lr": 0.00011475584495677751, "tps": 111481, "wall": 12713.8} {"step": 21627, "train_loss": 3.2073445320129395, "lr": 0.00011474030349182059, "tps": 111444, "wall": 12718.5} {"step": 21628, "train_loss": 3.2149312496185303, "lr": 0.00011472476321925121, "tps": 111408, "wall": 12723.3} {"step": 21629, "train_loss": 3.227304697036743, "lr": 0.00011470922413924536, "tps": 111371, "wall": 12728.0} {"step": 21630, "train_loss": 3.1734399795532227, "lr": 0.00011469368625197919, "tps": 111335, "wall": 12732.8} {"step": 21631, "train_loss": 3.227693557739258, "lr": 0.00011467814955762859, "tps": 111298, "wall": 12737.5} {"step": 21632, "train_loss": 3.218263626098633, "lr": 0.00011466261405636958, "tps": 111262, "wall": 12742.3} {"step": 21633, "train_loss": 3.1456727981567383, "lr": 0.00011464707974837823, "tps": 111226, "wall": 12747.1} {"step": 21634, "train_loss": 3.1172285079956055, "lr": 0.00011463154663383049, "tps": 111189, "wall": 12751.8} {"step": 21635, "train_loss": 3.2258284091949463, "lr": 0.0001146160147129022, "tps": 111152, "wall": 12756.7} {"step": 21636, "train_loss": 3.0944087505340576, "lr": 0.00011460048398576945, "tps": 111116, "wall": 12761.4} {"step": 21637, "train_loss": 3.2436563968658447, "lr": 0.00011458495445260807, "tps": 111080, "wall": 12766.2} {"step": 21638, "train_loss": 3.1732847690582275, "lr": 0.0001145694261135941, "tps": 111044, "wall": 12770.9} {"step": 21639, "train_loss": 3.323867082595825, "lr": 0.00011455389896890336, "tps": 111007, "wall": 12775.7} {"step": 21640, "train_loss": 3.093038558959961, "lr": 0.00011453837301871168, "tps": 110971, "wall": 12780.4} {"step": 21641, "train_loss": 3.2675719261169434, "lr": 0.00011452284826319513, "tps": 110935, "wall": 12785.2} {"step": 21642, "train_loss": 3.0801422595977783, "lr": 0.00011450732470252941, "tps": 110899, "wall": 12789.9} {"step": 21643, "train_loss": 3.0957744121551514, "lr": 0.00011449180233689038, "tps": 110863, "wall": 12794.7} {"step": 21644, "train_loss": 3.204270839691162, "lr": 0.00011447628116645399, "tps": 110827, "wall": 12799.5} {"step": 21645, "train_loss": 3.1809310913085938, "lr": 0.00011446076119139596, "tps": 110791, "wall": 12804.2} {"step": 21646, "train_loss": 3.1210763454437256, "lr": 0.00011444524241189212, "tps": 110755, "wall": 12809.0} {"step": 21647, "train_loss": 3.1786065101623535, "lr": 0.00011442972482811831, "tps": 110718, "wall": 12813.7} {"step": 21648, "train_loss": 3.1288506984710693, "lr": 0.00011441420844025032, "tps": 110682, "wall": 12818.5} {"step": 21649, "train_loss": 3.2147560119628906, "lr": 0.00011439869324846384, "tps": 110646, "wall": 12823.3} {"step": 21650, "train_loss": 3.184391736984253, "lr": 0.00011438317925293469, "tps": 110610, "wall": 12828.1} {"step": 21651, "train_loss": 3.324977397918701, "lr": 0.00011436766645383863, "tps": 110574, "wall": 12832.8} {"step": 21652, "train_loss": 3.145591974258423, "lr": 0.00011435215485135127, "tps": 110539, "wall": 12837.5} {"step": 21653, "train_loss": 3.0883193016052246, "lr": 0.00011433664444564851, "tps": 110503, "wall": 12842.3} {"step": 21654, "train_loss": 3.229503631591797, "lr": 0.00011432113523690588, "tps": 110467, "wall": 12847.1} {"step": 21655, "train_loss": 3.1513442993164062, "lr": 0.00011430562722529923, "tps": 110431, "wall": 12851.8} {"step": 21656, "train_loss": 3.1800570487976074, "lr": 0.0001142901204110041, "tps": 110395, "wall": 12856.6} {"step": 21657, "train_loss": 3.164076805114746, "lr": 0.00011427461479419621, "tps": 110359, "wall": 12861.4} {"step": 21658, "train_loss": 3.2858128547668457, "lr": 0.00011425911037505121, "tps": 110324, "wall": 12866.1} {"step": 21659, "train_loss": 3.2008626461029053, "lr": 0.00011424360715374476, "tps": 110288, "wall": 12870.9} {"step": 21660, "train_loss": 3.1580491065979004, "lr": 0.00011422810513045239, "tps": 110252, "wall": 12875.7} {"step": 21661, "train_loss": 3.2147321701049805, "lr": 0.00011421260430534979, "tps": 110216, "wall": 12880.5} {"step": 21662, "train_loss": 3.217116594314575, "lr": 0.00011419710467861257, "tps": 110181, "wall": 12885.2} {"step": 21663, "train_loss": 3.160463809967041, "lr": 0.00011418160625041628, "tps": 110145, "wall": 12889.9} {"step": 21664, "train_loss": 3.126929521560669, "lr": 0.00011416610902093643, "tps": 110110, "wall": 12894.7} {"step": 21665, "train_loss": 3.172809362411499, "lr": 0.00011415061299034862, "tps": 110074, "wall": 12899.5} {"step": 21666, "train_loss": 3.226595163345337, "lr": 0.00011413511815882843, "tps": 110039, "wall": 12904.2} {"step": 21667, "train_loss": 3.271548271179199, "lr": 0.00011411962452655132, "tps": 110003, "wall": 12909.0} {"step": 21668, "train_loss": 3.2218785285949707, "lr": 0.0001141041320936928, "tps": 109968, "wall": 12913.7} {"step": 21669, "train_loss": 3.132389545440674, "lr": 0.00011408864086042845, "tps": 109932, "wall": 12918.5} {"step": 21670, "train_loss": 3.176575183868408, "lr": 0.00011407315082693371, "tps": 109897, "wall": 12923.2} {"step": 21671, "train_loss": 3.2942280769348145, "lr": 0.00011405766199338399, "tps": 109862, "wall": 12928.0} {"step": 21672, "train_loss": 3.2744197845458984, "lr": 0.00011404217435995486, "tps": 109826, "wall": 12932.7} {"step": 21673, "train_loss": 3.2855169773101807, "lr": 0.00011402668792682174, "tps": 109790, "wall": 12937.6} {"step": 21674, "train_loss": 3.3188107013702393, "lr": 0.00011401120269415991, "tps": 109755, "wall": 12942.3} {"step": 21675, "train_loss": 3.237579584121704, "lr": 0.00011399571866214502, "tps": 109720, "wall": 12947.1} {"step": 21676, "train_loss": 3.1561076641082764, "lr": 0.00011398023583095236, "tps": 109685, "wall": 12951.8} {"step": 21677, "train_loss": 3.23522686958313, "lr": 0.00011396475420075723, "tps": 109649, "wall": 12956.6} {"step": 21678, "train_loss": 3.09495210647583, "lr": 0.00011394927377173518, "tps": 109614, "wall": 12961.4} {"step": 21679, "train_loss": 3.2095065116882324, "lr": 0.00011393379454406145, "tps": 109579, "wall": 12966.1} {"step": 21680, "train_loss": 3.2081685066223145, "lr": 0.00011391831651791149, "tps": 109544, "wall": 12970.9} {"step": 21681, "train_loss": 3.258145332336426, "lr": 0.00011390283969346058, "tps": 109509, "wall": 12975.6} {"step": 21682, "train_loss": 3.2094006538391113, "lr": 0.00011388736407088396, "tps": 109474, "wall": 12980.4} {"step": 21683, "train_loss": 3.230562210083008, "lr": 0.0001138718896503571, "tps": 109439, "wall": 12985.1} {"step": 21684, "train_loss": 3.279057502746582, "lr": 0.00011385641643205522, "tps": 109404, "wall": 12989.9} {"step": 21685, "train_loss": 3.184018850326538, "lr": 0.00011384094441615351, "tps": 109369, "wall": 12994.6} {"step": 21686, "train_loss": 3.183178424835205, "lr": 0.00011382547360282742, "tps": 109333, "wall": 12999.4} {"step": 21687, "train_loss": 3.107896327972412, "lr": 0.0001138100039922521, "tps": 109298, "wall": 13004.2} {"step": 21688, "train_loss": 3.299330949783325, "lr": 0.00011379453558460271, "tps": 109263, "wall": 13009.0} {"step": 21689, "train_loss": 3.2302820682525635, "lr": 0.00011377906838005465, "tps": 109228, "wall": 13013.8} {"step": 21690, "train_loss": 3.3133907318115234, "lr": 0.00011376360237878305, "tps": 109193, "wall": 13018.5} {"step": 21691, "train_loss": 3.2594900131225586, "lr": 0.00011374813758096306, "tps": 109159, "wall": 13023.2} {"step": 21692, "train_loss": 3.3056650161743164, "lr": 0.00011373267398676996, "tps": 109124, "wall": 13028.0} {"step": 21693, "train_loss": 3.2781319618225098, "lr": 0.00011371721159637887, "tps": 109089, "wall": 13032.7} {"step": 21694, "train_loss": 3.181691884994507, "lr": 0.00011370175040996491, "tps": 109055, "wall": 13037.5} {"step": 21695, "train_loss": 3.265078067779541, "lr": 0.00011368629042770334, "tps": 109020, "wall": 13042.2} {"step": 21696, "train_loss": 3.295217752456665, "lr": 0.00011367083164976913, "tps": 108985, "wall": 13047.0} {"step": 21697, "train_loss": 3.1313905715942383, "lr": 0.0001136553740763376, "tps": 108950, "wall": 13051.8} {"step": 21698, "train_loss": 3.1858291625976562, "lr": 0.00011363991770758371, "tps": 108915, "wall": 13056.6} {"step": 21699, "train_loss": 3.245698928833008, "lr": 0.00011362446254368255, "tps": 108881, "wall": 13061.3} {"step": 21700, "train_loss": 3.2038397789001465, "lr": 0.00011360900858480926, "tps": 108846, "wall": 13066.1} {"step": 21701, "train_loss": 3.155790328979492, "lr": 0.00011359355583113891, "tps": 108812, "wall": 13070.8} {"step": 21702, "train_loss": 3.193037271499634, "lr": 0.00011357810428284641, "tps": 108777, "wall": 13075.6} {"step": 21703, "train_loss": 3.1800193786621094, "lr": 0.00011356265394010703, "tps": 108743, "wall": 13080.3} {"step": 21704, "train_loss": 3.2361979484558105, "lr": 0.00011354720480309561, "tps": 108708, "wall": 13085.1} {"step": 21705, "train_loss": 3.2226288318634033, "lr": 0.00011353175687198718, "tps": 108674, "wall": 13089.8} {"step": 21706, "train_loss": 3.11875057220459, "lr": 0.00011351631014695681, "tps": 108639, "wall": 13094.6} {"step": 21707, "train_loss": 3.2996063232421875, "lr": 0.00011350086462817943, "tps": 108605, "wall": 13099.3} {"step": 21708, "train_loss": 3.1797361373901367, "lr": 0.00011348542031582998, "tps": 108570, "wall": 13104.1} {"step": 21709, "train_loss": 3.1913440227508545, "lr": 0.00011346997721008352, "tps": 108536, "wall": 13108.8} {"step": 21710, "train_loss": 3.1805593967437744, "lr": 0.0001134545353111149, "tps": 108502, "wall": 13113.6} {"step": 21711, "train_loss": 3.253101348876953, "lr": 0.00011343909461909902, "tps": 108467, "wall": 13118.4} {"step": 21712, "train_loss": 3.24851131439209, "lr": 0.00011342365513421089, "tps": 108432, "wall": 13123.2} {"step": 21713, "train_loss": 3.198197603225708, "lr": 0.00011340821685662537, "tps": 108398, "wall": 13127.9} {"step": 21714, "train_loss": 3.2447257041931152, "lr": 0.00011339277978651727, "tps": 108364, "wall": 13132.7} {"step": 21715, "train_loss": 3.1394102573394775, "lr": 0.0001133773439240616, "tps": 108329, "wall": 13137.5} {"step": 21716, "train_loss": 3.213827133178711, "lr": 0.00011336190926943309, "tps": 108295, "wall": 13142.2} {"step": 21717, "train_loss": 3.3230478763580322, "lr": 0.00011334647582280666, "tps": 108261, "wall": 13147.0} {"step": 21718, "train_loss": 3.22469425201416, "lr": 0.00011333104358435718, "tps": 108227, "wall": 13151.7} {"step": 21719, "train_loss": 3.129373788833618, "lr": 0.00011331561255425929, "tps": 108193, "wall": 13156.5} {"step": 21720, "train_loss": 3.209552764892578, "lr": 0.000113300182732688, "tps": 108159, "wall": 13161.2} {"step": 21721, "train_loss": 3.1172218322753906, "lr": 0.00011328475411981803, "tps": 108124, "wall": 13166.0} {"step": 21722, "train_loss": 3.177797794342041, "lr": 0.00011326932671582406, "tps": 108090, "wall": 13170.8} {"step": 21723, "train_loss": 3.2704215049743652, "lr": 0.00011325390052088099, "tps": 108056, "wall": 13175.6} {"step": 21724, "train_loss": 3.213588237762451, "lr": 0.00011323847553516351, "tps": 108022, "wall": 13180.3} {"step": 21725, "train_loss": 3.213864803314209, "lr": 0.00011322305175884631, "tps": 107988, "wall": 13185.1} {"step": 21726, "train_loss": 3.1408426761627197, "lr": 0.00011320762919210417, "tps": 107954, "wall": 13189.8} {"step": 21727, "train_loss": 3.1986396312713623, "lr": 0.00011319220783511184, "tps": 107920, "wall": 13194.6} {"step": 21728, "train_loss": 3.1678264141082764, "lr": 0.00011317678768804388, "tps": 107886, "wall": 13199.3} {"step": 21729, "train_loss": 3.128048896789551, "lr": 0.00011316136875107511, "tps": 107852, "wall": 13204.1} {"step": 21730, "train_loss": 3.173299789428711, "lr": 0.00011314595102438013, "tps": 107818, "wall": 13208.9} {"step": 21731, "train_loss": 3.2513458728790283, "lr": 0.00011313053450813351, "tps": 107784, "wall": 13213.7} {"step": 21732, "train_loss": 3.247742176055908, "lr": 0.00011311511920251008, "tps": 107750, "wall": 13218.4} {"step": 21733, "train_loss": 3.2484352588653564, "lr": 0.00011309970510768429, "tps": 107716, "wall": 13223.2} {"step": 21734, "train_loss": 3.208085775375366, "lr": 0.00011308429222383088, "tps": 107683, "wall": 13227.9} {"step": 21735, "train_loss": 3.1975886821746826, "lr": 0.00011306888055112436, "tps": 107649, "wall": 13232.7} {"step": 21736, "train_loss": 3.212482213973999, "lr": 0.00011305347008973934, "tps": 107615, "wall": 13237.5} {"step": 21737, "train_loss": 3.18361759185791, "lr": 0.00011303806083985042, "tps": 107581, "wall": 13242.2} {"step": 21738, "train_loss": 3.13497257232666, "lr": 0.00011302265280163213, "tps": 107548, "wall": 13247.0} {"step": 21739, "train_loss": 3.1231606006622314, "lr": 0.000113007245975259, "tps": 107514, "wall": 13251.7} {"step": 21740, "train_loss": 3.2371833324432373, "lr": 0.0001129918403609056, "tps": 107480, "wall": 13256.5} {"step": 21741, "train_loss": 3.301037073135376, "lr": 0.00011297643595874645, "tps": 107447, "wall": 13261.3} {"step": 21742, "train_loss": 3.2547380924224854, "lr": 0.00011296103276895592, "tps": 107413, "wall": 13266.0} {"step": 21743, "train_loss": 3.215202808380127, "lr": 0.0001129456307917087, "tps": 107379, "wall": 13270.8} {"step": 21744, "train_loss": 3.2425007820129395, "lr": 0.00011293023002717915, "tps": 107346, "wall": 13275.5} {"step": 21745, "train_loss": 3.1532700061798096, "lr": 0.00011291483047554167, "tps": 107312, "wall": 13280.3} {"step": 21746, "train_loss": 3.2547643184661865, "lr": 0.00011289943213697085, "tps": 107279, "wall": 13285.1} {"step": 21747, "train_loss": 3.1777617931365967, "lr": 0.00011288403501164109, "tps": 107245, "wall": 13289.8} {"step": 21748, "train_loss": 3.20412540435791, "lr": 0.00011286863909972666, "tps": 107212, "wall": 13294.6} {"step": 21749, "train_loss": 3.1505517959594727, "lr": 0.00011285324440140219, "tps": 107178, "wall": 13299.4} {"step": 21750, "train_loss": 3.086996078491211, "lr": 0.00011283785091684189, "tps": 107145, "wall": 13304.1} {"step": 21751, "train_loss": 3.1828508377075195, "lr": 0.00011282245864622027, "tps": 107111, "wall": 13308.9} {"step": 21752, "train_loss": 3.178882598876953, "lr": 0.00011280706758971167, "tps": 107078, "wall": 13313.6} {"step": 21753, "train_loss": 3.1829419136047363, "lr": 0.00011279167774749029, "tps": 107045, "wall": 13318.4} {"step": 21754, "train_loss": 3.143266201019287, "lr": 0.00011277628911973069, "tps": 107011, "wall": 13323.1} {"step": 21755, "train_loss": 3.2194535732269287, "lr": 0.00011276090170660704, "tps": 106978, "wall": 13327.9} {"step": 21756, "train_loss": 3.2738728523254395, "lr": 0.00011274551550829366, "tps": 106945, "wall": 13332.7} {"step": 21757, "train_loss": 3.1263160705566406, "lr": 0.00011273013052496497, "tps": 106912, "wall": 13337.4} {"step": 21758, "train_loss": 3.2646234035491943, "lr": 0.00011271474675679515, "tps": 106878, "wall": 13342.2} {"step": 21759, "train_loss": 3.208447217941284, "lr": 0.00011269936420395839, "tps": 106845, "wall": 13347.0} {"step": 21760, "train_loss": 3.146717071533203, "lr": 0.00011268398286662911, "tps": 106812, "wall": 13351.7} {"step": 21761, "train_loss": 3.211503028869629, "lr": 0.0001126686027449815, "tps": 106778, "wall": 13356.5} {"step": 21762, "train_loss": 3.2266788482666016, "lr": 0.0001126532238391897, "tps": 106745, "wall": 13361.3} {"step": 21763, "train_loss": 3.075371026992798, "lr": 0.00011263784614942804, "tps": 106712, "wall": 13366.0} {"step": 21764, "train_loss": 3.1961827278137207, "lr": 0.00011262246967587067, "tps": 106679, "wall": 13370.8} {"step": 21765, "train_loss": 3.22434401512146, "lr": 0.00011260709441869171, "tps": 106646, "wall": 13375.5} {"step": 21766, "train_loss": 3.1978046894073486, "lr": 0.00011259172037806547, "tps": 106613, "wall": 13380.3} {"step": 21767, "train_loss": 3.2431154251098633, "lr": 0.00011257634755416599, "tps": 106580, "wall": 13385.1} {"step": 21768, "train_loss": 3.195584774017334, "lr": 0.00011256097594716743, "tps": 106547, "wall": 13389.8} {"step": 21769, "train_loss": 3.1913652420043945, "lr": 0.00011254560555724403, "tps": 106514, "wall": 13394.6} {"step": 21770, "train_loss": 3.1427550315856934, "lr": 0.00011253023638456972, "tps": 106481, "wall": 13399.3} {"step": 21771, "train_loss": 3.330336809158325, "lr": 0.00011251486842931877, "tps": 106449, "wall": 13404.1} {"step": 21772, "train_loss": 3.1234822273254395, "lr": 0.00011249950169166523, "tps": 106416, "wall": 13408.8} {"step": 21773, "train_loss": 3.1170594692230225, "lr": 0.00011248413617178307, "tps": 106383, "wall": 13413.6} {"step": 21774, "train_loss": 3.1564784049987793, "lr": 0.0001124687718698465, "tps": 106349, "wall": 13418.4} {"step": 21775, "train_loss": 3.121570110321045, "lr": 0.00011245340878602948, "tps": 106316, "wall": 13423.2} {"step": 21776, "train_loss": 3.138819694519043, "lr": 0.00011243804692050601, "tps": 106284, "wall": 13427.9} {"step": 21777, "train_loss": 3.230675220489502, "lr": 0.00011242268627345027, "tps": 106251, "wall": 13432.7} {"step": 21778, "train_loss": 3.2132411003112793, "lr": 0.00011240732684503613, "tps": 106218, "wall": 13437.5} {"step": 21779, "train_loss": 3.224519729614258, "lr": 0.00011239196863543755, "tps": 106185, "wall": 13442.2} {"step": 21780, "train_loss": 3.1070382595062256, "lr": 0.0001123766116448286, "tps": 106153, "wall": 13447.0} {"step": 21781, "train_loss": 3.240407943725586, "lr": 0.00011236125587338326, "tps": 106120, "wall": 13451.7} {"step": 21782, "train_loss": 3.270094871520996, "lr": 0.00011234590132127536, "tps": 106087, "wall": 13456.5} {"step": 21783, "train_loss": 3.081233501434326, "lr": 0.00011233054798867897, "tps": 106055, "wall": 13461.2} {"step": 21784, "train_loss": 3.257277011871338, "lr": 0.00011231519587576796, "tps": 106022, "wall": 13466.0} {"step": 21785, "train_loss": 3.267852306365967, "lr": 0.00011229984498271618, "tps": 105990, "wall": 13470.8} {"step": 21786, "train_loss": 3.3406615257263184, "lr": 0.00011228449530969762, "tps": 105956, "wall": 13475.6} {"step": 21787, "train_loss": 3.1565122604370117, "lr": 0.00011226914685688607, "tps": 105924, "wall": 13480.3} {"step": 21788, "train_loss": 3.3055927753448486, "lr": 0.00011225379962445557, "tps": 105892, "wall": 13485.1} {"step": 21789, "train_loss": 3.2606136798858643, "lr": 0.00011223845361257978, "tps": 105859, "wall": 13489.9} {"step": 21790, "train_loss": 3.1080968379974365, "lr": 0.00011222310882143259, "tps": 105826, "wall": 13494.6} {"step": 21791, "train_loss": 3.0779237747192383, "lr": 0.00011220776525118793, "tps": 105794, "wall": 13499.4} {"step": 21792, "train_loss": 3.2571043968200684, "lr": 0.00011219242290201953, "tps": 105762, "wall": 13504.1} {"step": 21793, "train_loss": 3.2645907402038574, "lr": 0.00011217708177410112, "tps": 105729, "wall": 13508.9} {"step": 21794, "train_loss": 3.214735507965088, "lr": 0.00011216174186760664, "tps": 105697, "wall": 13513.6} {"step": 21795, "train_loss": 3.1609115600585938, "lr": 0.00011214640318270977, "tps": 105665, "wall": 13518.4} {"step": 21796, "train_loss": 3.174514055252075, "lr": 0.00011213106571958421, "tps": 105632, "wall": 13523.1} {"step": 21797, "train_loss": 3.1396665573120117, "lr": 0.00011211572947840385, "tps": 105600, "wall": 13527.9} {"step": 21798, "train_loss": 3.1384024620056152, "lr": 0.00011210039445934235, "tps": 105568, "wall": 13532.7} {"step": 21799, "train_loss": 3.2080297470092773, "lr": 0.00011208506066257332, "tps": 105535, "wall": 13537.5} {"step": 21800, "train_loss": 3.2148525714874268, "lr": 0.00011206972808827068, "tps": 105503, "wall": 13542.2} {"step": 21801, "train_loss": 3.1801137924194336, "lr": 0.00011205439673660793, "tps": 105471, "wall": 13547.0} {"step": 21802, "train_loss": 3.1534643173217773, "lr": 0.00011203906660775881, "tps": 105438, "wall": 13551.7} {"step": 21803, "train_loss": 3.124593496322632, "lr": 0.00011202373770189703, "tps": 105406, "wall": 13556.5} {"step": 21804, "train_loss": 3.1735358238220215, "lr": 0.00011200841001919617, "tps": 105374, "wall": 13561.3} {"step": 21805, "train_loss": 3.3009228706359863, "lr": 0.00011199308355982983, "tps": 105342, "wall": 13566.0} {"step": 21806, "train_loss": 3.0908889770507812, "lr": 0.00011197775832397175, "tps": 105310, "wall": 13570.8} {"step": 21807, "train_loss": 3.24627947807312, "lr": 0.0001119624343117954, "tps": 105278, "wall": 13575.5} {"step": 21808, "train_loss": 3.0737340450286865, "lr": 0.0001119471115234745, "tps": 105246, "wall": 13580.3} {"step": 21809, "train_loss": 3.2466330528259277, "lr": 0.00011193178995918259, "tps": 105214, "wall": 13585.0} {"step": 21810, "train_loss": 3.220284938812256, "lr": 0.00011191646961909313, "tps": 105182, "wall": 13589.8} {"step": 21811, "train_loss": 3.1786131858825684, "lr": 0.00011190115050337979, "tps": 105150, "wall": 13594.5} {"step": 21812, "train_loss": 3.1941349506378174, "lr": 0.00011188583261221607, "tps": 105117, "wall": 13599.4} {"step": 21813, "train_loss": 3.2775638103485107, "lr": 0.00011187051594577547, "tps": 105085, "wall": 13604.1} {"step": 21814, "train_loss": 3.325282573699951, "lr": 0.00011185520050423152, "tps": 105054, "wall": 13608.9} {"step": 21815, "train_loss": 3.1078245639801025, "lr": 0.00011183988628775777, "tps": 105022, "wall": 13613.6} {"step": 21816, "train_loss": 3.235459089279175, "lr": 0.00011182457329652754, "tps": 104990, "wall": 13618.4} {"step": 21817, "train_loss": 3.1519181728363037, "lr": 0.00011180926153071447, "tps": 104958, "wall": 13623.1} {"step": 21818, "train_loss": 3.2221519947052, "lr": 0.00011179395099049195, "tps": 104926, "wall": 13627.9} {"step": 21819, "train_loss": 3.2206850051879883, "lr": 0.00011177864167603331, "tps": 104895, "wall": 13632.6} {"step": 21820, "train_loss": 3.1916418075561523, "lr": 0.00011176333358751217, "tps": 104863, "wall": 13637.4} {"step": 21821, "train_loss": 3.3199923038482666, "lr": 0.00011174802672510179, "tps": 104831, "wall": 13642.1} {"step": 21822, "train_loss": 3.225533962249756, "lr": 0.0001117327210889756, "tps": 104799, "wall": 13646.9} {"step": 21823, "train_loss": 3.234989643096924, "lr": 0.00011171741667930704, "tps": 104768, "wall": 13651.6} {"step": 21824, "train_loss": 3.1628973484039307, "lr": 0.0001117021134962694, "tps": 104736, "wall": 13656.4} {"step": 21825, "train_loss": 3.11337947845459, "lr": 0.00011168681154003615, "tps": 104704, "wall": 13661.2} {"step": 21826, "train_loss": 3.2124805450439453, "lr": 0.00011167151081078054, "tps": 104672, "wall": 13666.0} {"step": 21827, "train_loss": 3.20072603225708, "lr": 0.00011165621130867586, "tps": 104641, "wall": 13670.7} {"step": 21828, "train_loss": 3.168382167816162, "lr": 0.00011164091303389554, "tps": 104609, "wall": 13675.5} {"step": 21829, "train_loss": 3.260761022567749, "lr": 0.00011162561598661281, "tps": 104577, "wall": 13680.2} {"step": 21830, "train_loss": 3.2017853260040283, "lr": 0.0001116103201670009, "tps": 104546, "wall": 13685.0} {"step": 21831, "train_loss": 3.2192325592041016, "lr": 0.00011159502557523329, "tps": 104514, "wall": 13689.7} {"step": 21832, "train_loss": 3.238565444946289, "lr": 0.00011157973221148297, "tps": 104483, "wall": 13694.5} {"step": 21833, "train_loss": 3.1227827072143555, "lr": 0.00011156444007592335, "tps": 104452, "wall": 13699.2} {"step": 21834, "train_loss": 3.2221689224243164, "lr": 0.00011154914916872765, "tps": 104420, "wall": 13704.0} {"step": 21835, "train_loss": 3.2683372497558594, "lr": 0.00011153385949006896, "tps": 104389, "wall": 13708.7} {"step": 21836, "train_loss": 3.303711175918579, "lr": 0.00011151857104012066, "tps": 104357, "wall": 13713.5} {"step": 21837, "train_loss": 3.1995677947998047, "lr": 0.00011150328381905586, "tps": 104325, "wall": 13718.3} {"step": 21838, "train_loss": 3.2007365226745605, "lr": 0.00011148799782704766, "tps": 104294, "wall": 13723.1} {"step": 21839, "train_loss": 3.223196506500244, "lr": 0.00011147271306426934, "tps": 104263, "wall": 13727.8} {"step": 21840, "train_loss": 3.2150774002075195, "lr": 0.00011145742953089402, "tps": 104231, "wall": 13732.6} {"step": 21841, "train_loss": 3.1757729053497314, "lr": 0.00011144214722709474, "tps": 104200, "wall": 13737.4} {"step": 21842, "train_loss": 3.3644938468933105, "lr": 0.00011142686615304477, "tps": 104169, "wall": 13742.1} {"step": 21843, "train_loss": 3.1372663974761963, "lr": 0.00011141158630891709, "tps": 104137, "wall": 13746.9} {"step": 21844, "train_loss": 3.192690372467041, "lr": 0.0001113963076948848, "tps": 104106, "wall": 13751.6} {"step": 21845, "train_loss": 3.1687817573547363, "lr": 0.00011138103031112108, "tps": 104075, "wall": 13756.4} {"step": 21846, "train_loss": 3.2170462608337402, "lr": 0.0001113657541577989, "tps": 104044, "wall": 13761.1} {"step": 21847, "train_loss": 3.2162973880767822, "lr": 0.0001113504792350913, "tps": 104012, "wall": 13765.9} {"step": 21848, "train_loss": 3.204481840133667, "lr": 0.00011133520554317138, "tps": 103981, "wall": 13770.7} {"step": 21849, "train_loss": 3.2315053939819336, "lr": 0.00011131993308221212, "tps": 103949, "wall": 13775.5} {"step": 21850, "train_loss": 3.1732239723205566, "lr": 0.00011130466185238655, "tps": 103918, "wall": 13780.3} {"step": 21851, "train_loss": 3.1919384002685547, "lr": 0.00011128939185386767, "tps": 103887, "wall": 13785.0} {"step": 21852, "train_loss": 3.197938919067383, "lr": 0.00011127412308682836, "tps": 103856, "wall": 13789.8} {"step": 21853, "train_loss": 3.198556423187256, "lr": 0.00011125885555144173, "tps": 103825, "wall": 13794.6} {"step": 21854, "train_loss": 3.193311929702759, "lr": 0.00011124358924788069, "tps": 103794, "wall": 13799.3} {"step": 21855, "train_loss": 3.1695172786712646, "lr": 0.0001112283241763181, "tps": 103763, "wall": 13804.1} {"step": 21856, "train_loss": 3.187514543533325, "lr": 0.00011121306033692698, "tps": 103731, "wall": 13808.9} {"step": 21857, "train_loss": 3.1784303188323975, "lr": 0.0001111977977298802, "tps": 103701, "wall": 13813.6} {"step": 21858, "train_loss": 3.1650216579437256, "lr": 0.00011118253635535059, "tps": 103670, "wall": 13818.4} {"step": 21859, "train_loss": 3.1790432929992676, "lr": 0.00011116727621351116, "tps": 103639, "wall": 13823.1} {"step": 21860, "train_loss": 3.1638972759246826, "lr": 0.0001111520173045347, "tps": 103608, "wall": 13827.9} {"step": 21861, "train_loss": 3.241790533065796, "lr": 0.00011113675962859402, "tps": 103577, "wall": 13832.6} {"step": 21862, "train_loss": 3.25809907913208, "lr": 0.00011112150318586211, "tps": 103545, "wall": 13837.5} {"step": 21863, "train_loss": 3.0946719646453857, "lr": 0.00011110624797651168, "tps": 103514, "wall": 13842.2} {"step": 21864, "train_loss": 3.2069292068481445, "lr": 0.00011109099400071547, "tps": 103484, "wall": 13847.0} {"step": 21865, "train_loss": 3.1720101833343506, "lr": 0.00011107574125864645, "tps": 103453, "wall": 13851.7} {"step": 21866, "train_loss": 3.1759963035583496, "lr": 0.00011106048975047731, "tps": 103422, "wall": 13856.5} {"step": 21867, "train_loss": 3.2396459579467773, "lr": 0.00011104523947638086, "tps": 103391, "wall": 13861.3} {"step": 21868, "train_loss": 3.2776291370391846, "lr": 0.00011102999043652984, "tps": 103361, "wall": 13866.0} {"step": 21869, "train_loss": 3.146885871887207, "lr": 0.00011101474263109691, "tps": 103330, "wall": 13870.7} {"step": 21870, "train_loss": 3.1599786281585693, "lr": 0.00011099949606025495, "tps": 103299, "wall": 13875.5} {"step": 21871, "train_loss": 3.173191547393799, "lr": 0.00011098425072417658, "tps": 103269, "wall": 13880.3} {"step": 21872, "train_loss": 3.291832685470581, "lr": 0.00011096900662303444, "tps": 103238, "wall": 13885.0} {"step": 21873, "train_loss": 3.1635921001434326, "lr": 0.00011095376375700139, "tps": 103207, "wall": 13889.8} {"step": 21874, "train_loss": 3.219998359680176, "lr": 0.00011093852212625, "tps": 103177, "wall": 13894.6} {"step": 21875, "train_loss": 3.1948611736297607, "lr": 0.00011092328173095285, "tps": 103145, "wall": 13899.4} {"step": 21876, "train_loss": 3.1512250900268555, "lr": 0.00011090804257128274, "tps": 103115, "wall": 13904.1} {"step": 21877, "train_loss": 3.1398768424987793, "lr": 0.00011089280464741221, "tps": 103084, "wall": 13908.9} {"step": 21878, "train_loss": 3.210358142852783, "lr": 0.00011087756795951383, "tps": 103054, "wall": 13913.6} {"step": 21879, "train_loss": 3.2940971851348877, "lr": 0.00011086233250776032, "tps": 103023, "wall": 13918.4} {"step": 21880, "train_loss": 3.1530957221984863, "lr": 0.00011084709829232425, "tps": 102993, "wall": 13923.2} {"step": 21881, "train_loss": 3.1884851455688477, "lr": 0.00011083186531337806, "tps": 102962, "wall": 13927.9} {"step": 21882, "train_loss": 3.3579940795898438, "lr": 0.00011081663357109446, "tps": 102932, "wall": 13932.7} {"step": 21883, "train_loss": 3.2461097240448, "lr": 0.00011080140306564591, "tps": 102902, "wall": 13937.4} {"step": 21884, "train_loss": 3.2427005767822266, "lr": 0.00011078617379720504, "tps": 102871, "wall": 13942.2} {"step": 21885, "train_loss": 3.207075595855713, "lr": 0.00011077094576594426, "tps": 102841, "wall": 13946.9} {"step": 21886, "train_loss": 3.1820662021636963, "lr": 0.00011075571897203609, "tps": 102811, "wall": 13951.7} {"step": 21887, "train_loss": 3.1947855949401855, "lr": 0.00011074049341565312, "tps": 102780, "wall": 13956.5} {"step": 21888, "train_loss": 3.2254815101623535, "lr": 0.0001107252690969677, "tps": 102750, "wall": 13961.2} {"step": 21889, "train_loss": 3.249760150909424, "lr": 0.00011071004601615232, "tps": 102719, "wall": 13966.0} {"step": 21890, "train_loss": 3.14284610748291, "lr": 0.00011069482417337948, "tps": 102689, "wall": 13970.8} {"step": 21891, "train_loss": 3.1707229614257812, "lr": 0.0001106796035688216, "tps": 102659, "wall": 13975.5} {"step": 21892, "train_loss": 3.2702319622039795, "lr": 0.00011066438420265104, "tps": 102628, "wall": 13980.3} {"step": 21893, "train_loss": 3.251042366027832, "lr": 0.00011064916607504031, "tps": 102598, "wall": 13985.0} {"step": 21894, "train_loss": 3.225119113922119, "lr": 0.00011063394918616174, "tps": 102568, "wall": 13989.8} {"step": 21895, "train_loss": 3.1114535331726074, "lr": 0.00011061873353618763, "tps": 102538, "wall": 13994.6} {"step": 21896, "train_loss": 3.1739535331726074, "lr": 0.0001106035191252905, "tps": 102507, "wall": 13999.3} {"step": 21897, "train_loss": 3.214215040206909, "lr": 0.00011058830595364261, "tps": 102477, "wall": 14004.1} {"step": 21898, "train_loss": 3.257922649383545, "lr": 0.00011057309402141626, "tps": 102447, "wall": 14008.9} {"step": 21899, "train_loss": 3.1720588207244873, "lr": 0.00011055788332878389, "tps": 102417, "wall": 14013.6} {"step": 21900, "train_loss": 3.280646324157715, "lr": 0.00011054267387591774, "tps": 102386, "wall": 14018.5} {"step": 21901, "train_loss": 3.2096986770629883, "lr": 0.00011052746566299004, "tps": 102356, "wall": 14023.2} {"step": 21902, "train_loss": 3.2338507175445557, "lr": 0.00011051225869017317, "tps": 102326, "wall": 14028.0} {"step": 21903, "train_loss": 3.2033655643463135, "lr": 0.00011049705295763933, "tps": 102296, "wall": 14032.8} {"step": 21904, "train_loss": 3.2424156665802, "lr": 0.0001104818484655608, "tps": 102266, "wall": 14037.5} {"step": 21905, "train_loss": 3.183769464492798, "lr": 0.00011046664521410988, "tps": 102236, "wall": 14042.3} {"step": 21906, "train_loss": 3.1556906700134277, "lr": 0.00011045144320345864, "tps": 102206, "wall": 14047.1} {"step": 21907, "train_loss": 3.2311336994171143, "lr": 0.00011043624243377943, "tps": 102176, "wall": 14051.8} {"step": 21908, "train_loss": 3.1947004795074463, "lr": 0.0001104210429052444, "tps": 102146, "wall": 14056.6} {"step": 21909, "train_loss": 3.091714382171631, "lr": 0.00011040584461802565, "tps": 102116, "wall": 14061.4} {"step": 21910, "train_loss": 3.2964231967926025, "lr": 0.00011039064757229552, "tps": 102086, "wall": 14066.1} {"step": 21911, "train_loss": 3.1303021907806396, "lr": 0.00011037545176822606, "tps": 102056, "wall": 14070.9} {"step": 21912, "train_loss": 3.168779134750366, "lr": 0.0001103602572059893, "tps": 102025, "wall": 14075.8} {"step": 21913, "train_loss": 3.3738765716552734, "lr": 0.00011034506388575758, "tps": 101995, "wall": 14080.5} {"step": 21914, "train_loss": 3.1661510467529297, "lr": 0.00011032987180770291, "tps": 101966, "wall": 14085.3} {"step": 21915, "train_loss": 3.150895118713379, "lr": 0.00011031468097199731, "tps": 101936, "wall": 14090.1} {"step": 21916, "train_loss": 3.16791033744812, "lr": 0.00011029949137881299, "tps": 101906, "wall": 14094.8} {"step": 21917, "train_loss": 3.244349241256714, "lr": 0.000110284303028322, "tps": 101876, "wall": 14099.6} {"step": 21918, "train_loss": 3.2099385261535645, "lr": 0.00011026911592069627, "tps": 101846, "wall": 14104.4} {"step": 21919, "train_loss": 3.136436939239502, "lr": 0.00011025393005610802, "tps": 101816, "wall": 14109.1} {"step": 21920, "train_loss": 3.1707100868225098, "lr": 0.00011023874543472912, "tps": 101787, "wall": 14113.9} {"step": 21921, "train_loss": 3.106839418411255, "lr": 0.00011022356205673167, "tps": 101757, "wall": 14118.7} {"step": 21922, "train_loss": 3.2934799194335938, "lr": 0.0001102083799222877, "tps": 101727, "wall": 14123.5} {"step": 21923, "train_loss": 3.1983773708343506, "lr": 0.00011019319903156904, "tps": 101697, "wall": 14128.3} {"step": 21924, "train_loss": 3.247040271759033, "lr": 0.00011017801938474785, "tps": 101667, "wall": 14133.1} {"step": 21925, "train_loss": 3.1029138565063477, "lr": 0.00011016284098199599, "tps": 101637, "wall": 14137.9} {"step": 21926, "train_loss": 3.246509075164795, "lr": 0.00011014766382348533, "tps": 101608, "wall": 14142.6} {"step": 21927, "train_loss": 3.2165589332580566, "lr": 0.00011013248790938795, "tps": 101578, "wall": 14147.4} {"step": 21928, "train_loss": 3.203449010848999, "lr": 0.0001101173132398757, "tps": 101548, "wall": 14152.2} {"step": 21929, "train_loss": 3.294983386993408, "lr": 0.0001101021398151204, "tps": 101519, "wall": 14156.9} {"step": 21930, "train_loss": 3.228532314300537, "lr": 0.00011008696763529409, "tps": 101489, "wall": 14161.7} {"step": 21931, "train_loss": 3.223482847213745, "lr": 0.00011007179670056852, "tps": 101460, "wall": 14166.5} {"step": 21932, "train_loss": 3.187875747680664, "lr": 0.00011005662701111555, "tps": 101430, "wall": 14171.3} {"step": 21933, "train_loss": 3.2376697063446045, "lr": 0.0001100414585671071, "tps": 101400, "wall": 14176.1} {"step": 21934, "train_loss": 3.216228723526001, "lr": 0.00011002629136871498, "tps": 101371, "wall": 14180.9} {"step": 21935, "train_loss": 3.1148853302001953, "lr": 0.00011001112541611091, "tps": 101341, "wall": 14185.6} {"step": 21936, "train_loss": 3.1561529636383057, "lr": 0.00010999596070946683, "tps": 101312, "wall": 14190.4} {"step": 21937, "train_loss": 3.174896240234375, "lr": 0.00010998079724895435, "tps": 101281, "wall": 14195.3} {"step": 21938, "train_loss": 3.185528516769409, "lr": 0.00010996563503474549, "tps": 101252, "wall": 14200.1} {"step": 21939, "train_loss": 3.185380458831787, "lr": 0.0001099504740670118, "tps": 101223, "wall": 14204.9} {"step": 21940, "train_loss": 3.234919548034668, "lr": 0.00010993531434592506, "tps": 101193, "wall": 14209.6} {"step": 21941, "train_loss": 3.189267873764038, "lr": 0.0001099201558716571, "tps": 101164, "wall": 14214.4} {"step": 21942, "train_loss": 3.179884433746338, "lr": 0.00010990499864437955, "tps": 101134, "wall": 14219.2} {"step": 21943, "train_loss": 3.162975311279297, "lr": 0.0001098898426642641, "tps": 101105, "wall": 14224.0} {"step": 21944, "train_loss": 3.2418341636657715, "lr": 0.00010987468793148252, "tps": 101075, "wall": 14228.8} {"step": 21945, "train_loss": 3.169767141342163, "lr": 0.0001098595344462064, "tps": 101046, "wall": 14233.6} {"step": 21946, "train_loss": 3.2694106101989746, "lr": 0.00010984438220860742, "tps": 101016, "wall": 14238.4} {"step": 21947, "train_loss": 3.1965014934539795, "lr": 0.00010982923121885726, "tps": 100987, "wall": 14243.2} {"step": 21948, "train_loss": 3.1218414306640625, "lr": 0.00010981408147712755, "tps": 100958, "wall": 14248.0} {"step": 21949, "train_loss": 3.210394859313965, "lr": 0.00010979893298358983, "tps": 100928, "wall": 14252.8} {"step": 21950, "train_loss": 3.204429864883423, "lr": 0.00010978378573841581, "tps": 100899, "wall": 14257.6} {"step": 21951, "train_loss": 3.1831276416778564, "lr": 0.00010976863974177702, "tps": 100869, "wall": 14262.4} {"step": 21952, "train_loss": 3.2164359092712402, "lr": 0.000109753494993845, "tps": 100840, "wall": 14267.2} {"step": 21953, "train_loss": 3.2166900634765625, "lr": 0.00010973835149479139, "tps": 100811, "wall": 14272.0} {"step": 21954, "train_loss": 3.231135845184326, "lr": 0.00010972320924478772, "tps": 100781, "wall": 14276.8} {"step": 21955, "train_loss": 3.1593170166015625, "lr": 0.00010970806824400543, "tps": 100752, "wall": 14281.6} {"step": 21956, "train_loss": 3.1884069442749023, "lr": 0.00010969292849261616, "tps": 100723, "wall": 14286.4} {"step": 21957, "train_loss": 3.1477913856506348, "lr": 0.00010967778999079133, "tps": 100693, "wall": 14291.2} {"step": 21958, "train_loss": 3.186981201171875, "lr": 0.00010966265273870251, "tps": 100664, "wall": 14296.0} {"step": 21959, "train_loss": 3.255169630050659, "lr": 0.00010964751673652111, "tps": 100635, "wall": 14300.8} {"step": 21960, "train_loss": 3.2276382446289062, "lr": 0.00010963238198441858, "tps": 100606, "wall": 14305.7} {"step": 21961, "train_loss": 3.318863868713379, "lr": 0.00010961724848256645, "tps": 100576, "wall": 14310.5} {"step": 21962, "train_loss": 3.2011523246765137, "lr": 0.00010960211623113612, "tps": 100546, "wall": 14315.4} {"step": 21963, "train_loss": 3.1571080684661865, "lr": 0.00010958698523029889, "tps": 100517, "wall": 14320.2} {"step": 21964, "train_loss": 3.240126132965088, "lr": 0.00010957185548022634, "tps": 100488, "wall": 14325.0} {"step": 21965, "train_loss": 3.213809013366699, "lr": 0.00010955672698108977, "tps": 100458, "wall": 14329.9} {"step": 21966, "train_loss": 3.190131187438965, "lr": 0.00010954159973306052, "tps": 100429, "wall": 14334.8} {"step": 21967, "train_loss": 3.1617274284362793, "lr": 0.0001095264737363101, "tps": 100399, "wall": 14339.6} {"step": 21968, "train_loss": 3.2065882682800293, "lr": 0.00010951134899100972, "tps": 100370, "wall": 14344.5} {"step": 21969, "train_loss": 3.1148128509521484, "lr": 0.00010949622549733071, "tps": 100341, "wall": 14349.3} {"step": 21970, "train_loss": 3.20645809173584, "lr": 0.00010948110325544452, "tps": 100312, "wall": 14354.1} {"step": 21971, "train_loss": 3.206041097640991, "lr": 0.00010946598226552233, "tps": 100282, "wall": 14359.0} {"step": 21972, "train_loss": 3.348024606704712, "lr": 0.00010945086252773542, "tps": 100253, "wall": 14363.8} {"step": 21973, "train_loss": 3.0792784690856934, "lr": 0.0001094357440422552, "tps": 100224, "wall": 14368.7} {"step": 21974, "train_loss": 3.1927998065948486, "lr": 0.00010942062680925278, "tps": 100194, "wall": 14373.6} {"step": 21975, "train_loss": 3.3315021991729736, "lr": 0.00010940551082889957, "tps": 100164, "wall": 14378.5} {"step": 21976, "train_loss": 3.159318208694458, "lr": 0.00010939039610136665, "tps": 100135, "wall": 14383.3} {"step": 21977, "train_loss": 3.2353720664978027, "lr": 0.0001093752826268253, "tps": 100106, "wall": 14388.2} {"step": 21978, "train_loss": 3.146134376525879, "lr": 0.00010936017040544679, "tps": 100077, "wall": 14393.1} {"step": 21979, "train_loss": 3.1026723384857178, "lr": 0.00010934505943740223, "tps": 100047, "wall": 14397.9} {"step": 21980, "train_loss": 3.212472915649414, "lr": 0.0001093299497228628, "tps": 100018, "wall": 14402.8} {"step": 21981, "train_loss": 3.2714154720306396, "lr": 0.00010931484126199971, "tps": 99989, "wall": 14407.7} {"step": 21982, "train_loss": 3.275067090988159, "lr": 0.00010929973405498413, "tps": 99960, "wall": 14412.5} {"step": 21983, "train_loss": 3.1745197772979736, "lr": 0.00010928462810198705, "tps": 99930, "wall": 14417.4} {"step": 21984, "train_loss": 3.187272787094116, "lr": 0.00010926952340317975, "tps": 99901, "wall": 14422.3} {"step": 21985, "train_loss": 3.177610397338867, "lr": 0.00010925441995873331, "tps": 99872, "wall": 14427.1} {"step": 21986, "train_loss": 3.3017635345458984, "lr": 0.00010923931776881871, "tps": 99843, "wall": 14432.0} {"step": 21987, "train_loss": 3.2078163623809814, "lr": 0.00010922421683360719, "tps": 99813, "wall": 14437.0} {"step": 21988, "train_loss": 3.2206859588623047, "lr": 0.00010920911715326974, "tps": 99784, "wall": 14441.9} {"step": 21989, "train_loss": 3.2101328372955322, "lr": 0.00010919401872797732, "tps": 99754, "wall": 14446.8} {"step": 21990, "train_loss": 3.1772468090057373, "lr": 0.00010917892155790111, "tps": 99725, "wall": 14451.7} {"step": 21991, "train_loss": 3.23974609375, "lr": 0.00010916382564321201, "tps": 99696, "wall": 14456.5} {"step": 21992, "train_loss": 3.2750296592712402, "lr": 0.00010914873098408116, "tps": 99667, "wall": 14461.4} {"step": 21993, "train_loss": 3.253086566925049, "lr": 0.0001091336375806795, "tps": 99638, "wall": 14466.3} {"step": 21994, "train_loss": 3.157102584838867, "lr": 0.00010911854543317788, "tps": 99609, "wall": 14471.2} {"step": 21995, "train_loss": 3.1836190223693848, "lr": 0.00010910345454174749, "tps": 99579, "wall": 14476.1} {"step": 21996, "train_loss": 3.1338062286376953, "lr": 0.00010908836490655914, "tps": 99550, "wall": 14481.0} {"step": 21997, "train_loss": 3.1175851821899414, "lr": 0.00010907327652778372, "tps": 99521, "wall": 14485.9} {"step": 21998, "train_loss": 3.127202272415161, "lr": 0.00010905818940559231, "tps": 99492, "wall": 14490.8} {"step": 21999, "train_loss": 3.1974589824676514, "lr": 0.0001090431035401557, "tps": 99462, "wall": 14495.8} {"step": 22000, "train_loss": 3.2438387870788574, "lr": 0.00010902801893164487, "tps": 99433, "wall": 14500.7, "val_loss_monitor": 3.3619413339249795} {"step": 22001, "train_loss": 3.300522804260254, "lr": 0.0001090129355802306, "tps": 99079, "wall": 14553.2} {"step": 22002, "train_loss": 3.2761070728302, "lr": 0.00010899785348608378, "tps": 99050, "wall": 14558.2} {"step": 22003, "train_loss": 3.2131848335266113, "lr": 0.00010898277264937531, "tps": 99021, "wall": 14563.1} {"step": 22004, "train_loss": 3.130627393722534, "lr": 0.00010896769307027602, "tps": 98992, "wall": 14568.0} {"step": 22005, "train_loss": 3.2453386783599854, "lr": 0.00010895261474895661, "tps": 98963, "wall": 14572.9} {"step": 22006, "train_loss": 3.244734764099121, "lr": 0.00010893753768558807, "tps": 98934, "wall": 14577.8} {"step": 22007, "train_loss": 3.3369102478027344, "lr": 0.0001089224618803411, "tps": 98905, "wall": 14582.7} {"step": 22008, "train_loss": 3.179591655731201, "lr": 0.00010890738733338644, "tps": 98876, "wall": 14587.7} {"step": 22009, "train_loss": 3.3430769443511963, "lr": 0.00010889231404489497, "tps": 98848, "wall": 14592.6} {"step": 22010, "train_loss": 3.250434637069702, "lr": 0.00010887724201503737, "tps": 98819, "wall": 14597.5} {"step": 22011, "train_loss": 3.222019672393799, "lr": 0.00010886217124398434, "tps": 98790, "wall": 14602.4} {"step": 22012, "train_loss": 3.2079529762268066, "lr": 0.00010884710173190668, "tps": 98761, "wall": 14607.3} {"step": 22013, "train_loss": 3.282028913497925, "lr": 0.0001088320334789751, "tps": 98732, "wall": 14612.2} {"step": 22014, "train_loss": 3.239337921142578, "lr": 0.00010881696648536018, "tps": 98703, "wall": 14617.2} {"step": 22015, "train_loss": 3.2606306076049805, "lr": 0.00010880190075123273, "tps": 98675, "wall": 14622.1} {"step": 22016, "train_loss": 3.234586000442505, "lr": 0.00010878683627676332, "tps": 98646, "wall": 14627.0} {"step": 22017, "train_loss": 3.2920925617218018, "lr": 0.00010877177306212269, "tps": 98617, "wall": 14632.0} {"step": 22018, "train_loss": 3.3150906562805176, "lr": 0.00010875671110748145, "tps": 98589, "wall": 14636.9} {"step": 22019, "train_loss": 3.270568370819092, "lr": 0.00010874165041301015, "tps": 98560, "wall": 14641.8} {"step": 22020, "train_loss": 3.247408866882324, "lr": 0.0001087265909788795, "tps": 98531, "wall": 14646.7} {"step": 22021, "train_loss": 3.3931286334991455, "lr": 0.00010871153280526, "tps": 98503, "wall": 14651.6} {"step": 22022, "train_loss": 3.3658881187438965, "lr": 0.00010869647589232228, "tps": 98474, "wall": 14656.6} {"step": 22023, "train_loss": 3.247422218322754, "lr": 0.00010868142024023695, "tps": 98446, "wall": 14661.5} {"step": 22024, "train_loss": 3.3021860122680664, "lr": 0.00010866636584917452, "tps": 98417, "wall": 14666.4} {"step": 22025, "train_loss": 3.2482223510742188, "lr": 0.00010865131271930545, "tps": 98388, "wall": 14671.3} {"step": 22026, "train_loss": 3.277570962905884, "lr": 0.00010863626085080039, "tps": 98359, "wall": 14676.3} {"step": 22027, "train_loss": 3.307264804840088, "lr": 0.00010862121024382978, "tps": 98331, "wall": 14681.3} {"step": 22028, "train_loss": 3.251126766204834, "lr": 0.00010860616089856411, "tps": 98302, "wall": 14686.2} {"step": 22029, "train_loss": 3.1375322341918945, "lr": 0.00010859111281517389, "tps": 98274, "wall": 14691.1} {"step": 22030, "train_loss": 3.2036292552948, "lr": 0.0001085760659938296, "tps": 98246, "wall": 14696.0} {"step": 22031, "train_loss": 3.2876834869384766, "lr": 0.00010856102043470157, "tps": 98217, "wall": 14700.9} {"step": 22032, "train_loss": 3.2555794715881348, "lr": 0.0001085459761379604, "tps": 98189, "wall": 14705.9} {"step": 22033, "train_loss": 3.254798173904419, "lr": 0.00010853093310377645, "tps": 98160, "wall": 14710.8} {"step": 22034, "train_loss": 3.3851213455200195, "lr": 0.00010851589133232007, "tps": 98132, "wall": 14715.7} {"step": 22035, "train_loss": 3.3103580474853516, "lr": 0.00010850085082376175, "tps": 98104, "wall": 14720.6} {"step": 22036, "train_loss": 3.2581965923309326, "lr": 0.00010848581157827178, "tps": 98075, "wall": 14725.5} {"step": 22037, "train_loss": 3.250831127166748, "lr": 0.0001084707735960206, "tps": 98047, "wall": 14730.5} {"step": 22038, "train_loss": 3.262296199798584, "lr": 0.00010845573687717854, "tps": 98018, "wall": 14735.5} {"step": 22039, "train_loss": 3.233534574508667, "lr": 0.0001084407014219159, "tps": 97990, "wall": 14740.4} {"step": 22040, "train_loss": 3.3524889945983887, "lr": 0.00010842566723040306, "tps": 97962, "wall": 14745.3} {"step": 22041, "train_loss": 3.3644824028015137, "lr": 0.00010841063430281028, "tps": 97933, "wall": 14750.2} {"step": 22042, "train_loss": 3.3365163803100586, "lr": 0.00010839560263930786, "tps": 97905, "wall": 14755.1} {"step": 22043, "train_loss": 3.2766332626342773, "lr": 0.0001083805722400661, "tps": 97877, "wall": 14760.0} {"step": 22044, "train_loss": 3.3301548957824707, "lr": 0.00010836554310525529, "tps": 97849, "wall": 14765.0} {"step": 22045, "train_loss": 3.2873501777648926, "lr": 0.0001083505152350456, "tps": 97820, "wall": 14769.9} {"step": 22046, "train_loss": 3.171016216278076, "lr": 0.00010833548862960734, "tps": 97792, "wall": 14774.8} {"step": 22047, "train_loss": 3.2161412239074707, "lr": 0.00010832046328911072, "tps": 97764, "wall": 14779.8} {"step": 22048, "train_loss": 3.3285720348358154, "lr": 0.00010830543921372584, "tps": 97736, "wall": 14784.7} {"step": 22049, "train_loss": 3.2456064224243164, "lr": 0.0001082904164036231, "tps": 97708, "wall": 14789.6} {"step": 22050, "train_loss": 3.2650506496429443, "lr": 0.00010827539485897253, "tps": 97680, "wall": 14794.5} {"step": 22051, "train_loss": 3.3277885913848877, "lr": 0.00010826037457994429, "tps": 97651, "wall": 14799.5} {"step": 22052, "train_loss": 3.2077057361602783, "lr": 0.00010824535556670865, "tps": 97623, "wall": 14804.5} {"step": 22053, "train_loss": 3.2994065284729004, "lr": 0.00010823033781943559, "tps": 97595, "wall": 14809.4} {"step": 22054, "train_loss": 3.3644728660583496, "lr": 0.00010821532133829535, "tps": 97567, "wall": 14814.3} {"step": 22055, "train_loss": 3.241414785385132, "lr": 0.00010820030612345802, "tps": 97539, "wall": 14819.2} {"step": 22056, "train_loss": 3.263823986053467, "lr": 0.00010818529217509362, "tps": 97511, "wall": 14824.1} {"step": 22057, "train_loss": 3.2483248710632324, "lr": 0.00010817027949337231, "tps": 97483, "wall": 14829.1} {"step": 22058, "train_loss": 3.262413740158081, "lr": 0.00010815526807846414, "tps": 97455, "wall": 14834.0} {"step": 22059, "train_loss": 3.3953468799591064, "lr": 0.00010814025793053906, "tps": 97427, "wall": 14838.9} {"step": 22060, "train_loss": 3.232074022293091, "lr": 0.00010812524904976729, "tps": 97399, "wall": 14843.8} {"step": 22061, "train_loss": 3.2690181732177734, "lr": 0.00010811024143631874, "tps": 97371, "wall": 14848.8} {"step": 22062, "train_loss": 3.3083906173706055, "lr": 0.00010809523509036333, "tps": 97344, "wall": 14853.7} {"step": 22063, "train_loss": 3.3251681327819824, "lr": 0.00010808023001207123, "tps": 97315, "wall": 14858.7} {"step": 22064, "train_loss": 3.2181477546691895, "lr": 0.00010806522620161236, "tps": 97287, "wall": 14863.7} {"step": 22065, "train_loss": 3.2710657119750977, "lr": 0.00010805022365915661, "tps": 97260, "wall": 14868.6} {"step": 22066, "train_loss": 3.234271764755249, "lr": 0.000108035222384874, "tps": 97232, "wall": 14873.5} {"step": 22067, "train_loss": 3.2971079349517822, "lr": 0.00010802022237893448, "tps": 97204, "wall": 14878.4} {"step": 22068, "train_loss": 3.3773298263549805, "lr": 0.00010800522364150787, "tps": 97176, "wall": 14883.4} {"step": 22069, "train_loss": 3.2452950477600098, "lr": 0.00010799022617276422, "tps": 97148, "wall": 14888.3} {"step": 22070, "train_loss": 3.2197813987731934, "lr": 0.00010797522997287326, "tps": 97121, "wall": 14893.2} {"step": 22071, "train_loss": 3.2866270542144775, "lr": 0.00010796023504200503, "tps": 97093, "wall": 14898.1} {"step": 22072, "train_loss": 3.392150402069092, "lr": 0.00010794524138032934, "tps": 97065, "wall": 14903.1} {"step": 22073, "train_loss": 3.290693759918213, "lr": 0.00010793024898801592, "tps": 97037, "wall": 14908.0} {"step": 22074, "train_loss": 3.2053451538085938, "lr": 0.00010791525786523478, "tps": 97010, "wall": 14912.9} {"step": 22075, "train_loss": 3.2018680572509766, "lr": 0.00010790026801215565, "tps": 96982, "wall": 14917.9} {"step": 22076, "train_loss": 3.340517520904541, "lr": 0.00010788527942894831, "tps": 96954, "wall": 14922.8} {"step": 22077, "train_loss": 3.2608907222747803, "lr": 0.00010787029211578264, "tps": 96927, "wall": 14927.8} {"step": 22078, "train_loss": 3.3067049980163574, "lr": 0.00010785530607282837, "tps": 96899, "wall": 14932.7} {"step": 22079, "train_loss": 3.321134328842163, "lr": 0.00010784032130025518, "tps": 96871, "wall": 14937.6} {"step": 22080, "train_loss": 3.2249932289123535, "lr": 0.00010782533779823298, "tps": 96844, "wall": 14942.5} {"step": 22081, "train_loss": 3.241532325744629, "lr": 0.00010781035556693142, "tps": 96816, "wall": 14947.5} {"step": 22082, "train_loss": 3.357980728149414, "lr": 0.00010779537460652015, "tps": 96789, "wall": 14952.4} {"step": 22083, "train_loss": 3.267833709716797, "lr": 0.00010778039491716905, "tps": 96761, "wall": 14957.4} {"step": 22084, "train_loss": 3.222416400909424, "lr": 0.00010776541649904766, "tps": 96733, "wall": 14962.3} {"step": 22085, "train_loss": 3.38930606842041, "lr": 0.00010775043935232566, "tps": 96706, "wall": 14967.3} {"step": 22086, "train_loss": 3.1887638568878174, "lr": 0.00010773546347717278, "tps": 96678, "wall": 14972.2} {"step": 22087, "train_loss": 3.3016903400421143, "lr": 0.00010772048887375867, "tps": 96650, "wall": 14977.2} {"step": 22088, "train_loss": 3.340055465698242, "lr": 0.0001077055155422529, "tps": 96623, "wall": 14982.1} {"step": 22089, "train_loss": 3.2955873012542725, "lr": 0.00010769054348282517, "tps": 96596, "wall": 14987.0} {"step": 22090, "train_loss": 3.213601589202881, "lr": 0.00010767557269564499, "tps": 96569, "wall": 14991.9} {"step": 22091, "train_loss": 3.388179302215576, "lr": 0.00010766060318088203, "tps": 96541, "wall": 14996.9} {"step": 22092, "train_loss": 3.2424259185791016, "lr": 0.00010764563493870585, "tps": 96514, "wall": 15001.8} {"step": 22093, "train_loss": 3.3427982330322266, "lr": 0.00010763066796928592, "tps": 96487, "wall": 15006.7} {"step": 22094, "train_loss": 3.2368574142456055, "lr": 0.00010761570227279194, "tps": 96459, "wall": 15011.6} {"step": 22095, "train_loss": 3.2846860885620117, "lr": 0.00010760073784939337, "tps": 96432, "wall": 15016.5} {"step": 22096, "train_loss": 3.443984031677246, "lr": 0.00010758577469925964, "tps": 96405, "wall": 15021.5} {"step": 22097, "train_loss": 3.3486509323120117, "lr": 0.00010757081282256043, "tps": 96378, "wall": 15026.4} {"step": 22098, "train_loss": 3.2572126388549805, "lr": 0.00010755585221946512, "tps": 96351, "wall": 15031.3} {"step": 22099, "train_loss": 3.173194646835327, "lr": 0.00010754089289014313, "tps": 96323, "wall": 15036.3} {"step": 22100, "train_loss": 3.288356065750122, "lr": 0.00010752593483476403, "tps": 96296, "wall": 15041.2} {"step": 22101, "train_loss": 3.295186996459961, "lr": 0.00010751097805349726, "tps": 96268, "wall": 15046.2} {"step": 22102, "train_loss": 3.178823232650757, "lr": 0.00010749602254651214, "tps": 96240, "wall": 15051.3} {"step": 22103, "train_loss": 3.2983365058898926, "lr": 0.00010748106831397822, "tps": 96212, "wall": 15056.3} {"step": 22104, "train_loss": 3.2001423835754395, "lr": 0.00010746611535606486, "tps": 96184, "wall": 15061.3} {"step": 22105, "train_loss": 3.262392997741699, "lr": 0.00010745116367294137, "tps": 96158, "wall": 15066.2} {"step": 22106, "train_loss": 3.2252659797668457, "lr": 0.00010743621326477722, "tps": 96131, "wall": 15071.1} {"step": 22107, "train_loss": 3.240771770477295, "lr": 0.00010742126413174172, "tps": 96104, "wall": 15076.0} {"step": 22108, "train_loss": 3.1963090896606445, "lr": 0.00010740631627400425, "tps": 96077, "wall": 15081.0} {"step": 22109, "train_loss": 3.3071467876434326, "lr": 0.00010739136969173415, "tps": 96050, "wall": 15085.9} {"step": 22110, "train_loss": 3.3378686904907227, "lr": 0.00010737642438510063, "tps": 96023, "wall": 15090.8} {"step": 22111, "train_loss": 3.3223228454589844, "lr": 0.00010736148035427314, "tps": 95995, "wall": 15095.8} {"step": 22112, "train_loss": 3.248199462890625, "lr": 0.00010734653759942088, "tps": 95969, "wall": 15100.7} {"step": 22113, "train_loss": 3.220010280609131, "lr": 0.00010733159612071309, "tps": 95942, "wall": 15105.6} {"step": 22114, "train_loss": 3.209016799926758, "lr": 0.00010731665591831912, "tps": 95915, "wall": 15110.5} {"step": 22115, "train_loss": 3.283005952835083, "lr": 0.00010730171699240816, "tps": 95888, "wall": 15115.3} {"step": 22116, "train_loss": 3.2993767261505127, "lr": 0.00010728677934314944, "tps": 95862, "wall": 15120.2} {"step": 22117, "train_loss": 3.256382703781128, "lr": 0.00010727184297071218, "tps": 95835, "wall": 15125.1} {"step": 22118, "train_loss": 3.2748405933380127, "lr": 0.00010725690787526561, "tps": 95809, "wall": 15130.0} {"step": 22119, "train_loss": 3.158039093017578, "lr": 0.00010724197405697882, "tps": 95782, "wall": 15134.9} {"step": 22120, "train_loss": 3.162618637084961, "lr": 0.0001072270415160211, "tps": 95755, "wall": 15139.8} {"step": 22121, "train_loss": 3.1975173950195312, "lr": 0.00010721211025256157, "tps": 95729, "wall": 15144.7} {"step": 22122, "train_loss": 3.3522753715515137, "lr": 0.00010719718026676928, "tps": 95702, "wall": 15149.6} {"step": 22123, "train_loss": 3.275263547897339, "lr": 0.0001071822515588135, "tps": 95676, "wall": 15154.4} {"step": 22124, "train_loss": 3.3104381561279297, "lr": 0.00010716732412886323, "tps": 95649, "wall": 15159.4} {"step": 22125, "train_loss": 3.205179214477539, "lr": 0.00010715239797708767, "tps": 95622, "wall": 15164.3} {"step": 22126, "train_loss": 3.3701043128967285, "lr": 0.00010713747310365585, "tps": 95596, "wall": 15169.1} {"step": 22127, "train_loss": 3.253817319869995, "lr": 0.00010712254950873677, "tps": 95570, "wall": 15174.0} {"step": 22128, "train_loss": 3.4028072357177734, "lr": 0.00010710762719249963, "tps": 95543, "wall": 15178.9} {"step": 22129, "train_loss": 3.2889022827148438, "lr": 0.0001070927061551134, "tps": 95517, "wall": 15183.7} {"step": 22130, "train_loss": 3.3658628463745117, "lr": 0.00010707778639674704, "tps": 95491, "wall": 15188.6} {"step": 22131, "train_loss": 3.367414951324463, "lr": 0.00010706286791756968, "tps": 95464, "wall": 15193.5} {"step": 22132, "train_loss": 3.235501766204834, "lr": 0.00010704795071775025, "tps": 95438, "wall": 15198.4} {"step": 22133, "train_loss": 3.275775671005249, "lr": 0.0001070330347974577, "tps": 95412, "wall": 15203.2} {"step": 22134, "train_loss": 3.2398648262023926, "lr": 0.0001070181201568611, "tps": 95386, "wall": 15208.1} {"step": 22135, "train_loss": 3.293576717376709, "lr": 0.00010700320679612934, "tps": 95359, "wall": 15212.9} {"step": 22136, "train_loss": 3.3556478023529053, "lr": 0.0001069882947154313, "tps": 95333, "wall": 15217.9} {"step": 22137, "train_loss": 3.327406167984009, "lr": 0.00010697338391493605, "tps": 95307, "wall": 15222.7} {"step": 22138, "train_loss": 3.2448723316192627, "lr": 0.00010695847439481243, "tps": 95281, "wall": 15227.6} {"step": 22139, "train_loss": 3.329078197479248, "lr": 0.00010694356615522925, "tps": 95254, "wall": 15232.5} {"step": 22140, "train_loss": 3.3209569454193115, "lr": 0.00010692865919635555, "tps": 95228, "wall": 15237.4} {"step": 22141, "train_loss": 3.1680779457092285, "lr": 0.0001069137535183601, "tps": 95202, "wall": 15242.2} {"step": 22142, "train_loss": 3.278075695037842, "lr": 0.00010689884912141168, "tps": 95176, "wall": 15247.1} {"step": 22143, "train_loss": 3.319228172302246, "lr": 0.00010688394600567932, "tps": 95150, "wall": 15251.9} {"step": 22144, "train_loss": 3.212808609008789, "lr": 0.00010686904417133168, "tps": 95124, "wall": 15256.8} {"step": 22145, "train_loss": 3.3097174167633057, "lr": 0.00010685414361853765, "tps": 95098, "wall": 15261.7} {"step": 22146, "train_loss": 3.314117193222046, "lr": 0.00010683924434746602, "tps": 95072, "wall": 15266.5} {"step": 22147, "train_loss": 3.2932024002075195, "lr": 0.00010682434635828548, "tps": 95046, "wall": 15271.4} {"step": 22148, "train_loss": 3.4029693603515625, "lr": 0.00010680944965116495, "tps": 95019, "wall": 15276.3} {"step": 22149, "train_loss": 3.244741678237915, "lr": 0.00010679455422627309, "tps": 94994, "wall": 15281.2} {"step": 22150, "train_loss": 3.2516098022460938, "lr": 0.00010677966008377857, "tps": 94968, "wall": 15286.0} {"step": 22151, "train_loss": 3.174488067626953, "lr": 0.00010676476722385027, "tps": 94942, "wall": 15290.9} {"step": 22152, "train_loss": 3.1797122955322266, "lr": 0.00010674987564665679, "tps": 94916, "wall": 15295.7} {"step": 22153, "train_loss": 3.2922475337982178, "lr": 0.00010673498535236681, "tps": 94890, "wall": 15300.6} {"step": 22154, "train_loss": 3.290656805038452, "lr": 0.00010672009634114908, "tps": 94865, "wall": 15305.4} {"step": 22155, "train_loss": 3.2414541244506836, "lr": 0.00010670520861317223, "tps": 94839, "wall": 15310.3} {"step": 22156, "train_loss": 3.299609661102295, "lr": 0.00010669032216860486, "tps": 94813, "wall": 15315.1} {"step": 22157, "train_loss": 3.167984962463379, "lr": 0.00010667543700761573, "tps": 94787, "wall": 15320.0} {"step": 22158, "train_loss": 3.362557888031006, "lr": 0.00010666055313037333, "tps": 94762, "wall": 15324.8} {"step": 22159, "train_loss": 3.362337589263916, "lr": 0.00010664567053704626, "tps": 94736, "wall": 15329.7} {"step": 22160, "train_loss": 3.4160401821136475, "lr": 0.00010663078922780326, "tps": 94710, "wall": 15334.5} {"step": 22161, "train_loss": 3.1909749507904053, "lr": 0.00010661590920281275, "tps": 94684, "wall": 15339.4} {"step": 22162, "train_loss": 3.380642890930176, "lr": 0.0001066010304622434, "tps": 94659, "wall": 15344.3} {"step": 22163, "train_loss": 3.4495344161987305, "lr": 0.00010658615300626372, "tps": 94633, "wall": 15349.1} {"step": 22164, "train_loss": 3.322549343109131, "lr": 0.00010657127683504216, "tps": 94607, "wall": 15353.9} {"step": 22165, "train_loss": 3.264204502105713, "lr": 0.00010655640194874739, "tps": 94582, "wall": 15358.8} {"step": 22166, "train_loss": 3.262503147125244, "lr": 0.00010654152834754781, "tps": 94556, "wall": 15363.6} {"step": 22167, "train_loss": 3.2467498779296875, "lr": 0.00010652665603161189, "tps": 94531, "wall": 15368.5} {"step": 22168, "train_loss": 3.212747097015381, "lr": 0.00010651178500110828, "tps": 94505, "wall": 15373.3} {"step": 22169, "train_loss": 3.291161060333252, "lr": 0.00010649691525620518, "tps": 94480, "wall": 15378.1} {"step": 22170, "train_loss": 3.345122814178467, "lr": 0.00010648204679707124, "tps": 94454, "wall": 15383.0} {"step": 22171, "train_loss": 3.2117533683776855, "lr": 0.0001064671796238748, "tps": 94429, "wall": 15387.8} {"step": 22172, "train_loss": 3.2650654315948486, "lr": 0.00010645231373678421, "tps": 94404, "wall": 15392.7} {"step": 22173, "train_loss": 3.312044143676758, "lr": 0.00010643744913596805, "tps": 94378, "wall": 15397.6} {"step": 22174, "train_loss": 3.198469400405884, "lr": 0.0001064225858215946, "tps": 94352, "wall": 15402.4} {"step": 22175, "train_loss": 3.344395160675049, "lr": 0.00010640772379383215, "tps": 94327, "wall": 15407.3} {"step": 22176, "train_loss": 3.2930679321289062, "lr": 0.00010639286305284926, "tps": 94301, "wall": 15412.1} {"step": 22177, "train_loss": 3.283252239227295, "lr": 0.00010637800359881414, "tps": 94276, "wall": 15417.0} {"step": 22178, "train_loss": 3.284393072128296, "lr": 0.00010636314543189505, "tps": 94251, "wall": 15421.8} {"step": 22179, "train_loss": 3.2553791999816895, "lr": 0.00010634828855226051, "tps": 94225, "wall": 15426.6} {"step": 22180, "train_loss": 3.340076446533203, "lr": 0.00010633343296007869, "tps": 94200, "wall": 15431.5} {"step": 22181, "train_loss": 3.292778730392456, "lr": 0.00010631857865551782, "tps": 94175, "wall": 15436.3} {"step": 22182, "train_loss": 3.1647143363952637, "lr": 0.00010630372563874629, "tps": 94149, "wall": 15441.2} {"step": 22183, "train_loss": 3.2718653678894043, "lr": 0.00010628887390993232, "tps": 94124, "wall": 15446.0} {"step": 22184, "train_loss": 3.2894320487976074, "lr": 0.00010627402346924409, "tps": 94099, "wall": 15450.8} {"step": 22185, "train_loss": 3.289137601852417, "lr": 0.00010625917431684994, "tps": 94073, "wall": 15455.7} {"step": 22186, "train_loss": 3.322413444519043, "lr": 0.00010624432645291793, "tps": 94048, "wall": 15460.5} {"step": 22187, "train_loss": 3.312396764755249, "lr": 0.00010622947987761642, "tps": 94023, "wall": 15465.4} {"step": 22188, "train_loss": 3.204343318939209, "lr": 0.0001062146345911135, "tps": 93998, "wall": 15470.2} {"step": 22189, "train_loss": 3.297301769256592, "lr": 0.0001061997905935773, "tps": 93973, "wall": 15475.0} {"step": 22190, "train_loss": 3.2422595024108887, "lr": 0.0001061849478851761, "tps": 93948, "wall": 15479.8} {"step": 22191, "train_loss": 3.325767755508423, "lr": 0.00010617010646607797, "tps": 93923, "wall": 15484.6} {"step": 22192, "train_loss": 3.227382183074951, "lr": 0.00010615526633645097, "tps": 93898, "wall": 15489.5} {"step": 22193, "train_loss": 3.249058723449707, "lr": 0.00010614042749646333, "tps": 93873, "wall": 15494.3} {"step": 22194, "train_loss": 3.189377784729004, "lr": 0.00010612558994628307, "tps": 93848, "wall": 15499.1} {"step": 22195, "train_loss": 3.1847734451293945, "lr": 0.00010611075368607824, "tps": 93823, "wall": 15503.9} {"step": 22196, "train_loss": 3.347623348236084, "lr": 0.000106095918716017, "tps": 93798, "wall": 15508.7} {"step": 22197, "train_loss": 3.3866453170776367, "lr": 0.00010608108503626739, "tps": 93774, "wall": 15513.5} {"step": 22198, "train_loss": 3.300105333328247, "lr": 0.00010606625264699733, "tps": 93748, "wall": 15518.4} {"step": 22199, "train_loss": 3.211594581604004, "lr": 0.000106051421548375, "tps": 93723, "wall": 15523.2} {"step": 22200, "train_loss": 3.2709665298461914, "lr": 0.0001060365917405683, "tps": 93699, "wall": 15528.0} {"step": 22201, "train_loss": 3.2282285690307617, "lr": 0.00010602176322374522, "tps": 93674, "wall": 15532.9} {"step": 22202, "train_loss": 3.3123409748077393, "lr": 0.00010600693599807381, "tps": 93649, "wall": 15537.7} {"step": 22203, "train_loss": 3.2074947357177734, "lr": 0.00010599211006372196, "tps": 93624, "wall": 15542.5} {"step": 22204, "train_loss": 3.255568265914917, "lr": 0.0001059772854208577, "tps": 93599, "wall": 15547.3} {"step": 22205, "train_loss": 3.3164048194885254, "lr": 0.00010596246206964893, "tps": 93575, "wall": 15552.1} {"step": 22206, "train_loss": 3.3337783813476562, "lr": 0.00010594764001026349, "tps": 93550, "wall": 15557.0} {"step": 22207, "train_loss": 3.2742152214050293, "lr": 0.00010593281924286941, "tps": 93525, "wall": 15561.8} {"step": 22208, "train_loss": 3.3289966583251953, "lr": 0.00010591799976763455, "tps": 93500, "wall": 15566.6} {"step": 22209, "train_loss": 3.274599075317383, "lr": 0.00010590318158472667, "tps": 93475, "wall": 15571.4} {"step": 22210, "train_loss": 3.2210211753845215, "lr": 0.0001058883646943138, "tps": 93450, "wall": 15576.3} {"step": 22211, "train_loss": 3.330820322036743, "lr": 0.0001058735490965637, "tps": 93426, "wall": 15581.1} {"step": 22212, "train_loss": 3.2875418663024902, "lr": 0.00010585873479164417, "tps": 93401, "wall": 15585.9} {"step": 22213, "train_loss": 3.1476399898529053, "lr": 0.00010584392177972309, "tps": 93377, "wall": 15590.7} {"step": 22214, "train_loss": 3.3368473052978516, "lr": 0.00010582911006096825, "tps": 93352, "wall": 15595.5} {"step": 22215, "train_loss": 3.1842432022094727, "lr": 0.00010581429963554736, "tps": 93327, "wall": 15600.4} {"step": 22216, "train_loss": 3.2841291427612305, "lr": 0.00010579949050362836, "tps": 93303, "wall": 15605.2} {"step": 22217, "train_loss": 3.368790626525879, "lr": 0.00010578468266537889, "tps": 93278, "wall": 15610.0} {"step": 22218, "train_loss": 3.2004761695861816, "lr": 0.00010576987612096662, "tps": 93254, "wall": 15614.8} {"step": 22219, "train_loss": 3.265087127685547, "lr": 0.0001057550708705595, "tps": 93229, "wall": 15619.6} {"step": 22220, "train_loss": 3.2881569862365723, "lr": 0.00010574026691432507, "tps": 93205, "wall": 15624.4} {"step": 22221, "train_loss": 3.326138496398926, "lr": 0.00010572546425243102, "tps": 93180, "wall": 15629.2} {"step": 22222, "train_loss": 3.38063645362854, "lr": 0.00010571066288504517, "tps": 93156, "wall": 15634.0} {"step": 22223, "train_loss": 3.274261474609375, "lr": 0.00010569586281233503, "tps": 93131, "wall": 15638.9} {"step": 22224, "train_loss": 3.318263530731201, "lr": 0.00010568106403446845, "tps": 93107, "wall": 15643.7} {"step": 22225, "train_loss": 3.2166361808776855, "lr": 0.00010566626655161291, "tps": 93082, "wall": 15648.5} {"step": 22226, "train_loss": 3.2626407146453857, "lr": 0.00010565147036393606, "tps": 93058, "wall": 15653.3} {"step": 22227, "train_loss": 3.2712230682373047, "lr": 0.00010563667547160556, "tps": 93033, "wall": 15658.1} {"step": 22228, "train_loss": 3.27229642868042, "lr": 0.00010562188187478902, "tps": 93009, "wall": 15662.9} {"step": 22229, "train_loss": 3.3862318992614746, "lr": 0.00010560708957365392, "tps": 92985, "wall": 15667.7} {"step": 22230, "train_loss": 3.2898221015930176, "lr": 0.00010559229856836795, "tps": 92960, "wall": 15672.5} {"step": 22231, "train_loss": 3.1947803497314453, "lr": 0.00010557750885909863, "tps": 92936, "wall": 15677.3} {"step": 22232, "train_loss": 3.264127254486084, "lr": 0.00010556272044601341, "tps": 92912, "wall": 15682.1} {"step": 22233, "train_loss": 3.2890737056732178, "lr": 0.00010554793332927995, "tps": 92888, "wall": 15686.9} {"step": 22234, "train_loss": 3.3143043518066406, "lr": 0.00010553314750906569, "tps": 92863, "wall": 15691.7} {"step": 22235, "train_loss": 3.3398168087005615, "lr": 0.00010551836298553807, "tps": 92839, "wall": 15696.6} {"step": 22236, "train_loss": 3.2788949012756348, "lr": 0.00010550357975886466, "tps": 92814, "wall": 15701.4} {"step": 22237, "train_loss": 3.2836039066314697, "lr": 0.00010548879782921291, "tps": 92790, "wall": 15706.2} {"step": 22238, "train_loss": 3.419649124145508, "lr": 0.00010547401719675021, "tps": 92766, "wall": 15711.0} {"step": 22239, "train_loss": 3.2435569763183594, "lr": 0.00010545923786164409, "tps": 92742, "wall": 15715.8} {"step": 22240, "train_loss": 3.295412540435791, "lr": 0.00010544445982406186, "tps": 92718, "wall": 15720.6} {"step": 22241, "train_loss": 3.2007482051849365, "lr": 0.00010542968308417105, "tps": 92693, "wall": 15725.4} {"step": 22242, "train_loss": 3.1805765628814697, "lr": 0.00010541490764213896, "tps": 92669, "wall": 15730.2} {"step": 22243, "train_loss": 3.253786563873291, "lr": 0.00010540013349813299, "tps": 92645, "wall": 15735.0} {"step": 22244, "train_loss": 3.2345004081726074, "lr": 0.00010538536065232052, "tps": 92621, "wall": 15739.8} {"step": 22245, "train_loss": 3.254004716873169, "lr": 0.00010537058910486889, "tps": 92597, "wall": 15744.6} {"step": 22246, "train_loss": 3.1500205993652344, "lr": 0.00010535581885594537, "tps": 92573, "wall": 15749.4} {"step": 22247, "train_loss": 3.201843023300171, "lr": 0.00010534104990571738, "tps": 92549, "wall": 15754.2} {"step": 22248, "train_loss": 3.2455172538757324, "lr": 0.00010532628225435224, "tps": 92525, "wall": 15759.1} {"step": 22249, "train_loss": 3.222198247909546, "lr": 0.00010531151590201707, "tps": 92501, "wall": 15763.9} {"step": 22250, "train_loss": 3.2760417461395264, "lr": 0.00010529675084887932, "tps": 92477, "wall": 15768.7} {"step": 22251, "train_loss": 3.2633578777313232, "lr": 0.0001052819870951062, "tps": 92453, "wall": 15773.5} {"step": 22252, "train_loss": 3.233914375305176, "lr": 0.00010526722464086485, "tps": 92429, "wall": 15778.3} {"step": 22253, "train_loss": 3.2181403636932373, "lr": 0.00010525246348632265, "tps": 92405, "wall": 15783.1} {"step": 22254, "train_loss": 3.409623861312866, "lr": 0.00010523770363164676, "tps": 92381, "wall": 15787.8} {"step": 22255, "train_loss": 3.308178186416626, "lr": 0.00010522294507700432, "tps": 92357, "wall": 15792.6} {"step": 22256, "train_loss": 3.2472918033599854, "lr": 0.00010520818782256261, "tps": 92333, "wall": 15797.4} {"step": 22257, "train_loss": 3.2707583904266357, "lr": 0.00010519343186848872, "tps": 92309, "wall": 15802.2} {"step": 22258, "train_loss": 3.3167619705200195, "lr": 0.00010517867721494989, "tps": 92285, "wall": 15807.0} {"step": 22259, "train_loss": 3.300067901611328, "lr": 0.00010516392386211322, "tps": 92262, "wall": 15811.8} {"step": 22260, "train_loss": 3.305232524871826, "lr": 0.00010514917181014576, "tps": 92237, "wall": 15816.7} {"step": 22261, "train_loss": 3.199702739715576, "lr": 0.00010513442105921476, "tps": 92214, "wall": 15821.5} {"step": 22262, "train_loss": 3.393277883529663, "lr": 0.00010511967160948726, "tps": 92190, "wall": 15826.3} {"step": 22263, "train_loss": 3.3281853199005127, "lr": 0.00010510492346113028, "tps": 92166, "wall": 15831.1} {"step": 22264, "train_loss": 3.2094335556030273, "lr": 0.000105090176614311, "tps": 92142, "wall": 15835.9} {"step": 22265, "train_loss": 3.318147897720337, "lr": 0.00010507543106919642, "tps": 92119, "wall": 15840.6} {"step": 22266, "train_loss": 3.34295654296875, "lr": 0.00010506068682595347, "tps": 92095, "wall": 15845.4} {"step": 22267, "train_loss": 3.2589049339294434, "lr": 0.0001050459438847494, "tps": 92071, "wall": 15850.2} {"step": 22268, "train_loss": 3.2396440505981445, "lr": 0.00010503120224575108, "tps": 92047, "wall": 15855.0} {"step": 22269, "train_loss": 3.3806917667388916, "lr": 0.00010501646190912544, "tps": 92024, "wall": 15859.8} {"step": 22270, "train_loss": 3.3178772926330566, "lr": 0.0001050017228750396, "tps": 92000, "wall": 15864.6} {"step": 22271, "train_loss": 3.3337855339050293, "lr": 0.0001049869851436605, "tps": 91976, "wall": 15869.4} {"step": 22272, "train_loss": 3.2308270931243896, "lr": 0.00010497224871515494, "tps": 91953, "wall": 15874.2} {"step": 22273, "train_loss": 3.258847236633301, "lr": 0.00010495751358969008, "tps": 91929, "wall": 15879.0} {"step": 22274, "train_loss": 3.2760910987854004, "lr": 0.0001049427797674327, "tps": 91905, "wall": 15883.8} {"step": 22275, "train_loss": 3.271066188812256, "lr": 0.00010492804724854967, "tps": 91882, "wall": 15888.6} {"step": 22276, "train_loss": 3.2727808952331543, "lr": 0.00010491331603320804, "tps": 91858, "wall": 15893.4} {"step": 22277, "train_loss": 3.267915964126587, "lr": 0.0001048985861215745, "tps": 91835, "wall": 15898.2} {"step": 22278, "train_loss": 3.24361515045166, "lr": 0.00010488385751381609, "tps": 91811, "wall": 15903.0} {"step": 22279, "train_loss": 3.269735336303711, "lr": 0.00010486913021009954, "tps": 91788, "wall": 15907.8} {"step": 22280, "train_loss": 3.3067808151245117, "lr": 0.00010485440421059167, "tps": 91764, "wall": 15912.6} {"step": 22281, "train_loss": 3.3211798667907715, "lr": 0.00010483967951545941, "tps": 91741, "wall": 15917.3} {"step": 22282, "train_loss": 3.189258575439453, "lr": 0.00010482495612486946, "tps": 91717, "wall": 15922.1} {"step": 22283, "train_loss": 3.3109538555145264, "lr": 0.0001048102340389886, "tps": 91694, "wall": 15926.9} {"step": 22284, "train_loss": 3.2590036392211914, "lr": 0.0001047955132579837, "tps": 91670, "wall": 15931.7} {"step": 22285, "train_loss": 3.4057908058166504, "lr": 0.00010478079378202146, "tps": 91646, "wall": 15936.6} {"step": 22286, "train_loss": 3.277493953704834, "lr": 0.00010476607561126854, "tps": 91623, "wall": 15941.4} {"step": 22287, "train_loss": 3.3475286960601807, "lr": 0.00010475135874589181, "tps": 91599, "wall": 15946.2} {"step": 22288, "train_loss": 3.2493786811828613, "lr": 0.00010473664318605796, "tps": 91576, "wall": 15950.9} {"step": 22289, "train_loss": 3.2673866748809814, "lr": 0.00010472192893193357, "tps": 91553, "wall": 15955.7} {"step": 22290, "train_loss": 3.3701257705688477, "lr": 0.00010470721598368544, "tps": 91529, "wall": 15960.5} {"step": 22291, "train_loss": 3.2144761085510254, "lr": 0.00010469250434148023, "tps": 91506, "wall": 15965.3} {"step": 22292, "train_loss": 3.446164608001709, "lr": 0.00010467779400548452, "tps": 91483, "wall": 15970.1} {"step": 22293, "train_loss": 3.2265806198120117, "lr": 0.00010466308497586503, "tps": 91459, "wall": 15974.9} {"step": 22294, "train_loss": 3.27144718170166, "lr": 0.00010464837725278833, "tps": 91436, "wall": 15979.6} {"step": 22295, "train_loss": 3.17002272605896, "lr": 0.00010463367083642108, "tps": 91413, "wall": 15984.5} {"step": 22296, "train_loss": 3.1964797973632812, "lr": 0.00010461896572692987, "tps": 91390, "wall": 15989.2} {"step": 22297, "train_loss": 3.263814687728882, "lr": 0.00010460426192448119, "tps": 91366, "wall": 15994.0} {"step": 22298, "train_loss": 3.3051083087921143, "lr": 0.00010458955942924171, "tps": 91343, "wall": 15998.9} {"step": 22299, "train_loss": 3.2836849689483643, "lr": 0.00010457485824137795, "tps": 91319, "wall": 16003.6} {"step": 22300, "train_loss": 3.156717300415039, "lr": 0.00010456015836105643, "tps": 91296, "wall": 16008.4} {"step": 22301, "train_loss": 3.2160239219665527, "lr": 0.0001045454597884437, "tps": 91273, "wall": 16013.2} {"step": 22302, "train_loss": 3.2375850677490234, "lr": 0.00010453076252370624, "tps": 91250, "wall": 16018.0} {"step": 22303, "train_loss": 3.2432031631469727, "lr": 0.00010451606656701049, "tps": 91227, "wall": 16022.8} {"step": 22304, "train_loss": 3.2592430114746094, "lr": 0.0001045013719185231, "tps": 91204, "wall": 16027.6} {"step": 22305, "train_loss": 3.2871646881103516, "lr": 0.00010448667857841037, "tps": 91180, "wall": 16032.4} {"step": 22306, "train_loss": 3.25246262550354, "lr": 0.00010447198654683874, "tps": 91157, "wall": 16037.2} {"step": 22307, "train_loss": 3.1754612922668457, "lr": 0.00010445729582397477, "tps": 91134, "wall": 16041.9} {"step": 22308, "train_loss": 3.3430447578430176, "lr": 0.00010444260640998478, "tps": 91111, "wall": 16046.7} {"step": 22309, "train_loss": 3.251408815383911, "lr": 0.00010442791830503513, "tps": 91088, "wall": 16051.5} {"step": 22310, "train_loss": 3.2972042560577393, "lr": 0.00010441323150929235, "tps": 91064, "wall": 16056.4} {"step": 22311, "train_loss": 3.4544806480407715, "lr": 0.00010439854602292269, "tps": 91041, "wall": 16061.2} {"step": 22312, "train_loss": 3.191577434539795, "lr": 0.00010438386184609259, "tps": 91018, "wall": 16066.0} {"step": 22313, "train_loss": 3.280167818069458, "lr": 0.00010436917897896837, "tps": 90995, "wall": 16070.8} {"step": 22314, "train_loss": 3.331414222717285, "lr": 0.00010435449742171628, "tps": 90972, "wall": 16075.5} {"step": 22315, "train_loss": 3.2702348232269287, "lr": 0.00010433981717450278, "tps": 90949, "wall": 16080.3} {"step": 22316, "train_loss": 3.283450126647949, "lr": 0.00010432513823749409, "tps": 90926, "wall": 16085.1} {"step": 22317, "train_loss": 3.236015796661377, "lr": 0.00010431046061085639, "tps": 90903, "wall": 16090.0} {"step": 22318, "train_loss": 3.26802396774292, "lr": 0.00010429578429475615, "tps": 90880, "wall": 16094.7} {"step": 22319, "train_loss": 3.246856689453125, "lr": 0.0001042811092893595, "tps": 90857, "wall": 16099.6} {"step": 22320, "train_loss": 3.4419631958007812, "lr": 0.00010426643559483265, "tps": 90834, "wall": 16104.3} {"step": 22321, "train_loss": 3.359713315963745, "lr": 0.00010425176321134196, "tps": 90811, "wall": 16109.1} {"step": 22322, "train_loss": 3.249788522720337, "lr": 0.00010423709213905353, "tps": 90788, "wall": 16113.9} {"step": 22323, "train_loss": 3.215785264968872, "lr": 0.00010422242237813353, "tps": 90765, "wall": 16118.8} {"step": 22324, "train_loss": 3.303234100341797, "lr": 0.00010420775392874826, "tps": 90742, "wall": 16123.6} {"step": 22325, "train_loss": 3.3379595279693604, "lr": 0.00010419308679106383, "tps": 90719, "wall": 16128.4} {"step": 22326, "train_loss": 3.2652111053466797, "lr": 0.00010417842096524628, "tps": 90696, "wall": 16133.2} {"step": 22327, "train_loss": 3.190962791442871, "lr": 0.00010416375645146192, "tps": 90673, "wall": 16138.0} {"step": 22328, "train_loss": 3.3675315380096436, "lr": 0.00010414909324987681, "tps": 90650, "wall": 16142.8} {"step": 22329, "train_loss": 3.21714448928833, "lr": 0.00010413443136065697, "tps": 90627, "wall": 16147.6} {"step": 22330, "train_loss": 3.3171863555908203, "lr": 0.00010411977078396862, "tps": 90605, "wall": 16152.3} {"step": 22331, "train_loss": 3.2820303440093994, "lr": 0.00010410511151997772, "tps": 90582, "wall": 16157.1} {"step": 22332, "train_loss": 3.2887346744537354, "lr": 0.00010409045356885043, "tps": 90559, "wall": 16161.9} {"step": 22333, "train_loss": 3.2013885974884033, "lr": 0.00010407579693075278, "tps": 90536, "wall": 16166.7} {"step": 22334, "train_loss": 3.271845817565918, "lr": 0.0001040611416058507, "tps": 90513, "wall": 16171.5} {"step": 22335, "train_loss": 3.3390753269195557, "lr": 0.00010404648759431033, "tps": 90490, "wall": 16176.4} {"step": 22336, "train_loss": 3.2026045322418213, "lr": 0.00010403183489629763, "tps": 90468, "wall": 16181.1} {"step": 22337, "train_loss": 3.203960418701172, "lr": 0.00010401718351197858, "tps": 90445, "wall": 16185.9} {"step": 22338, "train_loss": 3.3598484992980957, "lr": 0.00010400253344151913, "tps": 90422, "wall": 16190.7} {"step": 22339, "train_loss": 3.292118787765503, "lr": 0.00010398788468508522, "tps": 90400, "wall": 16195.5} {"step": 22340, "train_loss": 3.215848922729492, "lr": 0.00010397323724284289, "tps": 90377, "wall": 16200.3} {"step": 22341, "train_loss": 3.2858784198760986, "lr": 0.000103958591114958, "tps": 90354, "wall": 16205.1} {"step": 22342, "train_loss": 3.2878024578094482, "lr": 0.00010394394630159641, "tps": 90332, "wall": 16209.8} {"step": 22343, "train_loss": 3.2525787353515625, "lr": 0.0001039293028029241, "tps": 90309, "wall": 16214.6} {"step": 22344, "train_loss": 3.383014678955078, "lr": 0.00010391466061910695, "tps": 90287, "wall": 16219.4} {"step": 22345, "train_loss": 3.3336782455444336, "lr": 0.00010390001975031078, "tps": 90264, "wall": 16224.2} {"step": 22346, "train_loss": 3.1729865074157715, "lr": 0.00010388538019670149, "tps": 90242, "wall": 16228.9} {"step": 22347, "train_loss": 3.2949557304382324, "lr": 0.00010387074195844491, "tps": 90219, "wall": 16233.7} {"step": 22348, "train_loss": 3.250567674636841, "lr": 0.00010385610503570678, "tps": 90196, "wall": 16238.6} {"step": 22349, "train_loss": 3.288356304168701, "lr": 0.00010384146942865302, "tps": 90173, "wall": 16243.4} {"step": 22350, "train_loss": 3.2995448112487793, "lr": 0.0001038268351374494, "tps": 90151, "wall": 16248.2} {"step": 22351, "train_loss": 3.4121975898742676, "lr": 0.0001038122021622616, "tps": 90128, "wall": 16252.9} {"step": 22352, "train_loss": 3.2783560752868652, "lr": 0.00010379757050325554, "tps": 90106, "wall": 16257.7} {"step": 22353, "train_loss": 3.2474653720855713, "lr": 0.00010378294016059684, "tps": 90084, "wall": 16262.5} {"step": 22354, "train_loss": 3.3019115924835205, "lr": 0.00010376831113445132, "tps": 90061, "wall": 16267.3} {"step": 22355, "train_loss": 3.3067407608032227, "lr": 0.00010375368342498464, "tps": 90039, "wall": 16272.1} {"step": 22356, "train_loss": 3.224687099456787, "lr": 0.00010373905703236248, "tps": 90016, "wall": 16276.8} {"step": 22357, "train_loss": 3.1738052368164062, "lr": 0.00010372443195675061, "tps": 89994, "wall": 16281.6} {"step": 22358, "train_loss": 3.4144227504730225, "lr": 0.0001037098081983147, "tps": 89972, "wall": 16286.4} {"step": 22359, "train_loss": 3.219235897064209, "lr": 0.0001036951857572203, "tps": 89949, "wall": 16291.2} {"step": 22360, "train_loss": 3.2816989421844482, "lr": 0.00010368056463363318, "tps": 89926, "wall": 16296.0} {"step": 22361, "train_loss": 3.272515058517456, "lr": 0.00010366594482771894, "tps": 89904, "wall": 16300.8} {"step": 22362, "train_loss": 3.2914113998413086, "lr": 0.00010365132633964312, "tps": 89882, "wall": 16305.6} {"step": 22363, "train_loss": 3.286081314086914, "lr": 0.0001036367091695714, "tps": 89859, "wall": 16310.3} {"step": 22364, "train_loss": 3.28619647026062, "lr": 0.00010362209331766934, "tps": 89837, "wall": 16315.1} {"step": 22365, "train_loss": 3.1418373584747314, "lr": 0.00010360747878410242, "tps": 89815, "wall": 16319.9} {"step": 22366, "train_loss": 3.226651668548584, "lr": 0.00010359286556903636, "tps": 89792, "wall": 16324.7} {"step": 22367, "train_loss": 3.2374978065490723, "lr": 0.00010357825367263662, "tps": 89770, "wall": 16329.5} {"step": 22368, "train_loss": 3.2630860805511475, "lr": 0.00010356364309506868, "tps": 89748, "wall": 16334.3} {"step": 22369, "train_loss": 3.215552806854248, "lr": 0.00010354903383649812, "tps": 89726, "wall": 16339.1} {"step": 22370, "train_loss": 3.3511123657226562, "lr": 0.00010353442589709041, "tps": 89703, "wall": 16343.8} {"step": 22371, "train_loss": 3.278109312057495, "lr": 0.00010351981927701095, "tps": 89681, "wall": 16348.6} {"step": 22372, "train_loss": 3.2520346641540527, "lr": 0.00010350521397642538, "tps": 89659, "wall": 16353.4} {"step": 22373, "train_loss": 3.2850873470306396, "lr": 0.00010349060999549895, "tps": 89637, "wall": 16358.2} {"step": 22374, "train_loss": 3.3081555366516113, "lr": 0.00010347600733439726, "tps": 89614, "wall": 16363.0} {"step": 22375, "train_loss": 3.264714241027832, "lr": 0.0001034614059932857, "tps": 89592, "wall": 16367.8} {"step": 22376, "train_loss": 3.2383460998535156, "lr": 0.00010344680597232952, "tps": 89570, "wall": 16372.6} {"step": 22377, "train_loss": 3.31021785736084, "lr": 0.00010343220727169431, "tps": 89548, "wall": 16377.4} {"step": 22378, "train_loss": 3.317572593688965, "lr": 0.00010341760989154539, "tps": 89526, "wall": 16382.1} {"step": 22379, "train_loss": 3.184108257293701, "lr": 0.000103403013832048, "tps": 89504, "wall": 16386.9} {"step": 22380, "train_loss": 3.1704089641571045, "lr": 0.00010338841909336766, "tps": 89481, "wall": 16391.7} {"step": 22381, "train_loss": 3.1880249977111816, "lr": 0.0001033738256756696, "tps": 89459, "wall": 16396.5} {"step": 22382, "train_loss": 3.2953848838806152, "lr": 0.0001033592335791191, "tps": 89437, "wall": 16401.3} {"step": 22383, "train_loss": 3.2860114574432373, "lr": 0.00010334464280388154, "tps": 89415, "wall": 16406.0} {"step": 22384, "train_loss": 3.3725337982177734, "lr": 0.0001033300533501222, "tps": 89393, "wall": 16410.8} {"step": 22385, "train_loss": 3.257261276245117, "lr": 0.0001033154652180063, "tps": 89371, "wall": 16415.7} {"step": 22386, "train_loss": 3.2008771896362305, "lr": 0.00010330087840769913, "tps": 89349, "wall": 16420.4} {"step": 22387, "train_loss": 3.1834664344787598, "lr": 0.00010328629291936595, "tps": 89327, "wall": 16425.2} {"step": 22388, "train_loss": 3.3688013553619385, "lr": 0.0001032717087531719, "tps": 89305, "wall": 16430.0} {"step": 22389, "train_loss": 3.188066244125366, "lr": 0.0001032571259092823, "tps": 89283, "wall": 16434.7} {"step": 22390, "train_loss": 3.372453451156616, "lr": 0.00010324254438786223, "tps": 89261, "wall": 16439.5} {"step": 22391, "train_loss": 3.3061652183532715, "lr": 0.00010322796418907702, "tps": 89239, "wall": 16444.3} {"step": 22392, "train_loss": 3.257779359817505, "lr": 0.0001032133853130917, "tps": 89217, "wall": 16449.1} {"step": 22393, "train_loss": 3.315512180328369, "lr": 0.00010319880776007145, "tps": 89195, "wall": 16453.8} {"step": 22394, "train_loss": 3.1851024627685547, "lr": 0.00010318423153018147, "tps": 89174, "wall": 16458.6} {"step": 22395, "train_loss": 3.2392284870147705, "lr": 0.00010316965662358684, "tps": 89151, "wall": 16463.4} {"step": 22396, "train_loss": 3.2874531745910645, "lr": 0.00010315508304045258, "tps": 89130, "wall": 16468.2} {"step": 22397, "train_loss": 3.2874093055725098, "lr": 0.00010314051078094395, "tps": 89108, "wall": 16473.0} {"step": 22398, "train_loss": 3.264876365661621, "lr": 0.00010312593984522592, "tps": 89085, "wall": 16477.8} {"step": 22399, "train_loss": 3.241316080093384, "lr": 0.00010311137023346354, "tps": 89064, "wall": 16482.6} {"step": 22400, "train_loss": 3.2929141521453857, "lr": 0.00010309680194582187, "tps": 89042, "wall": 16487.4} {"step": 22401, "train_loss": 3.3088765144348145, "lr": 0.00010308223498246601, "tps": 89020, "wall": 16492.1} {"step": 22402, "train_loss": 3.3228766918182373, "lr": 0.00010306766934356085, "tps": 88998, "wall": 16496.9} {"step": 22403, "train_loss": 3.2716684341430664, "lr": 0.00010305310502927153, "tps": 88976, "wall": 16501.7} {"step": 22404, "train_loss": 3.2440237998962402, "lr": 0.00010303854203976291, "tps": 88955, "wall": 16506.5} {"step": 22405, "train_loss": 3.285393476486206, "lr": 0.0001030239803752, "tps": 88933, "wall": 16511.3} {"step": 22406, "train_loss": 3.3309335708618164, "lr": 0.0001030094200357478, "tps": 88911, "wall": 16516.0} {"step": 22407, "train_loss": 3.3309853076934814, "lr": 0.00010299486102157116, "tps": 88889, "wall": 16520.8} {"step": 22408, "train_loss": 3.1832361221313477, "lr": 0.00010298030333283515, "tps": 88868, "wall": 16525.6} {"step": 22409, "train_loss": 3.26798152923584, "lr": 0.0001029657469697046, "tps": 88846, "wall": 16530.4} {"step": 22410, "train_loss": 3.2647998332977295, "lr": 0.00010295119193234431, "tps": 88824, "wall": 16535.2} {"step": 22411, "train_loss": 3.2481651306152344, "lr": 0.00010293663822091933, "tps": 88802, "wall": 16540.0} {"step": 22412, "train_loss": 3.3365540504455566, "lr": 0.00010292208583559441, "tps": 88780, "wall": 16544.8} {"step": 22413, "train_loss": 3.3189568519592285, "lr": 0.00010290753477653441, "tps": 88759, "wall": 16549.5} {"step": 22414, "train_loss": 3.3371386528015137, "lr": 0.00010289298504390425, "tps": 88737, "wall": 16554.3} {"step": 22415, "train_loss": 3.1945881843566895, "lr": 0.00010287843663786867, "tps": 88715, "wall": 16559.1} {"step": 22416, "train_loss": 3.202432155609131, "lr": 0.00010286388955859246, "tps": 88694, "wall": 16563.9} {"step": 22417, "train_loss": 3.2652859687805176, "lr": 0.0001028493438062405, "tps": 88672, "wall": 16568.6} {"step": 22418, "train_loss": 3.386101722717285, "lr": 0.00010283479938097748, "tps": 88651, "wall": 16573.4} {"step": 22419, "train_loss": 3.203080177307129, "lr": 0.00010282025628296819, "tps": 88629, "wall": 16578.2} {"step": 22420, "train_loss": 3.280043125152588, "lr": 0.0001028057145123774, "tps": 88607, "wall": 16583.0} {"step": 22421, "train_loss": 3.298630714416504, "lr": 0.0001027911740693698, "tps": 88586, "wall": 16587.8} {"step": 22422, "train_loss": 3.2078146934509277, "lr": 0.00010277663495411008, "tps": 88564, "wall": 16592.5} {"step": 22423, "train_loss": 3.2820069789886475, "lr": 0.00010276209716676304, "tps": 88542, "wall": 16597.4} {"step": 22424, "train_loss": 3.4178645610809326, "lr": 0.00010274756070749332, "tps": 88521, "wall": 16602.2} {"step": 22425, "train_loss": 3.1499271392822266, "lr": 0.00010273302557646549, "tps": 88499, "wall": 16606.9} {"step": 22426, "train_loss": 3.1996583938598633, "lr": 0.00010271849177384436, "tps": 88478, "wall": 16611.7} {"step": 22427, "train_loss": 3.3136138916015625, "lr": 0.00010270395929979446, "tps": 88456, "wall": 16616.5} {"step": 22428, "train_loss": 3.2219934463500977, "lr": 0.00010268942815448048, "tps": 88435, "wall": 16621.3} {"step": 22429, "train_loss": 3.2479782104492188, "lr": 0.00010267489833806702, "tps": 88413, "wall": 16626.0} {"step": 22430, "train_loss": 3.2669055461883545, "lr": 0.00010266036985071861, "tps": 88392, "wall": 16630.8} {"step": 22431, "train_loss": 3.200685977935791, "lr": 0.00010264584269259991, "tps": 88370, "wall": 16635.6} {"step": 22432, "train_loss": 3.235652446746826, "lr": 0.00010263131686387548, "tps": 88349, "wall": 16640.4} {"step": 22433, "train_loss": 3.299467086791992, "lr": 0.0001026167923647098, "tps": 88328, "wall": 16645.2} {"step": 22434, "train_loss": 3.2402637004852295, "lr": 0.00010260226919526748, "tps": 88306, "wall": 16649.9} {"step": 22435, "train_loss": 3.232095241546631, "lr": 0.000102587747355713, "tps": 88285, "wall": 16654.7} {"step": 22436, "train_loss": 3.390449285507202, "lr": 0.0001025732268462108, "tps": 88263, "wall": 16659.6} {"step": 22437, "train_loss": 3.278449058532715, "lr": 0.00010255870766692552, "tps": 88241, "wall": 16664.4} {"step": 22438, "train_loss": 3.249481201171875, "lr": 0.00010254418981802154, "tps": 88220, "wall": 16669.2} {"step": 22439, "train_loss": 3.3032541275024414, "lr": 0.00010252967329966328, "tps": 88199, "wall": 16674.0} {"step": 22440, "train_loss": 3.133695125579834, "lr": 0.0001025151581120153, "tps": 88177, "wall": 16678.7} {"step": 22441, "train_loss": 3.2909932136535645, "lr": 0.00010250064425524195, "tps": 88156, "wall": 16683.5} {"step": 22442, "train_loss": 3.26540470123291, "lr": 0.0001024861317295076, "tps": 88134, "wall": 16688.3} {"step": 22443, "train_loss": 3.239859104156494, "lr": 0.00010247162053497681, "tps": 88113, "wall": 16693.1} {"step": 22444, "train_loss": 3.2202353477478027, "lr": 0.00010245711067181377, "tps": 88092, "wall": 16697.9} {"step": 22445, "train_loss": 3.277491807937622, "lr": 0.00010244260214018298, "tps": 88070, "wall": 16702.7} {"step": 22446, "train_loss": 3.25591778755188, "lr": 0.00010242809494024878, "tps": 88049, "wall": 16707.5} {"step": 22447, "train_loss": 3.311278820037842, "lr": 0.0001024135890721754, "tps": 88028, "wall": 16712.3} {"step": 22448, "train_loss": 3.2980597019195557, "lr": 0.0001023990845361273, "tps": 88006, "wall": 16717.1} {"step": 22449, "train_loss": 3.259188175201416, "lr": 0.00010238458133226876, "tps": 87985, "wall": 16721.9} {"step": 22450, "train_loss": 3.2337498664855957, "lr": 0.00010237007946076396, "tps": 87964, "wall": 16726.6} {"step": 22451, "train_loss": 3.265605926513672, "lr": 0.00010235557892177734, "tps": 87943, "wall": 16731.4} {"step": 22452, "train_loss": 3.2223119735717773, "lr": 0.00010234107971547309, "tps": 87922, "wall": 16736.2} {"step": 22453, "train_loss": 3.2060627937316895, "lr": 0.00010232658184201537, "tps": 87900, "wall": 16741.0} {"step": 22454, "train_loss": 3.28938364982605, "lr": 0.00010231208530156858, "tps": 87879, "wall": 16745.7} {"step": 22455, "train_loss": 3.2688417434692383, "lr": 0.00010229759009429684, "tps": 87858, "wall": 16750.5} {"step": 22456, "train_loss": 3.380380868911743, "lr": 0.00010228309622036431, "tps": 87837, "wall": 16755.3} {"step": 22457, "train_loss": 3.2860965728759766, "lr": 0.00010226860367993531, "tps": 87816, "wall": 16760.1} {"step": 22458, "train_loss": 3.1853227615356445, "lr": 0.00010225411247317391, "tps": 87795, "wall": 16764.8} {"step": 22459, "train_loss": 3.30645489692688, "lr": 0.00010223962260024426, "tps": 87774, "wall": 16769.6} {"step": 22460, "train_loss": 3.1856539249420166, "lr": 0.0001022251340613106, "tps": 87753, "wall": 16774.4} {"step": 22461, "train_loss": 3.306410789489746, "lr": 0.00010221064685653699, "tps": 87731, "wall": 16779.2} {"step": 22462, "train_loss": 3.2681853771209717, "lr": 0.00010219616098608744, "tps": 87710, "wall": 16784.0} {"step": 22463, "train_loss": 3.239208698272705, "lr": 0.00010218167645012626, "tps": 87689, "wall": 16788.8} {"step": 22464, "train_loss": 3.2721807956695557, "lr": 0.00010216719324881734, "tps": 87668, "wall": 16793.6} {"step": 22465, "train_loss": 3.241354465484619, "lr": 0.00010215271138232492, "tps": 87647, "wall": 16798.3} {"step": 22466, "train_loss": 3.2476344108581543, "lr": 0.00010213823085081293, "tps": 87626, "wall": 16803.1} {"step": 22467, "train_loss": 3.3467655181884766, "lr": 0.00010212375165444536, "tps": 87605, "wall": 16807.9} {"step": 22468, "train_loss": 3.313138484954834, "lr": 0.00010210927379338642, "tps": 87584, "wall": 16812.6} {"step": 22469, "train_loss": 3.285994529724121, "lr": 0.00010209479726779996, "tps": 87563, "wall": 16817.4} {"step": 22470, "train_loss": 3.398575782775879, "lr": 0.00010208032207784998, "tps": 87542, "wall": 16822.2} {"step": 22471, "train_loss": 3.2515616416931152, "lr": 0.00010206584822370055, "tps": 87521, "wall": 16827.0} {"step": 22472, "train_loss": 3.3568410873413086, "lr": 0.00010205137570551557, "tps": 87500, "wall": 16831.8} {"step": 22473, "train_loss": 3.288569450378418, "lr": 0.00010203690452345891, "tps": 87479, "wall": 16836.6} {"step": 22474, "train_loss": 3.3452630043029785, "lr": 0.00010202243467769466, "tps": 87458, "wall": 16841.4} {"step": 22475, "train_loss": 3.2306251525878906, "lr": 0.00010200796616838664, "tps": 87437, "wall": 16846.2} {"step": 22476, "train_loss": 3.3356800079345703, "lr": 0.0001019934989956987, "tps": 87416, "wall": 16851.0} {"step": 22477, "train_loss": 3.21321702003479, "lr": 0.00010197903315979485, "tps": 87395, "wall": 16855.7} {"step": 22478, "train_loss": 3.3334317207336426, "lr": 0.0001019645686608389, "tps": 87374, "wall": 16860.5} {"step": 22479, "train_loss": 3.2853736877441406, "lr": 0.00010195010549899464, "tps": 87354, "wall": 16865.3} {"step": 22480, "train_loss": 3.3654215335845947, "lr": 0.00010193564367442601, "tps": 87333, "wall": 16870.0} {"step": 22481, "train_loss": 3.299884080886841, "lr": 0.00010192118318729678, "tps": 87312, "wall": 16874.8} {"step": 22482, "train_loss": 3.3559975624084473, "lr": 0.00010190672403777082, "tps": 87291, "wall": 16879.6} {"step": 22483, "train_loss": 3.3029136657714844, "lr": 0.00010189226622601186, "tps": 87270, "wall": 16884.3} {"step": 22484, "train_loss": 3.2241082191467285, "lr": 0.00010187780975218365, "tps": 87250, "wall": 16889.1} {"step": 22485, "train_loss": 3.2443435192108154, "lr": 0.00010186335461645007, "tps": 87229, "wall": 16893.9} {"step": 22486, "train_loss": 3.2679476737976074, "lr": 0.00010184890081897478, "tps": 87208, "wall": 16898.7} {"step": 22487, "train_loss": 3.289116382598877, "lr": 0.00010183444835992148, "tps": 87187, "wall": 16903.5} {"step": 22488, "train_loss": 3.2502710819244385, "lr": 0.00010181999723945401, "tps": 87166, "wall": 16908.3} {"step": 22489, "train_loss": 3.2675881385803223, "lr": 0.00010180554745773601, "tps": 87145, "wall": 16913.1} {"step": 22490, "train_loss": 3.1817479133605957, "lr": 0.00010179109901493106, "tps": 87125, "wall": 16917.8} {"step": 22491, "train_loss": 3.2881011962890625, "lr": 0.00010177665191120302, "tps": 87104, "wall": 16922.6} {"step": 22492, "train_loss": 3.330897092819214, "lr": 0.00010176220614671548, "tps": 87083, "wall": 16927.4} {"step": 22493, "train_loss": 3.445377826690674, "lr": 0.00010174776172163203, "tps": 87063, "wall": 16932.1} {"step": 22494, "train_loss": 3.3305470943450928, "lr": 0.00010173331863611632, "tps": 87042, "wall": 16936.9} {"step": 22495, "train_loss": 3.259042501449585, "lr": 0.00010171887689033201, "tps": 87021, "wall": 16941.7} {"step": 22496, "train_loss": 3.3020477294921875, "lr": 0.00010170443648444264, "tps": 87001, "wall": 16946.5} {"step": 22497, "train_loss": 3.148144483566284, "lr": 0.00010168999741861185, "tps": 86980, "wall": 16951.2} {"step": 22498, "train_loss": 3.331997871398926, "lr": 0.00010167555969300309, "tps": 86959, "wall": 16956.1} {"step": 22499, "train_loss": 3.1669483184814453, "lr": 0.00010166112330778003, "tps": 86938, "wall": 16960.9} {"step": 22500, "train_loss": 3.3025500774383545, "lr": 0.00010164668826310621, "tps": 86918, "wall": 16965.6} {"step": 22501, "train_loss": 3.3202738761901855, "lr": 0.00010163225455914505, "tps": 86897, "wall": 16970.5} {"step": 22502, "train_loss": 3.2820067405700684, "lr": 0.00010161782219606014, "tps": 86876, "wall": 16975.3} {"step": 22503, "train_loss": 3.3013863563537598, "lr": 0.00010160339117401496, "tps": 86855, "wall": 16980.1} {"step": 22504, "train_loss": 3.2458648681640625, "lr": 0.00010158896149317291, "tps": 86835, "wall": 16984.9} {"step": 22505, "train_loss": 3.184373378753662, "lr": 0.00010157453315369756, "tps": 86814, "wall": 16989.7} {"step": 22506, "train_loss": 3.247445821762085, "lr": 0.00010156010615575233, "tps": 86794, "wall": 16994.5} {"step": 22507, "train_loss": 3.384023904800415, "lr": 0.00010154568049950061, "tps": 86773, "wall": 16999.2} {"step": 22508, "train_loss": 3.1895573139190674, "lr": 0.00010153125618510584, "tps": 86753, "wall": 17004.0} {"step": 22509, "train_loss": 3.221353054046631, "lr": 0.00010151683321273134, "tps": 86732, "wall": 17008.8} {"step": 22510, "train_loss": 3.2025258541107178, "lr": 0.00010150241158254061, "tps": 86711, "wall": 17013.6} {"step": 22511, "train_loss": 3.1778316497802734, "lr": 0.00010148799129469699, "tps": 86691, "wall": 17018.4} {"step": 22512, "train_loss": 3.1887152194976807, "lr": 0.00010147357234936374, "tps": 86670, "wall": 17023.2} {"step": 22513, "train_loss": 3.2869656085968018, "lr": 0.00010145915474670437, "tps": 86650, "wall": 17027.9} {"step": 22514, "train_loss": 3.3086977005004883, "lr": 0.00010144473848688209, "tps": 86629, "wall": 17032.8} {"step": 22515, "train_loss": 3.2460899353027344, "lr": 0.00010143032357006017, "tps": 86609, "wall": 17037.5} {"step": 22516, "train_loss": 3.283358573913574, "lr": 0.00010141590999640198, "tps": 86588, "wall": 17042.3} {"step": 22517, "train_loss": 3.1938729286193848, "lr": 0.00010140149776607082, "tps": 86568, "wall": 17047.1} {"step": 22518, "train_loss": 3.3033652305603027, "lr": 0.00010138708687922984, "tps": 86548, "wall": 17051.9} {"step": 22519, "train_loss": 3.304550886154175, "lr": 0.00010137267733604242, "tps": 86527, "wall": 17056.6} {"step": 22520, "train_loss": 3.2300302982330322, "lr": 0.00010135826913667173, "tps": 86507, "wall": 17061.4} {"step": 22521, "train_loss": 3.2792088985443115, "lr": 0.0001013438622812809, "tps": 86487, "wall": 17066.1} {"step": 22522, "train_loss": 3.2581706047058105, "lr": 0.00010132945677003327, "tps": 86466, "wall": 17070.9} {"step": 22523, "train_loss": 3.294844388961792, "lr": 0.00010131505260309198, "tps": 86445, "wall": 17075.8} {"step": 22524, "train_loss": 3.337347984313965, "lr": 0.00010130064978062019, "tps": 86425, "wall": 17080.6} {"step": 22525, "train_loss": 3.2645230293273926, "lr": 0.00010128624830278108, "tps": 86405, "wall": 17085.3} {"step": 22526, "train_loss": 3.265760898590088, "lr": 0.00010127184816973773, "tps": 86385, "wall": 17090.1} {"step": 22527, "train_loss": 3.2453062534332275, "lr": 0.00010125744938165333, "tps": 86364, "wall": 17094.9} {"step": 22528, "train_loss": 3.4160799980163574, "lr": 0.00010124305193869101, "tps": 86344, "wall": 17099.6} {"step": 22529, "train_loss": 3.3278589248657227, "lr": 0.00010122865584101373, "tps": 86324, "wall": 17104.4} {"step": 22530, "train_loss": 3.2619614601135254, "lr": 0.00010121426108878473, "tps": 86304, "wall": 17109.2} {"step": 22531, "train_loss": 3.1657490730285645, "lr": 0.00010119986768216705, "tps": 86283, "wall": 17114.0} {"step": 22532, "train_loss": 3.321486473083496, "lr": 0.00010118547562132356, "tps": 86263, "wall": 17118.7} {"step": 22533, "train_loss": 3.193345546722412, "lr": 0.00010117108490641753, "tps": 86243, "wall": 17123.5} {"step": 22534, "train_loss": 3.211357831954956, "lr": 0.00010115669553761189, "tps": 86223, "wall": 17128.3} {"step": 22535, "train_loss": 3.1627912521362305, "lr": 0.00010114230751506956, "tps": 86202, "wall": 17133.1} {"step": 22536, "train_loss": 3.236966133117676, "lr": 0.00010112792083895364, "tps": 86182, "wall": 17137.9} {"step": 22537, "train_loss": 3.3127224445343018, "lr": 0.00010111353550942708, "tps": 86162, "wall": 17142.6} {"step": 22538, "train_loss": 3.327486038208008, "lr": 0.00010109915152665277, "tps": 86142, "wall": 17147.4} {"step": 22539, "train_loss": 3.3003652095794678, "lr": 0.00010108476889079375, "tps": 86122, "wall": 17152.2} {"step": 22540, "train_loss": 3.4050581455230713, "lr": 0.00010107038760201286, "tps": 86101, "wall": 17157.0} {"step": 22541, "train_loss": 3.3549036979675293, "lr": 0.00010105600766047309, "tps": 86081, "wall": 17161.7} {"step": 22542, "train_loss": 3.275634765625, "lr": 0.00010104162906633732, "tps": 86061, "wall": 17166.5} {"step": 22543, "train_loss": 3.2685813903808594, "lr": 0.00010102725181976836, "tps": 86041, "wall": 17171.3} {"step": 22544, "train_loss": 3.2498998641967773, "lr": 0.00010101287592092916, "tps": 86021, "wall": 17176.1} {"step": 22545, "train_loss": 3.2141408920288086, "lr": 0.00010099850136998254, "tps": 86001, "wall": 17180.8} {"step": 22546, "train_loss": 3.231796979904175, "lr": 0.00010098412816709129, "tps": 85981, "wall": 17185.6} {"step": 22547, "train_loss": 3.2816576957702637, "lr": 0.00010096975631241832, "tps": 85961, "wall": 17190.4} {"step": 22548, "train_loss": 3.1090152263641357, "lr": 0.0001009553858061264, "tps": 85941, "wall": 17195.2} {"step": 22549, "train_loss": 3.274426221847534, "lr": 0.00010094101664837827, "tps": 85920, "wall": 17200.0} {"step": 22550, "train_loss": 3.1442902088165283, "lr": 0.00010092664883933678, "tps": 85900, "wall": 17204.8} {"step": 22551, "train_loss": 3.3573479652404785, "lr": 0.00010091228237916466, "tps": 85880, "wall": 17209.5} {"step": 22552, "train_loss": 3.281050682067871, "lr": 0.00010089791726802458, "tps": 85860, "wall": 17214.3} {"step": 22553, "train_loss": 3.265533447265625, "lr": 0.00010088355350607939, "tps": 85840, "wall": 17219.1} {"step": 22554, "train_loss": 3.286398410797119, "lr": 0.00010086919109349175, "tps": 85820, "wall": 17223.8} {"step": 22555, "train_loss": 3.29856014251709, "lr": 0.00010085483003042431, "tps": 85800, "wall": 17228.6} {"step": 22556, "train_loss": 3.2447311878204346, "lr": 0.00010084047031703985, "tps": 85781, "wall": 17233.4} {"step": 22557, "train_loss": 3.243959665298462, "lr": 0.00010082611195350102, "tps": 85761, "wall": 17238.1} {"step": 22558, "train_loss": 3.2253713607788086, "lr": 0.00010081175493997035, "tps": 85741, "wall": 17242.9} {"step": 22559, "train_loss": 3.2746331691741943, "lr": 0.00010079739927661065, "tps": 85721, "wall": 17247.7} {"step": 22560, "train_loss": 3.2529690265655518, "lr": 0.0001007830449635844, "tps": 85701, "wall": 17252.5} {"step": 22561, "train_loss": 3.325564384460449, "lr": 0.0001007686920010543, "tps": 85681, "wall": 17257.3} {"step": 22562, "train_loss": 3.278045892715454, "lr": 0.00010075434038918292, "tps": 85661, "wall": 17262.1} {"step": 22563, "train_loss": 3.287783145904541, "lr": 0.00010073999012813277, "tps": 85641, "wall": 17266.8} {"step": 22564, "train_loss": 3.297244071960449, "lr": 0.00010072564121806649, "tps": 85621, "wall": 17271.6} {"step": 22565, "train_loss": 3.1998610496520996, "lr": 0.00010071129365914665, "tps": 85601, "wall": 17276.4} {"step": 22566, "train_loss": 3.303279399871826, "lr": 0.00010069694745153562, "tps": 85581, "wall": 17281.1} {"step": 22567, "train_loss": 3.2305033206939697, "lr": 0.00010068260259539613, "tps": 85561, "wall": 17285.9} {"step": 22568, "train_loss": 3.195772409439087, "lr": 0.00010066825909089055, "tps": 85542, "wall": 17290.7} {"step": 22569, "train_loss": 3.358613967895508, "lr": 0.00010065391693818131, "tps": 85522, "wall": 17295.4} {"step": 22570, "train_loss": 3.2150721549987793, "lr": 0.00010063957613743104, "tps": 85502, "wall": 17300.2} {"step": 22571, "train_loss": 3.2256503105163574, "lr": 0.00010062523668880212, "tps": 85482, "wall": 17305.0} {"step": 22572, "train_loss": 3.273289203643799, "lr": 0.00010061089859245689, "tps": 85462, "wall": 17309.8} {"step": 22573, "train_loss": 3.2302443981170654, "lr": 0.00010059656184855792, "tps": 85443, "wall": 17314.5} {"step": 22574, "train_loss": 3.175110340118408, "lr": 0.00010058222645726756, "tps": 85423, "wall": 17319.4} {"step": 22575, "train_loss": 3.3599324226379395, "lr": 0.00010056789241874815, "tps": 85403, "wall": 17324.1} {"step": 22576, "train_loss": 3.226890802383423, "lr": 0.00010055355973316219, "tps": 85383, "wall": 17329.0} {"step": 22577, "train_loss": 3.1731603145599365, "lr": 0.00010053922840067186, "tps": 85363, "wall": 17333.7} {"step": 22578, "train_loss": 3.226168632507324, "lr": 0.0001005248984214397, "tps": 85344, "wall": 17338.5} {"step": 22579, "train_loss": 3.335757255554199, "lr": 0.00010051056979562798, "tps": 85324, "wall": 17343.3} {"step": 22580, "train_loss": 3.154202461242676, "lr": 0.00010049624252339889, "tps": 85304, "wall": 17348.0} {"step": 22581, "train_loss": 3.2314953804016113, "lr": 0.00010048191660491491, "tps": 85284, "wall": 17352.8} {"step": 22582, "train_loss": 3.2523751258850098, "lr": 0.00010046759204033826, "tps": 85265, "wall": 17357.6} {"step": 22583, "train_loss": 3.172584056854248, "lr": 0.00010045326882983109, "tps": 85245, "wall": 17362.4} {"step": 22584, "train_loss": 3.273940086364746, "lr": 0.00010043894697355582, "tps": 85225, "wall": 17367.1} {"step": 22585, "train_loss": 3.2304930686950684, "lr": 0.00010042462647167468, "tps": 85206, "wall": 17371.9} {"step": 22586, "train_loss": 3.219625473022461, "lr": 0.00010041030732434973, "tps": 85186, "wall": 17376.7} {"step": 22587, "train_loss": 3.281581163406372, "lr": 0.00010039598953174336, "tps": 85166, "wall": 17381.5} {"step": 22588, "train_loss": 3.221583366394043, "lr": 0.00010038167309401771, "tps": 85147, "wall": 17386.3} {"step": 22589, "train_loss": 3.3216893672943115, "lr": 0.00010036735801133488, "tps": 85127, "wall": 17391.1} {"step": 22590, "train_loss": 3.187253952026367, "lr": 0.00010035304428385712, "tps": 85108, "wall": 17395.8} {"step": 22591, "train_loss": 3.2643065452575684, "lr": 0.00010033873191174658, "tps": 85088, "wall": 17400.6} {"step": 22592, "train_loss": 3.3265247344970703, "lr": 0.00010032442089516529, "tps": 85068, "wall": 17405.4} {"step": 22593, "train_loss": 3.2449951171875, "lr": 0.00010031011123427547, "tps": 85049, "wall": 17410.1} {"step": 22594, "train_loss": 3.316969156265259, "lr": 0.00010029580292923914, "tps": 85029, "wall": 17414.9} {"step": 22595, "train_loss": 3.2770509719848633, "lr": 0.0001002814959802185, "tps": 85010, "wall": 17419.7} {"step": 22596, "train_loss": 3.245978355407715, "lr": 0.00010026719038737554, "tps": 84990, "wall": 17424.4} {"step": 22597, "train_loss": 3.286482334136963, "lr": 0.00010025288615087227, "tps": 84971, "wall": 17429.2} {"step": 22598, "train_loss": 3.2657008171081543, "lr": 0.00010023858327087084, "tps": 84951, "wall": 17434.0} {"step": 22599, "train_loss": 3.2671923637390137, "lr": 0.00010022428174753322, "tps": 84931, "wall": 17438.8} {"step": 22600, "train_loss": 3.1766300201416016, "lr": 0.00010020998158102135, "tps": 84912, "wall": 17443.6} {"step": 22601, "train_loss": 3.317885160446167, "lr": 0.00010019568277149735, "tps": 84893, "wall": 17448.4} {"step": 22602, "train_loss": 3.2823801040649414, "lr": 0.00010018138531912316, "tps": 84873, "wall": 17453.1} {"step": 22603, "train_loss": 3.2181949615478516, "lr": 0.00010016708922406061, "tps": 84854, "wall": 17457.9} {"step": 22604, "train_loss": 3.301356792449951, "lr": 0.00010015279448647188, "tps": 84834, "wall": 17462.7} {"step": 22605, "train_loss": 3.1894893646240234, "lr": 0.00010013850110651873, "tps": 84815, "wall": 17467.5} {"step": 22606, "train_loss": 3.2570395469665527, "lr": 0.00010012420908436308, "tps": 84795, "wall": 17472.2} {"step": 22607, "train_loss": 3.156742811203003, "lr": 0.00010010991842016693, "tps": 84776, "wall": 17477.0} {"step": 22608, "train_loss": 3.3466687202453613, "lr": 0.00010009562911409212, "tps": 84757, "wall": 17481.8} {"step": 22609, "train_loss": 3.235393524169922, "lr": 0.00010008134116630042, "tps": 84737, "wall": 17486.5} {"step": 22610, "train_loss": 3.343266010284424, "lr": 0.00010006705457695387, "tps": 84718, "wall": 17491.3} {"step": 22611, "train_loss": 3.2471680641174316, "lr": 0.00010005276934621419, "tps": 84698, "wall": 17496.2} {"step": 22612, "train_loss": 3.292264223098755, "lr": 0.0001000384854742432, "tps": 84679, "wall": 17500.9} {"step": 22613, "train_loss": 3.2558655738830566, "lr": 0.00010002420296120277, "tps": 84660, "wall": 17505.7} {"step": 22614, "train_loss": 3.253594160079956, "lr": 0.00010000992180725459, "tps": 84640, "wall": 17510.4} {"step": 22615, "train_loss": 3.2317261695861816, "lr": 9.99956420125606e-05, "tps": 84621, "wall": 17515.2} {"step": 22616, "train_loss": 3.308201551437378, "lr": 9.998136357728243e-05, "tps": 84602, "wall": 17520.0} {"step": 22617, "train_loss": 3.2644736766815186, "lr": 9.996708650158184e-05, "tps": 84582, "wall": 17524.8} {"step": 22618, "train_loss": 3.2318003177642822, "lr": 9.995281078562064e-05, "tps": 84563, "wall": 17529.5} {"step": 22619, "train_loss": 3.3121795654296875, "lr": 9.993853642956048e-05, "tps": 84544, "wall": 17534.3} {"step": 22620, "train_loss": 3.3469362258911133, "lr": 9.992426343356302e-05, "tps": 84525, "wall": 17539.0} {"step": 22621, "train_loss": 3.0957117080688477, "lr": 9.990999179779008e-05, "tps": 84505, "wall": 17543.8} {"step": 22622, "train_loss": 3.2431583404541016, "lr": 9.989572152240323e-05, "tps": 84486, "wall": 17548.6} {"step": 22623, "train_loss": 3.166368007659912, "lr": 9.988145260756409e-05, "tps": 84467, "wall": 17553.4} {"step": 22624, "train_loss": 3.34957218170166, "lr": 9.986718505343439e-05, "tps": 84448, "wall": 17558.2} {"step": 22625, "train_loss": 3.266981601715088, "lr": 9.985291886017575e-05, "tps": 84428, "wall": 17562.9} {"step": 22626, "train_loss": 3.252328872680664, "lr": 9.983865402794968e-05, "tps": 84409, "wall": 17567.7} {"step": 22627, "train_loss": 3.2801084518432617, "lr": 9.982439055691789e-05, "tps": 84390, "wall": 17572.5} {"step": 22628, "train_loss": 3.299112558364868, "lr": 9.981012844724189e-05, "tps": 84371, "wall": 17577.3} {"step": 22629, "train_loss": 3.2548587322235107, "lr": 9.979586769908321e-05, "tps": 84351, "wall": 17582.0} {"step": 22630, "train_loss": 3.2023963928222656, "lr": 9.978160831260351e-05, "tps": 84332, "wall": 17586.8} {"step": 22631, "train_loss": 3.2887556552886963, "lr": 9.97673502879642e-05, "tps": 84313, "wall": 17591.6} {"step": 22632, "train_loss": 3.216169595718384, "lr": 9.975309362532691e-05, "tps": 84294, "wall": 17596.3} {"step": 22633, "train_loss": 3.1537063121795654, "lr": 9.973883832485306e-05, "tps": 84275, "wall": 17601.1} {"step": 22634, "train_loss": 3.205760955810547, "lr": 9.972458438670412e-05, "tps": 84256, "wall": 17605.9} {"step": 22635, "train_loss": 3.2847883701324463, "lr": 9.971033181104163e-05, "tps": 84237, "wall": 17610.6} {"step": 22636, "train_loss": 3.2033286094665527, "lr": 9.969608059802702e-05, "tps": 84217, "wall": 17615.5} {"step": 22637, "train_loss": 3.214331865310669, "lr": 9.968183074782166e-05, "tps": 84198, "wall": 17620.2} {"step": 22638, "train_loss": 3.208252429962158, "lr": 9.966758226058708e-05, "tps": 84179, "wall": 17625.0} {"step": 22639, "train_loss": 3.2644741535186768, "lr": 9.965333513648465e-05, "tps": 84160, "wall": 17629.8} {"step": 22640, "train_loss": 3.3201346397399902, "lr": 9.963908937567568e-05, "tps": 84141, "wall": 17634.5} {"step": 22641, "train_loss": 3.27341890335083, "lr": 9.962484497832171e-05, "tps": 84122, "wall": 17639.3} {"step": 22642, "train_loss": 3.2812886238098145, "lr": 9.961060194458398e-05, "tps": 84103, "wall": 17644.1} {"step": 22643, "train_loss": 3.340738534927368, "lr": 9.95963602746238e-05, "tps": 84084, "wall": 17648.9} {"step": 22644, "train_loss": 3.2450146675109863, "lr": 9.958211996860262e-05, "tps": 84065, "wall": 17653.6} {"step": 22645, "train_loss": 3.283090353012085, "lr": 9.956788102668173e-05, "tps": 84046, "wall": 17658.4} {"step": 22646, "train_loss": 3.3597328662872314, "lr": 9.955364344902231e-05, "tps": 84027, "wall": 17663.2} {"step": 22647, "train_loss": 3.2921905517578125, "lr": 9.953940723578578e-05, "tps": 84008, "wall": 17668.0} {"step": 22648, "train_loss": 3.304067611694336, "lr": 9.952517238713334e-05, "tps": 83989, "wall": 17672.8} {"step": 22649, "train_loss": 3.2805709838867188, "lr": 9.951093890322631e-05, "tps": 83970, "wall": 17677.6} {"step": 22650, "train_loss": 3.3938140869140625, "lr": 9.949670678422588e-05, "tps": 83951, "wall": 17682.4} {"step": 22651, "train_loss": 3.309340000152588, "lr": 9.948247603029322e-05, "tps": 83932, "wall": 17687.1} {"step": 22652, "train_loss": 3.348344326019287, "lr": 9.946824664158963e-05, "tps": 83913, "wall": 17691.9} {"step": 22653, "train_loss": 3.3335673809051514, "lr": 9.94540186182763e-05, "tps": 83894, "wall": 17696.7} {"step": 22654, "train_loss": 3.2114884853363037, "lr": 9.943979196051428e-05, "tps": 83875, "wall": 17701.5} {"step": 22655, "train_loss": 3.3942036628723145, "lr": 9.94255666684649e-05, "tps": 83856, "wall": 17706.2} {"step": 22656, "train_loss": 3.2527308464050293, "lr": 9.941134274228921e-05, "tps": 83837, "wall": 17711.0} {"step": 22657, "train_loss": 3.24114727973938, "lr": 9.939712018214827e-05, "tps": 83818, "wall": 17715.7} {"step": 22658, "train_loss": 3.212851047515869, "lr": 9.938289898820338e-05, "tps": 83800, "wall": 17720.5} {"step": 22659, "train_loss": 3.2952795028686523, "lr": 9.936867916061552e-05, "tps": 83781, "wall": 17725.3} {"step": 22660, "train_loss": 3.2120540142059326, "lr": 9.935446069954572e-05, "tps": 83762, "wall": 17730.0} {"step": 22661, "train_loss": 3.221264600753784, "lr": 9.934024360515518e-05, "tps": 83743, "wall": 17734.8} {"step": 22662, "train_loss": 3.231563091278076, "lr": 9.932602787760488e-05, "tps": 83724, "wall": 17739.6} {"step": 22663, "train_loss": 3.152207136154175, "lr": 9.931181351705582e-05, "tps": 83705, "wall": 17744.4} {"step": 22664, "train_loss": 3.277621269226074, "lr": 9.929760052366912e-05, "tps": 83687, "wall": 17749.1} {"step": 22665, "train_loss": 3.3063411712646484, "lr": 9.928338889760573e-05, "tps": 83668, "wall": 17753.9} {"step": 22666, "train_loss": 3.390178918838501, "lr": 9.926917863902657e-05, "tps": 83649, "wall": 17758.7} {"step": 22667, "train_loss": 3.1531810760498047, "lr": 9.925496974809278e-05, "tps": 83630, "wall": 17763.4} {"step": 22668, "train_loss": 3.2076210975646973, "lr": 9.924076222496513e-05, "tps": 83611, "wall": 17768.2} {"step": 22669, "train_loss": 3.2843832969665527, "lr": 9.922655606980475e-05, "tps": 83593, "wall": 17773.0} {"step": 22670, "train_loss": 3.3576712608337402, "lr": 9.921235128277244e-05, "tps": 83574, "wall": 17777.8} {"step": 22671, "train_loss": 3.2858779430389404, "lr": 9.919814786402912e-05, "tps": 83555, "wall": 17782.5} {"step": 22672, "train_loss": 3.21602725982666, "lr": 9.918394581373575e-05, "tps": 83536, "wall": 17787.3} {"step": 22673, "train_loss": 3.2487287521362305, "lr": 9.916974513205319e-05, "tps": 83518, "wall": 17792.1} {"step": 22674, "train_loss": 3.2746429443359375, "lr": 9.91555458191423e-05, "tps": 83499, "wall": 17796.9} {"step": 22675, "train_loss": 3.227724075317383, "lr": 9.914134787516392e-05, "tps": 83480, "wall": 17801.7} {"step": 22676, "train_loss": 3.274496078491211, "lr": 9.912715130027883e-05, "tps": 83461, "wall": 17806.4} {"step": 22677, "train_loss": 3.4031577110290527, "lr": 9.911295609464797e-05, "tps": 83443, "wall": 17811.2} {"step": 22678, "train_loss": 3.284369707107544, "lr": 9.909876225843208e-05, "tps": 83424, "wall": 17816.0} {"step": 22679, "train_loss": 3.291325092315674, "lr": 9.90845697917919e-05, "tps": 83406, "wall": 17820.7} {"step": 22680, "train_loss": 3.2556254863739014, "lr": 9.907037869488831e-05, "tps": 83387, "wall": 17825.5} {"step": 22681, "train_loss": 3.2108230590820312, "lr": 9.905618896788199e-05, "tps": 83368, "wall": 17830.2} {"step": 22682, "train_loss": 3.2874398231506348, "lr": 9.904200061093369e-05, "tps": 83350, "wall": 17835.0} {"step": 22683, "train_loss": 3.2169013023376465, "lr": 9.902781362420417e-05, "tps": 83331, "wall": 17839.8} {"step": 22684, "train_loss": 3.2064332962036133, "lr": 9.901362800785414e-05, "tps": 83313, "wall": 17844.5} {"step": 22685, "train_loss": 3.1873340606689453, "lr": 9.89994437620442e-05, "tps": 83294, "wall": 17849.3} {"step": 22686, "train_loss": 3.2384629249572754, "lr": 9.89852608869352e-05, "tps": 83275, "wall": 17854.1} {"step": 22687, "train_loss": 3.180866241455078, "lr": 9.897107938268769e-05, "tps": 83256, "wall": 17858.9} {"step": 22688, "train_loss": 3.1799912452697754, "lr": 9.895689924946228e-05, "tps": 83238, "wall": 17863.7} {"step": 22689, "train_loss": 3.1960620880126953, "lr": 9.894272048741973e-05, "tps": 83219, "wall": 17868.5} {"step": 22690, "train_loss": 3.372349262237549, "lr": 9.892854309672059e-05, "tps": 83201, "wall": 17873.2} {"step": 22691, "train_loss": 3.2669289112091064, "lr": 9.89143670775254e-05, "tps": 83182, "wall": 17878.0} {"step": 22692, "train_loss": 3.3102774620056152, "lr": 9.890019242999486e-05, "tps": 83164, "wall": 17882.8} {"step": 22693, "train_loss": 3.253574848175049, "lr": 9.888601915428944e-05, "tps": 83145, "wall": 17887.5} {"step": 22694, "train_loss": 3.2807865142822266, "lr": 9.887184725056981e-05, "tps": 83127, "wall": 17892.3} {"step": 22695, "train_loss": 3.166166305541992, "lr": 9.885767671899646e-05, "tps": 83108, "wall": 17897.1} {"step": 22696, "train_loss": 3.1857292652130127, "lr": 9.884350755972983e-05, "tps": 83090, "wall": 17901.8} {"step": 22697, "train_loss": 3.2152864933013916, "lr": 9.882933977293057e-05, "tps": 83072, "wall": 17906.6} {"step": 22698, "train_loss": 3.2458810806274414, "lr": 9.881517335875909e-05, "tps": 83053, "wall": 17911.4} {"step": 22699, "train_loss": 3.323301315307617, "lr": 9.880100831737582e-05, "tps": 83034, "wall": 17916.2} {"step": 22700, "train_loss": 3.2692525386810303, "lr": 9.878684464894136e-05, "tps": 83016, "wall": 17921.0} {"step": 22701, "train_loss": 3.3093810081481934, "lr": 9.877268235361607e-05, "tps": 82997, "wall": 17925.7} {"step": 22702, "train_loss": 3.1797733306884766, "lr": 9.875852143156034e-05, "tps": 82979, "wall": 17930.6} {"step": 22703, "train_loss": 3.3735580444335938, "lr": 9.87443618829347e-05, "tps": 82960, "wall": 17935.3} {"step": 22704, "train_loss": 3.252140998840332, "lr": 9.873020370789948e-05, "tps": 82942, "wall": 17940.1} {"step": 22705, "train_loss": 3.121044874191284, "lr": 9.871604690661501e-05, "tps": 82924, "wall": 17944.8} {"step": 22706, "train_loss": 3.203427314758301, "lr": 9.870189147924177e-05, "tps": 82905, "wall": 17949.6} {"step": 22707, "train_loss": 3.2350106239318848, "lr": 9.86877374259401e-05, "tps": 82887, "wall": 17954.4} {"step": 22708, "train_loss": 3.2813024520874023, "lr": 9.867358474687022e-05, "tps": 82869, "wall": 17959.1} {"step": 22709, "train_loss": 3.1752970218658447, "lr": 9.865943344219261e-05, "tps": 82850, "wall": 17963.9} {"step": 22710, "train_loss": 3.3366103172302246, "lr": 9.864528351206743e-05, "tps": 82832, "wall": 17968.7} {"step": 22711, "train_loss": 3.151724338531494, "lr": 9.863113495665512e-05, "tps": 82813, "wall": 17973.5} {"step": 22712, "train_loss": 3.183774471282959, "lr": 9.861698777611587e-05, "tps": 82795, "wall": 17978.3} {"step": 22713, "train_loss": 3.244799852371216, "lr": 9.860284197060987e-05, "tps": 82777, "wall": 17983.1} {"step": 22714, "train_loss": 3.2055177688598633, "lr": 9.858869754029752e-05, "tps": 82758, "wall": 17987.8} {"step": 22715, "train_loss": 3.2543320655822754, "lr": 9.857455448533896e-05, "tps": 82740, "wall": 17992.6} {"step": 22716, "train_loss": 3.2301392555236816, "lr": 9.856041280589439e-05, "tps": 82722, "wall": 17997.4} {"step": 22717, "train_loss": 3.3150854110717773, "lr": 9.854627250212407e-05, "tps": 82703, "wall": 18002.1} {"step": 22718, "train_loss": 3.2979183197021484, "lr": 9.853213357418814e-05, "tps": 82685, "wall": 18006.9} {"step": 22719, "train_loss": 3.2008538246154785, "lr": 9.851799602224671e-05, "tps": 82667, "wall": 18011.7} {"step": 22720, "train_loss": 3.2666707038879395, "lr": 9.850385984646008e-05, "tps": 82649, "wall": 18016.4} {"step": 22721, "train_loss": 3.317996025085449, "lr": 9.848972504698828e-05, "tps": 82630, "wall": 18021.2} {"step": 22722, "train_loss": 3.3202524185180664, "lr": 9.84755916239914e-05, "tps": 82612, "wall": 18026.0} {"step": 22723, "train_loss": 3.360680103302002, "lr": 9.846145957762962e-05, "tps": 82594, "wall": 18030.7} {"step": 22724, "train_loss": 3.3235533237457275, "lr": 9.844732890806302e-05, "tps": 82575, "wall": 18035.6} {"step": 22725, "train_loss": 3.237175941467285, "lr": 9.843319961545161e-05, "tps": 82557, "wall": 18040.3} {"step": 22726, "train_loss": 3.3093883991241455, "lr": 9.841907169995552e-05, "tps": 82539, "wall": 18045.1} {"step": 22727, "train_loss": 3.2381138801574707, "lr": 9.840494516173473e-05, "tps": 82521, "wall": 18049.9} {"step": 22728, "train_loss": 3.2215723991394043, "lr": 9.839082000094934e-05, "tps": 82503, "wall": 18054.6} {"step": 22729, "train_loss": 3.420963764190674, "lr": 9.837669621775936e-05, "tps": 82485, "wall": 18059.4} {"step": 22730, "train_loss": 3.268608331680298, "lr": 9.836257381232463e-05, "tps": 82467, "wall": 18064.2} {"step": 22731, "train_loss": 3.4050397872924805, "lr": 9.834845278480534e-05, "tps": 82448, "wall": 18068.9} {"step": 22732, "train_loss": 3.3918304443359375, "lr": 9.833433313536135e-05, "tps": 82430, "wall": 18073.7} {"step": 22733, "train_loss": 3.2886404991149902, "lr": 9.832021486415255e-05, "tps": 82412, "wall": 18078.5} {"step": 22734, "train_loss": 3.180542469024658, "lr": 9.830609797133901e-05, "tps": 82394, "wall": 18083.3} {"step": 22735, "train_loss": 3.3268508911132812, "lr": 9.829198245708056e-05, "tps": 82376, "wall": 18088.0} {"step": 22736, "train_loss": 3.1946985721588135, "lr": 9.827786832153706e-05, "tps": 82358, "wall": 18092.8} {"step": 22737, "train_loss": 3.177875518798828, "lr": 9.826375556486851e-05, "tps": 82339, "wall": 18097.6} {"step": 22738, "train_loss": 3.290635347366333, "lr": 9.824964418723475e-05, "tps": 82321, "wall": 18102.4} {"step": 22739, "train_loss": 3.242842197418213, "lr": 9.823553418879552e-05, "tps": 82303, "wall": 18107.1} {"step": 22740, "train_loss": 3.2398664951324463, "lr": 9.822142556971083e-05, "tps": 82285, "wall": 18111.9} {"step": 22741, "train_loss": 3.2183804512023926, "lr": 9.820731833014038e-05, "tps": 82267, "wall": 18116.7} {"step": 22742, "train_loss": 3.281367063522339, "lr": 9.8193212470244e-05, "tps": 82249, "wall": 18121.4} {"step": 22743, "train_loss": 3.2872438430786133, "lr": 9.817910799018153e-05, "tps": 82231, "wall": 18126.2} {"step": 22744, "train_loss": 3.26710844039917, "lr": 9.816500489011272e-05, "tps": 82213, "wall": 18131.0} {"step": 22745, "train_loss": 3.249239206314087, "lr": 9.815090317019727e-05, "tps": 82195, "wall": 18135.7} {"step": 22746, "train_loss": 3.2209625244140625, "lr": 9.813680283059505e-05, "tps": 82177, "wall": 18140.5} {"step": 22747, "train_loss": 3.3884756565093994, "lr": 9.812270387146566e-05, "tps": 82159, "wall": 18145.3} {"step": 22748, "train_loss": 3.1773738861083984, "lr": 9.810860629296892e-05, "tps": 82141, "wall": 18150.0} {"step": 22749, "train_loss": 3.2151918411254883, "lr": 9.809451009526449e-05, "tps": 82123, "wall": 18154.8} {"step": 22750, "train_loss": 3.230771064758301, "lr": 9.808041527851199e-05, "tps": 82105, "wall": 18159.6} {"step": 22751, "train_loss": 3.317333221435547, "lr": 9.80663218428712e-05, "tps": 82087, "wall": 18164.4} {"step": 22752, "train_loss": 3.2885429859161377, "lr": 9.805222978850169e-05, "tps": 82069, "wall": 18169.2} {"step": 22753, "train_loss": 3.160006046295166, "lr": 9.803813911556306e-05, "tps": 82051, "wall": 18173.9} {"step": 22754, "train_loss": 3.2726199626922607, "lr": 9.802404982421508e-05, "tps": 82033, "wall": 18178.7} {"step": 22755, "train_loss": 3.266498565673828, "lr": 9.800996191461724e-05, "tps": 82016, "wall": 18183.5} {"step": 22756, "train_loss": 3.1931686401367188, "lr": 9.79958753869291e-05, "tps": 81998, "wall": 18188.2} {"step": 22757, "train_loss": 3.257929801940918, "lr": 9.798179024131032e-05, "tps": 81980, "wall": 18193.0} {"step": 22758, "train_loss": 3.2163405418395996, "lr": 9.796770647792045e-05, "tps": 81962, "wall": 18197.8} {"step": 22759, "train_loss": 3.2418689727783203, "lr": 9.795362409691894e-05, "tps": 81944, "wall": 18202.5} {"step": 22760, "train_loss": 3.246692657470703, "lr": 9.793954309846542e-05, "tps": 81926, "wall": 18207.3} {"step": 22761, "train_loss": 3.2192399501800537, "lr": 9.792546348271938e-05, "tps": 81909, "wall": 18212.0} {"step": 22762, "train_loss": 3.1969661712646484, "lr": 9.791138524984023e-05, "tps": 81890, "wall": 18216.9} {"step": 22763, "train_loss": 3.1838274002075195, "lr": 9.789730839998756e-05, "tps": 81873, "wall": 18221.6} {"step": 22764, "train_loss": 3.249938726425171, "lr": 9.788323293332074e-05, "tps": 81855, "wall": 18226.4} {"step": 22765, "train_loss": 3.2910938262939453, "lr": 9.786915884999932e-05, "tps": 81837, "wall": 18231.2} {"step": 22766, "train_loss": 3.1514055728912354, "lr": 9.785508615018268e-05, "tps": 81819, "wall": 18235.9} {"step": 22767, "train_loss": 3.196192741394043, "lr": 9.784101483403016e-05, "tps": 81801, "wall": 18240.7} {"step": 22768, "train_loss": 3.3828718662261963, "lr": 9.78269449017013e-05, "tps": 81784, "wall": 18245.4} {"step": 22769, "train_loss": 3.2383713722229004, "lr": 9.781287635335541e-05, "tps": 81766, "wall": 18250.2} {"step": 22770, "train_loss": 3.2602686882019043, "lr": 9.77988091891518e-05, "tps": 81748, "wall": 18255.0} {"step": 22771, "train_loss": 3.2209722995758057, "lr": 9.778474340925e-05, "tps": 81730, "wall": 18259.7} {"step": 22772, "train_loss": 3.1097617149353027, "lr": 9.777067901380918e-05, "tps": 81713, "wall": 18264.5} {"step": 22773, "train_loss": 3.2237966060638428, "lr": 9.775661600298868e-05, "tps": 81695, "wall": 18269.3} {"step": 22774, "train_loss": 3.240579605102539, "lr": 9.77425543769479e-05, "tps": 81677, "wall": 18274.1} {"step": 22775, "train_loss": 3.1953396797180176, "lr": 9.77284941358461e-05, "tps": 81659, "wall": 18278.9} {"step": 22776, "train_loss": 3.319232225418091, "lr": 9.771443527984245e-05, "tps": 81641, "wall": 18283.7} {"step": 22777, "train_loss": 3.2880632877349854, "lr": 9.770037780909636e-05, "tps": 81624, "wall": 18288.4} {"step": 22778, "train_loss": 3.264549732208252, "lr": 9.768632172376701e-05, "tps": 81606, "wall": 18293.2} {"step": 22779, "train_loss": 3.334653615951538, "lr": 9.767226702401357e-05, "tps": 81588, "wall": 18298.0} {"step": 22780, "train_loss": 3.25398588180542, "lr": 9.765821370999536e-05, "tps": 81571, "wall": 18302.7} {"step": 22781, "train_loss": 3.1904349327087402, "lr": 9.764416178187147e-05, "tps": 81553, "wall": 18307.5} {"step": 22782, "train_loss": 3.271965503692627, "lr": 9.76301112398012e-05, "tps": 81535, "wall": 18312.3} {"step": 22783, "train_loss": 3.291304111480713, "lr": 9.761606208394363e-05, "tps": 81518, "wall": 18317.0} {"step": 22784, "train_loss": 3.1606287956237793, "lr": 9.76020143144579e-05, "tps": 81500, "wall": 18321.8} {"step": 22785, "train_loss": 3.2857298851013184, "lr": 9.75879679315032e-05, "tps": 81482, "wall": 18326.6} {"step": 22786, "train_loss": 3.1540277004241943, "lr": 9.757392293523863e-05, "tps": 81465, "wall": 18331.3} {"step": 22787, "train_loss": 3.2407989501953125, "lr": 9.755987932582322e-05, "tps": 81447, "wall": 18336.2} {"step": 22788, "train_loss": 3.3566112518310547, "lr": 9.754583710341621e-05, "tps": 81429, "wall": 18341.0} {"step": 22789, "train_loss": 3.290369987487793, "lr": 9.753179626817654e-05, "tps": 81412, "wall": 18345.7} {"step": 22790, "train_loss": 3.26304292678833, "lr": 9.751775682026327e-05, "tps": 81394, "wall": 18350.5} {"step": 22791, "train_loss": 3.204782247543335, "lr": 9.750371875983554e-05, "tps": 81377, "wall": 18355.2} {"step": 22792, "train_loss": 3.211439609527588, "lr": 9.748968208705231e-05, "tps": 81359, "wall": 18360.0} {"step": 22793, "train_loss": 3.2466883659362793, "lr": 9.747564680207251e-05, "tps": 81341, "wall": 18364.8} {"step": 22794, "train_loss": 3.3175346851348877, "lr": 9.74616129050553e-05, "tps": 81324, "wall": 18369.6} {"step": 22795, "train_loss": 3.310512065887451, "lr": 9.744758039615955e-05, "tps": 81306, "wall": 18374.3} {"step": 22796, "train_loss": 3.1910510063171387, "lr": 9.743354927554418e-05, "tps": 81289, "wall": 18379.1} {"step": 22797, "train_loss": 3.2014236450195312, "lr": 9.741951954336827e-05, "tps": 81271, "wall": 18383.8} {"step": 22798, "train_loss": 3.1747543811798096, "lr": 9.740549119979066e-05, "tps": 81254, "wall": 18388.6} {"step": 22799, "train_loss": 3.1984100341796875, "lr": 9.739146424497023e-05, "tps": 81236, "wall": 18393.4} {"step": 22800, "train_loss": 3.289248466491699, "lr": 9.737743867906597e-05, "tps": 81219, "wall": 18398.2} {"step": 22801, "train_loss": 3.271174907684326, "lr": 9.736341450223666e-05, "tps": 81201, "wall": 18403.0} {"step": 22802, "train_loss": 3.2418792247772217, "lr": 9.73493917146413e-05, "tps": 81184, "wall": 18407.7} {"step": 22803, "train_loss": 3.224731922149658, "lr": 9.733537031643866e-05, "tps": 81166, "wall": 18412.5} {"step": 22804, "train_loss": 3.263078212738037, "lr": 9.732135030778751e-05, "tps": 81149, "wall": 18417.2} {"step": 22805, "train_loss": 3.1460180282592773, "lr": 9.730733168884681e-05, "tps": 81132, "wall": 18422.0} {"step": 22806, "train_loss": 3.2281525135040283, "lr": 9.729331445977528e-05, "tps": 81114, "wall": 18426.8} {"step": 22807, "train_loss": 3.1822259426116943, "lr": 9.72792986207317e-05, "tps": 81097, "wall": 18431.5} {"step": 22808, "train_loss": 3.2824525833129883, "lr": 9.726528417187487e-05, "tps": 81079, "wall": 18436.3} {"step": 22809, "train_loss": 3.25447678565979, "lr": 9.725127111336359e-05, "tps": 81062, "wall": 18441.0} {"step": 22810, "train_loss": 3.324406385421753, "lr": 9.723725944535645e-05, "tps": 81045, "wall": 18445.8} {"step": 22811, "train_loss": 3.278970956802368, "lr": 9.722324916801238e-05, "tps": 81027, "wall": 18450.6} {"step": 22812, "train_loss": 3.3017914295196533, "lr": 9.720924028148996e-05, "tps": 81010, "wall": 18455.4} {"step": 22813, "train_loss": 3.286959171295166, "lr": 9.719523278594785e-05, "tps": 80992, "wall": 18460.2} {"step": 22814, "train_loss": 3.28332781791687, "lr": 9.718122668154485e-05, "tps": 80975, "wall": 18465.0} {"step": 22815, "train_loss": 3.3442652225494385, "lr": 9.716722196843955e-05, "tps": 80957, "wall": 18469.7} {"step": 22816, "train_loss": 3.1848325729370117, "lr": 9.715321864679057e-05, "tps": 80940, "wall": 18474.5} {"step": 22817, "train_loss": 3.2289679050445557, "lr": 9.71392167167566e-05, "tps": 80923, "wall": 18479.2} {"step": 22818, "train_loss": 3.2736518383026123, "lr": 9.71252161784962e-05, "tps": 80905, "wall": 18484.0} {"step": 22819, "train_loss": 3.343980312347412, "lr": 9.711121703216803e-05, "tps": 80888, "wall": 18488.8} {"step": 22820, "train_loss": 3.259660005569458, "lr": 9.709721927793065e-05, "tps": 80871, "wall": 18493.5} {"step": 22821, "train_loss": 3.3290152549743652, "lr": 9.708322291594257e-05, "tps": 80854, "wall": 18498.3} {"step": 22822, "train_loss": 3.2530088424682617, "lr": 9.706922794636244e-05, "tps": 80836, "wall": 18503.1} {"step": 22823, "train_loss": 3.2865705490112305, "lr": 9.705523436934876e-05, "tps": 80819, "wall": 18507.8} {"step": 22824, "train_loss": 3.2590396404266357, "lr": 9.704124218505997e-05, "tps": 80802, "wall": 18512.6} {"step": 22825, "train_loss": 3.3377606868743896, "lr": 9.702725139365469e-05, "tps": 80784, "wall": 18517.4} {"step": 22826, "train_loss": 3.2901217937469482, "lr": 9.701326199529138e-05, "tps": 80767, "wall": 18522.2} {"step": 22827, "train_loss": 3.1755988597869873, "lr": 9.699927399012841e-05, "tps": 80750, "wall": 18527.0} {"step": 22828, "train_loss": 3.353724956512451, "lr": 9.698528737832439e-05, "tps": 80732, "wall": 18531.7} {"step": 22829, "train_loss": 3.4086430072784424, "lr": 9.697130216003769e-05, "tps": 80715, "wall": 18536.5} {"step": 22830, "train_loss": 3.334733724594116, "lr": 9.695731833542666e-05, "tps": 80698, "wall": 18541.3} {"step": 22831, "train_loss": 3.1537654399871826, "lr": 9.694333590464986e-05, "tps": 80681, "wall": 18546.1} {"step": 22832, "train_loss": 3.2919201850891113, "lr": 9.692935486786562e-05, "tps": 80664, "wall": 18550.8} {"step": 22833, "train_loss": 3.292745590209961, "lr": 9.691537522523222e-05, "tps": 80646, "wall": 18555.6} {"step": 22834, "train_loss": 3.2693231105804443, "lr": 9.690139697690819e-05, "tps": 80629, "wall": 18560.3} {"step": 22835, "train_loss": 3.195749521255493, "lr": 9.688742012305171e-05, "tps": 80612, "wall": 18565.1} {"step": 22836, "train_loss": 3.2385523319244385, "lr": 9.687344466382127e-05, "tps": 80595, "wall": 18569.9} {"step": 22837, "train_loss": 3.2914445400238037, "lr": 9.685947059937512e-05, "tps": 80578, "wall": 18574.7} {"step": 22838, "train_loss": 3.295320510864258, "lr": 9.684549792987146e-05, "tps": 80560, "wall": 18579.4} {"step": 22839, "train_loss": 3.317847967147827, "lr": 9.683152665546876e-05, "tps": 80543, "wall": 18584.2} {"step": 22840, "train_loss": 3.267996072769165, "lr": 9.681755677632515e-05, "tps": 80526, "wall": 18589.0} {"step": 22841, "train_loss": 3.253103017807007, "lr": 9.68035882925989e-05, "tps": 80509, "wall": 18593.7} {"step": 22842, "train_loss": 3.306535482406616, "lr": 9.67896212044483e-05, "tps": 80492, "wall": 18598.5} {"step": 22843, "train_loss": 3.225337505340576, "lr": 9.677565551203154e-05, "tps": 80475, "wall": 18603.3} {"step": 22844, "train_loss": 3.1902260780334473, "lr": 9.67616912155068e-05, "tps": 80458, "wall": 18608.0} {"step": 22845, "train_loss": 3.308988571166992, "lr": 9.674772831503232e-05, "tps": 80441, "wall": 18612.8} {"step": 22846, "train_loss": 3.2790021896362305, "lr": 9.673376681076618e-05, "tps": 80424, "wall": 18617.6} {"step": 22847, "train_loss": 3.3441410064697266, "lr": 9.671980670286665e-05, "tps": 80407, "wall": 18622.3} {"step": 22848, "train_loss": 3.249084949493408, "lr": 9.670584799149182e-05, "tps": 80389, "wall": 18627.1} {"step": 22849, "train_loss": 3.187021255493164, "lr": 9.669189067679976e-05, "tps": 80372, "wall": 18631.9} {"step": 22850, "train_loss": 3.1171627044677734, "lr": 9.66779347589487e-05, "tps": 80355, "wall": 18636.7} {"step": 22851, "train_loss": 3.1855592727661133, "lr": 9.666398023809666e-05, "tps": 80338, "wall": 18641.5} {"step": 22852, "train_loss": 3.217714309692383, "lr": 9.665002711440163e-05, "tps": 80321, "wall": 18646.3} {"step": 22853, "train_loss": 3.3155524730682373, "lr": 9.663607538802186e-05, "tps": 80304, "wall": 18651.1} {"step": 22854, "train_loss": 3.340615749359131, "lr": 9.662212505911531e-05, "tps": 80287, "wall": 18655.8} {"step": 22855, "train_loss": 3.344226837158203, "lr": 9.660817612783993e-05, "tps": 80270, "wall": 18660.6} {"step": 22856, "train_loss": 3.2835464477539062, "lr": 9.659422859435387e-05, "tps": 80253, "wall": 18665.4} {"step": 22857, "train_loss": 3.3506827354431152, "lr": 9.658028245881506e-05, "tps": 80236, "wall": 18670.1} {"step": 22858, "train_loss": 3.291738748550415, "lr": 9.656633772138142e-05, "tps": 80219, "wall": 18674.9} {"step": 22859, "train_loss": 3.2405354976654053, "lr": 9.655239438221106e-05, "tps": 80202, "wall": 18679.7} {"step": 22860, "train_loss": 3.255115032196045, "lr": 9.653845244146177e-05, "tps": 80185, "wall": 18684.4} {"step": 22861, "train_loss": 3.2026655673980713, "lr": 9.652451189929166e-05, "tps": 80168, "wall": 18689.2} {"step": 22862, "train_loss": 3.2479240894317627, "lr": 9.651057275585852e-05, "tps": 80151, "wall": 18694.0} {"step": 22863, "train_loss": 3.2900373935699463, "lr": 9.649663501132027e-05, "tps": 80134, "wall": 18698.8} {"step": 22864, "train_loss": 3.2396836280822754, "lr": 9.648269866583488e-05, "tps": 80117, "wall": 18703.6} {"step": 22865, "train_loss": 3.2204861640930176, "lr": 9.646876371956015e-05, "tps": 80100, "wall": 18708.3} {"step": 22866, "train_loss": 3.276695728302002, "lr": 9.645483017265388e-05, "tps": 80083, "wall": 18713.1} {"step": 22867, "train_loss": 3.233912944793701, "lr": 9.644089802527403e-05, "tps": 80066, "wall": 18717.9} {"step": 22868, "train_loss": 3.296006917953491, "lr": 9.642696727757839e-05, "tps": 80049, "wall": 18722.7} {"step": 22869, "train_loss": 3.3281192779541016, "lr": 9.641303792972471e-05, "tps": 80032, "wall": 18727.5} {"step": 22870, "train_loss": 3.2722229957580566, "lr": 9.639910998187084e-05, "tps": 80015, "wall": 18732.2} {"step": 22871, "train_loss": 3.2651045322418213, "lr": 9.638518343417457e-05, "tps": 79998, "wall": 18737.0} {"step": 22872, "train_loss": 3.2766103744506836, "lr": 9.637125828679353e-05, "tps": 79981, "wall": 18741.8} {"step": 22873, "train_loss": 3.2915163040161133, "lr": 9.635733453988567e-05, "tps": 79964, "wall": 18746.6} {"step": 22874, "train_loss": 3.220240592956543, "lr": 9.634341219360859e-05, "tps": 79948, "wall": 18751.4} {"step": 22875, "train_loss": 3.237273693084717, "lr": 9.632949124811997e-05, "tps": 79930, "wall": 18756.3} {"step": 22876, "train_loss": 3.255676746368408, "lr": 9.631557170357763e-05, "tps": 79914, "wall": 18761.0} {"step": 22877, "train_loss": 3.266052722930908, "lr": 9.630165356013917e-05, "tps": 79897, "wall": 18765.8} {"step": 22878, "train_loss": 3.1465559005737305, "lr": 9.628773681796222e-05, "tps": 79880, "wall": 18770.6} {"step": 22879, "train_loss": 3.3123276233673096, "lr": 9.627382147720454e-05, "tps": 79863, "wall": 18775.4} {"step": 22880, "train_loss": 3.2947964668273926, "lr": 9.625990753802364e-05, "tps": 79846, "wall": 18780.2} {"step": 22881, "train_loss": 3.2944650650024414, "lr": 9.624599500057728e-05, "tps": 79829, "wall": 18785.0} {"step": 22882, "train_loss": 3.3413331508636475, "lr": 9.623208386502295e-05, "tps": 79812, "wall": 18789.8} {"step": 22883, "train_loss": 3.2372007369995117, "lr": 9.621817413151825e-05, "tps": 79795, "wall": 18794.5} {"step": 22884, "train_loss": 3.267338514328003, "lr": 9.620426580022078e-05, "tps": 79778, "wall": 18799.3} {"step": 22885, "train_loss": 3.2774157524108887, "lr": 9.619035887128813e-05, "tps": 79761, "wall": 18804.2} {"step": 22886, "train_loss": 3.2327423095703125, "lr": 9.61764533448777e-05, "tps": 79745, "wall": 18809.0} {"step": 22887, "train_loss": 3.155005693435669, "lr": 9.616254922114719e-05, "tps": 79728, "wall": 18813.8} {"step": 22888, "train_loss": 3.2609598636627197, "lr": 9.614864650025401e-05, "tps": 79711, "wall": 18818.6} {"step": 22889, "train_loss": 3.372368812561035, "lr": 9.613474518235561e-05, "tps": 79694, "wall": 18823.5} {"step": 22890, "train_loss": 3.2922098636627197, "lr": 9.612084526760956e-05, "tps": 79677, "wall": 18828.3} {"step": 22891, "train_loss": 3.3108134269714355, "lr": 9.610694675617329e-05, "tps": 79660, "wall": 18833.1} {"step": 22892, "train_loss": 3.279447555541992, "lr": 9.609304964820417e-05, "tps": 79643, "wall": 18837.9} {"step": 22893, "train_loss": 3.2605175971984863, "lr": 9.607915394385975e-05, "tps": 79626, "wall": 18842.7} {"step": 22894, "train_loss": 3.236114740371704, "lr": 9.606525964329738e-05, "tps": 79609, "wall": 18847.6} {"step": 22895, "train_loss": 3.207021474838257, "lr": 9.605136674667438e-05, "tps": 79592, "wall": 18852.4} {"step": 22896, "train_loss": 3.3311767578125, "lr": 9.603747525414827e-05, "tps": 79575, "wall": 18857.2} {"step": 22897, "train_loss": 3.2839736938476562, "lr": 9.602358516587627e-05, "tps": 79559, "wall": 18862.0} {"step": 22898, "train_loss": 3.2336618900299072, "lr": 9.600969648201588e-05, "tps": 79542, "wall": 18866.8} {"step": 22899, "train_loss": 3.230867862701416, "lr": 9.599580920272436e-05, "tps": 79525, "wall": 18871.7} {"step": 22900, "train_loss": 3.2857444286346436, "lr": 9.598192332815897e-05, "tps": 79508, "wall": 18876.6} {"step": 22901, "train_loss": 3.2071666717529297, "lr": 9.596803885847712e-05, "tps": 79491, "wall": 18881.4} {"step": 22902, "train_loss": 3.2489089965820312, "lr": 9.595415579383603e-05, "tps": 79474, "wall": 18886.2} {"step": 22903, "train_loss": 3.075875759124756, "lr": 9.59402741343929e-05, "tps": 79457, "wall": 18891.0} {"step": 22904, "train_loss": 3.227088212966919, "lr": 9.592639388030512e-05, "tps": 79440, "wall": 18895.8} {"step": 22905, "train_loss": 3.2275495529174805, "lr": 9.591251503172986e-05, "tps": 79424, "wall": 18900.6} {"step": 22906, "train_loss": 3.280003309249878, "lr": 9.58986375888243e-05, "tps": 79407, "wall": 18905.5} {"step": 22907, "train_loss": 3.248936653137207, "lr": 9.588476155174574e-05, "tps": 79390, "wall": 18910.3} {"step": 22908, "train_loss": 3.2071805000305176, "lr": 9.587088692065132e-05, "tps": 79373, "wall": 18915.1} {"step": 22909, "train_loss": 3.397646427154541, "lr": 9.585701369569813e-05, "tps": 79356, "wall": 18920.0} {"step": 22910, "train_loss": 3.229719638824463, "lr": 9.584314187704348e-05, "tps": 79339, "wall": 18924.8} {"step": 22911, "train_loss": 3.343158721923828, "lr": 9.582927146484443e-05, "tps": 79323, "wall": 18929.7} {"step": 22912, "train_loss": 3.3055367469787598, "lr": 9.581540245925805e-05, "tps": 79306, "wall": 18934.5} {"step": 22913, "train_loss": 3.2633988857269287, "lr": 9.580153486044158e-05, "tps": 79289, "wall": 18939.4} {"step": 22914, "train_loss": 3.2174556255340576, "lr": 9.578766866855198e-05, "tps": 79272, "wall": 18944.3} {"step": 22915, "train_loss": 3.2171506881713867, "lr": 9.577380388374643e-05, "tps": 79255, "wall": 18949.1} {"step": 22916, "train_loss": 3.2708067893981934, "lr": 9.575994050618197e-05, "tps": 79238, "wall": 18954.0} {"step": 22917, "train_loss": 3.41855525970459, "lr": 9.574607853601556e-05, "tps": 79221, "wall": 18958.8} {"step": 22918, "train_loss": 3.25119948387146, "lr": 9.573221797340437e-05, "tps": 79205, "wall": 18963.7} {"step": 22919, "train_loss": 3.331394672393799, "lr": 9.571835881850531e-05, "tps": 79188, "wall": 18968.5} {"step": 22920, "train_loss": 3.239692211151123, "lr": 9.570450107147534e-05, "tps": 79171, "wall": 18973.4} {"step": 22921, "train_loss": 3.345694065093994, "lr": 9.56906447324716e-05, "tps": 79154, "wall": 18978.3} {"step": 22922, "train_loss": 3.3425302505493164, "lr": 9.567678980165093e-05, "tps": 79137, "wall": 18983.1} {"step": 22923, "train_loss": 3.3214519023895264, "lr": 9.566293627917026e-05, "tps": 79120, "wall": 18988.0} {"step": 22924, "train_loss": 3.1756012439727783, "lr": 9.564908416518665e-05, "tps": 79104, "wall": 18992.8} {"step": 22925, "train_loss": 3.287411689758301, "lr": 9.563523345985692e-05, "tps": 79087, "wall": 18997.8} {"step": 22926, "train_loss": 3.367919683456421, "lr": 9.562138416333795e-05, "tps": 79070, "wall": 19002.6} {"step": 22927, "train_loss": 3.3097212314605713, "lr": 9.560753627578674e-05, "tps": 79053, "wall": 19007.5} {"step": 22928, "train_loss": 3.1275460720062256, "lr": 9.559368979736005e-05, "tps": 79036, "wall": 19012.3} {"step": 22929, "train_loss": 3.2071173191070557, "lr": 9.557984472821475e-05, "tps": 79020, "wall": 19017.2} {"step": 22930, "train_loss": 3.3599491119384766, "lr": 9.556600106850772e-05, "tps": 79003, "wall": 19022.1} {"step": 22931, "train_loss": 3.282653570175171, "lr": 9.555215881839581e-05, "tps": 78986, "wall": 19026.9} {"step": 22932, "train_loss": 3.223768711090088, "lr": 9.553831797803569e-05, "tps": 78969, "wall": 19031.8} {"step": 22933, "train_loss": 3.20591402053833, "lr": 9.552447854758428e-05, "tps": 78953, "wall": 19036.7} {"step": 22934, "train_loss": 3.282144069671631, "lr": 9.551064052719828e-05, "tps": 78936, "wall": 19041.6} {"step": 22935, "train_loss": 3.176433563232422, "lr": 9.549680391703453e-05, "tps": 78919, "wall": 19046.4} {"step": 22936, "train_loss": 3.29940128326416, "lr": 9.54829687172497e-05, "tps": 78902, "wall": 19051.3} {"step": 22937, "train_loss": 3.221207618713379, "lr": 9.546913492800053e-05, "tps": 78885, "wall": 19056.3} {"step": 22938, "train_loss": 3.1391730308532715, "lr": 9.545530254944376e-05, "tps": 78868, "wall": 19061.2} {"step": 22939, "train_loss": 3.3227391242980957, "lr": 9.544147158173605e-05, "tps": 78852, "wall": 19066.0} {"step": 22940, "train_loss": 3.2196459770202637, "lr": 9.542764202503404e-05, "tps": 78835, "wall": 19070.9} {"step": 22941, "train_loss": 3.284663200378418, "lr": 9.541381387949452e-05, "tps": 78818, "wall": 19075.8} {"step": 22942, "train_loss": 3.147056818008423, "lr": 9.539998714527402e-05, "tps": 78801, "wall": 19080.7} {"step": 22943, "train_loss": 3.181908130645752, "lr": 9.538616182252918e-05, "tps": 78785, "wall": 19085.6} {"step": 22944, "train_loss": 3.236926317214966, "lr": 9.537233791141667e-05, "tps": 78768, "wall": 19090.5} {"step": 22945, "train_loss": 3.1862242221832275, "lr": 9.535851541209308e-05, "tps": 78751, "wall": 19095.4} {"step": 22946, "train_loss": 3.224439859390259, "lr": 9.534469432471491e-05, "tps": 78734, "wall": 19100.2} {"step": 22947, "train_loss": 3.2071757316589355, "lr": 9.533087464943885e-05, "tps": 78718, "wall": 19105.1} {"step": 22948, "train_loss": 3.211763620376587, "lr": 9.531705638642137e-05, "tps": 78701, "wall": 19110.0} {"step": 22949, "train_loss": 3.2753303050994873, "lr": 9.530323953581896e-05, "tps": 78684, "wall": 19114.9} {"step": 22950, "train_loss": 3.305429458618164, "lr": 9.528942409778828e-05, "tps": 78667, "wall": 19119.9} {"step": 22951, "train_loss": 3.3135461807250977, "lr": 9.527561007248566e-05, "tps": 78650, "wall": 19124.8} {"step": 22952, "train_loss": 3.189520835876465, "lr": 9.526179746006777e-05, "tps": 78634, "wall": 19129.7} {"step": 22953, "train_loss": 3.3040785789489746, "lr": 9.524798626069097e-05, "tps": 78617, "wall": 19134.6} {"step": 22954, "train_loss": 3.199070692062378, "lr": 9.523417647451167e-05, "tps": 78600, "wall": 19139.5} {"step": 22955, "train_loss": 3.304279327392578, "lr": 9.522036810168643e-05, "tps": 78584, "wall": 19144.4} {"step": 22956, "train_loss": 3.261164665222168, "lr": 9.52065611423716e-05, "tps": 78567, "wall": 19149.3} {"step": 22957, "train_loss": 3.2001843452453613, "lr": 9.519275559672356e-05, "tps": 78550, "wall": 19154.2} {"step": 22958, "train_loss": 3.313333511352539, "lr": 9.517895146489877e-05, "tps": 78533, "wall": 19159.1} {"step": 22959, "train_loss": 3.2038702964782715, "lr": 9.516514874705359e-05, "tps": 78517, "wall": 19164.0} {"step": 22960, "train_loss": 3.2575881481170654, "lr": 9.51513474433443e-05, "tps": 78500, "wall": 19168.9} {"step": 22961, "train_loss": 3.1481645107269287, "lr": 9.513754755392735e-05, "tps": 78483, "wall": 19173.8} {"step": 22962, "train_loss": 3.1739346981048584, "lr": 9.512374907895902e-05, "tps": 78466, "wall": 19178.8} {"step": 22963, "train_loss": 3.283308506011963, "lr": 9.510995201859555e-05, "tps": 78450, "wall": 19183.7} {"step": 22964, "train_loss": 3.277097463607788, "lr": 9.509615637299336e-05, "tps": 78433, "wall": 19188.6} {"step": 22965, "train_loss": 3.3573951721191406, "lr": 9.508236214230866e-05, "tps": 78416, "wall": 19193.5} {"step": 22966, "train_loss": 3.313673496246338, "lr": 9.506856932669769e-05, "tps": 78400, "wall": 19198.5} {"step": 22967, "train_loss": 3.1355414390563965, "lr": 9.505477792631678e-05, "tps": 78383, "wall": 19203.4} {"step": 22968, "train_loss": 3.181457281112671, "lr": 9.504098794132202e-05, "tps": 78366, "wall": 19208.3} {"step": 22969, "train_loss": 3.174440860748291, "lr": 9.502719937186979e-05, "tps": 78350, "wall": 19213.2} {"step": 22970, "train_loss": 3.2943592071533203, "lr": 9.501341221811619e-05, "tps": 78333, "wall": 19218.1} {"step": 22971, "train_loss": 3.2469370365142822, "lr": 9.499962648021737e-05, "tps": 78317, "wall": 19223.0} {"step": 22972, "train_loss": 3.2757794857025146, "lr": 9.498584215832959e-05, "tps": 78300, "wall": 19228.0} {"step": 22973, "train_loss": 3.339975357055664, "lr": 9.497205925260898e-05, "tps": 78283, "wall": 19232.9} {"step": 22974, "train_loss": 3.200470209121704, "lr": 9.495827776321154e-05, "tps": 78266, "wall": 19237.9} {"step": 22975, "train_loss": 3.1664679050445557, "lr": 9.49444976902936e-05, "tps": 78250, "wall": 19242.8} {"step": 22976, "train_loss": 3.3910417556762695, "lr": 9.493071903401115e-05, "tps": 78233, "wall": 19247.7} {"step": 22977, "train_loss": 3.248185396194458, "lr": 9.49169417945202e-05, "tps": 78216, "wall": 19252.7} {"step": 22978, "train_loss": 3.271888017654419, "lr": 9.490316597197696e-05, "tps": 78200, "wall": 19257.6} {"step": 22979, "train_loss": 3.359086513519287, "lr": 9.488939156653745e-05, "tps": 78183, "wall": 19262.5} {"step": 22980, "train_loss": 3.238905668258667, "lr": 9.487561857835759e-05, "tps": 78167, "wall": 19267.5} {"step": 22981, "train_loss": 3.1702258586883545, "lr": 9.486184700759356e-05, "tps": 78150, "wall": 19272.4} {"step": 22982, "train_loss": 3.3159494400024414, "lr": 9.484807685440133e-05, "tps": 78133, "wall": 19277.3} {"step": 22983, "train_loss": 3.223729372024536, "lr": 9.483430811893676e-05, "tps": 78117, "wall": 19282.2} {"step": 22984, "train_loss": 3.3100805282592773, "lr": 9.4820540801356e-05, "tps": 78100, "wall": 19287.2} {"step": 22985, "train_loss": 3.186718463897705, "lr": 9.48067749018149e-05, "tps": 78084, "wall": 19292.1} {"step": 22986, "train_loss": 3.3083083629608154, "lr": 9.479301042046939e-05, "tps": 78067, "wall": 19297.1} {"step": 22987, "train_loss": 3.1804721355438232, "lr": 9.477924735747547e-05, "tps": 78050, "wall": 19302.0} {"step": 22988, "train_loss": 3.242408037185669, "lr": 9.476548571298897e-05, "tps": 78034, "wall": 19307.0} {"step": 22989, "train_loss": 3.310872793197632, "lr": 9.475172548716587e-05, "tps": 78017, "wall": 19311.9} {"step": 22990, "train_loss": 3.3143060207366943, "lr": 9.473796668016201e-05, "tps": 78001, "wall": 19316.8} {"step": 22991, "train_loss": 3.295586585998535, "lr": 9.472420929213317e-05, "tps": 77984, "wall": 19321.8} {"step": 22992, "train_loss": 3.2501845359802246, "lr": 9.471045332323532e-05, "tps": 77968, "wall": 19326.7} {"step": 22993, "train_loss": 3.1584036350250244, "lr": 9.469669877362425e-05, "tps": 77951, "wall": 19331.6} {"step": 22994, "train_loss": 3.254206895828247, "lr": 9.468294564345568e-05, "tps": 77935, "wall": 19336.6} {"step": 22995, "train_loss": 3.2966578006744385, "lr": 9.466919393288556e-05, "tps": 77918, "wall": 19341.5} {"step": 22996, "train_loss": 3.232262372970581, "lr": 9.465544364206958e-05, "tps": 77902, "wall": 19346.5} {"step": 22997, "train_loss": 3.2249906063079834, "lr": 9.464169477116346e-05, "tps": 77885, "wall": 19351.4} {"step": 22998, "train_loss": 3.319814682006836, "lr": 9.462794732032306e-05, "tps": 77868, "wall": 19356.4} {"step": 22999, "train_loss": 3.264880895614624, "lr": 9.461420128970405e-05, "tps": 77852, "wall": 19361.4} {"step": 23000, "train_loss": 3.2087059020996094, "lr": 9.46004566794621e-05, "tps": 77835, "wall": 19366.3, "val_loss_monitor": 3.33378361972352} {"step": 23001, "train_loss": 3.1936464309692383, "lr": 9.458671348975302e-05, "tps": 77626, "wall": 19419.4} {"step": 23002, "train_loss": 3.4807913303375244, "lr": 9.45729717207324e-05, "tps": 77610, "wall": 19424.3} {"step": 23003, "train_loss": 3.136606216430664, "lr": 9.455923137255593e-05, "tps": 77593, "wall": 19429.3} {"step": 23004, "train_loss": 3.311905860900879, "lr": 9.45454924453793e-05, "tps": 77577, "wall": 19434.3} {"step": 23005, "train_loss": 3.2682442665100098, "lr": 9.453175493935809e-05, "tps": 77560, "wall": 19439.2} {"step": 23006, "train_loss": 3.23888897895813, "lr": 9.451801885464799e-05, "tps": 77544, "wall": 19444.2} {"step": 23007, "train_loss": 3.1927895545959473, "lr": 9.450428419140457e-05, "tps": 77528, "wall": 19449.1} {"step": 23008, "train_loss": 3.2638559341430664, "lr": 9.449055094978334e-05, "tps": 77511, "wall": 19454.1} {"step": 23009, "train_loss": 3.3372626304626465, "lr": 9.447681912993999e-05, "tps": 77495, "wall": 19459.0} {"step": 23010, "train_loss": 3.2680559158325195, "lr": 9.446308873203003e-05, "tps": 77478, "wall": 19464.0} {"step": 23011, "train_loss": 3.2599570751190186, "lr": 9.444935975620894e-05, "tps": 77462, "wall": 19469.0} {"step": 23012, "train_loss": 3.3894286155700684, "lr": 9.443563220263242e-05, "tps": 77446, "wall": 19473.9} {"step": 23013, "train_loss": 3.209015130996704, "lr": 9.442190607145571e-05, "tps": 77429, "wall": 19479.0} {"step": 23014, "train_loss": 3.24252986907959, "lr": 9.440818136283451e-05, "tps": 77413, "wall": 19484.0} {"step": 23015, "train_loss": 3.248326063156128, "lr": 9.439445807692423e-05, "tps": 77396, "wall": 19488.9} {"step": 23016, "train_loss": 3.2875895500183105, "lr": 9.438073621388027e-05, "tps": 77380, "wall": 19493.9} {"step": 23017, "train_loss": 3.256126880645752, "lr": 9.436701577385816e-05, "tps": 77363, "wall": 19498.9} {"step": 23018, "train_loss": 3.288832902908325, "lr": 9.435329675701331e-05, "tps": 77347, "wall": 19503.9} {"step": 23019, "train_loss": 3.340381622314453, "lr": 9.433957916350109e-05, "tps": 77331, "wall": 19508.8} {"step": 23020, "train_loss": 3.2577919960021973, "lr": 9.432586299347691e-05, "tps": 77314, "wall": 19513.8} {"step": 23021, "train_loss": 3.2081525325775146, "lr": 9.431214824709617e-05, "tps": 77298, "wall": 19518.8} {"step": 23022, "train_loss": 3.255197763442993, "lr": 9.429843492451418e-05, "tps": 77282, "wall": 19523.7} {"step": 23023, "train_loss": 3.2278428077697754, "lr": 9.428472302588636e-05, "tps": 77265, "wall": 19528.7} {"step": 23024, "train_loss": 3.153270721435547, "lr": 9.4271012551368e-05, "tps": 77249, "wall": 19533.7} {"step": 23025, "train_loss": 3.3014116287231445, "lr": 9.425730350111435e-05, "tps": 77233, "wall": 19538.7} {"step": 23026, "train_loss": 3.3105764389038086, "lr": 9.424359587528084e-05, "tps": 77216, "wall": 19543.7} {"step": 23027, "train_loss": 3.2041287422180176, "lr": 9.422988967402268e-05, "tps": 77200, "wall": 19548.7} {"step": 23028, "train_loss": 3.340264081954956, "lr": 9.421618489749507e-05, "tps": 77183, "wall": 19553.7} {"step": 23029, "train_loss": 3.3256583213806152, "lr": 9.420248154585337e-05, "tps": 77167, "wall": 19558.6} {"step": 23030, "train_loss": 3.320026397705078, "lr": 9.418877961925271e-05, "tps": 77151, "wall": 19563.6} {"step": 23031, "train_loss": 3.2491300106048584, "lr": 9.417507911784845e-05, "tps": 77135, "wall": 19568.6} {"step": 23032, "train_loss": 3.279284954071045, "lr": 9.416138004179565e-05, "tps": 77118, "wall": 19573.6} {"step": 23033, "train_loss": 3.1296305656433105, "lr": 9.414768239124951e-05, "tps": 77102, "wall": 19578.5} {"step": 23034, "train_loss": 3.3060617446899414, "lr": 9.41339861663653e-05, "tps": 77086, "wall": 19583.5} {"step": 23035, "train_loss": 3.3414087295532227, "lr": 9.41202913672981e-05, "tps": 77069, "wall": 19588.5} {"step": 23036, "train_loss": 3.269350051879883, "lr": 9.410659799420298e-05, "tps": 77053, "wall": 19593.5} {"step": 23037, "train_loss": 3.2502081394195557, "lr": 9.40929060472352e-05, "tps": 77037, "wall": 19598.6} {"step": 23038, "train_loss": 3.2295901775360107, "lr": 9.407921552654978e-05, "tps": 77021, "wall": 19603.5} {"step": 23039, "train_loss": 3.24692964553833, "lr": 9.406552643230175e-05, "tps": 77004, "wall": 19608.5} {"step": 23040, "train_loss": 3.2555480003356934, "lr": 9.405183876464633e-05, "tps": 76988, "wall": 19613.5} {"step": 23041, "train_loss": 3.2328858375549316, "lr": 9.403815252373848e-05, "tps": 76972, "wall": 19618.5} {"step": 23042, "train_loss": 3.264911651611328, "lr": 9.402446770973323e-05, "tps": 76956, "wall": 19623.5} {"step": 23043, "train_loss": 3.224501371383667, "lr": 9.401078432278564e-05, "tps": 76939, "wall": 19628.4} {"step": 23044, "train_loss": 3.181810140609741, "lr": 9.399710236305071e-05, "tps": 76923, "wall": 19633.4} {"step": 23045, "train_loss": 3.3060595989227295, "lr": 9.398342183068338e-05, "tps": 76907, "wall": 19638.4} {"step": 23046, "train_loss": 3.2495157718658447, "lr": 9.396974272583871e-05, "tps": 76891, "wall": 19643.4} {"step": 23047, "train_loss": 3.2898972034454346, "lr": 9.395606504867153e-05, "tps": 76875, "wall": 19648.3} {"step": 23048, "train_loss": 3.2965002059936523, "lr": 9.394238879933697e-05, "tps": 76859, "wall": 19653.3} {"step": 23049, "train_loss": 3.3955295085906982, "lr": 9.392871397798981e-05, "tps": 76842, "wall": 19658.4} {"step": 23050, "train_loss": 3.210233211517334, "lr": 9.391504058478497e-05, "tps": 76826, "wall": 19663.4} {"step": 23051, "train_loss": 3.168081760406494, "lr": 9.39013686198774e-05, "tps": 76810, "wall": 19668.4} {"step": 23052, "train_loss": 3.244011878967285, "lr": 9.388769808342198e-05, "tps": 76794, "wall": 19673.4} {"step": 23053, "train_loss": 3.240227222442627, "lr": 9.387402897557346e-05, "tps": 76778, "wall": 19678.4} {"step": 23054, "train_loss": 3.232398748397827, "lr": 9.386036129648683e-05, "tps": 76762, "wall": 19683.3} {"step": 23055, "train_loss": 3.259312391281128, "lr": 9.384669504631684e-05, "tps": 76745, "wall": 19688.3} {"step": 23056, "train_loss": 3.289579391479492, "lr": 9.383303022521826e-05, "tps": 76729, "wall": 19693.3} {"step": 23057, "train_loss": 3.2549805641174316, "lr": 9.381936683334601e-05, "tps": 76713, "wall": 19698.3} {"step": 23058, "train_loss": 3.293473958969116, "lr": 9.38057048708548e-05, "tps": 76697, "wall": 19703.3} {"step": 23059, "train_loss": 3.2492215633392334, "lr": 9.379204433789932e-05, "tps": 76681, "wall": 19708.3} {"step": 23060, "train_loss": 3.1580300331115723, "lr": 9.377838523463446e-05, "tps": 76665, "wall": 19713.3} {"step": 23061, "train_loss": 3.3514556884765625, "lr": 9.376472756121487e-05, "tps": 76649, "wall": 19718.3} {"step": 23062, "train_loss": 3.2317593097686768, "lr": 9.375107131779522e-05, "tps": 76633, "wall": 19723.3} {"step": 23063, "train_loss": 3.1605262756347656, "lr": 9.373741650453031e-05, "tps": 76616, "wall": 19728.3} {"step": 23064, "train_loss": 3.2817111015319824, "lr": 9.372376312157473e-05, "tps": 76600, "wall": 19733.3} {"step": 23065, "train_loss": 3.30814266204834, "lr": 9.371011116908325e-05, "tps": 76584, "wall": 19738.3} {"step": 23066, "train_loss": 3.1370813846588135, "lr": 9.369646064721049e-05, "tps": 76568, "wall": 19743.3} {"step": 23067, "train_loss": 3.3511035442352295, "lr": 9.368281155611094e-05, "tps": 76552, "wall": 19748.3} {"step": 23068, "train_loss": 3.216972589492798, "lr": 9.366916389593942e-05, "tps": 76536, "wall": 19753.3} {"step": 23069, "train_loss": 3.273970127105713, "lr": 9.365551766685045e-05, "tps": 76520, "wall": 19758.3} {"step": 23070, "train_loss": 3.2656707763671875, "lr": 9.364187286899856e-05, "tps": 76504, "wall": 19763.3} {"step": 23071, "train_loss": 3.204153299331665, "lr": 9.362822950253844e-05, "tps": 76488, "wall": 19768.3} {"step": 23072, "train_loss": 3.152576446533203, "lr": 9.361458756762455e-05, "tps": 76472, "wall": 19773.3} {"step": 23073, "train_loss": 3.3446059226989746, "lr": 9.360094706441139e-05, "tps": 76456, "wall": 19778.3} {"step": 23074, "train_loss": 3.1050479412078857, "lr": 9.358730799305361e-05, "tps": 76440, "wall": 19783.3} {"step": 23075, "train_loss": 3.273426055908203, "lr": 9.357367035370562e-05, "tps": 76424, "wall": 19788.3} {"step": 23076, "train_loss": 3.2083194255828857, "lr": 9.35600341465219e-05, "tps": 76408, "wall": 19793.3} {"step": 23077, "train_loss": 3.266608238220215, "lr": 9.3546399371657e-05, "tps": 76392, "wall": 19798.3} {"step": 23078, "train_loss": 3.238940954208374, "lr": 9.353276602926533e-05, "tps": 76376, "wall": 19803.3} {"step": 23079, "train_loss": 3.281628370285034, "lr": 9.351913411950127e-05, "tps": 76360, "wall": 19808.3} {"step": 23080, "train_loss": 3.223343849182129, "lr": 9.350550364251937e-05, "tps": 76344, "wall": 19813.3} {"step": 23081, "train_loss": 3.2359211444854736, "lr": 9.349187459847394e-05, "tps": 76328, "wall": 19818.3} {"step": 23082, "train_loss": 3.291095733642578, "lr": 9.347824698751937e-05, "tps": 76312, "wall": 19823.3} {"step": 23083, "train_loss": 3.2563252449035645, "lr": 9.34646208098101e-05, "tps": 76296, "wall": 19828.2} {"step": 23084, "train_loss": 3.3139100074768066, "lr": 9.34509960655004e-05, "tps": 76280, "wall": 19833.2} {"step": 23085, "train_loss": 3.1989831924438477, "lr": 9.343737275474473e-05, "tps": 76264, "wall": 19838.3} {"step": 23086, "train_loss": 3.173309326171875, "lr": 9.342375087769736e-05, "tps": 76248, "wall": 19843.3} {"step": 23087, "train_loss": 3.217299699783325, "lr": 9.34101304345125e-05, "tps": 76232, "wall": 19848.3} {"step": 23088, "train_loss": 3.1777422428131104, "lr": 9.339651142534459e-05, "tps": 76217, "wall": 19853.3} {"step": 23089, "train_loss": 3.230462074279785, "lr": 9.338289385034786e-05, "tps": 76201, "wall": 19858.3} {"step": 23090, "train_loss": 3.240365743637085, "lr": 9.33692777096765e-05, "tps": 76184, "wall": 19863.4} {"step": 23091, "train_loss": 3.189673900604248, "lr": 9.335566300348488e-05, "tps": 76168, "wall": 19868.5} {"step": 23092, "train_loss": 3.056304693222046, "lr": 9.334204973192714e-05, "tps": 76152, "wall": 19873.5} {"step": 23093, "train_loss": 3.2725830078125, "lr": 9.332843789515746e-05, "tps": 76136, "wall": 19878.6} {"step": 23094, "train_loss": 3.2342543601989746, "lr": 9.331482749333016e-05, "tps": 76120, "wall": 19883.7} {"step": 23095, "train_loss": 3.1929855346679688, "lr": 9.330121852659933e-05, "tps": 76104, "wall": 19888.8} {"step": 23096, "train_loss": 3.281129837036133, "lr": 9.32876109951191e-05, "tps": 76087, "wall": 19893.9} {"step": 23097, "train_loss": 3.1161913871765137, "lr": 9.327400489904374e-05, "tps": 76071, "wall": 19899.2} {"step": 23098, "train_loss": 3.311535120010376, "lr": 9.32604002385273e-05, "tps": 76054, "wall": 19904.3} {"step": 23099, "train_loss": 3.210512399673462, "lr": 9.324679701372383e-05, "tps": 76038, "wall": 19909.5} {"step": 23100, "train_loss": 3.2108941078186035, "lr": 9.323319522478756e-05, "tps": 76021, "wall": 19914.6} {"step": 23101, "train_loss": 3.2148022651672363, "lr": 9.321959487187247e-05, "tps": 76005, "wall": 19919.8} {"step": 23102, "train_loss": 3.3600645065307617, "lr": 9.320599595513271e-05, "tps": 75989, "wall": 19924.9} {"step": 23103, "train_loss": 3.180677890777588, "lr": 9.319239847472229e-05, "tps": 75972, "wall": 19930.1} {"step": 23104, "train_loss": 3.264772415161133, "lr": 9.31788024307952e-05, "tps": 75956, "wall": 19935.3} {"step": 23105, "train_loss": 3.219369411468506, "lr": 9.316520782350555e-05, "tps": 75939, "wall": 19940.4} {"step": 23106, "train_loss": 3.2290568351745605, "lr": 9.315161465300727e-05, "tps": 75923, "wall": 19945.6} {"step": 23107, "train_loss": 3.2302956581115723, "lr": 9.313802291945431e-05, "tps": 75907, "wall": 19950.8} {"step": 23108, "train_loss": 3.3825631141662598, "lr": 9.312443262300078e-05, "tps": 75890, "wall": 19956.1} {"step": 23109, "train_loss": 3.215409278869629, "lr": 9.31108437638005e-05, "tps": 75873, "wall": 19961.2} {"step": 23110, "train_loss": 3.351588010787964, "lr": 9.30972563420074e-05, "tps": 75857, "wall": 19966.4} {"step": 23111, "train_loss": 3.2662837505340576, "lr": 9.30836703577755e-05, "tps": 75841, "wall": 19971.6} {"step": 23112, "train_loss": 3.2629966735839844, "lr": 9.307008581125865e-05, "tps": 75824, "wall": 19976.8} {"step": 23113, "train_loss": 3.284970760345459, "lr": 9.305650270261068e-05, "tps": 75808, "wall": 19982.0} {"step": 23114, "train_loss": 3.1673619747161865, "lr": 9.304292103198558e-05, "tps": 75792, "wall": 19987.1} {"step": 23115, "train_loss": 3.2262423038482666, "lr": 9.302934079953713e-05, "tps": 75775, "wall": 19992.3} {"step": 23116, "train_loss": 3.2445390224456787, "lr": 9.301576200541912e-05, "tps": 75759, "wall": 19997.5} {"step": 23117, "train_loss": 3.3487086296081543, "lr": 9.30021846497855e-05, "tps": 75743, "wall": 20002.6} {"step": 23118, "train_loss": 3.2489466667175293, "lr": 9.298860873278998e-05, "tps": 75726, "wall": 20007.8} {"step": 23119, "train_loss": 3.1615545749664307, "lr": 9.297503425458632e-05, "tps": 75710, "wall": 20013.0} {"step": 23120, "train_loss": 3.1742262840270996, "lr": 9.29614612153284e-05, "tps": 75693, "wall": 20018.2} {"step": 23121, "train_loss": 3.3160297870635986, "lr": 9.294788961516986e-05, "tps": 75677, "wall": 20023.4} {"step": 23122, "train_loss": 3.2758946418762207, "lr": 9.293431945426457e-05, "tps": 75661, "wall": 20028.7} {"step": 23123, "train_loss": 3.2114248275756836, "lr": 9.292075073276617e-05, "tps": 75644, "wall": 20033.8} {"step": 23124, "train_loss": 3.2985386848449707, "lr": 9.290718345082834e-05, "tps": 75628, "wall": 20039.0} {"step": 23125, "train_loss": 3.2535645961761475, "lr": 9.289361760860485e-05, "tps": 75612, "wall": 20044.2} {"step": 23126, "train_loss": 3.253366470336914, "lr": 9.288005320624936e-05, "tps": 75595, "wall": 20049.4} {"step": 23127, "train_loss": 3.280282497406006, "lr": 9.286649024391542e-05, "tps": 75579, "wall": 20054.6} {"step": 23128, "train_loss": 3.2324485778808594, "lr": 9.285292872175683e-05, "tps": 75563, "wall": 20059.8} {"step": 23129, "train_loss": 3.393017292022705, "lr": 9.283936863992712e-05, "tps": 75546, "wall": 20065.0} {"step": 23130, "train_loss": 3.307879686355591, "lr": 9.282580999857991e-05, "tps": 75530, "wall": 20070.2} {"step": 23131, "train_loss": 3.318528175354004, "lr": 9.281225279786883e-05, "tps": 75514, "wall": 20075.4} {"step": 23132, "train_loss": 3.1875202655792236, "lr": 9.279869703794741e-05, "tps": 75497, "wall": 20080.7} {"step": 23133, "train_loss": 3.2980518341064453, "lr": 9.278514271896921e-05, "tps": 75481, "wall": 20086.0} {"step": 23134, "train_loss": 3.270832061767578, "lr": 9.277158984108785e-05, "tps": 75464, "wall": 20091.2} {"step": 23135, "train_loss": 3.2530622482299805, "lr": 9.275803840445679e-05, "tps": 75448, "wall": 20096.4} {"step": 23136, "train_loss": 3.3468575477600098, "lr": 9.27444884092295e-05, "tps": 75431, "wall": 20101.6} {"step": 23137, "train_loss": 3.213170051574707, "lr": 9.273093985555959e-05, "tps": 75415, "wall": 20106.9} {"step": 23138, "train_loss": 3.286212921142578, "lr": 9.271739274360043e-05, "tps": 75399, "wall": 20112.1} {"step": 23139, "train_loss": 3.2985010147094727, "lr": 9.270384707350557e-05, "tps": 75382, "wall": 20117.4} {"step": 23140, "train_loss": 3.2616467475891113, "lr": 9.269030284542842e-05, "tps": 75366, "wall": 20122.6} {"step": 23141, "train_loss": 3.3019731044769287, "lr": 9.267676005952236e-05, "tps": 75350, "wall": 20127.8} {"step": 23142, "train_loss": 3.3337578773498535, "lr": 9.266321871594091e-05, "tps": 75333, "wall": 20133.1} {"step": 23143, "train_loss": 3.2550973892211914, "lr": 9.264967881483738e-05, "tps": 75316, "wall": 20138.4} {"step": 23144, "train_loss": 3.283456563949585, "lr": 9.263614035636515e-05, "tps": 75300, "wall": 20143.7} {"step": 23145, "train_loss": 3.2845280170440674, "lr": 9.262260334067767e-05, "tps": 75284, "wall": 20149.0} {"step": 23146, "train_loss": 3.183664321899414, "lr": 9.26090677679282e-05, "tps": 75267, "wall": 20154.2} {"step": 23147, "train_loss": 3.1871862411499023, "lr": 9.259553363827008e-05, "tps": 75251, "wall": 20159.4} {"step": 23148, "train_loss": 3.3523006439208984, "lr": 9.258200095185669e-05, "tps": 75235, "wall": 20164.6} {"step": 23149, "train_loss": 3.1953630447387695, "lr": 9.256846970884129e-05, "tps": 75219, "wall": 20169.8} {"step": 23150, "train_loss": 3.321863889694214, "lr": 9.255493990937708e-05, "tps": 75203, "wall": 20175.0} {"step": 23151, "train_loss": 3.2397332191467285, "lr": 9.254141155361747e-05, "tps": 75186, "wall": 20180.3} {"step": 23152, "train_loss": 3.236616611480713, "lr": 9.252788464171565e-05, "tps": 75170, "wall": 20185.5} {"step": 23153, "train_loss": 3.118241786956787, "lr": 9.251435917382481e-05, "tps": 75154, "wall": 20190.7} {"step": 23154, "train_loss": 3.2551090717315674, "lr": 9.250083515009826e-05, "tps": 75137, "wall": 20196.0} {"step": 23155, "train_loss": 3.298953056335449, "lr": 9.248731257068907e-05, "tps": 75121, "wall": 20201.3} {"step": 23156, "train_loss": 3.227238178253174, "lr": 9.247379143575057e-05, "tps": 75105, "wall": 20206.5} {"step": 23157, "train_loss": 3.159268856048584, "lr": 9.246027174543588e-05, "tps": 75089, "wall": 20211.7} {"step": 23158, "train_loss": 3.2948455810546875, "lr": 9.244675349989804e-05, "tps": 75073, "wall": 20217.0} {"step": 23159, "train_loss": 3.3229997158050537, "lr": 9.243323669929035e-05, "tps": 75056, "wall": 20222.2} {"step": 23160, "train_loss": 3.2912344932556152, "lr": 9.241972134376586e-05, "tps": 75040, "wall": 20227.4} {"step": 23161, "train_loss": 3.2428462505340576, "lr": 9.24062074334776e-05, "tps": 75024, "wall": 20232.6} {"step": 23162, "train_loss": 3.253422260284424, "lr": 9.239269496857877e-05, "tps": 75008, "wall": 20237.8} {"step": 23163, "train_loss": 3.1831140518188477, "lr": 9.237918394922242e-05, "tps": 74992, "wall": 20243.1} {"step": 23164, "train_loss": 3.2593531608581543, "lr": 9.236567437556151e-05, "tps": 74976, "wall": 20248.3} {"step": 23165, "train_loss": 3.3145499229431152, "lr": 9.23521662477492e-05, "tps": 74960, "wall": 20253.5} {"step": 23166, "train_loss": 3.162449836730957, "lr": 9.233865956593847e-05, "tps": 74943, "wall": 20258.8} {"step": 23167, "train_loss": 3.243131637573242, "lr": 9.232515433028225e-05, "tps": 74927, "wall": 20264.1} {"step": 23168, "train_loss": 3.1429405212402344, "lr": 9.231165054093363e-05, "tps": 74911, "wall": 20269.3} {"step": 23169, "train_loss": 3.282151222229004, "lr": 9.229814819804555e-05, "tps": 74895, "wall": 20274.6} {"step": 23170, "train_loss": 3.2156896591186523, "lr": 9.228464730177089e-05, "tps": 74879, "wall": 20279.8} {"step": 23171, "train_loss": 3.2431411743164062, "lr": 9.227114785226273e-05, "tps": 74863, "wall": 20285.0} {"step": 23172, "train_loss": 3.173872709274292, "lr": 9.225764984967392e-05, "tps": 74847, "wall": 20290.2} {"step": 23173, "train_loss": 3.2633814811706543, "lr": 9.224415329415728e-05, "tps": 74831, "wall": 20295.4} {"step": 23174, "train_loss": 3.2102560997009277, "lr": 9.223065818586587e-05, "tps": 74815, "wall": 20300.6} {"step": 23175, "train_loss": 3.223637580871582, "lr": 9.221716452495239e-05, "tps": 74799, "wall": 20305.9} {"step": 23176, "train_loss": 3.272371768951416, "lr": 9.220367231156987e-05, "tps": 74783, "wall": 20311.1} {"step": 23177, "train_loss": 3.2325706481933594, "lr": 9.219018154587105e-05, "tps": 74766, "wall": 20316.4} {"step": 23178, "train_loss": 3.1979684829711914, "lr": 9.217669222800871e-05, "tps": 74750, "wall": 20321.7} {"step": 23179, "train_loss": 3.241720199584961, "lr": 9.216320435813577e-05, "tps": 74734, "wall": 20326.9} {"step": 23180, "train_loss": 3.22993803024292, "lr": 9.214971793640496e-05, "tps": 74718, "wall": 20332.1} {"step": 23181, "train_loss": 3.242687463760376, "lr": 9.213623296296907e-05, "tps": 74702, "wall": 20337.4} {"step": 23182, "train_loss": 3.3012020587921143, "lr": 9.212274943798085e-05, "tps": 74686, "wall": 20342.6} {"step": 23183, "train_loss": 3.1898062229156494, "lr": 9.210926736159298e-05, "tps": 74670, "wall": 20347.8} {"step": 23184, "train_loss": 3.251864433288574, "lr": 9.209578673395833e-05, "tps": 74654, "wall": 20353.0} {"step": 23185, "train_loss": 3.218233585357666, "lr": 9.208230755522951e-05, "tps": 74638, "wall": 20358.2} {"step": 23186, "train_loss": 3.2757833003997803, "lr": 9.206882982555915e-05, "tps": 74623, "wall": 20363.5} {"step": 23187, "train_loss": 3.300079107284546, "lr": 9.20553535451001e-05, "tps": 74606, "wall": 20368.7} {"step": 23188, "train_loss": 3.2896928787231445, "lr": 9.204187871400492e-05, "tps": 74591, "wall": 20374.0} {"step": 23189, "train_loss": 3.242745876312256, "lr": 9.202840533242619e-05, "tps": 74574, "wall": 20379.2} {"step": 23190, "train_loss": 3.257129192352295, "lr": 9.201493340051667e-05, "tps": 74558, "wall": 20384.5} {"step": 23191, "train_loss": 3.1836440563201904, "lr": 9.20014629184289e-05, "tps": 74542, "wall": 20389.7} {"step": 23192, "train_loss": 3.2517592906951904, "lr": 9.198799388631542e-05, "tps": 74527, "wall": 20395.0} {"step": 23193, "train_loss": 3.2352850437164307, "lr": 9.197452630432896e-05, "tps": 74511, "wall": 20400.2} {"step": 23194, "train_loss": 3.279022693634033, "lr": 9.196106017262197e-05, "tps": 74495, "wall": 20405.5} {"step": 23195, "train_loss": 3.308093786239624, "lr": 9.194759549134697e-05, "tps": 74479, "wall": 20410.7} {"step": 23196, "train_loss": 3.2388949394226074, "lr": 9.193413226065657e-05, "tps": 74463, "wall": 20415.9} {"step": 23197, "train_loss": 3.269360065460205, "lr": 9.192067048070323e-05, "tps": 74447, "wall": 20421.2} {"step": 23198, "train_loss": 3.238553524017334, "lr": 9.190721015163948e-05, "tps": 74431, "wall": 20426.4} {"step": 23199, "train_loss": 3.330798387527466, "lr": 9.18937512736178e-05, "tps": 74415, "wall": 20431.6} {"step": 23200, "train_loss": 3.2360548973083496, "lr": 9.18802938467906e-05, "tps": 74399, "wall": 20437.0} {"step": 23201, "train_loss": 3.3396596908569336, "lr": 9.18668378713104e-05, "tps": 74383, "wall": 20442.2} {"step": 23202, "train_loss": 3.3236379623413086, "lr": 9.185338334732958e-05, "tps": 74367, "wall": 20447.5} {"step": 23203, "train_loss": 3.223550796508789, "lr": 9.183993027500052e-05, "tps": 74351, "wall": 20452.7} {"step": 23204, "train_loss": 3.235795497894287, "lr": 9.182647865447573e-05, "tps": 74336, "wall": 20457.9} {"step": 23205, "train_loss": 3.257187843322754, "lr": 9.181302848590752e-05, "tps": 74320, "wall": 20463.2} {"step": 23206, "train_loss": 3.303713798522949, "lr": 9.17995797694482e-05, "tps": 74304, "wall": 20468.4} {"step": 23207, "train_loss": 3.228933334350586, "lr": 9.178613250525021e-05, "tps": 74288, "wall": 20473.6} {"step": 23208, "train_loss": 3.231964588165283, "lr": 9.177268669346589e-05, "tps": 74272, "wall": 20478.9} {"step": 23209, "train_loss": 3.3115930557250977, "lr": 9.175924233424741e-05, "tps": 74257, "wall": 20484.1} {"step": 23210, "train_loss": 3.2980735301971436, "lr": 9.174579942774725e-05, "tps": 74241, "wall": 20489.4} {"step": 23211, "train_loss": 3.2504286766052246, "lr": 9.173235797411762e-05, "tps": 74225, "wall": 20494.6} {"step": 23212, "train_loss": 3.321408987045288, "lr": 9.17189179735107e-05, "tps": 74209, "wall": 20499.9} {"step": 23213, "train_loss": 3.215003252029419, "lr": 9.170547942607889e-05, "tps": 74193, "wall": 20505.1} {"step": 23214, "train_loss": 3.2279229164123535, "lr": 9.169204233197435e-05, "tps": 74178, "wall": 20510.4} {"step": 23215, "train_loss": 3.2772960662841797, "lr": 9.167860669134923e-05, "tps": 74162, "wall": 20515.6} {"step": 23216, "train_loss": 3.2604312896728516, "lr": 9.166517250435586e-05, "tps": 74146, "wall": 20520.8} {"step": 23217, "train_loss": 3.3744020462036133, "lr": 9.165173977114631e-05, "tps": 74131, "wall": 20526.0} {"step": 23218, "train_loss": 3.2381057739257812, "lr": 9.163830849187284e-05, "tps": 74115, "wall": 20531.3} {"step": 23219, "train_loss": 3.270683526992798, "lr": 9.162487866668755e-05, "tps": 74099, "wall": 20536.5} {"step": 23220, "train_loss": 3.164527654647827, "lr": 9.161145029574255e-05, "tps": 74083, "wall": 20541.7} {"step": 23221, "train_loss": 3.2425613403320312, "lr": 9.159802337919001e-05, "tps": 74068, "wall": 20547.0} {"step": 23222, "train_loss": 3.301396369934082, "lr": 9.158459791718203e-05, "tps": 74052, "wall": 20552.2} {"step": 23223, "train_loss": 3.300306797027588, "lr": 9.15711739098706e-05, "tps": 74036, "wall": 20557.5} {"step": 23224, "train_loss": 3.198946475982666, "lr": 9.155775135740791e-05, "tps": 74020, "wall": 20562.8} {"step": 23225, "train_loss": 3.1947691440582275, "lr": 9.154433025994598e-05, "tps": 74005, "wall": 20568.0} {"step": 23226, "train_loss": 3.268078088760376, "lr": 9.153091061763676e-05, "tps": 73989, "wall": 20573.2} {"step": 23227, "train_loss": 3.2946105003356934, "lr": 9.151749243063242e-05, "tps": 73973, "wall": 20578.5} {"step": 23228, "train_loss": 3.2887516021728516, "lr": 9.150407569908483e-05, "tps": 73958, "wall": 20583.7} {"step": 23229, "train_loss": 3.2538604736328125, "lr": 9.149066042314599e-05, "tps": 73942, "wall": 20588.9} {"step": 23230, "train_loss": 3.1224777698516846, "lr": 9.147724660296796e-05, "tps": 73927, "wall": 20594.1} {"step": 23231, "train_loss": 3.29133939743042, "lr": 9.146383423870262e-05, "tps": 73911, "wall": 20599.3} {"step": 23232, "train_loss": 3.1887471675872803, "lr": 9.145042333050187e-05, "tps": 73896, "wall": 20604.6} {"step": 23233, "train_loss": 3.247087240219116, "lr": 9.143701387851773e-05, "tps": 73880, "wall": 20609.8} {"step": 23234, "train_loss": 3.239025831222534, "lr": 9.1423605882902e-05, "tps": 73864, "wall": 20615.0} {"step": 23235, "train_loss": 3.244962215423584, "lr": 9.14101993438067e-05, "tps": 73849, "wall": 20620.4} {"step": 23236, "train_loss": 3.190655469894409, "lr": 9.13967942613836e-05, "tps": 73833, "wall": 20625.6} {"step": 23237, "train_loss": 3.2674694061279297, "lr": 9.138339063578449e-05, "tps": 73817, "wall": 20630.9} {"step": 23238, "train_loss": 3.3053832054138184, "lr": 9.136998846716137e-05, "tps": 73802, "wall": 20636.2} {"step": 23239, "train_loss": 3.2436015605926514, "lr": 9.135658775566598e-05, "tps": 73786, "wall": 20641.4} {"step": 23240, "train_loss": 3.24851655960083, "lr": 9.134318850145005e-05, "tps": 73770, "wall": 20646.6} {"step": 23241, "train_loss": 3.2917661666870117, "lr": 9.132979070466553e-05, "tps": 73755, "wall": 20651.9} {"step": 23242, "train_loss": 3.179868221282959, "lr": 9.131639436546406e-05, "tps": 73739, "wall": 20657.1} {"step": 23243, "train_loss": 3.2671000957489014, "lr": 9.130299948399741e-05, "tps": 73724, "wall": 20662.3} {"step": 23244, "train_loss": 3.238438129425049, "lr": 9.12896060604174e-05, "tps": 73709, "wall": 20667.5} {"step": 23245, "train_loss": 3.2952325344085693, "lr": 9.127621409487568e-05, "tps": 73693, "wall": 20672.8} {"step": 23246, "train_loss": 3.1644749641418457, "lr": 9.126282358752393e-05, "tps": 73677, "wall": 20678.1} {"step": 23247, "train_loss": 3.2574045658111572, "lr": 9.124943453851392e-05, "tps": 73662, "wall": 20683.3} {"step": 23248, "train_loss": 3.2353575229644775, "lr": 9.12360469479973e-05, "tps": 73647, "wall": 20688.5} {"step": 23249, "train_loss": 3.2100493907928467, "lr": 9.122266081612563e-05, "tps": 73631, "wall": 20693.7} {"step": 23250, "train_loss": 3.245680093765259, "lr": 9.120927614305069e-05, "tps": 73616, "wall": 20699.0} {"step": 23251, "train_loss": 3.1543307304382324, "lr": 9.119589292892397e-05, "tps": 73600, "wall": 20704.2} {"step": 23252, "train_loss": 3.300447463989258, "lr": 9.11825111738972e-05, "tps": 73585, "wall": 20709.4} {"step": 23253, "train_loss": 3.283635139465332, "lr": 9.116913087812193e-05, "tps": 73569, "wall": 20714.7} {"step": 23254, "train_loss": 3.2884597778320312, "lr": 9.115575204174965e-05, "tps": 73554, "wall": 20719.9} {"step": 23255, "train_loss": 3.18757963180542, "lr": 9.114237466493204e-05, "tps": 73538, "wall": 20725.1} {"step": 23256, "train_loss": 3.278498649597168, "lr": 9.112899874782057e-05, "tps": 73523, "wall": 20730.3} {"step": 23257, "train_loss": 3.255133867263794, "lr": 9.111562429056672e-05, "tps": 73508, "wall": 20735.6} {"step": 23258, "train_loss": 3.2518601417541504, "lr": 9.110225129332213e-05, "tps": 73492, "wall": 20740.9} {"step": 23259, "train_loss": 3.345018148422241, "lr": 9.108887975623819e-05, "tps": 73477, "wall": 20746.1} {"step": 23260, "train_loss": 3.335402727127075, "lr": 9.107550967946635e-05, "tps": 73461, "wall": 20751.4} {"step": 23261, "train_loss": 3.222198486328125, "lr": 9.106214106315815e-05, "tps": 73446, "wall": 20756.6} {"step": 23262, "train_loss": 3.257708787918091, "lr": 9.104877390746501e-05, "tps": 73431, "wall": 20761.8} {"step": 23263, "train_loss": 3.207176446914673, "lr": 9.103540821253826e-05, "tps": 73415, "wall": 20767.0} {"step": 23264, "train_loss": 3.127803325653076, "lr": 9.102204397852945e-05, "tps": 73400, "wall": 20772.3} {"step": 23265, "train_loss": 3.16035795211792, "lr": 9.10086812055899e-05, "tps": 73385, "wall": 20777.5} {"step": 23266, "train_loss": 3.333106756210327, "lr": 9.099531989387092e-05, "tps": 73369, "wall": 20782.7} {"step": 23267, "train_loss": 3.3683958053588867, "lr": 9.098196004352402e-05, "tps": 73354, "wall": 20787.9} {"step": 23268, "train_loss": 3.186213970184326, "lr": 9.096860165470044e-05, "tps": 73339, "wall": 20793.2} {"step": 23269, "train_loss": 3.205827236175537, "lr": 9.095524472755146e-05, "tps": 73323, "wall": 20798.5} {"step": 23270, "train_loss": 3.1033248901367188, "lr": 9.094188926222852e-05, "tps": 73308, "wall": 20803.7} {"step": 23271, "train_loss": 3.2521564960479736, "lr": 9.092853525888277e-05, "tps": 73293, "wall": 20808.9} {"step": 23272, "train_loss": 3.290334701538086, "lr": 9.091518271766563e-05, "tps": 73277, "wall": 20814.2} {"step": 23273, "train_loss": 3.2576944828033447, "lr": 9.090183163872826e-05, "tps": 73262, "wall": 20819.4} {"step": 23274, "train_loss": 3.2284998893737793, "lr": 9.088848202222189e-05, "tps": 73247, "wall": 20824.6} {"step": 23275, "train_loss": 3.2689783573150635, "lr": 9.087513386829781e-05, "tps": 73232, "wall": 20829.8} {"step": 23276, "train_loss": 3.200531005859375, "lr": 9.086178717710724e-05, "tps": 73217, "wall": 20835.0} {"step": 23277, "train_loss": 3.278736114501953, "lr": 9.084844194880123e-05, "tps": 73201, "wall": 20840.3} {"step": 23278, "train_loss": 3.3214478492736816, "lr": 9.083509818353114e-05, "tps": 73186, "wall": 20845.5} {"step": 23279, "train_loss": 3.212398052215576, "lr": 9.082175588144804e-05, "tps": 73171, "wall": 20850.8} {"step": 23280, "train_loss": 3.2659006118774414, "lr": 9.080841504270301e-05, "tps": 73155, "wall": 20856.1} {"step": 23281, "train_loss": 3.2741026878356934, "lr": 9.079507566744731e-05, "tps": 73140, "wall": 20861.3} {"step": 23282, "train_loss": 3.2680115699768066, "lr": 9.078173775583198e-05, "tps": 73125, "wall": 20866.6} {"step": 23283, "train_loss": 3.283533811569214, "lr": 9.076840130800806e-05, "tps": 73110, "wall": 20871.8} {"step": 23284, "train_loss": 3.1366868019104004, "lr": 9.075506632412675e-05, "tps": 73095, "wall": 20877.0} {"step": 23285, "train_loss": 3.1895716190338135, "lr": 9.074173280433902e-05, "tps": 73079, "wall": 20882.2} {"step": 23286, "train_loss": 3.264998197555542, "lr": 9.07284007487959e-05, "tps": 73064, "wall": 20887.5} {"step": 23287, "train_loss": 3.369718074798584, "lr": 9.071507015764849e-05, "tps": 73049, "wall": 20892.7} {"step": 23288, "train_loss": 3.2367336750030518, "lr": 9.070174103104772e-05, "tps": 73034, "wall": 20897.9} {"step": 23289, "train_loss": 3.245745897293091, "lr": 9.068841336914463e-05, "tps": 73019, "wall": 20903.2} {"step": 23290, "train_loss": 3.196507215499878, "lr": 9.067508717209025e-05, "tps": 73004, "wall": 20908.4} {"step": 23291, "train_loss": 3.2947139739990234, "lr": 9.066176244003539e-05, "tps": 72988, "wall": 20913.6} {"step": 23292, "train_loss": 3.3081908226013184, "lr": 9.064843917313113e-05, "tps": 72973, "wall": 20919.0} {"step": 23293, "train_loss": 3.1611533164978027, "lr": 9.063511737152836e-05, "tps": 72958, "wall": 20924.2} {"step": 23294, "train_loss": 3.238394260406494, "lr": 9.062179703537794e-05, "tps": 72943, "wall": 20929.4} {"step": 23295, "train_loss": 3.3110368251800537, "lr": 9.060847816483085e-05, "tps": 72928, "wall": 20934.6} {"step": 23296, "train_loss": 3.3461194038391113, "lr": 9.059516076003791e-05, "tps": 72913, "wall": 20939.8} {"step": 23297, "train_loss": 3.2472496032714844, "lr": 9.058184482114995e-05, "tps": 72898, "wall": 20945.1} {"step": 23298, "train_loss": 3.230473518371582, "lr": 9.056853034831788e-05, "tps": 72883, "wall": 20950.3} {"step": 23299, "train_loss": 3.2735354900360107, "lr": 9.055521734169254e-05, "tps": 72868, "wall": 20955.5} {"step": 23300, "train_loss": 3.2253501415252686, "lr": 9.054190580142462e-05, "tps": 72853, "wall": 20960.7} {"step": 23301, "train_loss": 3.2784128189086914, "lr": 9.052859572766503e-05, "tps": 72838, "wall": 20965.9} {"step": 23302, "train_loss": 3.3216159343719482, "lr": 9.051528712056456e-05, "tps": 72823, "wall": 20971.2} {"step": 23303, "train_loss": 3.316803216934204, "lr": 9.050197998027382e-05, "tps": 72807, "wall": 20976.5} {"step": 23304, "train_loss": 3.2060837745666504, "lr": 9.048867430694373e-05, "tps": 72792, "wall": 20981.7} {"step": 23305, "train_loss": 3.237006187438965, "lr": 9.047537010072489e-05, "tps": 72777, "wall": 20987.0} {"step": 23306, "train_loss": 3.311711072921753, "lr": 9.046206736176812e-05, "tps": 72762, "wall": 20992.2} {"step": 23307, "train_loss": 3.2372984886169434, "lr": 9.044876609022407e-05, "tps": 72747, "wall": 20997.4} {"step": 23308, "train_loss": 3.2950568199157715, "lr": 9.043546628624334e-05, "tps": 72732, "wall": 21002.6} {"step": 23309, "train_loss": 3.317605972290039, "lr": 9.042216794997672e-05, "tps": 72717, "wall": 21007.8} {"step": 23310, "train_loss": 3.200269937515259, "lr": 9.040887108157477e-05, "tps": 72702, "wall": 21013.1} {"step": 23311, "train_loss": 3.306424140930176, "lr": 9.039557568118812e-05, "tps": 72687, "wall": 21018.3} {"step": 23312, "train_loss": 3.27040433883667, "lr": 9.038228174896744e-05, "tps": 72672, "wall": 21023.5} {"step": 23313, "train_loss": 3.259298324584961, "lr": 9.036898928506328e-05, "tps": 72658, "wall": 21028.7} {"step": 23314, "train_loss": 3.3045268058776855, "lr": 9.035569828962615e-05, "tps": 72643, "wall": 21034.0} {"step": 23315, "train_loss": 3.2730250358581543, "lr": 9.034240876280675e-05, "tps": 72627, "wall": 21039.3} {"step": 23316, "train_loss": 3.2093863487243652, "lr": 9.032912070475555e-05, "tps": 72612, "wall": 21044.5} {"step": 23317, "train_loss": 3.3432254791259766, "lr": 9.031583411562307e-05, "tps": 72597, "wall": 21049.8} {"step": 23318, "train_loss": 3.2850146293640137, "lr": 9.030254899555987e-05, "tps": 72582, "wall": 21055.0} {"step": 23319, "train_loss": 3.221841812133789, "lr": 9.02892653447164e-05, "tps": 72567, "wall": 21060.3} {"step": 23320, "train_loss": 3.2550129890441895, "lr": 9.027598316324312e-05, "tps": 72552, "wall": 21065.5} {"step": 23321, "train_loss": 3.3075878620147705, "lr": 9.026270245129055e-05, "tps": 72538, "wall": 21070.7} {"step": 23322, "train_loss": 3.2820820808410645, "lr": 9.024942320900909e-05, "tps": 72523, "wall": 21076.0} {"step": 23323, "train_loss": 3.3211703300476074, "lr": 9.023614543654915e-05, "tps": 72508, "wall": 21081.2} {"step": 23324, "train_loss": 3.2743635177612305, "lr": 9.022286913406125e-05, "tps": 72493, "wall": 21086.4} {"step": 23325, "train_loss": 3.2172155380249023, "lr": 9.020959430169563e-05, "tps": 72478, "wall": 21091.7} {"step": 23326, "train_loss": 3.167175054550171, "lr": 9.01963209396028e-05, "tps": 72463, "wall": 21097.0} {"step": 23327, "train_loss": 3.292896270751953, "lr": 9.018304904793309e-05, "tps": 72448, "wall": 21102.2} {"step": 23328, "train_loss": 3.290435314178467, "lr": 9.016977862683675e-05, "tps": 72433, "wall": 21107.5} {"step": 23329, "train_loss": 3.2483415603637695, "lr": 9.015650967646422e-05, "tps": 72418, "wall": 21112.7} {"step": 23330, "train_loss": 3.138319969177246, "lr": 9.014324219696582e-05, "tps": 72403, "wall": 21118.0} {"step": 23331, "train_loss": 3.2204999923706055, "lr": 9.01299761884917e-05, "tps": 72388, "wall": 21123.2} {"step": 23332, "train_loss": 3.315786838531494, "lr": 9.011671165119231e-05, "tps": 72374, "wall": 21128.4} {"step": 23333, "train_loss": 3.2449166774749756, "lr": 9.010344858521784e-05, "tps": 72359, "wall": 21133.6} {"step": 23334, "train_loss": 3.3086161613464355, "lr": 9.009018699071847e-05, "tps": 72344, "wall": 21138.9} {"step": 23335, "train_loss": 3.377765655517578, "lr": 9.007692686784454e-05, "tps": 72329, "wall": 21144.1} {"step": 23336, "train_loss": 3.2876780033111572, "lr": 9.006366821674623e-05, "tps": 72314, "wall": 21149.4} {"step": 23337, "train_loss": 3.1790666580200195, "lr": 9.005041103757364e-05, "tps": 72300, "wall": 21154.6} {"step": 23338, "train_loss": 3.2524123191833496, "lr": 9.003715533047707e-05, "tps": 72285, "wall": 21159.9} {"step": 23339, "train_loss": 3.259861469268799, "lr": 9.002390109560668e-05, "tps": 72270, "wall": 21165.1} {"step": 23340, "train_loss": 3.240001916885376, "lr": 9.001064833311247e-05, "tps": 72255, "wall": 21170.4} {"step": 23341, "train_loss": 3.1686952114105225, "lr": 8.999739704314474e-05, "tps": 72240, "wall": 21175.6} {"step": 23342, "train_loss": 3.1958425045013428, "lr": 8.998414722585347e-05, "tps": 72225, "wall": 21180.9} {"step": 23343, "train_loss": 3.2130441665649414, "lr": 8.997089888138887e-05, "tps": 72211, "wall": 21186.1} {"step": 23344, "train_loss": 3.161299228668213, "lr": 8.995765200990096e-05, "tps": 72196, "wall": 21191.3} {"step": 23345, "train_loss": 3.2786383628845215, "lr": 8.994440661153976e-05, "tps": 72181, "wall": 21196.6} {"step": 23346, "train_loss": 3.2474288940429688, "lr": 8.99311626864554e-05, "tps": 72166, "wall": 21201.8} {"step": 23347, "train_loss": 3.1754117012023926, "lr": 8.991792023479787e-05, "tps": 72152, "wall": 21207.0} {"step": 23348, "train_loss": 3.1129465103149414, "lr": 8.990467925671713e-05, "tps": 72137, "wall": 21212.3} {"step": 23349, "train_loss": 3.1384191513061523, "lr": 8.989143975236332e-05, "tps": 72122, "wall": 21217.6} {"step": 23350, "train_loss": 3.2411861419677734, "lr": 8.987820172188622e-05, "tps": 72107, "wall": 21222.9} {"step": 23351, "train_loss": 3.285456895828247, "lr": 8.986496516543593e-05, "tps": 72093, "wall": 21228.1} {"step": 23352, "train_loss": 3.225207567214966, "lr": 8.985173008316237e-05, "tps": 72078, "wall": 21233.3} {"step": 23353, "train_loss": 3.1794252395629883, "lr": 8.983849647521538e-05, "tps": 72063, "wall": 21238.6} {"step": 23354, "train_loss": 3.2931900024414062, "lr": 8.982526434174501e-05, "tps": 72048, "wall": 21243.8} {"step": 23355, "train_loss": 3.286663055419922, "lr": 8.98120336829011e-05, "tps": 72034, "wall": 21249.1} {"step": 23356, "train_loss": 3.2927184104919434, "lr": 8.979880449883345e-05, "tps": 72019, "wall": 21254.3} {"step": 23357, "train_loss": 3.1547913551330566, "lr": 8.978557678969205e-05, "tps": 72004, "wall": 21259.5} {"step": 23358, "train_loss": 3.216899871826172, "lr": 8.977235055562666e-05, "tps": 71990, "wall": 21264.7} {"step": 23359, "train_loss": 3.213810443878174, "lr": 8.975912579678707e-05, "tps": 71975, "wall": 21270.0} {"step": 23360, "train_loss": 3.279481887817383, "lr": 8.974590251332323e-05, "tps": 71961, "wall": 21275.2} {"step": 23361, "train_loss": 3.3291592597961426, "lr": 8.973268070538483e-05, "tps": 71946, "wall": 21280.4} {"step": 23362, "train_loss": 3.292781352996826, "lr": 8.971946037312164e-05, "tps": 71931, "wall": 21285.7} {"step": 23363, "train_loss": 3.263613700866699, "lr": 8.970624151668348e-05, "tps": 71917, "wall": 21290.9} {"step": 23364, "train_loss": 3.340017318725586, "lr": 8.969302413622008e-05, "tps": 71902, "wall": 21296.2} {"step": 23365, "train_loss": 3.197936534881592, "lr": 8.967980823188109e-05, "tps": 71888, "wall": 21301.4} {"step": 23366, "train_loss": 3.1362500190734863, "lr": 8.966659380381634e-05, "tps": 71873, "wall": 21306.6} {"step": 23367, "train_loss": 3.218717336654663, "lr": 8.96533808521754e-05, "tps": 71858, "wall": 21311.9} {"step": 23368, "train_loss": 3.224243402481079, "lr": 8.964016937710811e-05, "tps": 71844, "wall": 21317.1} {"step": 23369, "train_loss": 3.2405903339385986, "lr": 8.9626959378764e-05, "tps": 71829, "wall": 21322.3} {"step": 23370, "train_loss": 3.2257144451141357, "lr": 8.961375085729267e-05, "tps": 71815, "wall": 21327.6} {"step": 23371, "train_loss": 3.249894142150879, "lr": 8.960054381284393e-05, "tps": 71800, "wall": 21332.8} {"step": 23372, "train_loss": 3.2356009483337402, "lr": 8.958733824556726e-05, "tps": 71785, "wall": 21338.1} {"step": 23373, "train_loss": 3.2867472171783447, "lr": 8.957413415561222e-05, "tps": 71771, "wall": 21343.3} {"step": 23374, "train_loss": 3.1737871170043945, "lr": 8.95609315431285e-05, "tps": 71756, "wall": 21348.6} {"step": 23375, "train_loss": 3.126683235168457, "lr": 8.954773040826558e-05, "tps": 71742, "wall": 21353.8} {"step": 23376, "train_loss": 3.2290890216827393, "lr": 8.953453075117302e-05, "tps": 71727, "wall": 21359.0} {"step": 23377, "train_loss": 3.043349504470825, "lr": 8.952133257200039e-05, "tps": 71713, "wall": 21364.3} {"step": 23378, "train_loss": 3.228703260421753, "lr": 8.950813587089716e-05, "tps": 71698, "wall": 21369.5} {"step": 23379, "train_loss": 3.254605293273926, "lr": 8.949494064801276e-05, "tps": 71684, "wall": 21374.7} {"step": 23380, "train_loss": 3.1707358360290527, "lr": 8.94817469034968e-05, "tps": 71669, "wall": 21380.0} {"step": 23381, "train_loss": 3.340571880340576, "lr": 8.946855463749867e-05, "tps": 71655, "wall": 21385.2} {"step": 23382, "train_loss": 3.3288209438323975, "lr": 8.945536385016777e-05, "tps": 71640, "wall": 21390.4} {"step": 23383, "train_loss": 3.2260892391204834, "lr": 8.94421745416536e-05, "tps": 71626, "wall": 21395.7} {"step": 23384, "train_loss": 3.3409149646759033, "lr": 8.942898671210551e-05, "tps": 71611, "wall": 21401.0} {"step": 23385, "train_loss": 3.1400809288024902, "lr": 8.941580036167296e-05, "tps": 71597, "wall": 21406.2} {"step": 23386, "train_loss": 3.195006847381592, "lr": 8.94026154905053e-05, "tps": 71582, "wall": 21411.5} {"step": 23387, "train_loss": 3.184535503387451, "lr": 8.938943209875182e-05, "tps": 71568, "wall": 21416.8} {"step": 23388, "train_loss": 3.3057706356048584, "lr": 8.937625018656197e-05, "tps": 71553, "wall": 21422.0} {"step": 23389, "train_loss": 3.183828353881836, "lr": 8.936306975408501e-05, "tps": 71539, "wall": 21427.2} {"step": 23390, "train_loss": 3.348634719848633, "lr": 8.934989080147025e-05, "tps": 71524, "wall": 21432.5} {"step": 23391, "train_loss": 3.2219927310943604, "lr": 8.933671332886704e-05, "tps": 71510, "wall": 21437.7} {"step": 23392, "train_loss": 3.264679431915283, "lr": 8.932353733642458e-05, "tps": 71495, "wall": 21442.9} {"step": 23393, "train_loss": 3.1085028648376465, "lr": 8.931036282429212e-05, "tps": 71481, "wall": 21448.2} {"step": 23394, "train_loss": 3.2139389514923096, "lr": 8.929718979261898e-05, "tps": 71467, "wall": 21453.4} {"step": 23395, "train_loss": 3.3343191146850586, "lr": 8.928401824155437e-05, "tps": 71452, "wall": 21458.7} {"step": 23396, "train_loss": 3.20330548286438, "lr": 8.92708481712474e-05, "tps": 71438, "wall": 21463.9} {"step": 23397, "train_loss": 3.2231760025024414, "lr": 8.925767958184738e-05, "tps": 71423, "wall": 21469.2} {"step": 23398, "train_loss": 3.328195095062256, "lr": 8.924451247350347e-05, "tps": 71409, "wall": 21474.4} {"step": 23399, "train_loss": 3.2645423412323, "lr": 8.923134684636474e-05, "tps": 71395, "wall": 21479.6} {"step": 23400, "train_loss": 3.218979835510254, "lr": 8.92181827005804e-05, "tps": 71380, "wall": 21484.9} {"step": 23401, "train_loss": 3.264688730239868, "lr": 8.920502003629963e-05, "tps": 71366, "wall": 21490.2} {"step": 23402, "train_loss": 3.21707820892334, "lr": 8.919185885367133e-05, "tps": 71351, "wall": 21495.4} {"step": 23403, "train_loss": 3.24940824508667, "lr": 8.917869915284485e-05, "tps": 71337, "wall": 21500.6} {"step": 23404, "train_loss": 3.2282137870788574, "lr": 8.916554093396908e-05, "tps": 71323, "wall": 21505.9} {"step": 23405, "train_loss": 3.2940688133239746, "lr": 8.915238419719316e-05, "tps": 71309, "wall": 21511.1} {"step": 23406, "train_loss": 3.1284244060516357, "lr": 8.913922894266614e-05, "tps": 71294, "wall": 21516.4} {"step": 23407, "train_loss": 3.2454075813293457, "lr": 8.912607517053695e-05, "tps": 71280, "wall": 21521.6} {"step": 23408, "train_loss": 3.3203811645507812, "lr": 8.911292288095472e-05, "tps": 71265, "wall": 21526.9} {"step": 23409, "train_loss": 3.2227985858917236, "lr": 8.909977207406838e-05, "tps": 71251, "wall": 21532.2} {"step": 23410, "train_loss": 3.2021965980529785, "lr": 8.908662275002683e-05, "tps": 71237, "wall": 21537.4} {"step": 23411, "train_loss": 3.3195643424987793, "lr": 8.907347490897917e-05, "tps": 71222, "wall": 21542.7} {"step": 23412, "train_loss": 3.343231678009033, "lr": 8.906032855107426e-05, "tps": 71208, "wall": 21547.9} {"step": 23413, "train_loss": 3.3137693405151367, "lr": 8.904718367646102e-05, "tps": 71194, "wall": 21553.1} {"step": 23414, "train_loss": 3.320803165435791, "lr": 8.903404028528839e-05, "tps": 71179, "wall": 21558.4} {"step": 23415, "train_loss": 3.3671059608459473, "lr": 8.902089837770523e-05, "tps": 71165, "wall": 21563.6} {"step": 23416, "train_loss": 3.273318290710449, "lr": 8.900775795386038e-05, "tps": 71151, "wall": 21568.9} {"step": 23417, "train_loss": 3.3557395935058594, "lr": 8.899461901390277e-05, "tps": 71137, "wall": 21574.1} {"step": 23418, "train_loss": 3.22280216217041, "lr": 8.89814815579812e-05, "tps": 71122, "wall": 21579.5} {"step": 23419, "train_loss": 3.326791286468506, "lr": 8.896834558624447e-05, "tps": 71108, "wall": 21584.7} {"step": 23420, "train_loss": 3.2450060844421387, "lr": 8.895521109884144e-05, "tps": 71094, "wall": 21590.0} {"step": 23421, "train_loss": 3.192756175994873, "lr": 8.894207809592082e-05, "tps": 71079, "wall": 21595.2} {"step": 23422, "train_loss": 3.3778696060180664, "lr": 8.89289465776315e-05, "tps": 71065, "wall": 21600.4} {"step": 23423, "train_loss": 3.2057180404663086, "lr": 8.891581654412214e-05, "tps": 71051, "wall": 21605.6} {"step": 23424, "train_loss": 3.25716495513916, "lr": 8.890268799554145e-05, "tps": 71037, "wall": 21610.9} {"step": 23425, "train_loss": 3.2593905925750732, "lr": 8.888956093203827e-05, "tps": 71023, "wall": 21616.1} {"step": 23426, "train_loss": 3.2728567123413086, "lr": 8.887643535376123e-05, "tps": 71009, "wall": 21621.4} {"step": 23427, "train_loss": 3.1601452827453613, "lr": 8.886331126085896e-05, "tps": 70994, "wall": 21626.6} {"step": 23428, "train_loss": 3.316457986831665, "lr": 8.885018865348027e-05, "tps": 70980, "wall": 21631.8} {"step": 23429, "train_loss": 3.257612943649292, "lr": 8.883706753177371e-05, "tps": 70966, "wall": 21637.2} {"step": 23430, "train_loss": 3.172485113143921, "lr": 8.882394789588792e-05, "tps": 70951, "wall": 21642.4} {"step": 23431, "train_loss": 3.270724296569824, "lr": 8.88108297459716e-05, "tps": 70937, "wall": 21647.7} {"step": 23432, "train_loss": 3.2221415042877197, "lr": 8.879771308217328e-05, "tps": 70923, "wall": 21652.9} {"step": 23433, "train_loss": 3.2343661785125732, "lr": 8.878459790464148e-05, "tps": 70909, "wall": 21658.2} {"step": 23434, "train_loss": 3.269846200942993, "lr": 8.877148421352497e-05, "tps": 70895, "wall": 21663.4} {"step": 23435, "train_loss": 3.206836223602295, "lr": 8.875837200897215e-05, "tps": 70881, "wall": 21668.7} {"step": 23436, "train_loss": 3.276308298110962, "lr": 8.874526129113156e-05, "tps": 70867, "wall": 21673.9} {"step": 23437, "train_loss": 3.2667391300201416, "lr": 8.873215206015179e-05, "tps": 70853, "wall": 21679.1} {"step": 23438, "train_loss": 3.2923662662506104, "lr": 8.871904431618123e-05, "tps": 70838, "wall": 21684.4} {"step": 23439, "train_loss": 3.258707046508789, "lr": 8.870593805936852e-05, "tps": 70824, "wall": 21689.6} {"step": 23440, "train_loss": 3.090630292892456, "lr": 8.869283328986204e-05, "tps": 70810, "wall": 21694.8} {"step": 23441, "train_loss": 3.268126964569092, "lr": 8.867973000781019e-05, "tps": 70796, "wall": 21700.1} {"step": 23442, "train_loss": 3.217305898666382, "lr": 8.866662821336152e-05, "tps": 70782, "wall": 21705.4} {"step": 23443, "train_loss": 3.2558674812316895, "lr": 8.865352790666438e-05, "tps": 70768, "wall": 21710.6} {"step": 23444, "train_loss": 3.3360557556152344, "lr": 8.864042908786714e-05, "tps": 70754, "wall": 21715.8} {"step": 23445, "train_loss": 3.2417550086975098, "lr": 8.862733175711828e-05, "tps": 70740, "wall": 21721.1} {"step": 23446, "train_loss": 3.293473243713379, "lr": 8.86142359145661e-05, "tps": 70726, "wall": 21726.3} {"step": 23447, "train_loss": 3.298370599746704, "lr": 8.860114156035892e-05, "tps": 70712, "wall": 21731.5} {"step": 23448, "train_loss": 3.2064871788024902, "lr": 8.858804869464519e-05, "tps": 70698, "wall": 21736.8} {"step": 23449, "train_loss": 3.299116611480713, "lr": 8.857495731757311e-05, "tps": 70684, "wall": 21742.0} {"step": 23450, "train_loss": 3.1959638595581055, "lr": 8.856186742929102e-05, "tps": 70670, "wall": 21747.3} {"step": 23451, "train_loss": 3.2638750076293945, "lr": 8.854877902994722e-05, "tps": 70656, "wall": 21752.5} {"step": 23452, "train_loss": 3.2473695278167725, "lr": 8.853569211968999e-05, "tps": 70641, "wall": 21757.8} {"step": 23453, "train_loss": 3.3696560859680176, "lr": 8.852260669866746e-05, "tps": 70627, "wall": 21763.1} {"step": 23454, "train_loss": 3.195640802383423, "lr": 8.850952276702805e-05, "tps": 70613, "wall": 21768.3} {"step": 23455, "train_loss": 3.22572660446167, "lr": 8.849644032491986e-05, "tps": 70599, "wall": 21773.6} {"step": 23456, "train_loss": 3.136382579803467, "lr": 8.848335937249105e-05, "tps": 70585, "wall": 21778.8} {"step": 23457, "train_loss": 3.186744213104248, "lr": 8.847027990988992e-05, "tps": 70571, "wall": 21784.0} {"step": 23458, "train_loss": 3.245967149734497, "lr": 8.845720193726453e-05, "tps": 70558, "wall": 21789.3} {"step": 23459, "train_loss": 3.233734130859375, "lr": 8.844412545476311e-05, "tps": 70544, "wall": 21794.5} {"step": 23460, "train_loss": 3.2455577850341797, "lr": 8.843105046253375e-05, "tps": 70530, "wall": 21799.8} {"step": 23461, "train_loss": 3.1992146968841553, "lr": 8.841797696072454e-05, "tps": 70516, "wall": 21805.0} {"step": 23462, "train_loss": 3.2164106369018555, "lr": 8.840490494948365e-05, "tps": 70502, "wall": 21810.3} {"step": 23463, "train_loss": 3.232668876647949, "lr": 8.83918344289591e-05, "tps": 70488, "wall": 21815.5} {"step": 23464, "train_loss": 3.2154786586761475, "lr": 8.837876539929894e-05, "tps": 70474, "wall": 21820.8} {"step": 23465, "train_loss": 3.2590389251708984, "lr": 8.836569786065128e-05, "tps": 70460, "wall": 21826.0} {"step": 23466, "train_loss": 3.1996517181396484, "lr": 8.835263181316411e-05, "tps": 70446, "wall": 21831.3} {"step": 23467, "train_loss": 3.273120403289795, "lr": 8.833956725698543e-05, "tps": 70432, "wall": 21836.5} {"step": 23468, "train_loss": 3.2903335094451904, "lr": 8.832650419226327e-05, "tps": 70418, "wall": 21841.7} {"step": 23469, "train_loss": 3.319699764251709, "lr": 8.831344261914562e-05, "tps": 70404, "wall": 21846.9} {"step": 23470, "train_loss": 3.211801528930664, "lr": 8.830038253778033e-05, "tps": 70390, "wall": 21852.2} {"step": 23471, "train_loss": 3.1475095748901367, "lr": 8.828732394831554e-05, "tps": 70377, "wall": 21857.4} {"step": 23472, "train_loss": 3.362638473510742, "lr": 8.827426685089902e-05, "tps": 70363, "wall": 21862.7} {"step": 23473, "train_loss": 3.34146785736084, "lr": 8.826121124567869e-05, "tps": 70349, "wall": 21867.9} {"step": 23474, "train_loss": 3.1593008041381836, "lr": 8.824815713280255e-05, "tps": 70335, "wall": 21873.1} {"step": 23475, "train_loss": 3.2278103828430176, "lr": 8.823510451241837e-05, "tps": 70321, "wall": 21878.4} {"step": 23476, "train_loss": 3.2915382385253906, "lr": 8.822205338467408e-05, "tps": 70307, "wall": 21883.7} {"step": 23477, "train_loss": 3.202122211456299, "lr": 8.82090037497175e-05, "tps": 70293, "wall": 21888.9} {"step": 23478, "train_loss": 3.171238899230957, "lr": 8.819595560769643e-05, "tps": 70280, "wall": 21894.1} {"step": 23479, "train_loss": 3.172868013381958, "lr": 8.818290895875874e-05, "tps": 70266, "wall": 21899.3} {"step": 23480, "train_loss": 3.1593363285064697, "lr": 8.816986380305216e-05, "tps": 70252, "wall": 21904.6} {"step": 23481, "train_loss": 3.201911211013794, "lr": 8.81568201407245e-05, "tps": 70238, "wall": 21909.8} {"step": 23482, "train_loss": 3.28525710105896, "lr": 8.814377797192354e-05, "tps": 70225, "wall": 21915.0} {"step": 23483, "train_loss": 3.1778342723846436, "lr": 8.813073729679698e-05, "tps": 70211, "wall": 21920.2} {"step": 23484, "train_loss": 3.282172441482544, "lr": 8.811769811549254e-05, "tps": 70197, "wall": 21925.4} {"step": 23485, "train_loss": 3.192923069000244, "lr": 8.810466042815798e-05, "tps": 70183, "wall": 21930.6} {"step": 23486, "train_loss": 3.284644365310669, "lr": 8.809162423494097e-05, "tps": 70169, "wall": 21936.0} {"step": 23487, "train_loss": 3.330338716506958, "lr": 8.807858953598914e-05, "tps": 70156, "wall": 21941.2} {"step": 23488, "train_loss": 3.2891018390655518, "lr": 8.806555633145022e-05, "tps": 70142, "wall": 21946.4} {"step": 23489, "train_loss": 3.335035800933838, "lr": 8.80525246214718e-05, "tps": 70128, "wall": 21951.6} {"step": 23490, "train_loss": 3.252599000930786, "lr": 8.803949440620147e-05, "tps": 70115, "wall": 21956.8} {"step": 23491, "train_loss": 3.0933492183685303, "lr": 8.802646568578696e-05, "tps": 70101, "wall": 21962.0} {"step": 23492, "train_loss": 3.2401604652404785, "lr": 8.801343846037573e-05, "tps": 70088, "wall": 21967.2} {"step": 23493, "train_loss": 3.190502643585205, "lr": 8.800041273011545e-05, "tps": 70074, "wall": 21972.4} {"step": 23494, "train_loss": 3.30775785446167, "lr": 8.798738849515367e-05, "tps": 70060, "wall": 21977.5} {"step": 23495, "train_loss": 3.233844041824341, "lr": 8.79743657556378e-05, "tps": 70047, "wall": 21982.7} {"step": 23496, "train_loss": 3.171060562133789, "lr": 8.796134451171554e-05, "tps": 70033, "wall": 21987.9} {"step": 23497, "train_loss": 3.203618288040161, "lr": 8.794832476353427e-05, "tps": 70020, "wall": 21993.1} {"step": 23498, "train_loss": 3.352806568145752, "lr": 8.793530651124151e-05, "tps": 70006, "wall": 21998.4} {"step": 23499, "train_loss": 3.209132671356201, "lr": 8.792228975498478e-05, "tps": 69992, "wall": 22003.6} {"step": 23500, "train_loss": 3.270888090133667, "lr": 8.79092744949115e-05, "tps": 69979, "wall": 22008.8} {"step": 23501, "train_loss": 3.3264379501342773, "lr": 8.789626073116905e-05, "tps": 69965, "wall": 22014.1} {"step": 23502, "train_loss": 3.2430291175842285, "lr": 8.788324846390497e-05, "tps": 69952, "wall": 22019.3} {"step": 23503, "train_loss": 3.326106548309326, "lr": 8.787023769326657e-05, "tps": 69938, "wall": 22024.4} {"step": 23504, "train_loss": 3.282078742980957, "lr": 8.785722841940123e-05, "tps": 69925, "wall": 22029.6} {"step": 23505, "train_loss": 3.3567357063293457, "lr": 8.784422064245642e-05, "tps": 69911, "wall": 22034.8} {"step": 23506, "train_loss": 3.2177233695983887, "lr": 8.783121436257941e-05, "tps": 69898, "wall": 22040.0} {"step": 23507, "train_loss": 3.2664794921875, "lr": 8.781820957991751e-05, "tps": 69884, "wall": 22045.2} {"step": 23508, "train_loss": 3.212045192718506, "lr": 8.780520629461812e-05, "tps": 69871, "wall": 22050.4} {"step": 23509, "train_loss": 3.1825811862945557, "lr": 8.779220450682852e-05, "tps": 69857, "wall": 22055.5} {"step": 23510, "train_loss": 3.2609376907348633, "lr": 8.777920421669592e-05, "tps": 69844, "wall": 22060.8} {"step": 23511, "train_loss": 3.3125967979431152, "lr": 8.776620542436772e-05, "tps": 69830, "wall": 22065.9} {"step": 23512, "train_loss": 3.2895987033843994, "lr": 8.775320812999101e-05, "tps": 69817, "wall": 22071.1} {"step": 23513, "train_loss": 3.2080259323120117, "lr": 8.774021233371322e-05, "tps": 69804, "wall": 22076.3} {"step": 23514, "train_loss": 3.283773899078369, "lr": 8.77272180356814e-05, "tps": 69790, "wall": 22081.4} {"step": 23515, "train_loss": 3.3259594440460205, "lr": 8.771422523604278e-05, "tps": 69777, "wall": 22086.6} {"step": 23516, "train_loss": 3.272155523300171, "lr": 8.770123393494462e-05, "tps": 69764, "wall": 22091.7} {"step": 23517, "train_loss": 3.2272400856018066, "lr": 8.768824413253406e-05, "tps": 69750, "wall": 22096.9} {"step": 23518, "train_loss": 3.3093581199645996, "lr": 8.767525582895823e-05, "tps": 69737, "wall": 22102.1} {"step": 23519, "train_loss": 3.2299962043762207, "lr": 8.766226902436423e-05, "tps": 69724, "wall": 22107.2} {"step": 23520, "train_loss": 3.1520626544952393, "lr": 8.764928371889918e-05, "tps": 69710, "wall": 22112.4} {"step": 23521, "train_loss": 3.3186659812927246, "lr": 8.763629991271023e-05, "tps": 69697, "wall": 22117.6} {"step": 23522, "train_loss": 3.2780613899230957, "lr": 8.762331760594447e-05, "tps": 69683, "wall": 22122.8} {"step": 23523, "train_loss": 3.2649500370025635, "lr": 8.761033679874885e-05, "tps": 69670, "wall": 22128.0} {"step": 23524, "train_loss": 3.271915912628174, "lr": 8.759735749127056e-05, "tps": 69657, "wall": 22133.1} {"step": 23525, "train_loss": 3.274559736251831, "lr": 8.758437968365657e-05, "tps": 69643, "wall": 22138.3} {"step": 23526, "train_loss": 3.2563114166259766, "lr": 8.757140337605382e-05, "tps": 69630, "wall": 22143.4} {"step": 23527, "train_loss": 3.241875410079956, "lr": 8.755842856860945e-05, "tps": 69617, "wall": 22148.6} {"step": 23528, "train_loss": 3.336747169494629, "lr": 8.754545526147036e-05, "tps": 69604, "wall": 22153.7} {"step": 23529, "train_loss": 3.3244919776916504, "lr": 8.753248345478345e-05, "tps": 69591, "wall": 22158.9} {"step": 23530, "train_loss": 3.211348056793213, "lr": 8.751951314869582e-05, "tps": 69578, "wall": 22164.0} {"step": 23531, "train_loss": 3.2740025520324707, "lr": 8.750654434335429e-05, "tps": 69564, "wall": 22169.1} {"step": 23532, "train_loss": 3.3315672874450684, "lr": 8.749357703890575e-05, "tps": 69551, "wall": 22174.3} {"step": 23533, "train_loss": 3.221449851989746, "lr": 8.748061123549718e-05, "tps": 69538, "wall": 22179.5} {"step": 23534, "train_loss": 3.239097833633423, "lr": 8.746764693327543e-05, "tps": 69525, "wall": 22184.7} {"step": 23535, "train_loss": 3.3000922203063965, "lr": 8.745468413238728e-05, "tps": 69511, "wall": 22189.8} {"step": 23536, "train_loss": 3.182516098022461, "lr": 8.744172283297969e-05, "tps": 69498, "wall": 22194.9} {"step": 23537, "train_loss": 3.2168774604797363, "lr": 8.742876303519937e-05, "tps": 69485, "wall": 22200.0} {"step": 23538, "train_loss": 3.229933023452759, "lr": 8.741580473919327e-05, "tps": 69472, "wall": 22205.1} {"step": 23539, "train_loss": 3.299752712249756, "lr": 8.740284794510812e-05, "tps": 69459, "wall": 22210.2} {"step": 23540, "train_loss": 3.2809348106384277, "lr": 8.738989265309059e-05, "tps": 69446, "wall": 22215.4} {"step": 23541, "train_loss": 3.2456307411193848, "lr": 8.73769388632876e-05, "tps": 69433, "wall": 22220.5} {"step": 23542, "train_loss": 3.251725196838379, "lr": 8.736398657584584e-05, "tps": 69420, "wall": 22225.6} {"step": 23543, "train_loss": 3.1821351051330566, "lr": 8.735103579091193e-05, "tps": 69407, "wall": 22230.7} {"step": 23544, "train_loss": 3.264186382293701, "lr": 8.733808650863273e-05, "tps": 69394, "wall": 22235.8} {"step": 23545, "train_loss": 3.2443418502807617, "lr": 8.732513872915488e-05, "tps": 69381, "wall": 22241.0} {"step": 23546, "train_loss": 3.215557813644409, "lr": 8.731219245262497e-05, "tps": 69368, "wall": 22246.1} {"step": 23547, "train_loss": 3.2362170219421387, "lr": 8.729924767918976e-05, "tps": 69355, "wall": 22251.2} {"step": 23548, "train_loss": 3.2581419944763184, "lr": 8.728630440899587e-05, "tps": 69342, "wall": 22256.3} {"step": 23549, "train_loss": 3.185624837875366, "lr": 8.727336264218985e-05, "tps": 69329, "wall": 22261.4} {"step": 23550, "train_loss": 3.2751219272613525, "lr": 8.726042237891841e-05, "tps": 69316, "wall": 22266.5} {"step": 23551, "train_loss": 3.257707118988037, "lr": 8.724748361932807e-05, "tps": 69303, "wall": 22271.6} {"step": 23552, "train_loss": 3.3171498775482178, "lr": 8.723454636356538e-05, "tps": 69290, "wall": 22276.7} {"step": 23553, "train_loss": 3.170403242111206, "lr": 8.722161061177697e-05, "tps": 69277, "wall": 22281.8} {"step": 23554, "train_loss": 3.2258412837982178, "lr": 8.72086763641093e-05, "tps": 69265, "wall": 22286.9} {"step": 23555, "train_loss": 3.2598094940185547, "lr": 8.719574362070899e-05, "tps": 69252, "wall": 22291.9} {"step": 23556, "train_loss": 3.2082104682922363, "lr": 8.718281238172245e-05, "tps": 69238, "wall": 22297.2} {"step": 23557, "train_loss": 3.2924556732177734, "lr": 8.716988264729616e-05, "tps": 69225, "wall": 22302.3} {"step": 23558, "train_loss": 3.3299560546875, "lr": 8.71569544175767e-05, "tps": 69213, "wall": 22307.4} {"step": 23559, "train_loss": 3.1864864826202393, "lr": 8.714402769271042e-05, "tps": 69200, "wall": 22312.5} {"step": 23560, "train_loss": 3.2294137477874756, "lr": 8.713110247284373e-05, "tps": 69187, "wall": 22317.5} {"step": 23561, "train_loss": 3.2138609886169434, "lr": 8.711817875812316e-05, "tps": 69174, "wall": 22322.6} {"step": 23562, "train_loss": 3.1686885356903076, "lr": 8.710525654869504e-05, "tps": 69161, "wall": 22327.7} {"step": 23563, "train_loss": 3.287519693374634, "lr": 8.709233584470574e-05, "tps": 69148, "wall": 22332.8} {"step": 23564, "train_loss": 3.2520346641540527, "lr": 8.707941664630166e-05, "tps": 69135, "wall": 22337.9} {"step": 23565, "train_loss": 3.2754626274108887, "lr": 8.706649895362917e-05, "tps": 69123, "wall": 22343.0} {"step": 23566, "train_loss": 3.356241464614868, "lr": 8.70535827668345e-05, "tps": 69110, "wall": 22348.1} {"step": 23567, "train_loss": 3.256491184234619, "lr": 8.70406680860641e-05, "tps": 69097, "wall": 22353.2} {"step": 23568, "train_loss": 3.224130868911743, "lr": 8.70277549114642e-05, "tps": 69084, "wall": 22358.4} {"step": 23569, "train_loss": 3.227374315261841, "lr": 8.701484324318103e-05, "tps": 69071, "wall": 22363.5} {"step": 23570, "train_loss": 3.2707698345184326, "lr": 8.700193308136097e-05, "tps": 69058, "wall": 22368.6} {"step": 23571, "train_loss": 3.246257781982422, "lr": 8.698902442615015e-05, "tps": 69046, "wall": 22373.7} {"step": 23572, "train_loss": 3.166020393371582, "lr": 8.697611727769492e-05, "tps": 69033, "wall": 22378.8} {"step": 23573, "train_loss": 3.344223976135254, "lr": 8.696321163614143e-05, "tps": 69020, "wall": 22383.9} {"step": 23574, "train_loss": 3.212385654449463, "lr": 8.695030750163581e-05, "tps": 69007, "wall": 22389.0} {"step": 23575, "train_loss": 3.178680896759033, "lr": 8.693740487432439e-05, "tps": 68995, "wall": 22394.0} {"step": 23576, "train_loss": 3.290407180786133, "lr": 8.69245037543532e-05, "tps": 68982, "wall": 22399.1} {"step": 23577, "train_loss": 3.21881365776062, "lr": 8.691160414186839e-05, "tps": 68969, "wall": 22404.2} {"step": 23578, "train_loss": 3.244373321533203, "lr": 8.689870603701617e-05, "tps": 68957, "wall": 22409.2} {"step": 23579, "train_loss": 3.2313406467437744, "lr": 8.688580943994265e-05, "tps": 68944, "wall": 22414.2} {"step": 23580, "train_loss": 3.3282828330993652, "lr": 8.68729143507938e-05, "tps": 68931, "wall": 22419.4} {"step": 23581, "train_loss": 3.3379523754119873, "lr": 8.686002076971584e-05, "tps": 68918, "wall": 22424.5} {"step": 23582, "train_loss": 3.2048532962799072, "lr": 8.684712869685476e-05, "tps": 68906, "wall": 22429.5} {"step": 23583, "train_loss": 3.2076148986816406, "lr": 8.683423813235656e-05, "tps": 68893, "wall": 22434.7} {"step": 23584, "train_loss": 3.2585201263427734, "lr": 8.682134907636738e-05, "tps": 68880, "wall": 22439.7} {"step": 23585, "train_loss": 3.2646541595458984, "lr": 8.680846152903314e-05, "tps": 68868, "wall": 22444.8} {"step": 23586, "train_loss": 3.1510963439941406, "lr": 8.679557549049982e-05, "tps": 68855, "wall": 22449.9} {"step": 23587, "train_loss": 3.214374542236328, "lr": 8.678269096091347e-05, "tps": 68842, "wall": 22455.1} {"step": 23588, "train_loss": 3.0833520889282227, "lr": 8.676980794042e-05, "tps": 68829, "wall": 22460.1} {"step": 23589, "train_loss": 3.3175878524780273, "lr": 8.675692642916531e-05, "tps": 68817, "wall": 22465.2} {"step": 23590, "train_loss": 3.2235193252563477, "lr": 8.674404642729541e-05, "tps": 68804, "wall": 22470.2} {"step": 23591, "train_loss": 3.2458925247192383, "lr": 8.673116793495612e-05, "tps": 68792, "wall": 22475.3} {"step": 23592, "train_loss": 3.338808059692383, "lr": 8.67182909522934e-05, "tps": 68779, "wall": 22480.4} {"step": 23593, "train_loss": 3.2712020874023438, "lr": 8.670541547945312e-05, "tps": 68766, "wall": 22485.5} {"step": 23594, "train_loss": 3.1835856437683105, "lr": 8.669254151658104e-05, "tps": 68754, "wall": 22490.6} {"step": 23595, "train_loss": 3.232274055480957, "lr": 8.667966906382312e-05, "tps": 68741, "wall": 22495.6} {"step": 23596, "train_loss": 3.289155960083008, "lr": 8.666679812132509e-05, "tps": 68729, "wall": 22500.7} {"step": 23597, "train_loss": 3.236560583114624, "lr": 8.665392868923276e-05, "tps": 68716, "wall": 22505.7} {"step": 23598, "train_loss": 3.1952643394470215, "lr": 8.664106076769198e-05, "tps": 68704, "wall": 22510.8} {"step": 23599, "train_loss": 3.150947093963623, "lr": 8.66281943568485e-05, "tps": 68691, "wall": 22515.9} {"step": 23600, "train_loss": 3.2149288654327393, "lr": 8.661532945684798e-05, "tps": 68678, "wall": 22521.0} {"step": 23601, "train_loss": 3.2727766036987305, "lr": 8.660246606783627e-05, "tps": 68666, "wall": 22526.1} {"step": 23602, "train_loss": 3.2512106895446777, "lr": 8.658960418995907e-05, "tps": 68653, "wall": 22531.2} {"step": 23603, "train_loss": 3.254991292953491, "lr": 8.657674382336196e-05, "tps": 68640, "wall": 22536.4} {"step": 23604, "train_loss": 3.2184152603149414, "lr": 8.656388496819079e-05, "tps": 68628, "wall": 22541.5} {"step": 23605, "train_loss": 3.1510400772094727, "lr": 8.655102762459112e-05, "tps": 68615, "wall": 22546.5} {"step": 23606, "train_loss": 3.2857046127319336, "lr": 8.653817179270862e-05, "tps": 68602, "wall": 22551.6} {"step": 23607, "train_loss": 3.2701902389526367, "lr": 8.652531747268897e-05, "tps": 68590, "wall": 22556.7} {"step": 23608, "train_loss": 3.327559471130371, "lr": 8.651246466467768e-05, "tps": 68577, "wall": 22561.8} {"step": 23609, "train_loss": 3.148545742034912, "lr": 8.649961336882047e-05, "tps": 68565, "wall": 22567.0} {"step": 23610, "train_loss": 3.1851425170898438, "lr": 8.648676358526286e-05, "tps": 68552, "wall": 22572.1} {"step": 23611, "train_loss": 3.2185659408569336, "lr": 8.647391531415037e-05, "tps": 68539, "wall": 22577.2} {"step": 23612, "train_loss": 3.285897731781006, "lr": 8.646106855562863e-05, "tps": 68527, "wall": 22582.3} {"step": 23613, "train_loss": 3.280200719833374, "lr": 8.644822330984315e-05, "tps": 68514, "wall": 22587.4} {"step": 23614, "train_loss": 3.330280303955078, "lr": 8.643537957693936e-05, "tps": 68501, "wall": 22592.6} {"step": 23615, "train_loss": 3.152167797088623, "lr": 8.642253735706285e-05, "tps": 68489, "wall": 22597.7} {"step": 23616, "train_loss": 3.3483922481536865, "lr": 8.640969665035908e-05, "tps": 68476, "wall": 22602.9} {"step": 23617, "train_loss": 3.227351665496826, "lr": 8.639685745697344e-05, "tps": 68463, "wall": 22608.0} {"step": 23618, "train_loss": 3.251025438308716, "lr": 8.638401977705149e-05, "tps": 68451, "wall": 22613.1} {"step": 23619, "train_loss": 3.25205659866333, "lr": 8.637118361073857e-05, "tps": 68438, "wall": 22618.2} {"step": 23620, "train_loss": 3.265552282333374, "lr": 8.635834895818006e-05, "tps": 68425, "wall": 22623.4} {"step": 23621, "train_loss": 3.319243907928467, "lr": 8.634551581952148e-05, "tps": 68413, "wall": 22628.5} {"step": 23622, "train_loss": 3.237478733062744, "lr": 8.633268419490811e-05, "tps": 68400, "wall": 22633.7} {"step": 23623, "train_loss": 3.193844795227051, "lr": 8.631985408448526e-05, "tps": 68388, "wall": 22638.8} {"step": 23624, "train_loss": 3.2488977909088135, "lr": 8.63070254883984e-05, "tps": 68375, "wall": 22643.9} {"step": 23625, "train_loss": 3.263514518737793, "lr": 8.629419840679274e-05, "tps": 68362, "wall": 22649.1} {"step": 23626, "train_loss": 3.254181385040283, "lr": 8.628137283981369e-05, "tps": 68350, "wall": 22654.3} {"step": 23627, "train_loss": 3.27262020111084, "lr": 8.626854878760648e-05, "tps": 68337, "wall": 22659.5} {"step": 23628, "train_loss": 3.330892324447632, "lr": 8.625572625031632e-05, "tps": 68324, "wall": 22664.6} {"step": 23629, "train_loss": 3.2559754848480225, "lr": 8.62429052280886e-05, "tps": 68312, "wall": 22669.7} {"step": 23630, "train_loss": 3.348827838897705, "lr": 8.623008572106846e-05, "tps": 68299, "wall": 22674.9} {"step": 23631, "train_loss": 3.3744139671325684, "lr": 8.621726772940111e-05, "tps": 68286, "wall": 22680.0} {"step": 23632, "train_loss": 3.3423843383789062, "lr": 8.620445125323185e-05, "tps": 68274, "wall": 22685.1} {"step": 23633, "train_loss": 3.244685649871826, "lr": 8.619163629270578e-05, "tps": 68261, "wall": 22690.2} {"step": 23634, "train_loss": 3.1609091758728027, "lr": 8.617882284796805e-05, "tps": 68249, "wall": 22695.4} {"step": 23635, "train_loss": 3.243448257446289, "lr": 8.61660109191639e-05, "tps": 68236, "wall": 22700.5} {"step": 23636, "train_loss": 3.169931411743164, "lr": 8.615320050643845e-05, "tps": 68224, "wall": 22705.6} {"step": 23637, "train_loss": 3.2372934818267822, "lr": 8.61403916099367e-05, "tps": 68211, "wall": 22710.7} {"step": 23638, "train_loss": 3.3117480278015137, "lr": 8.612758422980391e-05, "tps": 68199, "wall": 22715.9} {"step": 23639, "train_loss": 3.265279769897461, "lr": 8.611477836618507e-05, "tps": 68186, "wall": 22721.0} {"step": 23640, "train_loss": 3.1986663341522217, "lr": 8.610197401922521e-05, "tps": 68174, "wall": 22726.1} {"step": 23641, "train_loss": 3.29276704788208, "lr": 8.608917118906951e-05, "tps": 68161, "wall": 22731.2} {"step": 23642, "train_loss": 3.3053622245788574, "lr": 8.60763698758629e-05, "tps": 68149, "wall": 22736.3} {"step": 23643, "train_loss": 3.213111162185669, "lr": 8.606357007975037e-05, "tps": 68137, "wall": 22741.4} {"step": 23644, "train_loss": 3.22391414642334, "lr": 8.605077180087701e-05, "tps": 68124, "wall": 22746.5} {"step": 23645, "train_loss": 3.29913330078125, "lr": 8.60379750393877e-05, "tps": 68112, "wall": 22751.6} {"step": 23646, "train_loss": 3.2122795581817627, "lr": 8.602517979542753e-05, "tps": 68099, "wall": 22756.7} {"step": 23647, "train_loss": 3.3325705528259277, "lr": 8.601238606914135e-05, "tps": 68087, "wall": 22761.8} {"step": 23648, "train_loss": 3.213131904602051, "lr": 8.599959386067407e-05, "tps": 68075, "wall": 22766.9} {"step": 23649, "train_loss": 3.216306209564209, "lr": 8.598680317017071e-05, "tps": 68062, "wall": 22772.0} {"step": 23650, "train_loss": 3.3174986839294434, "lr": 8.597401399777604e-05, "tps": 68050, "wall": 22777.2} {"step": 23651, "train_loss": 3.3358445167541504, "lr": 8.596122634363498e-05, "tps": 68037, "wall": 22782.3} {"step": 23652, "train_loss": 3.280545711517334, "lr": 8.594844020789243e-05, "tps": 68025, "wall": 22787.4} {"step": 23653, "train_loss": 3.378051280975342, "lr": 8.593565559069323e-05, "tps": 68013, "wall": 22792.4} {"step": 23654, "train_loss": 3.225104808807373, "lr": 8.592287249218212e-05, "tps": 68001, "wall": 22797.5} {"step": 23655, "train_loss": 3.2786240577697754, "lr": 8.591009091250397e-05, "tps": 67988, "wall": 22802.6} {"step": 23656, "train_loss": 3.295016050338745, "lr": 8.589731085180362e-05, "tps": 67976, "wall": 22807.6} {"step": 23657, "train_loss": 3.2806997299194336, "lr": 8.58845323102257e-05, "tps": 67964, "wall": 22812.7} {"step": 23658, "train_loss": 3.3020691871643066, "lr": 8.587175528791513e-05, "tps": 67952, "wall": 22817.7} {"step": 23659, "train_loss": 3.329418182373047, "lr": 8.585897978501656e-05, "tps": 67940, "wall": 22822.8} {"step": 23660, "train_loss": 3.246610164642334, "lr": 8.584620580167466e-05, "tps": 67927, "wall": 22827.8} {"step": 23661, "train_loss": 3.2817397117614746, "lr": 8.583343333803428e-05, "tps": 67915, "wall": 22832.9} {"step": 23662, "train_loss": 3.343111753463745, "lr": 8.582066239423996e-05, "tps": 67903, "wall": 22838.0} {"step": 23663, "train_loss": 3.1661648750305176, "lr": 8.580789297043647e-05, "tps": 67891, "wall": 22843.1} {"step": 23664, "train_loss": 3.2305407524108887, "lr": 8.579512506676844e-05, "tps": 67879, "wall": 22848.1} {"step": 23665, "train_loss": 3.1806321144104004, "lr": 8.578235868338045e-05, "tps": 67866, "wall": 22853.2} {"step": 23666, "train_loss": 3.2819371223449707, "lr": 8.576959382041721e-05, "tps": 67854, "wall": 22858.3} {"step": 23667, "train_loss": 3.265839099884033, "lr": 8.575683047802325e-05, "tps": 67842, "wall": 22863.3} {"step": 23668, "train_loss": 3.2870712280273438, "lr": 8.574406865634315e-05, "tps": 67830, "wall": 22868.4} {"step": 23669, "train_loss": 3.2911300659179688, "lr": 8.573130835552156e-05, "tps": 67818, "wall": 22873.4} {"step": 23670, "train_loss": 3.294344425201416, "lr": 8.571854957570296e-05, "tps": 67806, "wall": 22878.5} {"step": 23671, "train_loss": 3.2952218055725098, "lr": 8.570579231703186e-05, "tps": 67794, "wall": 22883.5} {"step": 23672, "train_loss": 3.280992031097412, "lr": 8.569303657965283e-05, "tps": 67782, "wall": 22888.5} {"step": 23673, "train_loss": 3.2472083568573, "lr": 8.568028236371035e-05, "tps": 67770, "wall": 22893.6} {"step": 23674, "train_loss": 3.174016237258911, "lr": 8.566752966934887e-05, "tps": 67757, "wall": 22898.7} {"step": 23675, "train_loss": 3.183290958404541, "lr": 8.565477849671293e-05, "tps": 67745, "wall": 22903.7} {"step": 23676, "train_loss": 3.208803653717041, "lr": 8.564202884594692e-05, "tps": 67733, "wall": 22908.7} {"step": 23677, "train_loss": 3.331775665283203, "lr": 8.562928071719522e-05, "tps": 67721, "wall": 22913.8} {"step": 23678, "train_loss": 3.165672779083252, "lr": 8.561653411060237e-05, "tps": 67709, "wall": 22918.8} {"step": 23679, "train_loss": 3.1672747135162354, "lr": 8.56037890263126e-05, "tps": 67697, "wall": 22923.8} {"step": 23680, "train_loss": 3.1927993297576904, "lr": 8.559104546447047e-05, "tps": 67685, "wall": 22928.8} {"step": 23681, "train_loss": 3.134709119796753, "lr": 8.557830342522022e-05, "tps": 67673, "wall": 22933.9} {"step": 23682, "train_loss": 3.219592332839966, "lr": 8.55655629087062e-05, "tps": 67661, "wall": 22938.9} {"step": 23683, "train_loss": 3.3217906951904297, "lr": 8.55528239150728e-05, "tps": 67649, "wall": 22943.9} {"step": 23684, "train_loss": 3.348832130432129, "lr": 8.554008644446426e-05, "tps": 67637, "wall": 22949.0} {"step": 23685, "train_loss": 3.2590627670288086, "lr": 8.552735049702485e-05, "tps": 67625, "wall": 22954.0} {"step": 23686, "train_loss": 3.2119081020355225, "lr": 8.551461607289899e-05, "tps": 67613, "wall": 22959.1} {"step": 23687, "train_loss": 3.2949957847595215, "lr": 8.550188317223076e-05, "tps": 67601, "wall": 22964.2} {"step": 23688, "train_loss": 3.2590694427490234, "lr": 8.548915179516449e-05, "tps": 67589, "wall": 22969.2} {"step": 23689, "train_loss": 3.266369342803955, "lr": 8.547642194184443e-05, "tps": 67577, "wall": 22974.2} {"step": 23690, "train_loss": 3.274390697479248, "lr": 8.546369361241462e-05, "tps": 67565, "wall": 22979.2} {"step": 23691, "train_loss": 3.312689781188965, "lr": 8.545096680701947e-05, "tps": 67554, "wall": 22984.2} {"step": 23692, "train_loss": 3.2307233810424805, "lr": 8.543824152580304e-05, "tps": 67542, "wall": 22989.3} {"step": 23693, "train_loss": 3.1376590728759766, "lr": 8.542551776890944e-05, "tps": 67530, "wall": 22994.3} {"step": 23694, "train_loss": 3.1931724548339844, "lr": 8.54127955364829e-05, "tps": 67518, "wall": 22999.3} {"step": 23695, "train_loss": 3.336393117904663, "lr": 8.54000748286675e-05, "tps": 67506, "wall": 23004.3} {"step": 23696, "train_loss": 3.1135051250457764, "lr": 8.538735564560724e-05, "tps": 67494, "wall": 23009.3} {"step": 23697, "train_loss": 3.187152862548828, "lr": 8.53746379874464e-05, "tps": 67482, "wall": 23014.3} {"step": 23698, "train_loss": 3.312297821044922, "lr": 8.536192185432894e-05, "tps": 67470, "wall": 23019.4} {"step": 23699, "train_loss": 3.2697031497955322, "lr": 8.534920724639883e-05, "tps": 67458, "wall": 23024.4} {"step": 23700, "train_loss": 3.294743776321411, "lr": 8.533649416380028e-05, "tps": 67447, "wall": 23029.4} {"step": 23701, "train_loss": 3.2022297382354736, "lr": 8.53237826066772e-05, "tps": 67435, "wall": 23034.4} {"step": 23702, "train_loss": 3.2516372203826904, "lr": 8.53110725751735e-05, "tps": 67423, "wall": 23039.4} {"step": 23703, "train_loss": 3.2612996101379395, "lr": 8.529836406943334e-05, "tps": 67411, "wall": 23044.4} {"step": 23704, "train_loss": 3.1668150424957275, "lr": 8.528565708960054e-05, "tps": 67399, "wall": 23049.4} {"step": 23705, "train_loss": 3.1572182178497314, "lr": 8.527295163581917e-05, "tps": 67388, "wall": 23054.4} {"step": 23706, "train_loss": 3.1981682777404785, "lr": 8.52602477082331e-05, "tps": 67376, "wall": 23059.4} {"step": 23707, "train_loss": 3.262606620788574, "lr": 8.524754530698615e-05, "tps": 67364, "wall": 23064.5} {"step": 23708, "train_loss": 3.224386692047119, "lr": 8.523484443222237e-05, "tps": 67352, "wall": 23069.5} {"step": 23709, "train_loss": 3.230637788772583, "lr": 8.522214508408555e-05, "tps": 67341, "wall": 23074.5} {"step": 23710, "train_loss": 3.3396034240722656, "lr": 8.520944726271951e-05, "tps": 67329, "wall": 23079.6} {"step": 23711, "train_loss": 3.1607046127319336, "lr": 8.51967509682682e-05, "tps": 67317, "wall": 23084.6} {"step": 23712, "train_loss": 3.197958469390869, "lr": 8.51840562008754e-05, "tps": 67305, "wall": 23089.6} {"step": 23713, "train_loss": 3.2732081413269043, "lr": 8.517136296068487e-05, "tps": 67293, "wall": 23094.6} {"step": 23714, "train_loss": 3.2148616313934326, "lr": 8.515867124784043e-05, "tps": 67281, "wall": 23099.6} {"step": 23715, "train_loss": 3.316941976547241, "lr": 8.514598106248587e-05, "tps": 67270, "wall": 23104.6} {"step": 23716, "train_loss": 3.313769817352295, "lr": 8.513329240476492e-05, "tps": 67258, "wall": 23109.6} {"step": 23717, "train_loss": 3.2079110145568848, "lr": 8.512060527482135e-05, "tps": 67246, "wall": 23114.6} {"step": 23718, "train_loss": 3.1486921310424805, "lr": 8.510791967279889e-05, "tps": 67235, "wall": 23119.6} {"step": 23719, "train_loss": 3.2605741024017334, "lr": 8.509523559884113e-05, "tps": 67223, "wall": 23124.5} {"step": 23720, "train_loss": 3.2947404384613037, "lr": 8.508255305309191e-05, "tps": 67211, "wall": 23129.5} {"step": 23721, "train_loss": 3.226015567779541, "lr": 8.50698720356948e-05, "tps": 67200, "wall": 23134.5} {"step": 23722, "train_loss": 3.2468833923339844, "lr": 8.505719254679345e-05, "tps": 67188, "wall": 23139.6} {"step": 23723, "train_loss": 3.3172926902770996, "lr": 8.504451458653157e-05, "tps": 67176, "wall": 23144.6} {"step": 23724, "train_loss": 3.303539276123047, "lr": 8.503183815505269e-05, "tps": 67165, "wall": 23149.6} {"step": 23725, "train_loss": 3.182847261428833, "lr": 8.501916325250049e-05, "tps": 67153, "wall": 23154.6} {"step": 23726, "train_loss": 3.1501927375793457, "lr": 8.500648987901851e-05, "tps": 67141, "wall": 23159.5} {"step": 23727, "train_loss": 3.2582550048828125, "lr": 8.499381803475027e-05, "tps": 67130, "wall": 23164.5} {"step": 23728, "train_loss": 3.234398365020752, "lr": 8.49811477198394e-05, "tps": 67118, "wall": 23169.5} {"step": 23729, "train_loss": 3.2366058826446533, "lr": 8.49684789344294e-05, "tps": 67106, "wall": 23174.5} {"step": 23730, "train_loss": 3.2948460578918457, "lr": 8.495581167866374e-05, "tps": 67095, "wall": 23179.5} {"step": 23731, "train_loss": 3.262737512588501, "lr": 8.4943145952686e-05, "tps": 67083, "wall": 23184.4} {"step": 23732, "train_loss": 3.3806164264678955, "lr": 8.493048175663959e-05, "tps": 67072, "wall": 23189.4} {"step": 23733, "train_loss": 3.243351697921753, "lr": 8.491781909066793e-05, "tps": 67060, "wall": 23194.4} {"step": 23734, "train_loss": 3.2265408039093018, "lr": 8.490515795491461e-05, "tps": 67048, "wall": 23199.4} {"step": 23735, "train_loss": 3.305464267730713, "lr": 8.489249834952296e-05, "tps": 67037, "wall": 23204.4} {"step": 23736, "train_loss": 3.2812294960021973, "lr": 8.487984027463633e-05, "tps": 67025, "wall": 23209.4} {"step": 23737, "train_loss": 3.362818717956543, "lr": 8.486718373039823e-05, "tps": 67014, "wall": 23214.4} {"step": 23738, "train_loss": 3.191164493560791, "lr": 8.485452871695199e-05, "tps": 67002, "wall": 23219.4} {"step": 23739, "train_loss": 3.2511961460113525, "lr": 8.484187523444092e-05, "tps": 66991, "wall": 23224.3} {"step": 23740, "train_loss": 3.24015736579895, "lr": 8.482922328300843e-05, "tps": 66979, "wall": 23229.3} {"step": 23741, "train_loss": 3.376743793487549, "lr": 8.481657286279779e-05, "tps": 66968, "wall": 23234.3} {"step": 23742, "train_loss": 3.3101930618286133, "lr": 8.480392397395234e-05, "tps": 66956, "wall": 23239.3} {"step": 23743, "train_loss": 3.3278865814208984, "lr": 8.479127661661536e-05, "tps": 66945, "wall": 23244.2} {"step": 23744, "train_loss": 3.2288384437561035, "lr": 8.477863079093008e-05, "tps": 66933, "wall": 23249.2} {"step": 23745, "train_loss": 3.1903252601623535, "lr": 8.476598649703984e-05, "tps": 66922, "wall": 23254.2} {"step": 23746, "train_loss": 3.2339820861816406, "lr": 8.47533437350878e-05, "tps": 66910, "wall": 23259.2} {"step": 23747, "train_loss": 3.0968408584594727, "lr": 8.474070250521716e-05, "tps": 66898, "wall": 23264.2} {"step": 23748, "train_loss": 3.2609660625457764, "lr": 8.47280628075712e-05, "tps": 66887, "wall": 23269.2} {"step": 23749, "train_loss": 3.275865077972412, "lr": 8.47154246422931e-05, "tps": 66875, "wall": 23274.1} {"step": 23750, "train_loss": 3.1617910861968994, "lr": 8.470278800952591e-05, "tps": 66864, "wall": 23279.1} {"step": 23751, "train_loss": 3.2659356594085693, "lr": 8.469015290941289e-05, "tps": 66853, "wall": 23284.1} {"step": 23752, "train_loss": 3.278978109359741, "lr": 8.467751934209716e-05, "tps": 66841, "wall": 23289.0} {"step": 23753, "train_loss": 3.2559776306152344, "lr": 8.466488730772176e-05, "tps": 66830, "wall": 23294.0} {"step": 23754, "train_loss": 3.1849007606506348, "lr": 8.465225680642988e-05, "tps": 66818, "wall": 23298.9} {"step": 23755, "train_loss": 3.155135154724121, "lr": 8.463962783836456e-05, "tps": 66807, "wall": 23303.9} {"step": 23756, "train_loss": 3.223726749420166, "lr": 8.46270004036688e-05, "tps": 66796, "wall": 23308.9} {"step": 23757, "train_loss": 3.2435834407806396, "lr": 8.461437450248577e-05, "tps": 66784, "wall": 23313.8} {"step": 23758, "train_loss": 3.272137403488159, "lr": 8.460175013495838e-05, "tps": 66773, "wall": 23318.8} {"step": 23759, "train_loss": 3.1956684589385986, "lr": 8.458912730122974e-05, "tps": 66761, "wall": 23323.8} {"step": 23760, "train_loss": 3.276736259460449, "lr": 8.457650600144278e-05, "tps": 66750, "wall": 23328.7} {"step": 23761, "train_loss": 3.351013660430908, "lr": 8.456388623574043e-05, "tps": 66738, "wall": 23333.8} {"step": 23762, "train_loss": 3.292202949523926, "lr": 8.455126800426576e-05, "tps": 66727, "wall": 23338.7} {"step": 23763, "train_loss": 3.2129220962524414, "lr": 8.453865130716166e-05, "tps": 66716, "wall": 23343.7} {"step": 23764, "train_loss": 3.2156519889831543, "lr": 8.4526036144571e-05, "tps": 66704, "wall": 23348.6} {"step": 23765, "train_loss": 3.335423231124878, "lr": 8.451342251663676e-05, "tps": 66693, "wall": 23353.6} {"step": 23766, "train_loss": 3.176978588104248, "lr": 8.450081042350182e-05, "tps": 66682, "wall": 23358.5} {"step": 23767, "train_loss": 3.2668981552124023, "lr": 8.448819986530898e-05, "tps": 66670, "wall": 23363.5} {"step": 23768, "train_loss": 3.2794294357299805, "lr": 8.44755908422012e-05, "tps": 66659, "wall": 23368.4} {"step": 23769, "train_loss": 3.311728000640869, "lr": 8.446298335432124e-05, "tps": 66648, "wall": 23373.4} {"step": 23770, "train_loss": 3.2702550888061523, "lr": 8.445037740181188e-05, "tps": 66636, "wall": 23378.4} {"step": 23771, "train_loss": 3.1883058547973633, "lr": 8.443777298481605e-05, "tps": 66625, "wall": 23383.4} {"step": 23772, "train_loss": 3.1608974933624268, "lr": 8.442517010347646e-05, "tps": 66613, "wall": 23388.3} {"step": 23773, "train_loss": 3.1879494190216064, "lr": 8.441256875793581e-05, "tps": 66602, "wall": 23393.3} {"step": 23774, "train_loss": 3.2902801036834717, "lr": 8.439996894833697e-05, "tps": 66591, "wall": 23398.3} {"step": 23775, "train_loss": 3.23394775390625, "lr": 8.438737067482265e-05, "tps": 66579, "wall": 23403.2} {"step": 23776, "train_loss": 3.2368388175964355, "lr": 8.437477393753544e-05, "tps": 66568, "wall": 23408.2} {"step": 23777, "train_loss": 3.1909098625183105, "lr": 8.436217873661819e-05, "tps": 66557, "wall": 23413.1} {"step": 23778, "train_loss": 3.2147393226623535, "lr": 8.434958507221347e-05, "tps": 66546, "wall": 23418.1} {"step": 23779, "train_loss": 3.283839225769043, "lr": 8.433699294446404e-05, "tps": 66534, "wall": 23423.0} {"step": 23780, "train_loss": 3.1456832885742188, "lr": 8.432440235351251e-05, "tps": 66523, "wall": 23428.0} {"step": 23781, "train_loss": 3.2732763290405273, "lr": 8.431181329950142e-05, "tps": 66512, "wall": 23432.9} {"step": 23782, "train_loss": 3.2310256958007812, "lr": 8.429922578257349e-05, "tps": 66500, "wall": 23438.0} {"step": 23783, "train_loss": 3.2675507068634033, "lr": 8.428663980287129e-05, "tps": 66489, "wall": 23442.9} {"step": 23784, "train_loss": 3.4658241271972656, "lr": 8.427405536053732e-05, "tps": 66478, "wall": 23447.9} {"step": 23785, "train_loss": 3.2808239459991455, "lr": 8.426147245571423e-05, "tps": 66467, "wall": 23452.8} {"step": 23786, "train_loss": 3.2427704334259033, "lr": 8.424889108854454e-05, "tps": 66455, "wall": 23457.7} {"step": 23787, "train_loss": 3.1941781044006348, "lr": 8.423631125917071e-05, "tps": 66444, "wall": 23462.7} {"step": 23788, "train_loss": 3.3765296936035156, "lr": 8.422373296773533e-05, "tps": 66433, "wall": 23467.6} {"step": 23789, "train_loss": 3.2126870155334473, "lr": 8.421115621438086e-05, "tps": 66422, "wall": 23472.5} {"step": 23790, "train_loss": 3.121096134185791, "lr": 8.41985809992497e-05, "tps": 66411, "wall": 23477.5} {"step": 23791, "train_loss": 3.1235873699188232, "lr": 8.418600732248441e-05, "tps": 66400, "wall": 23482.4} {"step": 23792, "train_loss": 3.186272144317627, "lr": 8.417343518422738e-05, "tps": 66388, "wall": 23487.4} {"step": 23793, "train_loss": 3.2017855644226074, "lr": 8.416086458462099e-05, "tps": 66377, "wall": 23492.3} {"step": 23794, "train_loss": 3.1251676082611084, "lr": 8.414829552380769e-05, "tps": 66366, "wall": 23497.4} {"step": 23795, "train_loss": 3.217907190322876, "lr": 8.413572800192981e-05, "tps": 66354, "wall": 23502.3} {"step": 23796, "train_loss": 3.3788280487060547, "lr": 8.412316201912981e-05, "tps": 66343, "wall": 23507.2} {"step": 23797, "train_loss": 3.259774923324585, "lr": 8.411059757554998e-05, "tps": 66332, "wall": 23512.2} {"step": 23798, "train_loss": 3.1875805854797363, "lr": 8.40980346713326e-05, "tps": 66321, "wall": 23517.1} {"step": 23799, "train_loss": 3.2592685222625732, "lr": 8.408547330662009e-05, "tps": 66310, "wall": 23522.0} {"step": 23800, "train_loss": 3.1719179153442383, "lr": 8.40729134815547e-05, "tps": 66299, "wall": 23527.0} {"step": 23801, "train_loss": 3.231842041015625, "lr": 8.406035519627864e-05, "tps": 66288, "wall": 23531.9} {"step": 23802, "train_loss": 3.338927745819092, "lr": 8.404779845093427e-05, "tps": 66277, "wall": 23536.9} {"step": 23803, "train_loss": 3.1518568992614746, "lr": 8.403524324566378e-05, "tps": 66265, "wall": 23541.8} {"step": 23804, "train_loss": 3.2463932037353516, "lr": 8.402268958060941e-05, "tps": 66254, "wall": 23546.7} {"step": 23805, "train_loss": 3.25917911529541, "lr": 8.40101374559134e-05, "tps": 66243, "wall": 23551.7} {"step": 23806, "train_loss": 3.1841931343078613, "lr": 8.399758687171789e-05, "tps": 66232, "wall": 23556.7} {"step": 23807, "train_loss": 3.200910806655884, "lr": 8.398503782816503e-05, "tps": 66221, "wall": 23561.6} {"step": 23808, "train_loss": 3.245865821838379, "lr": 8.397249032539707e-05, "tps": 66210, "wall": 23566.6} {"step": 23809, "train_loss": 3.2502336502075195, "lr": 8.395994436355612e-05, "tps": 66199, "wall": 23571.5} {"step": 23810, "train_loss": 3.1797971725463867, "lr": 8.39473999427842e-05, "tps": 66188, "wall": 23576.4} {"step": 23811, "train_loss": 3.2278285026550293, "lr": 8.393485706322357e-05, "tps": 66177, "wall": 23581.4} {"step": 23812, "train_loss": 3.2949600219726562, "lr": 8.392231572501616e-05, "tps": 66165, "wall": 23586.3} {"step": 23813, "train_loss": 3.281562566757202, "lr": 8.39097759283042e-05, "tps": 66154, "wall": 23591.2} {"step": 23814, "train_loss": 3.1925055980682373, "lr": 8.389723767322963e-05, "tps": 66143, "wall": 23596.2} {"step": 23815, "train_loss": 3.2820394039154053, "lr": 8.388470095993448e-05, "tps": 66132, "wall": 23601.1} {"step": 23816, "train_loss": 3.293281316757202, "lr": 8.387216578856087e-05, "tps": 66121, "wall": 23606.0} {"step": 23817, "train_loss": 3.333280563354492, "lr": 8.385963215925071e-05, "tps": 66110, "wall": 23611.0} {"step": 23818, "train_loss": 3.309156894683838, "lr": 8.384710007214596e-05, "tps": 66099, "wall": 23615.9} {"step": 23819, "train_loss": 3.1376307010650635, "lr": 8.383456952738865e-05, "tps": 66088, "wall": 23620.9} {"step": 23820, "train_loss": 3.0530052185058594, "lr": 8.382204052512075e-05, "tps": 66077, "wall": 23625.8} {"step": 23821, "train_loss": 3.2777390480041504, "lr": 8.380951306548406e-05, "tps": 66066, "wall": 23630.8} {"step": 23822, "train_loss": 3.177680015563965, "lr": 8.379698714862063e-05, "tps": 66055, "wall": 23635.7} {"step": 23823, "train_loss": 3.2628302574157715, "lr": 8.378446277467228e-05, "tps": 66044, "wall": 23640.6} {"step": 23824, "train_loss": 3.162100076675415, "lr": 8.377193994378087e-05, "tps": 66033, "wall": 23645.5} {"step": 23825, "train_loss": 3.336120128631592, "lr": 8.375941865608836e-05, "tps": 66022, "wall": 23650.4} {"step": 23826, "train_loss": 3.154064655303955, "lr": 8.37468989117365e-05, "tps": 66011, "wall": 23655.4} {"step": 23827, "train_loss": 3.190376043319702, "lr": 8.373438071086712e-05, "tps": 66000, "wall": 23660.4} {"step": 23828, "train_loss": 3.1655242443084717, "lr": 8.372186405362207e-05, "tps": 65989, "wall": 23665.3} {"step": 23829, "train_loss": 3.245354413986206, "lr": 8.370934894014315e-05, "tps": 65978, "wall": 23670.2} {"step": 23830, "train_loss": 3.278303861618042, "lr": 8.3696835370572e-05, "tps": 65967, "wall": 23675.1} {"step": 23831, "train_loss": 3.2237191200256348, "lr": 8.368432334505056e-05, "tps": 65956, "wall": 23680.1} {"step": 23832, "train_loss": 3.2562742233276367, "lr": 8.36718128637204e-05, "tps": 65945, "wall": 23685.1} {"step": 23833, "train_loss": 3.1463282108306885, "lr": 8.365930392672341e-05, "tps": 65934, "wall": 23690.0} {"step": 23834, "train_loss": 3.1762232780456543, "lr": 8.364679653420116e-05, "tps": 65923, "wall": 23694.9} {"step": 23835, "train_loss": 3.2847423553466797, "lr": 8.363429068629535e-05, "tps": 65912, "wall": 23699.8} {"step": 23836, "train_loss": 3.150374412536621, "lr": 8.36217863831477e-05, "tps": 65901, "wall": 23704.8} {"step": 23837, "train_loss": 3.32218599319458, "lr": 8.360928362489988e-05, "tps": 65890, "wall": 23709.7} {"step": 23838, "train_loss": 3.249098777770996, "lr": 8.359678241169338e-05, "tps": 65879, "wall": 23714.6} {"step": 23839, "train_loss": 3.110015869140625, "lr": 8.358428274366997e-05, "tps": 65868, "wall": 23719.5} {"step": 23840, "train_loss": 3.2992615699768066, "lr": 8.357178462097117e-05, "tps": 65857, "wall": 23724.5} {"step": 23841, "train_loss": 3.207911729812622, "lr": 8.355928804373854e-05, "tps": 65847, "wall": 23729.4} {"step": 23842, "train_loss": 3.221749782562256, "lr": 8.354679301211373e-05, "tps": 65836, "wall": 23734.3} {"step": 23843, "train_loss": 3.337146043777466, "lr": 8.353429952623823e-05, "tps": 65824, "wall": 23739.3} {"step": 23844, "train_loss": 3.28714656829834, "lr": 8.35218075862535e-05, "tps": 65814, "wall": 23744.3} {"step": 23845, "train_loss": 3.1149842739105225, "lr": 8.35093171923012e-05, "tps": 65803, "wall": 23749.2} {"step": 23846, "train_loss": 3.300642728805542, "lr": 8.349682834452271e-05, "tps": 65792, "wall": 23754.1} {"step": 23847, "train_loss": 3.166787624359131, "lr": 8.34843410430595e-05, "tps": 65781, "wall": 23759.0} {"step": 23848, "train_loss": 3.2295007705688477, "lr": 8.34718552880531e-05, "tps": 65770, "wall": 23764.0} {"step": 23849, "train_loss": 3.2055132389068604, "lr": 8.345937107964485e-05, "tps": 65759, "wall": 23768.9} {"step": 23850, "train_loss": 3.242169141769409, "lr": 8.34468884179763e-05, "tps": 65748, "wall": 23773.8} {"step": 23851, "train_loss": 3.18057918548584, "lr": 8.343440730318878e-05, "tps": 65737, "wall": 23778.7} {"step": 23852, "train_loss": 3.1237566471099854, "lr": 8.342192773542361e-05, "tps": 65727, "wall": 23783.7} {"step": 23853, "train_loss": 3.1243603229522705, "lr": 8.340944971482232e-05, "tps": 65716, "wall": 23788.6} {"step": 23854, "train_loss": 3.298391342163086, "lr": 8.339697324152616e-05, "tps": 65705, "wall": 23793.5} {"step": 23855, "train_loss": 3.2512924671173096, "lr": 8.338449831567647e-05, "tps": 65694, "wall": 23798.5} {"step": 23856, "train_loss": 3.4047913551330566, "lr": 8.337202493741456e-05, "tps": 65683, "wall": 23803.4} {"step": 23857, "train_loss": 3.1371235847473145, "lr": 8.335955310688173e-05, "tps": 65672, "wall": 23808.3} {"step": 23858, "train_loss": 3.28786563873291, "lr": 8.334708282421928e-05, "tps": 65661, "wall": 23813.3} {"step": 23859, "train_loss": 3.285080909729004, "lr": 8.33346140895685e-05, "tps": 65651, "wall": 23818.2} {"step": 23860, "train_loss": 3.1395270824432373, "lr": 8.332214690307056e-05, "tps": 65640, "wall": 23823.1} {"step": 23861, "train_loss": 3.172205924987793, "lr": 8.330968126486678e-05, "tps": 65629, "wall": 23828.0} {"step": 23862, "train_loss": 3.2667088508605957, "lr": 8.329721717509831e-05, "tps": 65618, "wall": 23832.9} {"step": 23863, "train_loss": 3.1744492053985596, "lr": 8.32847546339063e-05, "tps": 65607, "wall": 23837.8} {"step": 23864, "train_loss": 3.216397523880005, "lr": 8.327229364143208e-05, "tps": 65597, "wall": 23842.8} {"step": 23865, "train_loss": 3.1961827278137207, "lr": 8.325983419781668e-05, "tps": 65586, "wall": 23847.7} {"step": 23866, "train_loss": 3.3076086044311523, "lr": 8.32473763032012e-05, "tps": 65575, "wall": 23852.6} {"step": 23867, "train_loss": 3.2329277992248535, "lr": 8.323491995772694e-05, "tps": 65564, "wall": 23857.6} {"step": 23868, "train_loss": 3.2837533950805664, "lr": 8.322246516153488e-05, "tps": 65553, "wall": 23862.5} {"step": 23869, "train_loss": 3.1982288360595703, "lr": 8.32100119147661e-05, "tps": 65543, "wall": 23867.4} {"step": 23870, "train_loss": 3.3083133697509766, "lr": 8.319756021756175e-05, "tps": 65532, "wall": 23872.3} {"step": 23871, "train_loss": 3.2943203449249268, "lr": 8.318511007006283e-05, "tps": 65521, "wall": 23877.2} {"step": 23872, "train_loss": 3.2384562492370605, "lr": 8.317266147241034e-05, "tps": 65510, "wall": 23882.1} {"step": 23873, "train_loss": 3.243530511856079, "lr": 8.316021442474537e-05, "tps": 65500, "wall": 23887.1} {"step": 23874, "train_loss": 3.2024669647216797, "lr": 8.314776892720887e-05, "tps": 65489, "wall": 23892.0} {"step": 23875, "train_loss": 3.318636178970337, "lr": 8.313532497994192e-05, "tps": 65478, "wall": 23896.9} {"step": 23876, "train_loss": 3.2611947059631348, "lr": 8.312288258308537e-05, "tps": 65467, "wall": 23901.8} {"step": 23877, "train_loss": 3.264619827270508, "lr": 8.311044173678019e-05, "tps": 65457, "wall": 23906.7} {"step": 23878, "train_loss": 3.1729912757873535, "lr": 8.309800244116737e-05, "tps": 65446, "wall": 23911.7} {"step": 23879, "train_loss": 3.2221896648406982, "lr": 8.308556469638778e-05, "tps": 65435, "wall": 23916.6} {"step": 23880, "train_loss": 3.10601544380188, "lr": 8.307312850258227e-05, "tps": 65424, "wall": 23921.5} {"step": 23881, "train_loss": 3.2349250316619873, "lr": 8.306069385989182e-05, "tps": 65414, "wall": 23926.5} {"step": 23882, "train_loss": 3.3532087802886963, "lr": 8.304826076845724e-05, "tps": 65403, "wall": 23931.4} {"step": 23883, "train_loss": 3.190944194793701, "lr": 8.303582922841931e-05, "tps": 65392, "wall": 23936.3} {"step": 23884, "train_loss": 3.273754119873047, "lr": 8.302339923991899e-05, "tps": 65382, "wall": 23941.2} {"step": 23885, "train_loss": 3.207282066345215, "lr": 8.301097080309702e-05, "tps": 65371, "wall": 23946.1} {"step": 23886, "train_loss": 3.2369680404663086, "lr": 8.299854391809408e-05, "tps": 65360, "wall": 23951.0} {"step": 23887, "train_loss": 3.2558341026306152, "lr": 8.298611858505114e-05, "tps": 65350, "wall": 23955.9} {"step": 23888, "train_loss": 3.237807035446167, "lr": 8.297369480410885e-05, "tps": 65339, "wall": 23960.8} {"step": 23889, "train_loss": 3.220409870147705, "lr": 8.296127257540792e-05, "tps": 65328, "wall": 23965.8} {"step": 23890, "train_loss": 3.3572769165039062, "lr": 8.294885189908915e-05, "tps": 65318, "wall": 23970.7} {"step": 23891, "train_loss": 3.1931381225585938, "lr": 8.293643277529313e-05, "tps": 65307, "wall": 23975.6} {"step": 23892, "train_loss": 3.2890167236328125, "lr": 8.29240152041607e-05, "tps": 65296, "wall": 23980.6} {"step": 23893, "train_loss": 3.2553577423095703, "lr": 8.291159918583243e-05, "tps": 65286, "wall": 23985.5} {"step": 23894, "train_loss": 3.1880581378936768, "lr": 8.28991847204489e-05, "tps": 65275, "wall": 23990.4} {"step": 23895, "train_loss": 3.2760794162750244, "lr": 8.288677180815092e-05, "tps": 65264, "wall": 23995.3} {"step": 23896, "train_loss": 3.2962071895599365, "lr": 8.287436044907897e-05, "tps": 65254, "wall": 24000.2} {"step": 23897, "train_loss": 3.257452964782715, "lr": 8.286195064337366e-05, "tps": 65243, "wall": 24005.1} {"step": 23898, "train_loss": 3.3640799522399902, "lr": 8.284954239117561e-05, "tps": 65232, "wall": 24010.0} {"step": 23899, "train_loss": 3.1871066093444824, "lr": 8.28371356926254e-05, "tps": 65222, "wall": 24014.9} {"step": 23900, "train_loss": 3.2219698429107666, "lr": 8.282473054786346e-05, "tps": 65211, "wall": 24019.8} {"step": 23901, "train_loss": 3.2423527240753174, "lr": 8.281232695703045e-05, "tps": 65201, "wall": 24024.7} {"step": 23902, "train_loss": 3.292449951171875, "lr": 8.279992492026682e-05, "tps": 65190, "wall": 24029.6} {"step": 23903, "train_loss": 3.2469747066497803, "lr": 8.278752443771303e-05, "tps": 65179, "wall": 24034.6} {"step": 23904, "train_loss": 3.2500739097595215, "lr": 8.277512550950964e-05, "tps": 65169, "wall": 24039.5} {"step": 23905, "train_loss": 3.2824525833129883, "lr": 8.276272813579702e-05, "tps": 65158, "wall": 24044.5} {"step": 23906, "train_loss": 3.278343439102173, "lr": 8.27503323167156e-05, "tps": 65148, "wall": 24049.4} {"step": 23907, "train_loss": 3.13602352142334, "lr": 8.273793805240591e-05, "tps": 65137, "wall": 24054.3} {"step": 23908, "train_loss": 3.244561195373535, "lr": 8.272554534300821e-05, "tps": 65126, "wall": 24059.2} {"step": 23909, "train_loss": 3.195128917694092, "lr": 8.271315418866304e-05, "tps": 65116, "wall": 24064.1} {"step": 23910, "train_loss": 3.1833393573760986, "lr": 8.270076458951066e-05, "tps": 65105, "wall": 24069.0} {"step": 23911, "train_loss": 3.3113951683044434, "lr": 8.268837654569139e-05, "tps": 65095, "wall": 24073.9} {"step": 23912, "train_loss": 3.3138766288757324, "lr": 8.26759900573457e-05, "tps": 65084, "wall": 24078.8} {"step": 23913, "train_loss": 3.231644630432129, "lr": 8.266360512461378e-05, "tps": 65074, "wall": 24083.7} {"step": 23914, "train_loss": 3.233438491821289, "lr": 8.265122174763595e-05, "tps": 65063, "wall": 24088.6} {"step": 23915, "train_loss": 3.2212705612182617, "lr": 8.263883992655258e-05, "tps": 65053, "wall": 24093.5} {"step": 23916, "train_loss": 3.1759285926818848, "lr": 8.262645966150382e-05, "tps": 65042, "wall": 24098.5} {"step": 23917, "train_loss": 3.22678804397583, "lr": 8.261408095262993e-05, "tps": 65032, "wall": 24103.4} {"step": 23918, "train_loss": 3.257326602935791, "lr": 8.260170380007119e-05, "tps": 65021, "wall": 24108.3} {"step": 23919, "train_loss": 3.2407712936401367, "lr": 8.258932820396783e-05, "tps": 65011, "wall": 24113.2} {"step": 23920, "train_loss": 3.2317066192626953, "lr": 8.257695416445989e-05, "tps": 65000, "wall": 24118.1} {"step": 23921, "train_loss": 3.197671890258789, "lr": 8.256458168168773e-05, "tps": 64989, "wall": 24123.0} {"step": 23922, "train_loss": 3.2482187747955322, "lr": 8.255221075579142e-05, "tps": 64979, "wall": 24127.9} {"step": 23923, "train_loss": 3.3629214763641357, "lr": 8.253984138691105e-05, "tps": 64968, "wall": 24132.8} {"step": 23924, "train_loss": 3.2854413986206055, "lr": 8.252747357518684e-05, "tps": 64958, "wall": 24137.7} {"step": 23925, "train_loss": 3.2204246520996094, "lr": 8.251510732075885e-05, "tps": 64947, "wall": 24142.6} {"step": 23926, "train_loss": 3.351327896118164, "lr": 8.250274262376712e-05, "tps": 64937, "wall": 24147.5} {"step": 23927, "train_loss": 3.3661911487579346, "lr": 8.249037948435178e-05, "tps": 64927, "wall": 24152.4} {"step": 23928, "train_loss": 3.2838902473449707, "lr": 8.247801790265286e-05, "tps": 64916, "wall": 24157.4} {"step": 23929, "train_loss": 3.3640785217285156, "lr": 8.246565787881039e-05, "tps": 64905, "wall": 24162.3} {"step": 23930, "train_loss": 3.255384922027588, "lr": 8.245329941296442e-05, "tps": 64895, "wall": 24167.2} {"step": 23931, "train_loss": 3.202198028564453, "lr": 8.244094250525488e-05, "tps": 64884, "wall": 24172.1} {"step": 23932, "train_loss": 3.3026232719421387, "lr": 8.242858715582178e-05, "tps": 64874, "wall": 24177.1} {"step": 23933, "train_loss": 3.1607725620269775, "lr": 8.241623336480513e-05, "tps": 64863, "wall": 24182.0} {"step": 23934, "train_loss": 3.3242835998535156, "lr": 8.240388113234476e-05, "tps": 64853, "wall": 24186.9} {"step": 23935, "train_loss": 3.2560763359069824, "lr": 8.239153045858075e-05, "tps": 64843, "wall": 24191.8} {"step": 23936, "train_loss": 3.2247154712677, "lr": 8.23791813436529e-05, "tps": 64832, "wall": 24196.7} {"step": 23937, "train_loss": 3.2230944633483887, "lr": 8.236683378770108e-05, "tps": 64822, "wall": 24201.6} {"step": 23938, "train_loss": 3.1536989212036133, "lr": 8.235448779086528e-05, "tps": 64811, "wall": 24206.5} {"step": 23939, "train_loss": 3.27502179145813, "lr": 8.234214335328529e-05, "tps": 64801, "wall": 24211.4} {"step": 23940, "train_loss": 3.205533981323242, "lr": 8.232980047510088e-05, "tps": 64790, "wall": 24216.4} {"step": 23941, "train_loss": 3.244232654571533, "lr": 8.231745915645197e-05, "tps": 64780, "wall": 24221.3} {"step": 23942, "train_loss": 3.1692099571228027, "lr": 8.230511939747836e-05, "tps": 64769, "wall": 24226.2} {"step": 23943, "train_loss": 3.2612287998199463, "lr": 8.229278119831974e-05, "tps": 64759, "wall": 24231.1} {"step": 23944, "train_loss": 3.2524096965789795, "lr": 8.2280444559116e-05, "tps": 64749, "wall": 24236.0} {"step": 23945, "train_loss": 3.256239891052246, "lr": 8.226810948000681e-05, "tps": 64738, "wall": 24241.0} {"step": 23946, "train_loss": 3.3487181663513184, "lr": 8.225577596113197e-05, "tps": 64728, "wall": 24245.9} {"step": 23947, "train_loss": 3.32505202293396, "lr": 8.224344400263113e-05, "tps": 64717, "wall": 24250.8} {"step": 23948, "train_loss": 3.2620997428894043, "lr": 8.223111360464397e-05, "tps": 64707, "wall": 24255.7} {"step": 23949, "train_loss": 3.206990957260132, "lr": 8.221878476731024e-05, "tps": 64696, "wall": 24260.7} {"step": 23950, "train_loss": 3.221207618713379, "lr": 8.22064574907696e-05, "tps": 64686, "wall": 24265.7} {"step": 23951, "train_loss": 3.256920576095581, "lr": 8.21941317751616e-05, "tps": 64675, "wall": 24270.7} {"step": 23952, "train_loss": 3.058711528778076, "lr": 8.218180762062597e-05, "tps": 64664, "wall": 24275.7} {"step": 23953, "train_loss": 3.223097324371338, "lr": 8.216948502730229e-05, "tps": 64653, "wall": 24280.8} {"step": 23954, "train_loss": 3.303295612335205, "lr": 8.215716399533009e-05, "tps": 64643, "wall": 24285.9} {"step": 23955, "train_loss": 3.2312965393066406, "lr": 8.214484452484905e-05, "tps": 64632, "wall": 24290.9} {"step": 23956, "train_loss": 3.1986844539642334, "lr": 8.213252661599864e-05, "tps": 64621, "wall": 24296.0} {"step": 23957, "train_loss": 3.1334495544433594, "lr": 8.212021026891843e-05, "tps": 64610, "wall": 24301.1} {"step": 23958, "train_loss": 3.1970834732055664, "lr": 8.210789548374795e-05, "tps": 64599, "wall": 24306.2} {"step": 23959, "train_loss": 3.2649271488189697, "lr": 8.20955822606267e-05, "tps": 64589, "wall": 24311.3} {"step": 23960, "train_loss": 3.288182258605957, "lr": 8.20832705996941e-05, "tps": 64578, "wall": 24316.4} {"step": 23961, "train_loss": 3.2129929065704346, "lr": 8.207096050108972e-05, "tps": 64567, "wall": 24321.5} {"step": 23962, "train_loss": 3.317009925842285, "lr": 8.205865196495291e-05, "tps": 64556, "wall": 24326.6} {"step": 23963, "train_loss": 3.28338885307312, "lr": 8.204634499142321e-05, "tps": 64545, "wall": 24331.6} {"step": 23964, "train_loss": 3.225609302520752, "lr": 8.203403958063996e-05, "tps": 64534, "wall": 24336.8} {"step": 23965, "train_loss": 3.2436628341674805, "lr": 8.202173573274254e-05, "tps": 64523, "wall": 24341.9} {"step": 23966, "train_loss": 3.200159788131714, "lr": 8.200943344787042e-05, "tps": 64513, "wall": 24347.0} {"step": 23967, "train_loss": 3.268965244293213, "lr": 8.19971327261629e-05, "tps": 64502, "wall": 24352.1} {"step": 23968, "train_loss": 3.241307258605957, "lr": 8.198483356775926e-05, "tps": 64491, "wall": 24357.2} {"step": 23969, "train_loss": 3.235158681869507, "lr": 8.197253597279893e-05, "tps": 64480, "wall": 24362.3} {"step": 23970, "train_loss": 3.269061803817749, "lr": 8.196023994142122e-05, "tps": 64469, "wall": 24367.4} {"step": 23971, "train_loss": 3.2180416584014893, "lr": 8.194794547376531e-05, "tps": 64458, "wall": 24372.5} {"step": 23972, "train_loss": 3.2983286380767822, "lr": 8.19356525699706e-05, "tps": 64448, "wall": 24377.7} {"step": 23973, "train_loss": 3.3171937465667725, "lr": 8.192336123017626e-05, "tps": 64437, "wall": 24382.8} {"step": 23974, "train_loss": 3.2116522789001465, "lr": 8.191107145452152e-05, "tps": 64426, "wall": 24387.9} {"step": 23975, "train_loss": 3.2287209033966064, "lr": 8.189878324314568e-05, "tps": 64415, "wall": 24393.0} {"step": 23976, "train_loss": 3.205397129058838, "lr": 8.188649659618793e-05, "tps": 64404, "wall": 24398.1} {"step": 23977, "train_loss": 3.0960769653320312, "lr": 8.187421151378732e-05, "tps": 64394, "wall": 24403.2} {"step": 23978, "train_loss": 3.134847402572632, "lr": 8.186192799608318e-05, "tps": 64383, "wall": 24408.3} {"step": 23979, "train_loss": 3.2475674152374268, "lr": 8.18496460432146e-05, "tps": 64372, "wall": 24413.4} {"step": 23980, "train_loss": 3.1728110313415527, "lr": 8.183736565532065e-05, "tps": 64361, "wall": 24418.5} {"step": 23981, "train_loss": 3.2640483379364014, "lr": 8.182508683254056e-05, "tps": 64351, "wall": 24423.6} {"step": 23982, "train_loss": 3.256349563598633, "lr": 8.181280957501329e-05, "tps": 64340, "wall": 24428.7} {"step": 23983, "train_loss": 3.2409024238586426, "lr": 8.180053388287803e-05, "tps": 64329, "wall": 24433.8} {"step": 23984, "train_loss": 3.336055040359497, "lr": 8.178825975627382e-05, "tps": 64318, "wall": 24438.9} {"step": 23985, "train_loss": 3.2800230979919434, "lr": 8.177598719533963e-05, "tps": 64308, "wall": 24444.0} {"step": 23986, "train_loss": 3.325984477996826, "lr": 8.176371620021458e-05, "tps": 64297, "wall": 24449.1} {"step": 23987, "train_loss": 3.236827850341797, "lr": 8.175144677103763e-05, "tps": 64286, "wall": 24454.2} {"step": 23988, "train_loss": 3.347593307495117, "lr": 8.173917890794773e-05, "tps": 64275, "wall": 24459.3} {"step": 23989, "train_loss": 3.2458128929138184, "lr": 8.172691261108392e-05, "tps": 64265, "wall": 24464.4} {"step": 23990, "train_loss": 3.2273988723754883, "lr": 8.171464788058514e-05, "tps": 64254, "wall": 24469.5} {"step": 23991, "train_loss": 3.211820125579834, "lr": 8.170238471659026e-05, "tps": 64243, "wall": 24474.6} {"step": 23992, "train_loss": 3.2831926345825195, "lr": 8.169012311923829e-05, "tps": 64232, "wall": 24479.7} {"step": 23993, "train_loss": 3.168623447418213, "lr": 8.167786308866809e-05, "tps": 64222, "wall": 24484.8} {"step": 23994, "train_loss": 3.0860238075256348, "lr": 8.16656046250185e-05, "tps": 64211, "wall": 24489.9} {"step": 23995, "train_loss": 3.170144557952881, "lr": 8.165334772842848e-05, "tps": 64201, "wall": 24495.0} {"step": 23996, "train_loss": 3.317824125289917, "lr": 8.164109239903679e-05, "tps": 64190, "wall": 24500.0} {"step": 23997, "train_loss": 3.32759428024292, "lr": 8.162883863698226e-05, "tps": 64179, "wall": 24505.1} {"step": 23998, "train_loss": 3.1523921489715576, "lr": 8.161658644240378e-05, "tps": 64169, "wall": 24510.3} {"step": 23999, "train_loss": 3.2508726119995117, "lr": 8.160433581544006e-05, "tps": 64158, "wall": 24515.3} {"step": 24000, "train_loss": 3.258211135864258, "lr": 8.159208675622994e-05, "tps": 64147, "wall": 24520.5, "val_loss_monitor": 3.321788123588601} {"step": 24001, "train_loss": 3.3179445266723633, "lr": 8.157983926491218e-05, "tps": 64006, "wall": 24575.5} {"step": 24002, "train_loss": 3.235521078109741, "lr": 8.15675933416254e-05, "tps": 63995, "wall": 24580.7} {"step": 24003, "train_loss": 3.310946464538574, "lr": 8.155534898650848e-05, "tps": 63984, "wall": 24585.9} {"step": 24004, "train_loss": 3.1866188049316406, "lr": 8.154310619970004e-05, "tps": 63974, "wall": 24591.0} {"step": 24005, "train_loss": 3.3282477855682373, "lr": 8.153086498133873e-05, "tps": 63963, "wall": 24596.1} {"step": 24006, "train_loss": 3.3150477409362793, "lr": 8.151862533156335e-05, "tps": 63953, "wall": 24601.2} {"step": 24007, "train_loss": 3.172457456588745, "lr": 8.150638725051245e-05, "tps": 63942, "wall": 24606.3} {"step": 24008, "train_loss": 3.2550907135009766, "lr": 8.149415073832467e-05, "tps": 63931, "wall": 24611.4} {"step": 24009, "train_loss": 3.163425922393799, "lr": 8.148191579513869e-05, "tps": 63921, "wall": 24616.6} {"step": 24010, "train_loss": 3.276440143585205, "lr": 8.146968242109303e-05, "tps": 63910, "wall": 24621.7} {"step": 24011, "train_loss": 3.2610888481140137, "lr": 8.145745061632627e-05, "tps": 63900, "wall": 24626.7} {"step": 24012, "train_loss": 3.2974233627319336, "lr": 8.144522038097703e-05, "tps": 63889, "wall": 24631.8} {"step": 24013, "train_loss": 3.2796823978424072, "lr": 8.143299171518387e-05, "tps": 63878, "wall": 24637.0} {"step": 24014, "train_loss": 3.2339258193969727, "lr": 8.142076461908521e-05, "tps": 63868, "wall": 24642.1} {"step": 24015, "train_loss": 3.181210517883301, "lr": 8.140853909281966e-05, "tps": 63857, "wall": 24647.2} {"step": 24016, "train_loss": 3.209588050842285, "lr": 8.139631513652568e-05, "tps": 63847, "wall": 24652.3} {"step": 24017, "train_loss": 3.2083497047424316, "lr": 8.138409275034171e-05, "tps": 63836, "wall": 24657.4} {"step": 24018, "train_loss": 3.1437344551086426, "lr": 8.137187193440627e-05, "tps": 63826, "wall": 24662.5} {"step": 24019, "train_loss": 3.247269630432129, "lr": 8.135965268885773e-05, "tps": 63815, "wall": 24667.6} {"step": 24020, "train_loss": 3.27468204498291, "lr": 8.13474350138346e-05, "tps": 63805, "wall": 24672.6} {"step": 24021, "train_loss": 3.229468822479248, "lr": 8.13352189094752e-05, "tps": 63794, "wall": 24677.7} {"step": 24022, "train_loss": 3.2776308059692383, "lr": 8.132300437591789e-05, "tps": 63784, "wall": 24682.8} {"step": 24023, "train_loss": 3.2454140186309814, "lr": 8.131079141330116e-05, "tps": 63773, "wall": 24687.9} {"step": 24024, "train_loss": 3.164177417755127, "lr": 8.129858002176329e-05, "tps": 63762, "wall": 24693.0} {"step": 24025, "train_loss": 3.2426350116729736, "lr": 8.12863702014426e-05, "tps": 63752, "wall": 24698.2} {"step": 24026, "train_loss": 3.248096466064453, "lr": 8.127416195247741e-05, "tps": 63741, "wall": 24703.3} {"step": 24027, "train_loss": 3.1360507011413574, "lr": 8.126195527500597e-05, "tps": 63731, "wall": 24708.4} {"step": 24028, "train_loss": 3.2834315299987793, "lr": 8.124975016916666e-05, "tps": 63720, "wall": 24713.5} {"step": 24029, "train_loss": 3.243295192718506, "lr": 8.123754663509768e-05, "tps": 63710, "wall": 24718.6} {"step": 24030, "train_loss": 3.2568087577819824, "lr": 8.122534467293723e-05, "tps": 63699, "wall": 24723.7} {"step": 24031, "train_loss": 3.17763352394104, "lr": 8.121314428282363e-05, "tps": 63689, "wall": 24728.8} {"step": 24032, "train_loss": 3.3391566276550293, "lr": 8.120094546489505e-05, "tps": 63678, "wall": 24733.9} {"step": 24033, "train_loss": 3.2724838256835938, "lr": 8.118874821928961e-05, "tps": 63668, "wall": 24739.0} {"step": 24034, "train_loss": 3.251758098602295, "lr": 8.117655254614561e-05, "tps": 63658, "wall": 24744.1} {"step": 24035, "train_loss": 3.246293067932129, "lr": 8.116435844560109e-05, "tps": 63647, "wall": 24749.2} {"step": 24036, "train_loss": 3.1022515296936035, "lr": 8.115216591779422e-05, "tps": 63637, "wall": 24754.2} {"step": 24037, "train_loss": 3.1807327270507812, "lr": 8.113997496286317e-05, "tps": 63626, "wall": 24759.4} {"step": 24038, "train_loss": 3.184596061706543, "lr": 8.112778558094597e-05, "tps": 63615, "wall": 24764.6} {"step": 24039, "train_loss": 3.2197892665863037, "lr": 8.11155977721807e-05, "tps": 63605, "wall": 24769.7} {"step": 24040, "train_loss": 3.2456698417663574, "lr": 8.110341153670548e-05, "tps": 63594, "wall": 24774.8} {"step": 24041, "train_loss": 3.265808343887329, "lr": 8.10912268746583e-05, "tps": 63584, "wall": 24779.9} {"step": 24042, "train_loss": 3.2329792976379395, "lr": 8.107904378617725e-05, "tps": 63574, "wall": 24785.0} {"step": 24043, "train_loss": 3.253767490386963, "lr": 8.106686227140033e-05, "tps": 63563, "wall": 24790.1} {"step": 24044, "train_loss": 3.21820068359375, "lr": 8.105468233046547e-05, "tps": 63553, "wall": 24795.2} {"step": 24045, "train_loss": 3.328834056854248, "lr": 8.10425039635107e-05, "tps": 63542, "wall": 24800.2} {"step": 24046, "train_loss": 3.124793291091919, "lr": 8.103032717067399e-05, "tps": 63532, "wall": 24805.3} {"step": 24047, "train_loss": 3.1953043937683105, "lr": 8.101815195209319e-05, "tps": 63522, "wall": 24810.4} {"step": 24048, "train_loss": 3.1287143230438232, "lr": 8.100597830790633e-05, "tps": 63511, "wall": 24815.5} {"step": 24049, "train_loss": 3.240938663482666, "lr": 8.099380623825125e-05, "tps": 63501, "wall": 24820.7} {"step": 24050, "train_loss": 3.403535842895508, "lr": 8.098163574326583e-05, "tps": 63490, "wall": 24825.8} {"step": 24051, "train_loss": 3.204904556274414, "lr": 8.0969466823088e-05, "tps": 63480, "wall": 24830.9} {"step": 24052, "train_loss": 3.2373390197753906, "lr": 8.095729947785559e-05, "tps": 63469, "wall": 24836.0} {"step": 24053, "train_loss": 3.2411582469940186, "lr": 8.094513370770636e-05, "tps": 63459, "wall": 24841.1} {"step": 24054, "train_loss": 3.1859703063964844, "lr": 8.09329695127782e-05, "tps": 63449, "wall": 24846.2} {"step": 24055, "train_loss": 3.3205947875976562, "lr": 8.092080689320891e-05, "tps": 63438, "wall": 24851.3} {"step": 24056, "train_loss": 3.227062702178955, "lr": 8.090864584913618e-05, "tps": 63428, "wall": 24856.4} {"step": 24057, "train_loss": 3.2354655265808105, "lr": 8.089648638069788e-05, "tps": 63417, "wall": 24861.5} {"step": 24058, "train_loss": 3.2348289489746094, "lr": 8.088432848803172e-05, "tps": 63407, "wall": 24866.6} {"step": 24059, "train_loss": 3.453648328781128, "lr": 8.087217217127536e-05, "tps": 63397, "wall": 24871.7} {"step": 24060, "train_loss": 3.2207753658294678, "lr": 8.086001743056661e-05, "tps": 63386, "wall": 24876.9} {"step": 24061, "train_loss": 3.2783427238464355, "lr": 8.084786426604307e-05, "tps": 63376, "wall": 24882.0} {"step": 24062, "train_loss": 3.316763162612915, "lr": 8.083571267784248e-05, "tps": 63365, "wall": 24887.1} {"step": 24063, "train_loss": 3.1716105937957764, "lr": 8.08235626661025e-05, "tps": 63355, "wall": 24892.2} {"step": 24064, "train_loss": 3.193815231323242, "lr": 8.081141423096063e-05, "tps": 63345, "wall": 24897.4} {"step": 24065, "train_loss": 3.305377721786499, "lr": 8.079926737255468e-05, "tps": 63334, "wall": 24902.5} {"step": 24066, "train_loss": 3.274604320526123, "lr": 8.078712209102214e-05, "tps": 63324, "wall": 24907.6} {"step": 24067, "train_loss": 3.254100799560547, "lr": 8.077497838650058e-05, "tps": 63314, "wall": 24912.6} {"step": 24068, "train_loss": 3.3388352394104004, "lr": 8.076283625912764e-05, "tps": 63303, "wall": 24917.7} {"step": 24069, "train_loss": 3.206312417984009, "lr": 8.075069570904082e-05, "tps": 63293, "wall": 24922.8} {"step": 24070, "train_loss": 3.206958770751953, "lr": 8.07385567363776e-05, "tps": 63283, "wall": 24927.9} {"step": 24071, "train_loss": 3.158966302871704, "lr": 8.072641934127558e-05, "tps": 63272, "wall": 24933.0} {"step": 24072, "train_loss": 3.2320914268493652, "lr": 8.071428352387225e-05, "tps": 63262, "wall": 24938.2} {"step": 24073, "train_loss": 3.2198381423950195, "lr": 8.070214928430498e-05, "tps": 63251, "wall": 24943.3} {"step": 24074, "train_loss": 3.2629241943359375, "lr": 8.069001662271136e-05, "tps": 63241, "wall": 24948.4} {"step": 24075, "train_loss": 3.2036690711975098, "lr": 8.067788553922875e-05, "tps": 63231, "wall": 24953.6} {"step": 24076, "train_loss": 3.307929039001465, "lr": 8.066575603399455e-05, "tps": 63220, "wall": 24958.7} {"step": 24077, "train_loss": 3.2702322006225586, "lr": 8.065362810714627e-05, "tps": 63210, "wall": 24963.8} {"step": 24078, "train_loss": 3.214366912841797, "lr": 8.064150175882115e-05, "tps": 63200, "wall": 24968.9} {"step": 24079, "train_loss": 3.2723236083984375, "lr": 8.06293769891567e-05, "tps": 63190, "wall": 24973.9} {"step": 24080, "train_loss": 3.1601433753967285, "lr": 8.061725379829021e-05, "tps": 63179, "wall": 24979.0} {"step": 24081, "train_loss": 3.3018250465393066, "lr": 8.060513218635896e-05, "tps": 63169, "wall": 24984.1} {"step": 24082, "train_loss": 3.320192813873291, "lr": 8.059301215350035e-05, "tps": 63159, "wall": 24989.2} {"step": 24083, "train_loss": 3.179143190383911, "lr": 8.058089369985166e-05, "tps": 63149, "wall": 24994.3} {"step": 24084, "train_loss": 3.0670459270477295, "lr": 8.05687768255501e-05, "tps": 63138, "wall": 24999.5} {"step": 24085, "train_loss": 3.3133459091186523, "lr": 8.055666153073303e-05, "tps": 63128, "wall": 25004.6} {"step": 24086, "train_loss": 3.281993865966797, "lr": 8.05445478155376e-05, "tps": 63118, "wall": 25009.8} {"step": 24087, "train_loss": 3.208714008331299, "lr": 8.053243568010107e-05, "tps": 63107, "wall": 25014.9} {"step": 24088, "train_loss": 3.1962826251983643, "lr": 8.052032512456069e-05, "tps": 63097, "wall": 25020.0} {"step": 24089, "train_loss": 3.1836118698120117, "lr": 8.050821614905362e-05, "tps": 63087, "wall": 25025.1} {"step": 24090, "train_loss": 3.1922473907470703, "lr": 8.049610875371697e-05, "tps": 63076, "wall": 25030.2} {"step": 24091, "train_loss": 3.243997097015381, "lr": 8.048400293868799e-05, "tps": 63066, "wall": 25035.3} {"step": 24092, "train_loss": 3.204221725463867, "lr": 8.04718987041038e-05, "tps": 63056, "wall": 25040.4} {"step": 24093, "train_loss": 3.213002920150757, "lr": 8.045979605010139e-05, "tps": 63046, "wall": 25045.5} {"step": 24094, "train_loss": 3.2879481315612793, "lr": 8.044769497681806e-05, "tps": 63035, "wall": 25050.6} {"step": 24095, "train_loss": 3.2050201892852783, "lr": 8.04355954843907e-05, "tps": 63025, "wall": 25055.7} {"step": 24096, "train_loss": 3.316969394683838, "lr": 8.042349757295654e-05, "tps": 63015, "wall": 25060.9} {"step": 24097, "train_loss": 3.1553237438201904, "lr": 8.041140124265253e-05, "tps": 63005, "wall": 25066.0} {"step": 24098, "train_loss": 3.221137762069702, "lr": 8.039930649361568e-05, "tps": 62994, "wall": 25071.1} {"step": 24099, "train_loss": 3.2704601287841797, "lr": 8.03872133259831e-05, "tps": 62984, "wall": 25076.2} {"step": 24100, "train_loss": 3.2403597831726074, "lr": 8.037512173989172e-05, "tps": 62974, "wall": 25081.3} {"step": 24101, "train_loss": 3.1560122966766357, "lr": 8.036303173547845e-05, "tps": 62964, "wall": 25086.4} {"step": 24102, "train_loss": 3.2678780555725098, "lr": 8.035094331288035e-05, "tps": 62954, "wall": 25091.5} {"step": 24103, "train_loss": 3.3047804832458496, "lr": 8.033885647223434e-05, "tps": 62944, "wall": 25096.6} {"step": 24104, "train_loss": 3.1173343658447266, "lr": 8.032677121367726e-05, "tps": 62933, "wall": 25101.7} {"step": 24105, "train_loss": 3.215348243713379, "lr": 8.031468753734612e-05, "tps": 62923, "wall": 25106.8} {"step": 24106, "train_loss": 3.2275054454803467, "lr": 8.030260544337778e-05, "tps": 62913, "wall": 25111.9} {"step": 24107, "train_loss": 3.2018966674804688, "lr": 8.029052493190901e-05, "tps": 62903, "wall": 25117.1} {"step": 24108, "train_loss": 3.3009378910064697, "lr": 8.027844600307678e-05, "tps": 62893, "wall": 25122.1} {"step": 24109, "train_loss": 3.315490961074829, "lr": 8.026636865701788e-05, "tps": 62882, "wall": 25127.3} {"step": 24110, "train_loss": 3.2860469818115234, "lr": 8.025429289386908e-05, "tps": 62872, "wall": 25132.4} {"step": 24111, "train_loss": 3.331995964050293, "lr": 8.024221871376723e-05, "tps": 62862, "wall": 25137.6} {"step": 24112, "train_loss": 3.191967010498047, "lr": 8.02301461168491e-05, "tps": 62852, "wall": 25142.7} {"step": 24113, "train_loss": 3.2614548206329346, "lr": 8.021807510325139e-05, "tps": 62841, "wall": 25147.8} {"step": 24114, "train_loss": 3.282705783843994, "lr": 8.020600567311094e-05, "tps": 62831, "wall": 25152.8} {"step": 24115, "train_loss": 3.3160524368286133, "lr": 8.019393782656435e-05, "tps": 62821, "wall": 25157.9} {"step": 24116, "train_loss": 3.1498095989227295, "lr": 8.018187156374846e-05, "tps": 62811, "wall": 25163.0} {"step": 24117, "train_loss": 3.229288101196289, "lr": 8.016980688479991e-05, "tps": 62801, "wall": 25168.1} {"step": 24118, "train_loss": 3.208364248275757, "lr": 8.015774378985528e-05, "tps": 62791, "wall": 25173.2} {"step": 24119, "train_loss": 3.21451473236084, "lr": 8.014568227905134e-05, "tps": 62781, "wall": 25178.4} {"step": 24120, "train_loss": 3.165170192718506, "lr": 8.013362235252469e-05, "tps": 62770, "wall": 25183.5} {"step": 24121, "train_loss": 3.174226999282837, "lr": 8.012156401041189e-05, "tps": 62760, "wall": 25188.7} {"step": 24122, "train_loss": 3.290787935256958, "lr": 8.010950725284963e-05, "tps": 62750, "wall": 25193.7} {"step": 24123, "train_loss": 3.1782524585723877, "lr": 8.009745207997441e-05, "tps": 62740, "wall": 25198.8} {"step": 24124, "train_loss": 3.306576728820801, "lr": 8.00853984919228e-05, "tps": 62730, "wall": 25203.9} {"step": 24125, "train_loss": 3.195796489715576, "lr": 8.00733464888314e-05, "tps": 62720, "wall": 25209.0} {"step": 24126, "train_loss": 3.11198353767395, "lr": 8.006129607083672e-05, "tps": 62710, "wall": 25214.1} {"step": 24127, "train_loss": 3.209230422973633, "lr": 8.004924723807519e-05, "tps": 62700, "wall": 25219.2} {"step": 24128, "train_loss": 3.1733450889587402, "lr": 8.00371999906834e-05, "tps": 62690, "wall": 25224.3} {"step": 24129, "train_loss": 3.292426109313965, "lr": 8.00251543287978e-05, "tps": 62680, "wall": 25229.4} {"step": 24130, "train_loss": 3.2618181705474854, "lr": 8.001311025255473e-05, "tps": 62670, "wall": 25234.5} {"step": 24131, "train_loss": 3.2825565338134766, "lr": 8.000106776209081e-05, "tps": 62659, "wall": 25239.7} {"step": 24132, "train_loss": 3.470691680908203, "lr": 7.998902685754231e-05, "tps": 62649, "wall": 25244.8} {"step": 24133, "train_loss": 3.2133700847625732, "lr": 7.997698753904572e-05, "tps": 62639, "wall": 25249.9} {"step": 24134, "train_loss": 3.280092477798462, "lr": 7.996494980673743e-05, "tps": 62629, "wall": 25255.0} {"step": 24135, "train_loss": 3.1717703342437744, "lr": 7.995291366075369e-05, "tps": 62619, "wall": 25260.1} {"step": 24136, "train_loss": 3.192317008972168, "lr": 7.994087910123096e-05, "tps": 62609, "wall": 25265.2} {"step": 24137, "train_loss": 3.2558844089508057, "lr": 7.992884612830553e-05, "tps": 62599, "wall": 25270.3} {"step": 24138, "train_loss": 3.255722761154175, "lr": 7.991681474211367e-05, "tps": 62589, "wall": 25275.4} {"step": 24139, "train_loss": 3.133040428161621, "lr": 7.990478494279177e-05, "tps": 62579, "wall": 25280.5} {"step": 24140, "train_loss": 3.227952241897583, "lr": 7.989275673047604e-05, "tps": 62569, "wall": 25285.6} {"step": 24141, "train_loss": 3.2006640434265137, "lr": 7.988073010530269e-05, "tps": 62559, "wall": 25290.7} {"step": 24142, "train_loss": 3.2435855865478516, "lr": 7.986870506740805e-05, "tps": 62549, "wall": 25295.8} {"step": 24143, "train_loss": 3.292451858520508, "lr": 7.98566816169283e-05, "tps": 62539, "wall": 25301.0} {"step": 24144, "train_loss": 3.0953283309936523, "lr": 7.984465975399959e-05, "tps": 62528, "wall": 25306.1} {"step": 24145, "train_loss": 3.376555919647217, "lr": 7.983263947875823e-05, "tps": 62519, "wall": 25311.2} {"step": 24146, "train_loss": 3.154231071472168, "lr": 7.98206207913403e-05, "tps": 62509, "wall": 25316.3} {"step": 24147, "train_loss": 3.1726272106170654, "lr": 7.980860369188189e-05, "tps": 62499, "wall": 25321.4} {"step": 24148, "train_loss": 3.262000799179077, "lr": 7.979658818051927e-05, "tps": 62489, "wall": 25326.5} {"step": 24149, "train_loss": 3.243520975112915, "lr": 7.978457425738843e-05, "tps": 62479, "wall": 25331.6} {"step": 24150, "train_loss": 3.209449291229248, "lr": 7.977256192262559e-05, "tps": 62469, "wall": 25336.7} {"step": 24151, "train_loss": 3.27665376663208, "lr": 7.976055117636674e-05, "tps": 62459, "wall": 25341.8} {"step": 24152, "train_loss": 3.1643049716949463, "lr": 7.97485420187479e-05, "tps": 62449, "wall": 25346.9} {"step": 24153, "train_loss": 3.33551287651062, "lr": 7.973653444990521e-05, "tps": 62439, "wall": 25352.0} {"step": 24154, "train_loss": 3.25955867767334, "lr": 7.972452846997463e-05, "tps": 62428, "wall": 25357.2} {"step": 24155, "train_loss": 3.306251287460327, "lr": 7.971252407909216e-05, "tps": 62419, "wall": 25362.3} {"step": 24156, "train_loss": 3.1678085327148438, "lr": 7.970052127739385e-05, "tps": 62408, "wall": 25367.4} {"step": 24157, "train_loss": 3.319828510284424, "lr": 7.968852006501564e-05, "tps": 62399, "wall": 25372.5} {"step": 24158, "train_loss": 3.2759923934936523, "lr": 7.967652044209338e-05, "tps": 62389, "wall": 25377.6} {"step": 24159, "train_loss": 3.2992448806762695, "lr": 7.966452240876314e-05, "tps": 62379, "wall": 25382.7} {"step": 24160, "train_loss": 3.1827433109283447, "lr": 7.96525259651608e-05, "tps": 62369, "wall": 25387.8} {"step": 24161, "train_loss": 3.140462875366211, "lr": 7.96405311114222e-05, "tps": 62359, "wall": 25392.9} {"step": 24162, "train_loss": 3.1797335147857666, "lr": 7.962853784768326e-05, "tps": 62349, "wall": 25398.0} {"step": 24163, "train_loss": 3.149583339691162, "lr": 7.96165461740799e-05, "tps": 62339, "wall": 25403.0} {"step": 24164, "train_loss": 3.2461819648742676, "lr": 7.960455609074782e-05, "tps": 62329, "wall": 25408.1} {"step": 24165, "train_loss": 3.2223916053771973, "lr": 7.959256759782297e-05, "tps": 62319, "wall": 25413.2} {"step": 24166, "train_loss": 3.246840000152588, "lr": 7.95805806954411e-05, "tps": 62309, "wall": 25418.4} {"step": 24167, "train_loss": 3.1428797245025635, "lr": 7.956859538373798e-05, "tps": 62299, "wall": 25423.5} {"step": 24168, "train_loss": 3.2494986057281494, "lr": 7.955661166284946e-05, "tps": 62289, "wall": 25428.6} {"step": 24169, "train_loss": 3.13838267326355, "lr": 7.954462953291118e-05, "tps": 62279, "wall": 25433.7} {"step": 24170, "train_loss": 3.209009885787964, "lr": 7.953264899405898e-05, "tps": 62269, "wall": 25438.8} {"step": 24171, "train_loss": 3.272660255432129, "lr": 7.952067004642854e-05, "tps": 62260, "wall": 25443.9} {"step": 24172, "train_loss": 3.2142012119293213, "lr": 7.950869269015549e-05, "tps": 62250, "wall": 25449.0} {"step": 24173, "train_loss": 3.2209086418151855, "lr": 7.949671692537562e-05, "tps": 62240, "wall": 25454.1} {"step": 24174, "train_loss": 3.26547908782959, "lr": 7.948474275222457e-05, "tps": 62230, "wall": 25459.1} {"step": 24175, "train_loss": 3.294734001159668, "lr": 7.94727701708379e-05, "tps": 62220, "wall": 25464.2} {"step": 24176, "train_loss": 3.28450345993042, "lr": 7.946079918135129e-05, "tps": 62210, "wall": 25469.3} {"step": 24177, "train_loss": 3.302013874053955, "lr": 7.944882978390041e-05, "tps": 62200, "wall": 25474.4} {"step": 24178, "train_loss": 3.0723509788513184, "lr": 7.94368619786207e-05, "tps": 62190, "wall": 25479.6} {"step": 24179, "train_loss": 3.382762908935547, "lr": 7.942489576564789e-05, "tps": 62181, "wall": 25484.6} {"step": 24180, "train_loss": 3.2751173973083496, "lr": 7.941293114511745e-05, "tps": 62171, "wall": 25489.8} {"step": 24181, "train_loss": 3.2336697578430176, "lr": 7.94009681171649e-05, "tps": 62161, "wall": 25494.9} {"step": 24182, "train_loss": 3.2946479320526123, "lr": 7.938900668192585e-05, "tps": 62151, "wall": 25499.9} {"step": 24183, "train_loss": 3.2101285457611084, "lr": 7.937704683953573e-05, "tps": 62141, "wall": 25505.1} {"step": 24184, "train_loss": 3.222860336303711, "lr": 7.936508859012997e-05, "tps": 62131, "wall": 25510.1} {"step": 24185, "train_loss": 3.2275781631469727, "lr": 7.935313193384415e-05, "tps": 62121, "wall": 25515.2} {"step": 24186, "train_loss": 3.2046995162963867, "lr": 7.934117687081362e-05, "tps": 62112, "wall": 25520.3} {"step": 24187, "train_loss": 3.276721715927124, "lr": 7.932922340117386e-05, "tps": 62102, "wall": 25525.4} {"step": 24188, "train_loss": 3.159611701965332, "lr": 7.931727152506032e-05, "tps": 62092, "wall": 25530.5} {"step": 24189, "train_loss": 3.199941635131836, "lr": 7.930532124260825e-05, "tps": 62082, "wall": 25535.6} {"step": 24190, "train_loss": 3.2177188396453857, "lr": 7.929337255395317e-05, "tps": 62072, "wall": 25540.8} {"step": 24191, "train_loss": 3.201174736022949, "lr": 7.92814254592304e-05, "tps": 62062, "wall": 25545.9} {"step": 24192, "train_loss": 3.221118927001953, "lr": 7.926947995857523e-05, "tps": 62052, "wall": 25551.0} {"step": 24193, "train_loss": 3.280484199523926, "lr": 7.925753605212302e-05, "tps": 62043, "wall": 25556.1} {"step": 24194, "train_loss": 3.208768367767334, "lr": 7.9245593740009e-05, "tps": 62033, "wall": 25561.2} {"step": 24195, "train_loss": 3.1579055786132812, "lr": 7.923365302236855e-05, "tps": 62023, "wall": 25566.3} {"step": 24196, "train_loss": 3.245619058609009, "lr": 7.922171389933692e-05, "tps": 62013, "wall": 25571.3} {"step": 24197, "train_loss": 3.265636682510376, "lr": 7.920977637104924e-05, "tps": 62003, "wall": 25576.4} {"step": 24198, "train_loss": 3.383852481842041, "lr": 7.919784043764092e-05, "tps": 61994, "wall": 25581.5} {"step": 24199, "train_loss": 3.3356971740722656, "lr": 7.918590609924707e-05, "tps": 61984, "wall": 25586.6} {"step": 24200, "train_loss": 3.308636426925659, "lr": 7.917397335600284e-05, "tps": 61974, "wall": 25591.7} {"step": 24201, "train_loss": 3.2073915004730225, "lr": 7.916204220804348e-05, "tps": 61964, "wall": 25596.9} {"step": 24202, "train_loss": 3.2869744300842285, "lr": 7.915011265550419e-05, "tps": 61954, "wall": 25602.0} {"step": 24203, "train_loss": 3.150601863861084, "lr": 7.913818469851992e-05, "tps": 61945, "wall": 25607.1} {"step": 24204, "train_loss": 3.205369710922241, "lr": 7.9126258337226e-05, "tps": 61935, "wall": 25612.2} {"step": 24205, "train_loss": 3.3716044425964355, "lr": 7.911433357175746e-05, "tps": 61925, "wall": 25617.2} {"step": 24206, "train_loss": 3.204921245574951, "lr": 7.910241040224931e-05, "tps": 61915, "wall": 25622.3} {"step": 24207, "train_loss": 3.391988754272461, "lr": 7.909048882883673e-05, "tps": 61906, "wall": 25627.5} {"step": 24208, "train_loss": 3.2253339290618896, "lr": 7.90785688516547e-05, "tps": 61896, "wall": 25632.5} {"step": 24209, "train_loss": 3.2026290893554688, "lr": 7.906665047083824e-05, "tps": 61886, "wall": 25637.6} {"step": 24210, "train_loss": 3.2293543815612793, "lr": 7.905473368652242e-05, "tps": 61876, "wall": 25642.7} {"step": 24211, "train_loss": 3.202409505844116, "lr": 7.904281849884214e-05, "tps": 61867, "wall": 25647.8} {"step": 24212, "train_loss": 3.2502670288085938, "lr": 7.903090490793252e-05, "tps": 61857, "wall": 25653.0} {"step": 24213, "train_loss": 3.2127599716186523, "lr": 7.90189929139284e-05, "tps": 61847, "wall": 25658.1} {"step": 24214, "train_loss": 3.2402498722076416, "lr": 7.900708251696473e-05, "tps": 61837, "wall": 25663.2} {"step": 24215, "train_loss": 3.261162281036377, "lr": 7.89951737171765e-05, "tps": 61828, "wall": 25668.3} {"step": 24216, "train_loss": 3.3076446056365967, "lr": 7.898326651469856e-05, "tps": 61818, "wall": 25673.4} {"step": 24217, "train_loss": 3.263214588165283, "lr": 7.897136090966577e-05, "tps": 61808, "wall": 25678.5} {"step": 24218, "train_loss": 3.228116750717163, "lr": 7.895945690221309e-05, "tps": 61798, "wall": 25683.6} {"step": 24219, "train_loss": 3.2135512828826904, "lr": 7.894755449247529e-05, "tps": 61789, "wall": 25688.7} {"step": 24220, "train_loss": 3.2227210998535156, "lr": 7.89356536805872e-05, "tps": 61779, "wall": 25693.7} {"step": 24221, "train_loss": 3.2544901371002197, "lr": 7.89237544666837e-05, "tps": 61769, "wall": 25698.9} {"step": 24222, "train_loss": 3.2270941734313965, "lr": 7.891185685089952e-05, "tps": 61760, "wall": 25703.9} {"step": 24223, "train_loss": 3.3336637020111084, "lr": 7.889996083336942e-05, "tps": 61750, "wall": 25709.0} {"step": 24224, "train_loss": 3.259113311767578, "lr": 7.888806641422825e-05, "tps": 61740, "wall": 25714.1} {"step": 24225, "train_loss": 3.1067795753479004, "lr": 7.88761735936107e-05, "tps": 61730, "wall": 25719.3} {"step": 24226, "train_loss": 3.2771434783935547, "lr": 7.886428237165145e-05, "tps": 61721, "wall": 25724.4} {"step": 24227, "train_loss": 3.378018379211426, "lr": 7.885239274848527e-05, "tps": 61711, "wall": 25729.4} {"step": 24228, "train_loss": 3.1572422981262207, "lr": 7.884050472424678e-05, "tps": 61702, "wall": 25734.5} {"step": 24229, "train_loss": 3.231166362762451, "lr": 7.882861829907074e-05, "tps": 61692, "wall": 25739.6} {"step": 24230, "train_loss": 3.1884279251098633, "lr": 7.881673347309175e-05, "tps": 61682, "wall": 25744.7} {"step": 24231, "train_loss": 3.1280856132507324, "lr": 7.880485024644439e-05, "tps": 61673, "wall": 25749.8} {"step": 24232, "train_loss": 3.2711241245269775, "lr": 7.879296861926337e-05, "tps": 61663, "wall": 25754.8} {"step": 24233, "train_loss": 3.265181541442871, "lr": 7.878108859168326e-05, "tps": 61653, "wall": 25759.9} {"step": 24234, "train_loss": 3.214761257171631, "lr": 7.876921016383855e-05, "tps": 61644, "wall": 25765.0} {"step": 24235, "train_loss": 3.2829184532165527, "lr": 7.875733333586392e-05, "tps": 61634, "wall": 25770.1} {"step": 24236, "train_loss": 3.2108023166656494, "lr": 7.874545810789388e-05, "tps": 61624, "wall": 25775.2} {"step": 24237, "train_loss": 3.2117507457733154, "lr": 7.873358448006285e-05, "tps": 61615, "wall": 25780.4} {"step": 24238, "train_loss": 3.216564655303955, "lr": 7.872171245250549e-05, "tps": 61605, "wall": 25785.4} {"step": 24239, "train_loss": 3.253319501876831, "lr": 7.87098420253562e-05, "tps": 61595, "wall": 25790.5} {"step": 24240, "train_loss": 3.2294259071350098, "lr": 7.869797319874943e-05, "tps": 61586, "wall": 25795.6} {"step": 24241, "train_loss": 3.2103118896484375, "lr": 7.86861059728197e-05, "tps": 61576, "wall": 25800.6} {"step": 24242, "train_loss": 3.235428810119629, "lr": 7.867424034770142e-05, "tps": 61567, "wall": 25805.7} {"step": 24243, "train_loss": 3.2228925228118896, "lr": 7.866237632352891e-05, "tps": 61557, "wall": 25810.8} {"step": 24244, "train_loss": 3.2910406589508057, "lr": 7.865051390043672e-05, "tps": 61548, "wall": 25815.9} {"step": 24245, "train_loss": 3.234518527984619, "lr": 7.863865307855917e-05, "tps": 61538, "wall": 25820.9} {"step": 24246, "train_loss": 3.2237548828125, "lr": 7.862679385803053e-05, "tps": 61529, "wall": 25826.0} {"step": 24247, "train_loss": 3.2571749687194824, "lr": 7.861493623898528e-05, "tps": 61519, "wall": 25831.1} {"step": 24248, "train_loss": 3.3469998836517334, "lr": 7.860308022155762e-05, "tps": 61509, "wall": 25836.3} {"step": 24249, "train_loss": 3.25711989402771, "lr": 7.859122580588199e-05, "tps": 61500, "wall": 25841.3} {"step": 24250, "train_loss": 3.2847061157226562, "lr": 7.857937299209258e-05, "tps": 61490, "wall": 25846.4} {"step": 24251, "train_loss": 3.1754539012908936, "lr": 7.856752178032364e-05, "tps": 61481, "wall": 25851.5} {"step": 24252, "train_loss": 3.2388713359832764, "lr": 7.855567217070951e-05, "tps": 61471, "wall": 25856.6} {"step": 24253, "train_loss": 3.1651391983032227, "lr": 7.85438241633844e-05, "tps": 61462, "wall": 25861.7} {"step": 24254, "train_loss": 3.2124552726745605, "lr": 7.853197775848241e-05, "tps": 61452, "wall": 25866.7} {"step": 24255, "train_loss": 3.2981014251708984, "lr": 7.852013295613792e-05, "tps": 61442, "wall": 25871.8} {"step": 24256, "train_loss": 3.162914991378784, "lr": 7.850828975648502e-05, "tps": 61433, "wall": 25876.9} {"step": 24257, "train_loss": 3.200251817703247, "lr": 7.849644815965778e-05, "tps": 61423, "wall": 25882.0} {"step": 24258, "train_loss": 3.2712507247924805, "lr": 7.84846081657905e-05, "tps": 61414, "wall": 25887.1} {"step": 24259, "train_loss": 3.1857340335845947, "lr": 7.847276977501722e-05, "tps": 61404, "wall": 25892.1} {"step": 24260, "train_loss": 3.3024239540100098, "lr": 7.846093298747205e-05, "tps": 61395, "wall": 25897.3} {"step": 24261, "train_loss": 3.2978618144989014, "lr": 7.844909780328913e-05, "tps": 61385, "wall": 25902.3} {"step": 24262, "train_loss": 3.220452070236206, "lr": 7.843726422260245e-05, "tps": 61376, "wall": 25907.4} {"step": 24263, "train_loss": 3.2478489875793457, "lr": 7.842543224554609e-05, "tps": 61366, "wall": 25912.5} {"step": 24264, "train_loss": 3.1410436630249023, "lr": 7.841360187225411e-05, "tps": 61357, "wall": 25917.6} {"step": 24265, "train_loss": 3.3143696784973145, "lr": 7.84017731028605e-05, "tps": 61347, "wall": 25922.7} {"step": 24266, "train_loss": 3.2966115474700928, "lr": 7.838994593749927e-05, "tps": 61338, "wall": 25927.8} {"step": 24267, "train_loss": 3.2618908882141113, "lr": 7.837812037630441e-05, "tps": 61328, "wall": 25932.9} {"step": 24268, "train_loss": 3.1754794120788574, "lr": 7.83662964194098e-05, "tps": 61319, "wall": 25937.9} {"step": 24269, "train_loss": 3.172844648361206, "lr": 7.835447406694953e-05, "tps": 61309, "wall": 25943.0} {"step": 24270, "train_loss": 3.2001407146453857, "lr": 7.834265331905744e-05, "tps": 61300, "wall": 25948.1} {"step": 24271, "train_loss": 3.243865489959717, "lr": 7.833083417586733e-05, "tps": 61290, "wall": 25953.2} {"step": 24272, "train_loss": 3.263073205947876, "lr": 7.831901663751331e-05, "tps": 61281, "wall": 25958.3} {"step": 24273, "train_loss": 3.279761791229248, "lr": 7.83072007041291e-05, "tps": 61271, "wall": 25963.4} {"step": 24274, "train_loss": 3.1858925819396973, "lr": 7.829538637584855e-05, "tps": 61262, "wall": 25968.5} {"step": 24275, "train_loss": 3.255887031555176, "lr": 7.828357365280556e-05, "tps": 61252, "wall": 25973.6} {"step": 24276, "train_loss": 3.3329882621765137, "lr": 7.827176253513394e-05, "tps": 61243, "wall": 25978.7} {"step": 24277, "train_loss": 3.1645936965942383, "lr": 7.82599530229674e-05, "tps": 61233, "wall": 25983.7} {"step": 24278, "train_loss": 3.1528820991516113, "lr": 7.824814511643983e-05, "tps": 61224, "wall": 25988.8} {"step": 24279, "train_loss": 3.276386260986328, "lr": 7.823633881568493e-05, "tps": 61214, "wall": 25993.9} {"step": 24280, "train_loss": 3.1764297485351562, "lr": 7.822453412083642e-05, "tps": 61205, "wall": 25998.9} {"step": 24281, "train_loss": 3.178882598876953, "lr": 7.821273103202809e-05, "tps": 61196, "wall": 26004.0} {"step": 24282, "train_loss": 3.2107701301574707, "lr": 7.820092954939357e-05, "tps": 61186, "wall": 26009.1} {"step": 24283, "train_loss": 3.221057415008545, "lr": 7.818912967306666e-05, "tps": 61177, "wall": 26014.1} {"step": 24284, "train_loss": 3.269796371459961, "lr": 7.817733140318093e-05, "tps": 61167, "wall": 26019.3} {"step": 24285, "train_loss": 3.2474260330200195, "lr": 7.816553473987004e-05, "tps": 61158, "wall": 26024.3} {"step": 24286, "train_loss": 3.3188114166259766, "lr": 7.815373968326766e-05, "tps": 61149, "wall": 26029.4} {"step": 24287, "train_loss": 3.239682197570801, "lr": 7.814194623350742e-05, "tps": 61139, "wall": 26034.5} {"step": 24288, "train_loss": 3.4103150367736816, "lr": 7.813015439072285e-05, "tps": 61130, "wall": 26039.6} {"step": 24289, "train_loss": 3.2352540493011475, "lr": 7.811836415504759e-05, "tps": 61120, "wall": 26044.7} {"step": 24290, "train_loss": 3.2248144149780273, "lr": 7.81065755266152e-05, "tps": 61111, "wall": 26049.8} {"step": 24291, "train_loss": 3.2709391117095947, "lr": 7.809478850555912e-05, "tps": 61101, "wall": 26054.8} {"step": 24292, "train_loss": 3.2208545207977295, "lr": 7.808300309201299e-05, "tps": 61092, "wall": 26059.9} {"step": 24293, "train_loss": 3.1806905269622803, "lr": 7.807121928611033e-05, "tps": 61083, "wall": 26065.0} {"step": 24294, "train_loss": 3.228328227996826, "lr": 7.80594370879845e-05, "tps": 61073, "wall": 26070.0} {"step": 24295, "train_loss": 3.1644093990325928, "lr": 7.804765649776909e-05, "tps": 61064, "wall": 26075.1} {"step": 24296, "train_loss": 3.2201247215270996, "lr": 7.80358775155975e-05, "tps": 61054, "wall": 26080.2} {"step": 24297, "train_loss": 3.222318649291992, "lr": 7.802410014160315e-05, "tps": 61045, "wall": 26085.3} {"step": 24298, "train_loss": 3.2054243087768555, "lr": 7.80123243759195e-05, "tps": 61036, "wall": 26090.4} {"step": 24299, "train_loss": 3.2627861499786377, "lr": 7.800055021867993e-05, "tps": 61026, "wall": 26095.5} {"step": 24300, "train_loss": 3.213407516479492, "lr": 7.798877767001775e-05, "tps": 61017, "wall": 26100.5} {"step": 24301, "train_loss": 3.206162929534912, "lr": 7.797700673006644e-05, "tps": 61008, "wall": 26105.6} {"step": 24302, "train_loss": 3.227323532104492, "lr": 7.796523739895923e-05, "tps": 60998, "wall": 26110.7} {"step": 24303, "train_loss": 3.27595591545105, "lr": 7.795346967682955e-05, "tps": 60989, "wall": 26115.7} {"step": 24304, "train_loss": 3.233773946762085, "lr": 7.794170356381064e-05, "tps": 60980, "wall": 26120.8} {"step": 24305, "train_loss": 3.2977778911590576, "lr": 7.792993906003574e-05, "tps": 60970, "wall": 26125.9} {"step": 24306, "train_loss": 3.381220579147339, "lr": 7.791817616563825e-05, "tps": 60961, "wall": 26131.0} {"step": 24307, "train_loss": 3.15419340133667, "lr": 7.790641488075132e-05, "tps": 60952, "wall": 26136.0} {"step": 24308, "train_loss": 3.3615734577178955, "lr": 7.789465520550819e-05, "tps": 60942, "wall": 26141.2} {"step": 24309, "train_loss": 3.244131088256836, "lr": 7.788289714004212e-05, "tps": 60933, "wall": 26146.2} {"step": 24310, "train_loss": 3.3363399505615234, "lr": 7.787114068448629e-05, "tps": 60924, "wall": 26151.3} {"step": 24311, "train_loss": 3.254946708679199, "lr": 7.78593858389738e-05, "tps": 60914, "wall": 26156.4} {"step": 24312, "train_loss": 3.2674670219421387, "lr": 7.784763260363795e-05, "tps": 60905, "wall": 26161.5} {"step": 24313, "train_loss": 3.2618556022644043, "lr": 7.783588097861176e-05, "tps": 60896, "wall": 26166.5} {"step": 24314, "train_loss": 3.229905605316162, "lr": 7.782413096402842e-05, "tps": 60886, "wall": 26171.6} {"step": 24315, "train_loss": 3.1581127643585205, "lr": 7.781238256002101e-05, "tps": 60877, "wall": 26176.6} {"step": 24316, "train_loss": 3.246307134628296, "lr": 7.780063576672267e-05, "tps": 60868, "wall": 26181.7} {"step": 24317, "train_loss": 3.1949477195739746, "lr": 7.778889058426632e-05, "tps": 60859, "wall": 26186.7} {"step": 24318, "train_loss": 3.200939178466797, "lr": 7.777714701278522e-05, "tps": 60849, "wall": 26191.8} {"step": 24319, "train_loss": 3.224188804626465, "lr": 7.776540505241221e-05, "tps": 60840, "wall": 26197.0} {"step": 24320, "train_loss": 3.1659092903137207, "lr": 7.775366470328043e-05, "tps": 60831, "wall": 26202.1} {"step": 24321, "train_loss": 3.275510311126709, "lr": 7.774192596552283e-05, "tps": 60821, "wall": 26207.1} {"step": 24322, "train_loss": 3.1294522285461426, "lr": 7.773018883927236e-05, "tps": 60812, "wall": 26212.2} {"step": 24323, "train_loss": 3.244356632232666, "lr": 7.771845332466203e-05, "tps": 60803, "wall": 26217.2} {"step": 24324, "train_loss": 3.3004515171051025, "lr": 7.770671942182477e-05, "tps": 60794, "wall": 26222.3} {"step": 24325, "train_loss": 3.178178310394287, "lr": 7.769498713089344e-05, "tps": 60784, "wall": 26227.4} {"step": 24326, "train_loss": 3.1971192359924316, "lr": 7.768325645200107e-05, "tps": 60775, "wall": 26232.5} {"step": 24327, "train_loss": 3.1822187900543213, "lr": 7.767152738528043e-05, "tps": 60766, "wall": 26237.5} {"step": 24328, "train_loss": 3.274200201034546, "lr": 7.765979993086441e-05, "tps": 60757, "wall": 26242.6} {"step": 24329, "train_loss": 3.14558482170105, "lr": 7.76480740888859e-05, "tps": 60747, "wall": 26247.7} {"step": 24330, "train_loss": 3.2374954223632812, "lr": 7.763634985947775e-05, "tps": 60738, "wall": 26252.7} {"step": 24331, "train_loss": 3.266634941101074, "lr": 7.762462724277263e-05, "tps": 60729, "wall": 26257.9} {"step": 24332, "train_loss": 3.3577094078063965, "lr": 7.761290623890351e-05, "tps": 60720, "wall": 26262.9} {"step": 24333, "train_loss": 3.306457042694092, "lr": 7.760118684800308e-05, "tps": 60710, "wall": 26268.0} {"step": 24334, "train_loss": 3.244532823562622, "lr": 7.758946907020408e-05, "tps": 60701, "wall": 26273.0} {"step": 24335, "train_loss": 3.204072952270508, "lr": 7.757775290563932e-05, "tps": 60692, "wall": 26278.1} {"step": 24336, "train_loss": 3.200242757797241, "lr": 7.75660383544414e-05, "tps": 60683, "wall": 26283.1} {"step": 24337, "train_loss": 3.2232251167297363, "lr": 7.75543254167432e-05, "tps": 60674, "wall": 26288.2} {"step": 24338, "train_loss": 3.2634570598602295, "lr": 7.754261409267727e-05, "tps": 60664, "wall": 26293.4} {"step": 24339, "train_loss": 3.2173402309417725, "lr": 7.753090438237629e-05, "tps": 60655, "wall": 26298.5} {"step": 24340, "train_loss": 3.216454029083252, "lr": 7.751919628597298e-05, "tps": 60646, "wall": 26303.5} {"step": 24341, "train_loss": 3.203461170196533, "lr": 7.75074898035999e-05, "tps": 60637, "wall": 26308.6} {"step": 24342, "train_loss": 3.254420757293701, "lr": 7.749578493538966e-05, "tps": 60627, "wall": 26313.6} {"step": 24343, "train_loss": 3.1785826683044434, "lr": 7.748408168147492e-05, "tps": 60618, "wall": 26318.8} {"step": 24344, "train_loss": 3.24218487739563, "lr": 7.74723800419882e-05, "tps": 60609, "wall": 26323.9} {"step": 24345, "train_loss": 3.1940243244171143, "lr": 7.746068001706204e-05, "tps": 60600, "wall": 26328.9} {"step": 24346, "train_loss": 3.30722713470459, "lr": 7.744898160682903e-05, "tps": 60591, "wall": 26334.0} {"step": 24347, "train_loss": 3.298119068145752, "lr": 7.743728481142169e-05, "tps": 60581, "wall": 26339.1} {"step": 24348, "train_loss": 3.1532649993896484, "lr": 7.742558963097245e-05, "tps": 60572, "wall": 26344.1} {"step": 24349, "train_loss": 3.2738208770751953, "lr": 7.741389606561389e-05, "tps": 60563, "wall": 26349.2} {"step": 24350, "train_loss": 3.302574634552002, "lr": 7.740220411547843e-05, "tps": 60554, "wall": 26354.3} {"step": 24351, "train_loss": 3.238969564437866, "lr": 7.739051378069846e-05, "tps": 60545, "wall": 26359.3} {"step": 24352, "train_loss": 3.2474405765533447, "lr": 7.737882506140653e-05, "tps": 60536, "wall": 26364.4} {"step": 24353, "train_loss": 3.310311794281006, "lr": 7.736713795773498e-05, "tps": 60527, "wall": 26369.4} {"step": 24354, "train_loss": 3.228912830352783, "lr": 7.735545246981614e-05, "tps": 60517, "wall": 26374.5} {"step": 24355, "train_loss": 3.2006301879882812, "lr": 7.734376859778251e-05, "tps": 60508, "wall": 26379.6} {"step": 24356, "train_loss": 3.3421995639801025, "lr": 7.733208634176634e-05, "tps": 60499, "wall": 26384.7} {"step": 24357, "train_loss": 3.1748719215393066, "lr": 7.732040570190007e-05, "tps": 60490, "wall": 26389.7} {"step": 24358, "train_loss": 3.2021265029907227, "lr": 7.730872667831596e-05, "tps": 60481, "wall": 26394.8} {"step": 24359, "train_loss": 3.2282509803771973, "lr": 7.729704927114627e-05, "tps": 60472, "wall": 26399.9} {"step": 24360, "train_loss": 3.121108055114746, "lr": 7.728537348052337e-05, "tps": 60463, "wall": 26404.9} {"step": 24361, "train_loss": 3.1471238136291504, "lr": 7.727369930657946e-05, "tps": 60453, "wall": 26410.0} {"step": 24362, "train_loss": 3.0927860736846924, "lr": 7.726202674944682e-05, "tps": 60444, "wall": 26415.0} {"step": 24363, "train_loss": 3.2615275382995605, "lr": 7.725035580925768e-05, "tps": 60435, "wall": 26420.1} {"step": 24364, "train_loss": 3.291524887084961, "lr": 7.723868648614416e-05, "tps": 60426, "wall": 26425.2} {"step": 24365, "train_loss": 3.2252907752990723, "lr": 7.722701878023859e-05, "tps": 60417, "wall": 26430.2} {"step": 24366, "train_loss": 3.1762535572052, "lr": 7.721535269167307e-05, "tps": 60408, "wall": 26435.3} {"step": 24367, "train_loss": 3.219167947769165, "lr": 7.720368822057969e-05, "tps": 60399, "wall": 26440.4} {"step": 24368, "train_loss": 3.3198349475860596, "lr": 7.719202536709074e-05, "tps": 60390, "wall": 26445.5} {"step": 24369, "train_loss": 3.2388014793395996, "lr": 7.718036413133822e-05, "tps": 60381, "wall": 26450.6} {"step": 24370, "train_loss": 3.231933116912842, "lr": 7.716870451345424e-05, "tps": 60371, "wall": 26455.6} {"step": 24371, "train_loss": 3.184004783630371, "lr": 7.715704651357092e-05, "tps": 60362, "wall": 26460.7} {"step": 24372, "train_loss": 3.310314893722534, "lr": 7.714539013182034e-05, "tps": 60353, "wall": 26465.8} {"step": 24373, "train_loss": 3.2962422370910645, "lr": 7.713373536833443e-05, "tps": 60344, "wall": 26470.8} {"step": 24374, "train_loss": 3.217505931854248, "lr": 7.712208222324535e-05, "tps": 60335, "wall": 26475.9} {"step": 24375, "train_loss": 3.1326236724853516, "lr": 7.711043069668505e-05, "tps": 60326, "wall": 26481.0} {"step": 24376, "train_loss": 3.1611409187316895, "lr": 7.709878078878549e-05, "tps": 60317, "wall": 26486.0} {"step": 24377, "train_loss": 3.239629030227661, "lr": 7.708713249967871e-05, "tps": 60308, "wall": 26491.1} {"step": 24378, "train_loss": 3.221170663833618, "lr": 7.707548582949662e-05, "tps": 60299, "wall": 26496.1} {"step": 24379, "train_loss": 3.11395001411438, "lr": 7.706384077837112e-05, "tps": 60290, "wall": 26501.2} {"step": 24380, "train_loss": 3.288054943084717, "lr": 7.70521973464342e-05, "tps": 60281, "wall": 26506.3} {"step": 24381, "train_loss": 3.211483955383301, "lr": 7.704055553381769e-05, "tps": 60272, "wall": 26511.4} {"step": 24382, "train_loss": 3.2178125381469727, "lr": 7.702891534065353e-05, "tps": 60263, "wall": 26516.5} {"step": 24383, "train_loss": 3.2277863025665283, "lr": 7.701727676707356e-05, "tps": 60254, "wall": 26521.5} {"step": 24384, "train_loss": 3.249505043029785, "lr": 7.700563981320959e-05, "tps": 60245, "wall": 26526.6} {"step": 24385, "train_loss": 3.182420253753662, "lr": 7.699400447919347e-05, "tps": 60236, "wall": 26531.6} {"step": 24386, "train_loss": 3.2486114501953125, "lr": 7.698237076515704e-05, "tps": 60227, "wall": 26536.7} {"step": 24387, "train_loss": 3.365377902984619, "lr": 7.697073867123197e-05, "tps": 60218, "wall": 26541.7} {"step": 24388, "train_loss": 3.154906988143921, "lr": 7.69591081975502e-05, "tps": 60209, "wall": 26546.8} {"step": 24389, "train_loss": 3.302900791168213, "lr": 7.694747934424337e-05, "tps": 60200, "wall": 26551.8} {"step": 24390, "train_loss": 3.3899266719818115, "lr": 7.693585211144317e-05, "tps": 60190, "wall": 26557.0} {"step": 24391, "train_loss": 3.138331890106201, "lr": 7.692422649928145e-05, "tps": 60181, "wall": 26562.0} {"step": 24392, "train_loss": 3.188474178314209, "lr": 7.691260250788982e-05, "tps": 60172, "wall": 26567.1} {"step": 24393, "train_loss": 3.315248966217041, "lr": 7.690098013739992e-05, "tps": 60163, "wall": 26572.2} {"step": 24394, "train_loss": 3.175758123397827, "lr": 7.68893593879435e-05, "tps": 60154, "wall": 26577.2} {"step": 24395, "train_loss": 3.1971986293792725, "lr": 7.687774025965219e-05, "tps": 60145, "wall": 26582.3} {"step": 24396, "train_loss": 3.2165274620056152, "lr": 7.68661227526575e-05, "tps": 60136, "wall": 26587.3} {"step": 24397, "train_loss": 3.3261756896972656, "lr": 7.685450686709117e-05, "tps": 60127, "wall": 26592.4} {"step": 24398, "train_loss": 3.1999762058258057, "lr": 7.684289260308469e-05, "tps": 60119, "wall": 26597.5} {"step": 24399, "train_loss": 3.3806188106536865, "lr": 7.68312799607697e-05, "tps": 60110, "wall": 26602.5} {"step": 24400, "train_loss": 3.238415241241455, "lr": 7.681966894027775e-05, "tps": 60101, "wall": 26607.6} {"step": 24401, "train_loss": 3.1820459365844727, "lr": 7.680805954174026e-05, "tps": 60092, "wall": 26612.7} {"step": 24402, "train_loss": 3.2066946029663086, "lr": 7.679645176528886e-05, "tps": 60082, "wall": 26617.8} {"step": 24403, "train_loss": 3.121744155883789, "lr": 7.678484561105502e-05, "tps": 60073, "wall": 26622.9} {"step": 24404, "train_loss": 3.251258373260498, "lr": 7.677324107917015e-05, "tps": 60064, "wall": 26627.9} {"step": 24405, "train_loss": 3.252243757247925, "lr": 7.67616381697658e-05, "tps": 60056, "wall": 26633.0} {"step": 24406, "train_loss": 3.2117860317230225, "lr": 7.675003688297336e-05, "tps": 60047, "wall": 26638.0} {"step": 24407, "train_loss": 3.3097472190856934, "lr": 7.673843721892417e-05, "tps": 60038, "wall": 26643.1} {"step": 24408, "train_loss": 3.197824001312256, "lr": 7.672683917774982e-05, "tps": 60029, "wall": 26648.2} {"step": 24409, "train_loss": 3.3114113807678223, "lr": 7.671524275958155e-05, "tps": 60020, "wall": 26653.2} {"step": 24410, "train_loss": 3.2502689361572266, "lr": 7.670364796455072e-05, "tps": 60011, "wall": 26658.3} {"step": 24411, "train_loss": 3.177910804748535, "lr": 7.669205479278876e-05, "tps": 60002, "wall": 26663.3} {"step": 24412, "train_loss": 3.277700901031494, "lr": 7.668046324442697e-05, "tps": 59993, "wall": 26668.4} {"step": 24413, "train_loss": 3.22880220413208, "lr": 7.66688733195966e-05, "tps": 59984, "wall": 26673.4} {"step": 24414, "train_loss": 3.22983717918396, "lr": 7.665728501842903e-05, "tps": 59975, "wall": 26678.5} {"step": 24415, "train_loss": 3.237694263458252, "lr": 7.664569834105544e-05, "tps": 59966, "wall": 26683.6} {"step": 24416, "train_loss": 3.192026138305664, "lr": 7.663411328760717e-05, "tps": 59957, "wall": 26688.6} {"step": 24417, "train_loss": 3.212604522705078, "lr": 7.662252985821544e-05, "tps": 59948, "wall": 26693.7} {"step": 24418, "train_loss": 3.278733730316162, "lr": 7.661094805301137e-05, "tps": 59940, "wall": 26698.7} {"step": 24419, "train_loss": 3.2575883865356445, "lr": 7.659936787212633e-05, "tps": 59931, "wall": 26703.8} {"step": 24420, "train_loss": 3.278994083404541, "lr": 7.658778931569137e-05, "tps": 59922, "wall": 26708.8} {"step": 24421, "train_loss": 3.317491054534912, "lr": 7.657621238383767e-05, "tps": 59913, "wall": 26713.9} {"step": 24422, "train_loss": 3.2346763610839844, "lr": 7.656463707669643e-05, "tps": 59904, "wall": 26718.9} {"step": 24423, "train_loss": 3.2646067142486572, "lr": 7.655306339439876e-05, "tps": 59895, "wall": 26723.9} {"step": 24424, "train_loss": 3.2434871196746826, "lr": 7.654149133707566e-05, "tps": 59886, "wall": 26729.0} {"step": 24425, "train_loss": 3.150473117828369, "lr": 7.65299209048584e-05, "tps": 59878, "wall": 26734.0} {"step": 24426, "train_loss": 3.2282028198242188, "lr": 7.651835209787793e-05, "tps": 59869, "wall": 26739.1} {"step": 24427, "train_loss": 3.123724937438965, "lr": 7.650678491626529e-05, "tps": 59860, "wall": 26744.2} {"step": 24428, "train_loss": 3.244828224182129, "lr": 7.649521936015158e-05, "tps": 59851, "wall": 26749.3} {"step": 24429, "train_loss": 3.247370719909668, "lr": 7.648365542966782e-05, "tps": 59842, "wall": 26754.3} {"step": 24430, "train_loss": 3.179889678955078, "lr": 7.647209312494491e-05, "tps": 59833, "wall": 26759.4} {"step": 24431, "train_loss": 3.282754898071289, "lr": 7.646053244611396e-05, "tps": 59824, "wall": 26764.4} {"step": 24432, "train_loss": 3.29773211479187, "lr": 7.644897339330586e-05, "tps": 59815, "wall": 26769.5} {"step": 24433, "train_loss": 3.2393064498901367, "lr": 7.643741596665148e-05, "tps": 59807, "wall": 26774.5} {"step": 24434, "train_loss": 3.2345774173736572, "lr": 7.642586016628189e-05, "tps": 59798, "wall": 26779.6} {"step": 24435, "train_loss": 3.153482437133789, "lr": 7.641430599232786e-05, "tps": 59789, "wall": 26784.6} {"step": 24436, "train_loss": 3.32755708694458, "lr": 7.64027534449204e-05, "tps": 59780, "wall": 26789.7} {"step": 24437, "train_loss": 3.1829566955566406, "lr": 7.639120252419032e-05, "tps": 59771, "wall": 26794.7} {"step": 24438, "train_loss": 3.2021846771240234, "lr": 7.637965323026842e-05, "tps": 59762, "wall": 26799.8} {"step": 24439, "train_loss": 3.3468916416168213, "lr": 7.636810556328562e-05, "tps": 59754, "wall": 26804.9} {"step": 24440, "train_loss": 3.162459135055542, "lr": 7.635655952337269e-05, "tps": 59745, "wall": 26810.0} {"step": 24441, "train_loss": 3.1502060890197754, "lr": 7.634501511066039e-05, "tps": 59736, "wall": 26815.0} {"step": 24442, "train_loss": 3.127384901046753, "lr": 7.633347232527954e-05, "tps": 59727, "wall": 26820.1} {"step": 24443, "train_loss": 3.1589341163635254, "lr": 7.632193116736093e-05, "tps": 59718, "wall": 26825.2} {"step": 24444, "train_loss": 3.292146921157837, "lr": 7.63103916370352e-05, "tps": 59709, "wall": 26830.2} {"step": 24445, "train_loss": 3.278226613998413, "lr": 7.629885373443316e-05, "tps": 59701, "wall": 26835.3} {"step": 24446, "train_loss": 3.265542984008789, "lr": 7.628731745968548e-05, "tps": 59692, "wall": 26840.3} {"step": 24447, "train_loss": 3.2688236236572266, "lr": 7.62757828129228e-05, "tps": 59683, "wall": 26845.3} {"step": 24448, "train_loss": 3.2779016494750977, "lr": 7.62642497942759e-05, "tps": 59674, "wall": 26850.4} {"step": 24449, "train_loss": 3.165417432785034, "lr": 7.625271840387532e-05, "tps": 59665, "wall": 26855.5} {"step": 24450, "train_loss": 3.193523645401001, "lr": 7.624118864185168e-05, "tps": 59657, "wall": 26860.6} {"step": 24451, "train_loss": 3.347106695175171, "lr": 7.62296605083357e-05, "tps": 59648, "wall": 26865.6} {"step": 24452, "train_loss": 3.2402658462524414, "lr": 7.621813400345783e-05, "tps": 59639, "wall": 26870.7} {"step": 24453, "train_loss": 3.2639572620391846, "lr": 7.620660912734878e-05, "tps": 59630, "wall": 26875.7} {"step": 24454, "train_loss": 3.287614583969116, "lr": 7.619508588013904e-05, "tps": 59621, "wall": 26880.7} {"step": 24455, "train_loss": 3.2013697624206543, "lr": 7.618356426195907e-05, "tps": 59613, "wall": 26885.8} {"step": 24456, "train_loss": 3.1998162269592285, "lr": 7.617204427293954e-05, "tps": 59604, "wall": 26890.8} {"step": 24457, "train_loss": 3.2850565910339355, "lr": 7.616052591321089e-05, "tps": 59595, "wall": 26895.9} {"step": 24458, "train_loss": 3.2112176418304443, "lr": 7.614900918290351e-05, "tps": 59586, "wall": 26900.9} {"step": 24459, "train_loss": 3.1958847045898438, "lr": 7.613749408214799e-05, "tps": 59578, "wall": 26906.0} {"step": 24460, "train_loss": 3.156428098678589, "lr": 7.612598061107472e-05, "tps": 59569, "wall": 26911.0} {"step": 24461, "train_loss": 3.332127094268799, "lr": 7.611446876981407e-05, "tps": 59560, "wall": 26916.1} {"step": 24462, "train_loss": 3.188897132873535, "lr": 7.610295855849656e-05, "tps": 59551, "wall": 26921.2} {"step": 24463, "train_loss": 3.297445774078369, "lr": 7.609144997725252e-05, "tps": 59543, "wall": 26926.2} {"step": 24464, "train_loss": 3.278934955596924, "lr": 7.607994302621227e-05, "tps": 59534, "wall": 26931.3} {"step": 24465, "train_loss": 3.3150687217712402, "lr": 7.606843770550627e-05, "tps": 59525, "wall": 26936.4} {"step": 24466, "train_loss": 3.2384321689605713, "lr": 7.605693401526477e-05, "tps": 59516, "wall": 26941.5} {"step": 24467, "train_loss": 3.206493854522705, "lr": 7.604543195561808e-05, "tps": 59507, "wall": 26946.6} {"step": 24468, "train_loss": 3.2288708686828613, "lr": 7.603393152669658e-05, "tps": 59499, "wall": 26951.6} {"step": 24469, "train_loss": 3.199897527694702, "lr": 7.602243272863043e-05, "tps": 59490, "wall": 26956.7} {"step": 24470, "train_loss": 3.252495288848877, "lr": 7.601093556155e-05, "tps": 59481, "wall": 26961.7} {"step": 24471, "train_loss": 3.1933281421661377, "lr": 7.599944002558548e-05, "tps": 59473, "wall": 26966.8} {"step": 24472, "train_loss": 3.1943087577819824, "lr": 7.598794612086704e-05, "tps": 59464, "wall": 26971.9} {"step": 24473, "train_loss": 3.164233446121216, "lr": 7.597645384752501e-05, "tps": 59455, "wall": 26977.0} {"step": 24474, "train_loss": 3.1997110843658447, "lr": 7.596496320568946e-05, "tps": 59446, "wall": 26982.0} {"step": 24475, "train_loss": 3.3153555393218994, "lr": 7.59534741954906e-05, "tps": 59438, "wall": 26987.1} {"step": 24476, "train_loss": 3.3460583686828613, "lr": 7.59419868170586e-05, "tps": 59429, "wall": 26992.1} {"step": 24477, "train_loss": 3.296278715133667, "lr": 7.593050107052355e-05, "tps": 59420, "wall": 26997.2} {"step": 24478, "train_loss": 3.2182939052581787, "lr": 7.591901695601556e-05, "tps": 59412, "wall": 27002.2} {"step": 24479, "train_loss": 3.2646961212158203, "lr": 7.590753447366478e-05, "tps": 59403, "wall": 27007.3} {"step": 24480, "train_loss": 3.126868963241577, "lr": 7.589605362360124e-05, "tps": 59394, "wall": 27012.3} {"step": 24481, "train_loss": 3.151520252227783, "lr": 7.588457440595495e-05, "tps": 59385, "wall": 27017.4} {"step": 24482, "train_loss": 3.097609281539917, "lr": 7.587309682085606e-05, "tps": 59377, "wall": 27022.4} {"step": 24483, "train_loss": 3.183361291885376, "lr": 7.586162086843452e-05, "tps": 59368, "wall": 27027.5} {"step": 24484, "train_loss": 3.3048901557922363, "lr": 7.585014654882028e-05, "tps": 59359, "wall": 27032.5} {"step": 24485, "train_loss": 3.2677836418151855, "lr": 7.583867386214343e-05, "tps": 59351, "wall": 27037.6} {"step": 24486, "train_loss": 3.2062902450561523, "lr": 7.582720280853387e-05, "tps": 59342, "wall": 27042.7} {"step": 24487, "train_loss": 3.31184983253479, "lr": 7.581573338812152e-05, "tps": 59333, "wall": 27047.7} {"step": 24488, "train_loss": 3.249296188354492, "lr": 7.58042656010364e-05, "tps": 59325, "wall": 27052.8} {"step": 24489, "train_loss": 3.1656713485717773, "lr": 7.579279944740829e-05, "tps": 59316, "wall": 27057.8} {"step": 24490, "train_loss": 3.1897401809692383, "lr": 7.578133492736724e-05, "tps": 59307, "wall": 27062.9} {"step": 24491, "train_loss": 3.2692441940307617, "lr": 7.576987204104297e-05, "tps": 59299, "wall": 27067.9} {"step": 24492, "train_loss": 3.2556049823760986, "lr": 7.575841078856538e-05, "tps": 59290, "wall": 27073.0} {"step": 24493, "train_loss": 3.2237894535064697, "lr": 7.574695117006436e-05, "tps": 59281, "wall": 27078.0} {"step": 24494, "train_loss": 3.2235350608825684, "lr": 7.573549318566968e-05, "tps": 59273, "wall": 27083.1} {"step": 24495, "train_loss": 3.2601335048675537, "lr": 7.572403683551109e-05, "tps": 59264, "wall": 27088.2} {"step": 24496, "train_loss": 3.1722421646118164, "lr": 7.571258211971846e-05, "tps": 59255, "wall": 27093.2} {"step": 24497, "train_loss": 3.2779455184936523, "lr": 7.570112903842151e-05, "tps": 59247, "wall": 27098.4} {"step": 24498, "train_loss": 3.208961248397827, "lr": 7.568967759174993e-05, "tps": 59238, "wall": 27103.4} {"step": 24499, "train_loss": 3.1925055980682373, "lr": 7.567822777983352e-05, "tps": 59229, "wall": 27108.5} {"step": 24500, "train_loss": 3.2743725776672363, "lr": 7.566677960280198e-05, "tps": 59221, "wall": 27113.5} {"step": 24501, "train_loss": 3.263162136077881, "lr": 7.565533306078492e-05, "tps": 59212, "wall": 27118.8} {"step": 24502, "train_loss": 3.1778769493103027, "lr": 7.564388815391208e-05, "tps": 59203, "wall": 27123.8} {"step": 24503, "train_loss": 3.1070127487182617, "lr": 7.563244488231309e-05, "tps": 59194, "wall": 27128.9} {"step": 24504, "train_loss": 3.247523069381714, "lr": 7.562100324611755e-05, "tps": 59186, "wall": 27134.0} {"step": 24505, "train_loss": 3.118292808532715, "lr": 7.560956324545515e-05, "tps": 59177, "wall": 27139.0} {"step": 24506, "train_loss": 3.246899127960205, "lr": 7.559812488045532e-05, "tps": 59169, "wall": 27144.1} {"step": 24507, "train_loss": 3.2368204593658447, "lr": 7.558668815124784e-05, "tps": 59160, "wall": 27149.1} {"step": 24508, "train_loss": 3.273982048034668, "lr": 7.557525305796215e-05, "tps": 59151, "wall": 27154.2} {"step": 24509, "train_loss": 3.2222471237182617, "lr": 7.556381960072778e-05, "tps": 59143, "wall": 27159.3} {"step": 24510, "train_loss": 3.12979793548584, "lr": 7.555238777967431e-05, "tps": 59134, "wall": 27164.4} {"step": 24511, "train_loss": 3.2141876220703125, "lr": 7.55409575949312e-05, "tps": 59125, "wall": 27169.5} {"step": 24512, "train_loss": 3.150981903076172, "lr": 7.552952904662789e-05, "tps": 59117, "wall": 27174.5} {"step": 24513, "train_loss": 3.3620200157165527, "lr": 7.551810213489396e-05, "tps": 59108, "wall": 27179.6} {"step": 24514, "train_loss": 3.2067997455596924, "lr": 7.550667685985876e-05, "tps": 59100, "wall": 27184.7} {"step": 24515, "train_loss": 3.176429510116577, "lr": 7.549525322165172e-05, "tps": 59091, "wall": 27189.7} {"step": 24516, "train_loss": 3.1952319145202637, "lr": 7.54838312204023e-05, "tps": 59082, "wall": 27194.8} {"step": 24517, "train_loss": 3.19187593460083, "lr": 7.547241085623984e-05, "tps": 59074, "wall": 27199.9} {"step": 24518, "train_loss": 3.1753311157226562, "lr": 7.546099212929372e-05, "tps": 59065, "wall": 27204.9} {"step": 24519, "train_loss": 3.2578110694885254, "lr": 7.544957503969333e-05, "tps": 59056, "wall": 27210.0} {"step": 24520, "train_loss": 3.256721258163452, "lr": 7.543815958756796e-05, "tps": 59048, "wall": 27215.1} {"step": 24521, "train_loss": 3.3080108165740967, "lr": 7.542674577304692e-05, "tps": 59039, "wall": 27220.3} {"step": 24522, "train_loss": 3.256010055541992, "lr": 7.541533359625954e-05, "tps": 59031, "wall": 27225.3} {"step": 24523, "train_loss": 3.161173105239868, "lr": 7.540392305733506e-05, "tps": 59022, "wall": 27230.4} {"step": 24524, "train_loss": 3.081350564956665, "lr": 7.539251415640281e-05, "tps": 59013, "wall": 27235.5} {"step": 24525, "train_loss": 3.179103374481201, "lr": 7.538110689359196e-05, "tps": 59005, "wall": 27240.5} {"step": 24526, "train_loss": 3.1432652473449707, "lr": 7.536970126903174e-05, "tps": 58996, "wall": 27245.6} {"step": 24527, "train_loss": 3.246229648590088, "lr": 7.535829728285139e-05, "tps": 58988, "wall": 27250.7} {"step": 24528, "train_loss": 3.239413022994995, "lr": 7.534689493518007e-05, "tps": 58979, "wall": 27255.7} {"step": 24529, "train_loss": 3.1504437923431396, "lr": 7.53354942261469e-05, "tps": 58971, "wall": 27260.8} {"step": 24530, "train_loss": 3.2578186988830566, "lr": 7.532409515588121e-05, "tps": 58962, "wall": 27265.9} {"step": 24531, "train_loss": 3.230461597442627, "lr": 7.531269772451189e-05, "tps": 58954, "wall": 27270.9} {"step": 24532, "train_loss": 3.255507469177246, "lr": 7.530130193216815e-05, "tps": 58945, "wall": 27276.0} {"step": 24533, "train_loss": 3.2667291164398193, "lr": 7.528990777897916e-05, "tps": 58936, "wall": 27281.1} {"step": 24534, "train_loss": 3.340045928955078, "lr": 7.527851526507386e-05, "tps": 58928, "wall": 27286.1} {"step": 24535, "train_loss": 3.1913981437683105, "lr": 7.52671243905814e-05, "tps": 58919, "wall": 27291.2} {"step": 24536, "train_loss": 3.2805533409118652, "lr": 7.525573515563079e-05, "tps": 58911, "wall": 27296.3} {"step": 24537, "train_loss": 3.235963821411133, "lr": 7.524434756035098e-05, "tps": 58902, "wall": 27301.4} {"step": 24538, "train_loss": 3.3275158405303955, "lr": 7.52329616048711e-05, "tps": 58894, "wall": 27306.4} {"step": 24539, "train_loss": 3.294024705886841, "lr": 7.522157728932007e-05, "tps": 58885, "wall": 27311.5} {"step": 24540, "train_loss": 3.2370665073394775, "lr": 7.521019461382677e-05, "tps": 58877, "wall": 27316.6} {"step": 24541, "train_loss": 3.2114100456237793, "lr": 7.519881357852028e-05, "tps": 58868, "wall": 27321.6} {"step": 24542, "train_loss": 3.2738137245178223, "lr": 7.518743418352946e-05, "tps": 58860, "wall": 27326.7} {"step": 24543, "train_loss": 3.2135701179504395, "lr": 7.517605642898318e-05, "tps": 58851, "wall": 27331.8} {"step": 24544, "train_loss": 3.0651583671569824, "lr": 7.516468031501041e-05, "tps": 58842, "wall": 27336.9} {"step": 24545, "train_loss": 3.1881961822509766, "lr": 7.515330584173999e-05, "tps": 58834, "wall": 27342.0} {"step": 24546, "train_loss": 3.281620740890503, "lr": 7.514193300930068e-05, "tps": 58825, "wall": 27347.0} {"step": 24547, "train_loss": 3.1760518550872803, "lr": 7.513056181782145e-05, "tps": 58817, "wall": 27352.1} {"step": 24548, "train_loss": 3.2054145336151123, "lr": 7.511919226743103e-05, "tps": 58808, "wall": 27357.1} {"step": 24549, "train_loss": 3.246846914291382, "lr": 7.510782435825823e-05, "tps": 58800, "wall": 27362.2} {"step": 24550, "train_loss": 3.2598230838775635, "lr": 7.509645809043188e-05, "tps": 58791, "wall": 27367.3} {"step": 24551, "train_loss": 3.1698923110961914, "lr": 7.508509346408064e-05, "tps": 58783, "wall": 27372.3} {"step": 24552, "train_loss": 3.1766104698181152, "lr": 7.507373047933334e-05, "tps": 58774, "wall": 27377.4} {"step": 24553, "train_loss": 3.2567996978759766, "lr": 7.506236913631866e-05, "tps": 58766, "wall": 27382.5} {"step": 24554, "train_loss": 3.3434557914733887, "lr": 7.505100943516527e-05, "tps": 58757, "wall": 27387.5} {"step": 24555, "train_loss": 3.246525764465332, "lr": 7.503965137600191e-05, "tps": 58749, "wall": 27392.6} {"step": 24556, "train_loss": 3.193218231201172, "lr": 7.502829495895724e-05, "tps": 58740, "wall": 27397.7} {"step": 24557, "train_loss": 3.2572343349456787, "lr": 7.501694018415986e-05, "tps": 58732, "wall": 27402.8} {"step": 24558, "train_loss": 3.336852550506592, "lr": 7.500558705173843e-05, "tps": 58723, "wall": 27407.9} {"step": 24559, "train_loss": 3.21696400642395, "lr": 7.499423556182158e-05, "tps": 58715, "wall": 27412.9} {"step": 24560, "train_loss": 3.2498679161071777, "lr": 7.498288571453783e-05, "tps": 58707, "wall": 27418.0} {"step": 24561, "train_loss": 3.1381335258483887, "lr": 7.497153751001581e-05, "tps": 58698, "wall": 27423.0} {"step": 24562, "train_loss": 3.2650227546691895, "lr": 7.496019094838409e-05, "tps": 58690, "wall": 27428.1} {"step": 24563, "train_loss": 3.294156312942505, "lr": 7.494884602977113e-05, "tps": 58681, "wall": 27433.1} {"step": 24564, "train_loss": 3.222541093826294, "lr": 7.493750275430552e-05, "tps": 58673, "wall": 27438.2} {"step": 24565, "train_loss": 3.148573160171509, "lr": 7.492616112211567e-05, "tps": 58664, "wall": 27443.2} {"step": 24566, "train_loss": 3.2763097286224365, "lr": 7.491482113333018e-05, "tps": 58656, "wall": 27448.3} {"step": 24567, "train_loss": 3.3051278591156006, "lr": 7.490348278807744e-05, "tps": 58648, "wall": 27453.3} {"step": 24568, "train_loss": 3.1852962970733643, "lr": 7.489214608648585e-05, "tps": 58639, "wall": 27458.5} {"step": 24569, "train_loss": 3.303938150405884, "lr": 7.488081102868392e-05, "tps": 58631, "wall": 27463.5} {"step": 24570, "train_loss": 3.1435508728027344, "lr": 7.486947761480004e-05, "tps": 58622, "wall": 27468.6} {"step": 24571, "train_loss": 3.1420555114746094, "lr": 7.485814584496248e-05, "tps": 58614, "wall": 27473.7} {"step": 24572, "train_loss": 3.3226919174194336, "lr": 7.484681571929977e-05, "tps": 58605, "wall": 27478.8} {"step": 24573, "train_loss": 3.2544333934783936, "lr": 7.483548723794018e-05, "tps": 58597, "wall": 27483.8} {"step": 24574, "train_loss": 3.248533010482788, "lr": 7.4824160401012e-05, "tps": 58589, "wall": 27488.9} {"step": 24575, "train_loss": 3.1965017318725586, "lr": 7.481283520864363e-05, "tps": 58580, "wall": 27493.9} {"step": 24576, "train_loss": 3.21755313873291, "lr": 7.480151166096332e-05, "tps": 58572, "wall": 27499.0} {"step": 24577, "train_loss": 3.2603607177734375, "lr": 7.479018975809928e-05, "tps": 58563, "wall": 27504.0} {"step": 24578, "train_loss": 3.2053229808807373, "lr": 7.477886950017989e-05, "tps": 58555, "wall": 27509.1} {"step": 24579, "train_loss": 3.2542529106140137, "lr": 7.47675508873333e-05, "tps": 58547, "wall": 27514.1} {"step": 24580, "train_loss": 3.213331460952759, "lr": 7.475623391968772e-05, "tps": 58538, "wall": 27519.2} {"step": 24581, "train_loss": 3.2780208587646484, "lr": 7.474491859737143e-05, "tps": 58530, "wall": 27524.3} {"step": 24582, "train_loss": 3.1844794750213623, "lr": 7.473360492051256e-05, "tps": 58521, "wall": 27529.4} {"step": 24583, "train_loss": 3.293550491333008, "lr": 7.472229288923922e-05, "tps": 58513, "wall": 27534.4} {"step": 24584, "train_loss": 3.410538911819458, "lr": 7.471098250367965e-05, "tps": 58505, "wall": 27539.5} {"step": 24585, "train_loss": 3.2032995223999023, "lr": 7.46996737639619e-05, "tps": 58496, "wall": 27544.6} {"step": 24586, "train_loss": 3.2395458221435547, "lr": 7.468836667021413e-05, "tps": 58488, "wall": 27549.6} {"step": 24587, "train_loss": 3.296144485473633, "lr": 7.46770612225644e-05, "tps": 58480, "wall": 27554.7} {"step": 24588, "train_loss": 3.2346646785736084, "lr": 7.466575742114074e-05, "tps": 58471, "wall": 27559.8} {"step": 24589, "train_loss": 3.2638051509857178, "lr": 7.465445526607131e-05, "tps": 58463, "wall": 27564.9} {"step": 24590, "train_loss": 3.303718090057373, "lr": 7.464315475748407e-05, "tps": 58454, "wall": 27569.9} {"step": 24591, "train_loss": 3.235354423522949, "lr": 7.463185589550696e-05, "tps": 58446, "wall": 27575.0} {"step": 24592, "train_loss": 3.2156107425689697, "lr": 7.462055868026813e-05, "tps": 58437, "wall": 27580.2} {"step": 24593, "train_loss": 3.2071681022644043, "lr": 7.460926311189546e-05, "tps": 58429, "wall": 27585.3} {"step": 24594, "train_loss": 3.2782928943634033, "lr": 7.459796919051691e-05, "tps": 58421, "wall": 27590.4} {"step": 24595, "train_loss": 3.210015296936035, "lr": 7.458667691626044e-05, "tps": 58412, "wall": 27595.4} {"step": 24596, "train_loss": 3.2877209186553955, "lr": 7.457538628925396e-05, "tps": 58404, "wall": 27600.5} {"step": 24597, "train_loss": 3.18424654006958, "lr": 7.456409730962535e-05, "tps": 58396, "wall": 27605.5} {"step": 24598, "train_loss": 3.21875, "lr": 7.455280997750254e-05, "tps": 58387, "wall": 27610.6} {"step": 24599, "train_loss": 3.256692886352539, "lr": 7.454152429301336e-05, "tps": 58379, "wall": 27615.7} {"step": 24600, "train_loss": 3.2307119369506836, "lr": 7.453024025628563e-05, "tps": 58370, "wall": 27620.8} {"step": 24601, "train_loss": 3.2213473320007324, "lr": 7.451895786744725e-05, "tps": 58362, "wall": 27625.9} {"step": 24602, "train_loss": 3.187718629837036, "lr": 7.450767712662594e-05, "tps": 58354, "wall": 27630.9} {"step": 24603, "train_loss": 3.2072315216064453, "lr": 7.449639803394958e-05, "tps": 58345, "wall": 27636.0} {"step": 24604, "train_loss": 3.2862133979797363, "lr": 7.448512058954589e-05, "tps": 58337, "wall": 27641.1} {"step": 24605, "train_loss": 3.198984146118164, "lr": 7.447384479354258e-05, "tps": 58329, "wall": 27646.2} {"step": 24606, "train_loss": 3.1312384605407715, "lr": 7.44625706460675e-05, "tps": 58320, "wall": 27651.2} {"step": 24607, "train_loss": 3.1866979598999023, "lr": 7.445129814724827e-05, "tps": 58312, "wall": 27656.3} {"step": 24608, "train_loss": 3.144362688064575, "lr": 7.444002729721256e-05, "tps": 58304, "wall": 27661.4} {"step": 24609, "train_loss": 3.387698173522949, "lr": 7.442875809608816e-05, "tps": 58295, "wall": 27666.4} {"step": 24610, "train_loss": 3.2387571334838867, "lr": 7.441749054400266e-05, "tps": 58287, "wall": 27671.5} {"step": 24611, "train_loss": 3.3561742305755615, "lr": 7.440622464108364e-05, "tps": 58279, "wall": 27676.5} {"step": 24612, "train_loss": 3.2201180458068848, "lr": 7.439496038745886e-05, "tps": 58271, "wall": 27681.6} {"step": 24613, "train_loss": 3.2451260089874268, "lr": 7.438369778325581e-05, "tps": 58262, "wall": 27686.7} {"step": 24614, "train_loss": 3.1421003341674805, "lr": 7.437243682860207e-05, "tps": 58254, "wall": 27691.7} {"step": 24615, "train_loss": 3.200380325317383, "lr": 7.436117752362532e-05, "tps": 58246, "wall": 27696.8} {"step": 24616, "train_loss": 3.3228509426116943, "lr": 7.434991986845299e-05, "tps": 58237, "wall": 27701.9} {"step": 24617, "train_loss": 3.2917604446411133, "lr": 7.433866386321262e-05, "tps": 58229, "wall": 27706.9} {"step": 24618, "train_loss": 3.215120792388916, "lr": 7.432740950803178e-05, "tps": 58221, "wall": 27712.0} {"step": 24619, "train_loss": 3.186504364013672, "lr": 7.431615680303795e-05, "tps": 58213, "wall": 27717.0} {"step": 24620, "train_loss": 3.1916632652282715, "lr": 7.430490574835852e-05, "tps": 58204, "wall": 27722.1} {"step": 24621, "train_loss": 3.309960126876831, "lr": 7.429365634412105e-05, "tps": 58196, "wall": 27727.1} {"step": 24622, "train_loss": 3.2458529472351074, "lr": 7.428240859045287e-05, "tps": 58188, "wall": 27732.2} {"step": 24623, "train_loss": 3.0656661987304688, "lr": 7.42711624874815e-05, "tps": 58180, "wall": 27737.3} {"step": 24624, "train_loss": 3.1998789310455322, "lr": 7.425991803533427e-05, "tps": 58171, "wall": 27742.3} {"step": 24625, "train_loss": 3.17006254196167, "lr": 7.424867523413854e-05, "tps": 58163, "wall": 27747.4} {"step": 24626, "train_loss": 3.173616647720337, "lr": 7.423743408402175e-05, "tps": 58155, "wall": 27752.4} {"step": 24627, "train_loss": 3.264791965484619, "lr": 7.422619458511117e-05, "tps": 58146, "wall": 27757.6} {"step": 24628, "train_loss": 3.1885552406311035, "lr": 7.421495673753413e-05, "tps": 58138, "wall": 27762.7} {"step": 24629, "train_loss": 3.2284111976623535, "lr": 7.420372054141797e-05, "tps": 58130, "wall": 27767.7} {"step": 24630, "train_loss": 3.2482566833496094, "lr": 7.419248599688997e-05, "tps": 58122, "wall": 27772.8} {"step": 24631, "train_loss": 3.305173873901367, "lr": 7.41812531040773e-05, "tps": 58113, "wall": 27777.9} {"step": 24632, "train_loss": 3.1594972610473633, "lr": 7.417002186310737e-05, "tps": 58105, "wall": 27783.0} {"step": 24633, "train_loss": 3.1720073223114014, "lr": 7.41587922741073e-05, "tps": 58097, "wall": 27788.0} {"step": 24634, "train_loss": 3.3597753047943115, "lr": 7.414756433720428e-05, "tps": 58089, "wall": 27793.1} {"step": 24635, "train_loss": 3.1755542755126953, "lr": 7.413633805252558e-05, "tps": 58081, "wall": 27798.1} {"step": 24636, "train_loss": 3.1576735973358154, "lr": 7.412511342019835e-05, "tps": 58072, "wall": 27803.2} {"step": 24637, "train_loss": 3.252922773361206, "lr": 7.411389044034967e-05, "tps": 58064, "wall": 27808.2} {"step": 24638, "train_loss": 3.195549488067627, "lr": 7.410266911310678e-05, "tps": 58056, "wall": 27813.3} {"step": 24639, "train_loss": 3.2177162170410156, "lr": 7.409144943859668e-05, "tps": 58048, "wall": 27818.4} {"step": 24640, "train_loss": 3.2889368534088135, "lr": 7.40802314169466e-05, "tps": 58039, "wall": 27823.5} {"step": 24641, "train_loss": 3.2287797927856445, "lr": 7.406901504828357e-05, "tps": 58031, "wall": 27828.6} {"step": 24642, "train_loss": 3.25472092628479, "lr": 7.405780033273455e-05, "tps": 58023, "wall": 27833.7} {"step": 24643, "train_loss": 3.283151626586914, "lr": 7.404658727042674e-05, "tps": 58015, "wall": 27838.8} {"step": 24644, "train_loss": 3.2917704582214355, "lr": 7.403537586148705e-05, "tps": 58006, "wall": 27843.9} {"step": 24645, "train_loss": 3.245631217956543, "lr": 7.40241661060425e-05, "tps": 57998, "wall": 27848.9} {"step": 24646, "train_loss": 3.2778210639953613, "lr": 7.401295800422015e-05, "tps": 57990, "wall": 27854.0} {"step": 24647, "train_loss": 3.214643955230713, "lr": 7.400175155614688e-05, "tps": 57982, "wall": 27859.0} {"step": 24648, "train_loss": 3.2905683517456055, "lr": 7.399054676194963e-05, "tps": 57974, "wall": 27864.1} {"step": 24649, "train_loss": 3.2839503288269043, "lr": 7.397934362175543e-05, "tps": 57965, "wall": 27869.2} {"step": 24650, "train_loss": 3.2370004653930664, "lr": 7.396814213569112e-05, "tps": 57957, "wall": 27874.3} {"step": 24651, "train_loss": 3.3093533515930176, "lr": 7.395694230388353e-05, "tps": 57949, "wall": 27879.4} {"step": 24652, "train_loss": 3.2016351222991943, "lr": 7.394574412645965e-05, "tps": 57941, "wall": 27884.4} {"step": 24653, "train_loss": 3.192017078399658, "lr": 7.393454760354628e-05, "tps": 57933, "wall": 27889.5} {"step": 24654, "train_loss": 3.228391408920288, "lr": 7.392335273527021e-05, "tps": 57924, "wall": 27894.6} {"step": 24655, "train_loss": 3.3529162406921387, "lr": 7.391215952175837e-05, "tps": 57916, "wall": 27899.7} {"step": 24656, "train_loss": 3.1607179641723633, "lr": 7.390096796313744e-05, "tps": 57908, "wall": 27904.7} {"step": 24657, "train_loss": 3.2460293769836426, "lr": 7.388977805953428e-05, "tps": 57900, "wall": 27909.8} {"step": 24658, "train_loss": 3.2983310222625732, "lr": 7.387858981107563e-05, "tps": 57892, "wall": 27914.8} {"step": 24659, "train_loss": 3.296502113342285, "lr": 7.386740321788816e-05, "tps": 57884, "wall": 27919.9} {"step": 24660, "train_loss": 3.232741355895996, "lr": 7.38562182800987e-05, "tps": 57875, "wall": 27925.0} {"step": 24661, "train_loss": 3.224956750869751, "lr": 7.38450349978339e-05, "tps": 57867, "wall": 27930.0} {"step": 24662, "train_loss": 3.248133420944214, "lr": 7.383385337122042e-05, "tps": 57859, "wall": 27935.1} {"step": 24663, "train_loss": 3.3026952743530273, "lr": 7.382267340038501e-05, "tps": 57851, "wall": 27940.2} {"step": 24664, "train_loss": 3.1535184383392334, "lr": 7.381149508545424e-05, "tps": 57843, "wall": 27945.2} {"step": 24665, "train_loss": 3.2518982887268066, "lr": 7.380031842655474e-05, "tps": 57835, "wall": 27950.3} {"step": 24666, "train_loss": 3.2275795936584473, "lr": 7.378914342381317e-05, "tps": 57827, "wall": 27955.3} {"step": 24667, "train_loss": 3.253763198852539, "lr": 7.37779700773561e-05, "tps": 57819, "wall": 27960.4} {"step": 24668, "train_loss": 3.217313289642334, "lr": 7.376679838731005e-05, "tps": 57810, "wall": 27965.4} {"step": 24669, "train_loss": 3.227933883666992, "lr": 7.375562835380165e-05, "tps": 57802, "wall": 27970.5} {"step": 24670, "train_loss": 3.24092960357666, "lr": 7.374445997695742e-05, "tps": 57794, "wall": 27975.5} {"step": 24671, "train_loss": 3.2700212001800537, "lr": 7.373329325690381e-05, "tps": 57786, "wall": 27980.6} {"step": 24672, "train_loss": 3.2777624130249023, "lr": 7.372212819376742e-05, "tps": 57778, "wall": 27985.6} {"step": 24673, "train_loss": 3.213561773300171, "lr": 7.371096478767468e-05, "tps": 57770, "wall": 27990.7} {"step": 24674, "train_loss": 3.238610029220581, "lr": 7.369980303875199e-05, "tps": 57762, "wall": 27995.8} {"step": 24675, "train_loss": 3.2466559410095215, "lr": 7.368864294712587e-05, "tps": 57754, "wall": 28000.9} {"step": 24676, "train_loss": 3.2247259616851807, "lr": 7.367748451292271e-05, "tps": 57745, "wall": 28006.0} {"step": 24677, "train_loss": 3.2189064025878906, "lr": 7.366632773626893e-05, "tps": 57737, "wall": 28011.0} {"step": 24678, "train_loss": 3.1495563983917236, "lr": 7.365517261729094e-05, "tps": 57729, "wall": 28016.1} {"step": 24679, "train_loss": 3.3045225143432617, "lr": 7.364401915611501e-05, "tps": 57721, "wall": 28021.1} {"step": 24680, "train_loss": 3.2210493087768555, "lr": 7.36328673528676e-05, "tps": 57713, "wall": 28026.2} {"step": 24681, "train_loss": 3.3278074264526367, "lr": 7.362171720767497e-05, "tps": 57705, "wall": 28031.2} {"step": 24682, "train_loss": 3.1755027770996094, "lr": 7.361056872066341e-05, "tps": 57697, "wall": 28036.3} {"step": 24683, "train_loss": 3.3595261573791504, "lr": 7.35994218919593e-05, "tps": 57689, "wall": 28041.3} {"step": 24684, "train_loss": 3.296928882598877, "lr": 7.358827672168886e-05, "tps": 57681, "wall": 28046.4} {"step": 24685, "train_loss": 3.198704719543457, "lr": 7.357713320997828e-05, "tps": 57673, "wall": 28051.4} {"step": 24686, "train_loss": 3.2300620079040527, "lr": 7.356599135695392e-05, "tps": 57665, "wall": 28056.6} {"step": 24687, "train_loss": 3.242924690246582, "lr": 7.355485116274193e-05, "tps": 57657, "wall": 28061.6} {"step": 24688, "train_loss": 3.3426613807678223, "lr": 7.354371262746847e-05, "tps": 57649, "wall": 28066.7} {"step": 24689, "train_loss": 3.130904197692871, "lr": 7.353257575125978e-05, "tps": 57641, "wall": 28071.7} {"step": 24690, "train_loss": 3.158066987991333, "lr": 7.352144053424201e-05, "tps": 57632, "wall": 28076.8} {"step": 24691, "train_loss": 3.3116164207458496, "lr": 7.351030697654124e-05, "tps": 57624, "wall": 28081.9} {"step": 24692, "train_loss": 3.2324023246765137, "lr": 7.349917507828368e-05, "tps": 57616, "wall": 28086.9} {"step": 24693, "train_loss": 3.1286418437957764, "lr": 7.348804483959533e-05, "tps": 57608, "wall": 28092.0} {"step": 24694, "train_loss": 3.298274040222168, "lr": 7.34769162606024e-05, "tps": 57600, "wall": 28097.0} {"step": 24695, "train_loss": 3.244868040084839, "lr": 7.346578934143087e-05, "tps": 57592, "wall": 28102.1} {"step": 24696, "train_loss": 3.219952344894409, "lr": 7.345466408220679e-05, "tps": 57584, "wall": 28107.1} {"step": 24697, "train_loss": 3.1695170402526855, "lr": 7.344354048305621e-05, "tps": 57576, "wall": 28112.2} {"step": 24698, "train_loss": 3.2753422260284424, "lr": 7.343241854410517e-05, "tps": 57568, "wall": 28117.3} {"step": 24699, "train_loss": 3.283540725708008, "lr": 7.342129826547962e-05, "tps": 57560, "wall": 28122.4} {"step": 24700, "train_loss": 3.2881202697753906, "lr": 7.341017964730551e-05, "tps": 57552, "wall": 28127.5} {"step": 24701, "train_loss": 3.1758687496185303, "lr": 7.339906268970878e-05, "tps": 57544, "wall": 28132.6} {"step": 24702, "train_loss": 3.18746018409729, "lr": 7.338794739281545e-05, "tps": 57536, "wall": 28137.6} {"step": 24703, "train_loss": 3.1764543056488037, "lr": 7.337683375675137e-05, "tps": 57528, "wall": 28142.7} {"step": 24704, "train_loss": 3.163407564163208, "lr": 7.336572178164242e-05, "tps": 57520, "wall": 28147.7} {"step": 24705, "train_loss": 3.2099218368530273, "lr": 7.335461146761453e-05, "tps": 57512, "wall": 28152.8} {"step": 24706, "train_loss": 3.1022496223449707, "lr": 7.334350281479356e-05, "tps": 57504, "wall": 28157.8} {"step": 24707, "train_loss": 3.1605329513549805, "lr": 7.333239582330527e-05, "tps": 57496, "wall": 28162.9} {"step": 24708, "train_loss": 3.2172882556915283, "lr": 7.332129049327556e-05, "tps": 57488, "wall": 28168.0} {"step": 24709, "train_loss": 3.1959338188171387, "lr": 7.331018682483022e-05, "tps": 57480, "wall": 28173.0} {"step": 24710, "train_loss": 3.213703155517578, "lr": 7.329908481809498e-05, "tps": 57472, "wall": 28178.1} {"step": 24711, "train_loss": 3.197369337081909, "lr": 7.328798447319569e-05, "tps": 57464, "wall": 28183.2} {"step": 24712, "train_loss": 3.207815647125244, "lr": 7.327688579025805e-05, "tps": 57456, "wall": 28188.3} {"step": 24713, "train_loss": 3.2119603157043457, "lr": 7.326578876940772e-05, "tps": 57448, "wall": 28193.3} {"step": 24714, "train_loss": 3.190772294998169, "lr": 7.325469341077053e-05, "tps": 57440, "wall": 28198.4} {"step": 24715, "train_loss": 3.2514889240264893, "lr": 7.324359971447212e-05, "tps": 57432, "wall": 28203.5} {"step": 24716, "train_loss": 3.197826385498047, "lr": 7.32325076806381e-05, "tps": 57424, "wall": 28208.5} {"step": 24717, "train_loss": 3.2473113536834717, "lr": 7.322141730939423e-05, "tps": 57416, "wall": 28213.7} {"step": 24718, "train_loss": 3.3045196533203125, "lr": 7.321032860086603e-05, "tps": 57408, "wall": 28218.7} {"step": 24719, "train_loss": 3.2236781120300293, "lr": 7.319924155517918e-05, "tps": 57400, "wall": 28223.8} {"step": 24720, "train_loss": 3.20615291595459, "lr": 7.318815617245933e-05, "tps": 57392, "wall": 28228.8} {"step": 24721, "train_loss": 3.3143177032470703, "lr": 7.31770724528319e-05, "tps": 57384, "wall": 28233.9} {"step": 24722, "train_loss": 3.172109603881836, "lr": 7.316599039642258e-05, "tps": 57376, "wall": 28239.0} {"step": 24723, "train_loss": 3.3297038078308105, "lr": 7.315491000335687e-05, "tps": 57368, "wall": 28244.1} {"step": 24724, "train_loss": 3.1778829097747803, "lr": 7.314383127376025e-05, "tps": 57360, "wall": 28249.2} {"step": 24725, "train_loss": 3.1899943351745605, "lr": 7.31327542077583e-05, "tps": 57352, "wall": 28254.2} {"step": 24726, "train_loss": 3.2109460830688477, "lr": 7.312167880547645e-05, "tps": 57344, "wall": 28259.3} {"step": 24727, "train_loss": 3.173917531967163, "lr": 7.311060506704016e-05, "tps": 57336, "wall": 28264.4} {"step": 24728, "train_loss": 3.1373353004455566, "lr": 7.309953299257488e-05, "tps": 57328, "wall": 28269.4} {"step": 24729, "train_loss": 3.295884370803833, "lr": 7.308846258220604e-05, "tps": 57320, "wall": 28274.4} {"step": 24730, "train_loss": 3.2915563583374023, "lr": 7.3077393836059e-05, "tps": 57312, "wall": 28279.5} {"step": 24731, "train_loss": 3.202380657196045, "lr": 7.306632675425924e-05, "tps": 57304, "wall": 28284.5} {"step": 24732, "train_loss": 3.2233643531799316, "lr": 7.305526133693207e-05, "tps": 57296, "wall": 28289.6} {"step": 24733, "train_loss": 3.25665283203125, "lr": 7.304419758420284e-05, "tps": 57288, "wall": 28294.6} {"step": 24734, "train_loss": 3.2524523735046387, "lr": 7.303313549619691e-05, "tps": 57280, "wall": 28299.7} {"step": 24735, "train_loss": 3.2611608505249023, "lr": 7.302207507303952e-05, "tps": 57272, "wall": 28304.8} {"step": 24736, "train_loss": 3.3040566444396973, "lr": 7.301101631485608e-05, "tps": 57265, "wall": 28309.8} {"step": 24737, "train_loss": 3.14388370513916, "lr": 7.299995922177178e-05, "tps": 57257, "wall": 28314.9} {"step": 24738, "train_loss": 3.174677848815918, "lr": 7.298890379391183e-05, "tps": 57249, "wall": 28319.9} {"step": 24739, "train_loss": 3.1811628341674805, "lr": 7.297785003140163e-05, "tps": 57241, "wall": 28325.0} {"step": 24740, "train_loss": 3.2281296253204346, "lr": 7.296679793436626e-05, "tps": 57233, "wall": 28330.0} {"step": 24741, "train_loss": 3.334986686706543, "lr": 7.295574750293093e-05, "tps": 57225, "wall": 28335.1} {"step": 24742, "train_loss": 3.307831287384033, "lr": 7.294469873722089e-05, "tps": 57217, "wall": 28340.1} {"step": 24743, "train_loss": 3.268775463104248, "lr": 7.293365163736126e-05, "tps": 57209, "wall": 28345.2} {"step": 24744, "train_loss": 3.2352075576782227, "lr": 7.292260620347711e-05, "tps": 57201, "wall": 28350.2} {"step": 24745, "train_loss": 3.1646792888641357, "lr": 7.29115624356937e-05, "tps": 57194, "wall": 28355.3} {"step": 24746, "train_loss": 3.2287702560424805, "lr": 7.290052033413609e-05, "tps": 57186, "wall": 28360.4} {"step": 24747, "train_loss": 3.2010490894317627, "lr": 7.288947989892926e-05, "tps": 57178, "wall": 28365.5} {"step": 24748, "train_loss": 3.19693660736084, "lr": 7.287844113019841e-05, "tps": 57170, "wall": 28370.6} {"step": 24749, "train_loss": 3.124310255050659, "lr": 7.286740402806855e-05, "tps": 57162, "wall": 28375.7} {"step": 24750, "train_loss": 3.2726857662200928, "lr": 7.285636859266465e-05, "tps": 57154, "wall": 28380.7} {"step": 24751, "train_loss": 3.1980981826782227, "lr": 7.284533482411182e-05, "tps": 57146, "wall": 28385.8} {"step": 24752, "train_loss": 3.219466209411621, "lr": 7.283430272253495e-05, "tps": 57138, "wall": 28390.8} {"step": 24753, "train_loss": 3.3187437057495117, "lr": 7.28232722880591e-05, "tps": 57130, "wall": 28395.9} {"step": 24754, "train_loss": 3.2421622276306152, "lr": 7.281224352080917e-05, "tps": 57122, "wall": 28400.9} {"step": 24755, "train_loss": 3.1810173988342285, "lr": 7.280121642091009e-05, "tps": 57115, "wall": 28406.0} {"step": 24756, "train_loss": 3.281451463699341, "lr": 7.279019098848681e-05, "tps": 57107, "wall": 28411.0} {"step": 24757, "train_loss": 3.2097177505493164, "lr": 7.277916722366424e-05, "tps": 57099, "wall": 28416.1} {"step": 24758, "train_loss": 3.254371166229248, "lr": 7.276814512656718e-05, "tps": 57091, "wall": 28421.2} {"step": 24759, "train_loss": 3.157506227493286, "lr": 7.275712469732057e-05, "tps": 57083, "wall": 28426.2} {"step": 24760, "train_loss": 3.1629228591918945, "lr": 7.274610593604922e-05, "tps": 57075, "wall": 28431.3} {"step": 24761, "train_loss": 3.250577211380005, "lr": 7.273508884287788e-05, "tps": 57067, "wall": 28436.4} {"step": 24762, "train_loss": 3.1246790885925293, "lr": 7.272407341793149e-05, "tps": 57059, "wall": 28441.5} {"step": 24763, "train_loss": 3.2370476722717285, "lr": 7.271305966133478e-05, "tps": 57052, "wall": 28446.5} {"step": 24764, "train_loss": 3.2282540798187256, "lr": 7.270204757321241e-05, "tps": 57044, "wall": 28451.6} {"step": 24765, "train_loss": 3.11619234085083, "lr": 7.26910371536893e-05, "tps": 57036, "wall": 28456.7} {"step": 24766, "train_loss": 3.322288990020752, "lr": 7.268002840289008e-05, "tps": 57028, "wall": 28461.8} {"step": 24767, "train_loss": 3.180677652359009, "lr": 7.266902132093942e-05, "tps": 57020, "wall": 28466.8} {"step": 24768, "train_loss": 3.22542667388916, "lr": 7.265801590796209e-05, "tps": 57012, "wall": 28471.9} {"step": 24769, "train_loss": 3.1611592769622803, "lr": 7.264701216408274e-05, "tps": 57004, "wall": 28477.0} {"step": 24770, "train_loss": 3.187122106552124, "lr": 7.263601008942596e-05, "tps": 56997, "wall": 28482.0} {"step": 24771, "train_loss": 3.2821078300476074, "lr": 7.262500968411647e-05, "tps": 56989, "wall": 28487.1} {"step": 24772, "train_loss": 3.228430986404419, "lr": 7.26140109482788e-05, "tps": 56981, "wall": 28492.1} {"step": 24773, "train_loss": 3.3167572021484375, "lr": 7.260301388203763e-05, "tps": 56973, "wall": 28497.2} {"step": 24774, "train_loss": 3.262263536453247, "lr": 7.259201848551749e-05, "tps": 56965, "wall": 28502.2} {"step": 24775, "train_loss": 3.130066394805908, "lr": 7.258102475884291e-05, "tps": 56958, "wall": 28507.3} {"step": 24776, "train_loss": 3.2134320735931396, "lr": 7.257003270213849e-05, "tps": 56950, "wall": 28512.4} {"step": 24777, "train_loss": 3.201815128326416, "lr": 7.255904231552872e-05, "tps": 56942, "wall": 28517.4} {"step": 24778, "train_loss": 3.14337420463562, "lr": 7.254805359913805e-05, "tps": 56934, "wall": 28522.5} {"step": 24779, "train_loss": 3.135652542114258, "lr": 7.253706655309105e-05, "tps": 56926, "wall": 28527.6} {"step": 24780, "train_loss": 3.169837236404419, "lr": 7.252608117751214e-05, "tps": 56918, "wall": 28532.7} {"step": 24781, "train_loss": 3.25850248336792, "lr": 7.251509747252572e-05, "tps": 56910, "wall": 28537.8} {"step": 24782, "train_loss": 3.237196683883667, "lr": 7.25041154382563e-05, "tps": 56903, "wall": 28542.9} {"step": 24783, "train_loss": 3.2848124504089355, "lr": 7.24931350748282e-05, "tps": 56895, "wall": 28548.0} {"step": 24784, "train_loss": 3.205902576446533, "lr": 7.248215638236585e-05, "tps": 56887, "wall": 28553.0} {"step": 24785, "train_loss": 3.2827749252319336, "lr": 7.247117936099363e-05, "tps": 56879, "wall": 28558.1} {"step": 24786, "train_loss": 3.1659536361694336, "lr": 7.246020401083589e-05, "tps": 56871, "wall": 28563.2} {"step": 24787, "train_loss": 3.1423304080963135, "lr": 7.24492303320169e-05, "tps": 56864, "wall": 28568.2} {"step": 24788, "train_loss": 3.271848678588867, "lr": 7.243825832466102e-05, "tps": 56856, "wall": 28573.3} {"step": 24789, "train_loss": 3.2005276679992676, "lr": 7.242728798889253e-05, "tps": 56848, "wall": 28578.4} {"step": 24790, "train_loss": 3.2467637062072754, "lr": 7.241631932483573e-05, "tps": 56840, "wall": 28583.4} {"step": 24791, "train_loss": 3.3213958740234375, "lr": 7.240535233261485e-05, "tps": 56833, "wall": 28588.4} {"step": 24792, "train_loss": 3.2109599113464355, "lr": 7.239438701235409e-05, "tps": 56825, "wall": 28593.5} {"step": 24793, "train_loss": 3.103030204772949, "lr": 7.238342336417771e-05, "tps": 56817, "wall": 28598.6} {"step": 24794, "train_loss": 3.2752532958984375, "lr": 7.237246138820992e-05, "tps": 56809, "wall": 28603.7} {"step": 24795, "train_loss": 3.296041488647461, "lr": 7.236150108457483e-05, "tps": 56801, "wall": 28608.7} {"step": 24796, "train_loss": 3.2914557456970215, "lr": 7.235054245339669e-05, "tps": 56794, "wall": 28613.8} {"step": 24797, "train_loss": 3.1714725494384766, "lr": 7.23395854947996e-05, "tps": 56786, "wall": 28618.8} {"step": 24798, "train_loss": 3.2557249069213867, "lr": 7.23286302089076e-05, "tps": 56778, "wall": 28623.9} {"step": 24799, "train_loss": 3.2569808959960938, "lr": 7.231767659584494e-05, "tps": 56770, "wall": 28629.0} {"step": 24800, "train_loss": 3.2404770851135254, "lr": 7.230672465573563e-05, "tps": 56763, "wall": 28634.0} {"step": 24801, "train_loss": 3.239849805831909, "lr": 7.229577438870367e-05, "tps": 56755, "wall": 28639.1} {"step": 24802, "train_loss": 3.293203353881836, "lr": 7.228482579487321e-05, "tps": 56747, "wall": 28644.1} {"step": 24803, "train_loss": 3.197906017303467, "lr": 7.227387887436825e-05, "tps": 56739, "wall": 28649.2} {"step": 24804, "train_loss": 3.2522435188293457, "lr": 7.226293362731273e-05, "tps": 56732, "wall": 28654.3} {"step": 24805, "train_loss": 3.1921067237854004, "lr": 7.225199005383074e-05, "tps": 56724, "wall": 28659.4} {"step": 24806, "train_loss": 3.2560501098632812, "lr": 7.224104815404614e-05, "tps": 56716, "wall": 28664.4} {"step": 24807, "train_loss": 3.1658599376678467, "lr": 7.223010792808299e-05, "tps": 56708, "wall": 28669.5} {"step": 24808, "train_loss": 3.2002615928649902, "lr": 7.221916937606518e-05, "tps": 56701, "wall": 28674.6} {"step": 24809, "train_loss": 3.319654703140259, "lr": 7.220823249811657e-05, "tps": 56693, "wall": 28679.6} {"step": 24810, "train_loss": 3.2354273796081543, "lr": 7.219729729436113e-05, "tps": 56685, "wall": 28684.7} {"step": 24811, "train_loss": 3.321622848510742, "lr": 7.218636376492271e-05, "tps": 56678, "wall": 28689.7} {"step": 24812, "train_loss": 3.296682357788086, "lr": 7.217543190992514e-05, "tps": 56670, "wall": 28694.8} {"step": 24813, "train_loss": 3.27060604095459, "lr": 7.216450172949227e-05, "tps": 56662, "wall": 28699.8} {"step": 24814, "train_loss": 3.2450966835021973, "lr": 7.215357322374797e-05, "tps": 56655, "wall": 28704.8} {"step": 24815, "train_loss": 3.175593376159668, "lr": 7.214264639281592e-05, "tps": 56647, "wall": 28709.9} {"step": 24816, "train_loss": 3.1662309169769287, "lr": 7.213172123681999e-05, "tps": 56639, "wall": 28714.9} {"step": 24817, "train_loss": 3.3018691539764404, "lr": 7.212079775588397e-05, "tps": 56631, "wall": 28720.0} {"step": 24818, "train_loss": 3.185183525085449, "lr": 7.210987595013148e-05, "tps": 56624, "wall": 28725.1} {"step": 24819, "train_loss": 3.2550106048583984, "lr": 7.209895581968638e-05, "tps": 56616, "wall": 28730.2} {"step": 24820, "train_loss": 3.2374320030212402, "lr": 7.208803736467229e-05, "tps": 56608, "wall": 28735.3} {"step": 24821, "train_loss": 3.2900145053863525, "lr": 7.207712058521287e-05, "tps": 56601, "wall": 28740.3} {"step": 24822, "train_loss": 3.184530735015869, "lr": 7.20662054814319e-05, "tps": 56593, "wall": 28745.4} {"step": 24823, "train_loss": 3.2390387058258057, "lr": 7.205529205345294e-05, "tps": 56585, "wall": 28750.5} {"step": 24824, "train_loss": 3.24397611618042, "lr": 7.204438030139957e-05, "tps": 56578, "wall": 28755.5} {"step": 24825, "train_loss": 3.25219988822937, "lr": 7.203347022539553e-05, "tps": 56570, "wall": 28760.6} {"step": 24826, "train_loss": 3.3102567195892334, "lr": 7.202256182556431e-05, "tps": 56562, "wall": 28765.6} {"step": 24827, "train_loss": 3.204716682434082, "lr": 7.201165510202953e-05, "tps": 56555, "wall": 28770.7} {"step": 24828, "train_loss": 3.2585740089416504, "lr": 7.200075005491476e-05, "tps": 56547, "wall": 28775.8} {"step": 24829, "train_loss": 3.227684497833252, "lr": 7.198984668434344e-05, "tps": 56539, "wall": 28780.9} {"step": 24830, "train_loss": 3.2962257862091064, "lr": 7.197894499043919e-05, "tps": 56531, "wall": 28786.0} {"step": 24831, "train_loss": 3.1893906593322754, "lr": 7.196804497332546e-05, "tps": 56524, "wall": 28791.1} {"step": 24832, "train_loss": 3.269437074661255, "lr": 7.195714663312569e-05, "tps": 56516, "wall": 28796.2} {"step": 24833, "train_loss": 3.2737300395965576, "lr": 7.194624996996338e-05, "tps": 56508, "wall": 28801.2} {"step": 24834, "train_loss": 3.159529209136963, "lr": 7.1935354983962e-05, "tps": 56501, "wall": 28806.3} {"step": 24835, "train_loss": 3.2259411811828613, "lr": 7.192446167524487e-05, "tps": 56493, "wall": 28811.3} {"step": 24836, "train_loss": 3.3433260917663574, "lr": 7.191357004393549e-05, "tps": 56485, "wall": 28816.4} {"step": 24837, "train_loss": 3.258005142211914, "lr": 7.190268009015722e-05, "tps": 56478, "wall": 28821.4} {"step": 24838, "train_loss": 3.2279629707336426, "lr": 7.189179181403333e-05, "tps": 56470, "wall": 28826.5} {"step": 24839, "train_loss": 3.294970989227295, "lr": 7.188090521568729e-05, "tps": 56462, "wall": 28831.5} {"step": 24840, "train_loss": 3.231874942779541, "lr": 7.187002029524236e-05, "tps": 56455, "wall": 28836.7} {"step": 24841, "train_loss": 3.217603921890259, "lr": 7.185913705282181e-05, "tps": 56447, "wall": 28841.7} {"step": 24842, "train_loss": 3.183889627456665, "lr": 7.184825548854904e-05, "tps": 56439, "wall": 28846.8} {"step": 24843, "train_loss": 3.1689133644104004, "lr": 7.18373756025472e-05, "tps": 56432, "wall": 28851.9} {"step": 24844, "train_loss": 3.1370081901550293, "lr": 7.182649739493961e-05, "tps": 56424, "wall": 28856.9} {"step": 24845, "train_loss": 3.180325508117676, "lr": 7.181562086584947e-05, "tps": 56416, "wall": 28862.0} {"step": 24846, "train_loss": 3.295146942138672, "lr": 7.180474601539995e-05, "tps": 56409, "wall": 28867.1} {"step": 24847, "train_loss": 3.1671745777130127, "lr": 7.179387284371435e-05, "tps": 56401, "wall": 28872.1} {"step": 24848, "train_loss": 3.2016568183898926, "lr": 7.178300135091576e-05, "tps": 56394, "wall": 28877.2} {"step": 24849, "train_loss": 3.3464674949645996, "lr": 7.177213153712729e-05, "tps": 56386, "wall": 28882.2} {"step": 24850, "train_loss": 3.1953845024108887, "lr": 7.17612634024722e-05, "tps": 56379, "wall": 28887.3} {"step": 24851, "train_loss": 3.153533935546875, "lr": 7.175039694707353e-05, "tps": 56371, "wall": 28892.3} {"step": 24852, "train_loss": 3.1646320819854736, "lr": 7.173953217105435e-05, "tps": 56363, "wall": 28897.4} {"step": 24853, "train_loss": 3.1374826431274414, "lr": 7.172866907453779e-05, "tps": 56356, "wall": 28902.5} {"step": 24854, "train_loss": 3.193295478820801, "lr": 7.17178076576469e-05, "tps": 56348, "wall": 28907.5} {"step": 24855, "train_loss": 3.1689133644104004, "lr": 7.170694792050467e-05, "tps": 56340, "wall": 28912.6} {"step": 24856, "train_loss": 3.304058313369751, "lr": 7.169608986323419e-05, "tps": 56333, "wall": 28917.7} {"step": 24857, "train_loss": 3.313337802886963, "lr": 7.168523348595843e-05, "tps": 56325, "wall": 28922.7} {"step": 24858, "train_loss": 3.175400733947754, "lr": 7.167437878880034e-05, "tps": 56318, "wall": 28927.8} {"step": 24859, "train_loss": 3.2705087661743164, "lr": 7.166352577188293e-05, "tps": 56310, "wall": 28932.9} {"step": 24860, "train_loss": 3.126673698425293, "lr": 7.165267443532912e-05, "tps": 56302, "wall": 28938.0} {"step": 24861, "train_loss": 3.2071080207824707, "lr": 7.164182477926184e-05, "tps": 56295, "wall": 28943.0} {"step": 24862, "train_loss": 3.252455472946167, "lr": 7.163097680380401e-05, "tps": 56287, "wall": 28948.1} {"step": 24863, "train_loss": 3.2071008682250977, "lr": 7.162013050907846e-05, "tps": 56280, "wall": 28953.2} {"step": 24864, "train_loss": 3.1679258346557617, "lr": 7.160928589520815e-05, "tps": 56272, "wall": 28958.4} {"step": 24865, "train_loss": 3.305352210998535, "lr": 7.159844296231586e-05, "tps": 56264, "wall": 28963.5} {"step": 24866, "train_loss": 3.3205602169036865, "lr": 7.158760171052441e-05, "tps": 56257, "wall": 28968.5} {"step": 24867, "train_loss": 3.2359278202056885, "lr": 7.157676213995672e-05, "tps": 56249, "wall": 28973.6} {"step": 24868, "train_loss": 3.173675537109375, "lr": 7.15659242507354e-05, "tps": 56241, "wall": 28978.7} {"step": 24869, "train_loss": 3.198302984237671, "lr": 7.155508804298339e-05, "tps": 56234, "wall": 28983.8} {"step": 24870, "train_loss": 3.1303441524505615, "lr": 7.154425351682334e-05, "tps": 56226, "wall": 28988.9} {"step": 24871, "train_loss": 3.230247974395752, "lr": 7.153342067237798e-05, "tps": 56218, "wall": 28994.1} {"step": 24872, "train_loss": 3.2195162773132324, "lr": 7.152258950977011e-05, "tps": 56211, "wall": 28999.2} {"step": 24873, "train_loss": 3.2427785396575928, "lr": 7.151176002912241e-05, "tps": 56203, "wall": 29004.5} {"step": 24874, "train_loss": 3.1467068195343018, "lr": 7.150093223055745e-05, "tps": 56195, "wall": 29009.8} {"step": 24875, "train_loss": 3.2482187747955322, "lr": 7.1490106114198e-05, "tps": 56187, "wall": 29015.0} {"step": 24876, "train_loss": 3.209554672241211, "lr": 7.147928168016668e-05, "tps": 56179, "wall": 29020.2} {"step": 24877, "train_loss": 3.144805431365967, "lr": 7.146845892858605e-05, "tps": 56171, "wall": 29025.5} {"step": 24878, "train_loss": 3.27917218208313, "lr": 7.14576378595788e-05, "tps": 56163, "wall": 29030.5} {"step": 24879, "train_loss": 3.2881033420562744, "lr": 7.144681847326744e-05, "tps": 56156, "wall": 29035.7} {"step": 24880, "train_loss": 3.2400667667388916, "lr": 7.143600076977453e-05, "tps": 56148, "wall": 29040.9} {"step": 24881, "train_loss": 3.2440521717071533, "lr": 7.142518474922266e-05, "tps": 56140, "wall": 29046.0} {"step": 24882, "train_loss": 3.1613428592681885, "lr": 7.141437041173436e-05, "tps": 56133, "wall": 29051.1} {"step": 24883, "train_loss": 3.230257272720337, "lr": 7.140355775743206e-05, "tps": 56125, "wall": 29056.2} {"step": 24884, "train_loss": 3.2551703453063965, "lr": 7.139274678643835e-05, "tps": 56118, "wall": 29061.3} {"step": 24885, "train_loss": 3.153395175933838, "lr": 7.138193749887558e-05, "tps": 56110, "wall": 29066.4} {"step": 24886, "train_loss": 3.2439751625061035, "lr": 7.137112989486634e-05, "tps": 56102, "wall": 29071.6} {"step": 24887, "train_loss": 3.2195730209350586, "lr": 7.136032397453296e-05, "tps": 56094, "wall": 29076.8} {"step": 24888, "train_loss": 3.218719244003296, "lr": 7.134951973799782e-05, "tps": 56087, "wall": 29081.8} {"step": 24889, "train_loss": 3.1244330406188965, "lr": 7.133871718538341e-05, "tps": 56079, "wall": 29087.0} {"step": 24890, "train_loss": 3.146033763885498, "lr": 7.132791631681206e-05, "tps": 56072, "wall": 29092.1} {"step": 24891, "train_loss": 3.3256397247314453, "lr": 7.131711713240608e-05, "tps": 56064, "wall": 29097.4} {"step": 24892, "train_loss": 3.2941784858703613, "lr": 7.130631963228787e-05, "tps": 56055, "wall": 29103.1} {"step": 24893, "train_loss": 3.2085039615631104, "lr": 7.129552381657973e-05, "tps": 56047, "wall": 29108.5} {"step": 24894, "train_loss": 3.185488700866699, "lr": 7.128472968540387e-05, "tps": 56039, "wall": 29113.6} {"step": 24895, "train_loss": 3.2708911895751953, "lr": 7.127393723888272e-05, "tps": 56032, "wall": 29118.7} {"step": 24896, "train_loss": 3.193702220916748, "lr": 7.126314647713841e-05, "tps": 56024, "wall": 29123.8} {"step": 24897, "train_loss": 3.222843647003174, "lr": 7.125235740029321e-05, "tps": 56017, "wall": 29128.9} {"step": 24898, "train_loss": 3.363466739654541, "lr": 7.124157000846941e-05, "tps": 56009, "wall": 29134.0} {"step": 24899, "train_loss": 3.332890272140503, "lr": 7.123078430178912e-05, "tps": 56001, "wall": 29139.2} {"step": 24900, "train_loss": 3.180607795715332, "lr": 7.122000028037452e-05, "tps": 55994, "wall": 29144.3} {"step": 24901, "train_loss": 3.268655776977539, "lr": 7.120921794434785e-05, "tps": 55986, "wall": 29149.4} {"step": 24902, "train_loss": 3.236528158187866, "lr": 7.119843729383122e-05, "tps": 55978, "wall": 29155.0} {"step": 24903, "train_loss": 3.2234063148498535, "lr": 7.118765832894668e-05, "tps": 55970, "wall": 29160.1} {"step": 24904, "train_loss": 3.181309700012207, "lr": 7.117688104981646e-05, "tps": 55963, "wall": 29165.2} {"step": 24905, "train_loss": 3.186776638031006, "lr": 7.116610545656253e-05, "tps": 55955, "wall": 29170.3} {"step": 24906, "train_loss": 3.225663900375366, "lr": 7.115533154930704e-05, "tps": 55947, "wall": 29175.5} {"step": 24907, "train_loss": 3.201904773712158, "lr": 7.114455932817202e-05, "tps": 55940, "wall": 29180.6} {"step": 24908, "train_loss": 3.2171318531036377, "lr": 7.113378879327944e-05, "tps": 55932, "wall": 29185.7} {"step": 24909, "train_loss": 3.181487560272217, "lr": 7.112301994475139e-05, "tps": 55925, "wall": 29190.7} {"step": 24910, "train_loss": 3.2201383113861084, "lr": 7.111225278270984e-05, "tps": 55917, "wall": 29195.8} {"step": 24911, "train_loss": 3.231933355331421, "lr": 7.110148730727668e-05, "tps": 55910, "wall": 29201.0} {"step": 24912, "train_loss": 3.1422083377838135, "lr": 7.1090723518574e-05, "tps": 55902, "wall": 29206.4} {"step": 24913, "train_loss": 3.3210010528564453, "lr": 7.107996141672363e-05, "tps": 55894, "wall": 29211.6} {"step": 24914, "train_loss": 3.210353374481201, "lr": 7.106920100184747e-05, "tps": 55886, "wall": 29216.8} {"step": 24915, "train_loss": 3.2036752700805664, "lr": 7.105844227406753e-05, "tps": 55879, "wall": 29221.9} {"step": 24916, "train_loss": 3.1719586849212646, "lr": 7.10476852335056e-05, "tps": 55871, "wall": 29227.0} {"step": 24917, "train_loss": 3.260129451751709, "lr": 7.10369298802835e-05, "tps": 55863, "wall": 29232.2} {"step": 24918, "train_loss": 3.157534599304199, "lr": 7.102617621452316e-05, "tps": 55856, "wall": 29237.4} {"step": 24919, "train_loss": 3.1856422424316406, "lr": 7.101542423634637e-05, "tps": 55847, "wall": 29243.1} {"step": 24920, "train_loss": 3.191645383834839, "lr": 7.100467394587484e-05, "tps": 55839, "wall": 29248.3} {"step": 24921, "train_loss": 3.2652904987335205, "lr": 7.099392534323051e-05, "tps": 55832, "wall": 29253.4} {"step": 24922, "train_loss": 3.2756991386413574, "lr": 7.098317842853499e-05, "tps": 55824, "wall": 29258.7} {"step": 24923, "train_loss": 3.2815589904785156, "lr": 7.097243320191012e-05, "tps": 55817, "wall": 29263.8} {"step": 24924, "train_loss": 3.339906930923462, "lr": 7.09616896634776e-05, "tps": 55808, "wall": 29269.3} {"step": 24925, "train_loss": 3.2075600624084473, "lr": 7.095094781335909e-05, "tps": 55800, "wall": 29274.7} {"step": 24926, "train_loss": 3.2274155616760254, "lr": 7.094020765167634e-05, "tps": 55793, "wall": 29279.8} {"step": 24927, "train_loss": 3.2161121368408203, "lr": 7.092946917855096e-05, "tps": 55785, "wall": 29284.9} {"step": 24928, "train_loss": 3.177272081375122, "lr": 7.09187323941046e-05, "tps": 55778, "wall": 29290.0} {"step": 24929, "train_loss": 3.2265398502349854, "lr": 7.090799729845893e-05, "tps": 55770, "wall": 29295.1} {"step": 24930, "train_loss": 3.178089141845703, "lr": 7.089726389173557e-05, "tps": 55763, "wall": 29300.2} {"step": 24931, "train_loss": 3.226362943649292, "lr": 7.088653217405599e-05, "tps": 55755, "wall": 29305.3} {"step": 24932, "train_loss": 3.314281702041626, "lr": 7.087580214554189e-05, "tps": 55748, "wall": 29310.4} {"step": 24933, "train_loss": 3.174671173095703, "lr": 7.08650738063148e-05, "tps": 55741, "wall": 29315.4} {"step": 24934, "train_loss": 3.242177963256836, "lr": 7.085434715649615e-05, "tps": 55733, "wall": 29320.6} {"step": 24935, "train_loss": 3.1404364109039307, "lr": 7.084362219620757e-05, "tps": 55726, "wall": 29325.7} {"step": 24936, "train_loss": 3.078824043273926, "lr": 7.08328989255705e-05, "tps": 55718, "wall": 29330.8} {"step": 24937, "train_loss": 3.2334365844726562, "lr": 7.082217734470639e-05, "tps": 55711, "wall": 29335.8} {"step": 24938, "train_loss": 3.2302772998809814, "lr": 7.081145745373677e-05, "tps": 55703, "wall": 29340.9} {"step": 24939, "train_loss": 3.1485848426818848, "lr": 7.080073925278297e-05, "tps": 55696, "wall": 29346.0} {"step": 24940, "train_loss": 3.25986909866333, "lr": 7.079002274196653e-05, "tps": 55689, "wall": 29351.0} {"step": 24941, "train_loss": 3.321066379547119, "lr": 7.077930792140878e-05, "tps": 55681, "wall": 29356.1} {"step": 24942, "train_loss": 3.2620608806610107, "lr": 7.076859479123104e-05, "tps": 55674, "wall": 29361.2} {"step": 24943, "train_loss": 3.23728609085083, "lr": 7.07578833515548e-05, "tps": 55666, "wall": 29366.3} {"step": 24944, "train_loss": 3.2921078205108643, "lr": 7.074717360250134e-05, "tps": 55659, "wall": 29371.4} {"step": 24945, "train_loss": 3.2313098907470703, "lr": 7.073646554419191e-05, "tps": 55651, "wall": 29376.5} {"step": 24946, "train_loss": 3.274932861328125, "lr": 7.072575917674791e-05, "tps": 55644, "wall": 29381.7} {"step": 24947, "train_loss": 3.3278684616088867, "lr": 7.07150545002906e-05, "tps": 55637, "wall": 29386.7} {"step": 24948, "train_loss": 3.301954746246338, "lr": 7.070435151494117e-05, "tps": 55629, "wall": 29391.8} {"step": 24949, "train_loss": 3.200110912322998, "lr": 7.069365022082097e-05, "tps": 55622, "wall": 29396.9} {"step": 24950, "train_loss": 3.146608352661133, "lr": 7.06829506180512e-05, "tps": 55614, "wall": 29402.0} {"step": 24951, "train_loss": 3.2864644527435303, "lr": 7.067225270675297e-05, "tps": 55607, "wall": 29407.1} {"step": 24952, "train_loss": 3.3635151386260986, "lr": 7.06615564870476e-05, "tps": 55600, "wall": 29412.1} {"step": 24953, "train_loss": 3.1007957458496094, "lr": 7.06508619590562e-05, "tps": 55592, "wall": 29417.2} {"step": 24954, "train_loss": 3.3130431175231934, "lr": 7.064016912289986e-05, "tps": 55585, "wall": 29422.4} {"step": 24955, "train_loss": 3.2103934288024902, "lr": 7.062947797869984e-05, "tps": 55577, "wall": 29427.6} {"step": 24956, "train_loss": 3.1500275135040283, "lr": 7.061878852657713e-05, "tps": 55570, "wall": 29432.8} {"step": 24957, "train_loss": 3.1964712142944336, "lr": 7.060810076665283e-05, "tps": 55562, "wall": 29438.0} {"step": 24958, "train_loss": 3.1169373989105225, "lr": 7.05974146990481e-05, "tps": 55555, "wall": 29443.1} {"step": 24959, "train_loss": 3.1664247512817383, "lr": 7.058673032388389e-05, "tps": 55547, "wall": 29448.2} {"step": 24960, "train_loss": 3.3130016326904297, "lr": 7.057604764128134e-05, "tps": 55540, "wall": 29453.3} {"step": 24961, "train_loss": 3.2650256156921387, "lr": 7.05653666513614e-05, "tps": 55532, "wall": 29458.5} {"step": 24962, "train_loss": 3.1814658641815186, "lr": 7.055468735424502e-05, "tps": 55525, "wall": 29463.6} {"step": 24963, "train_loss": 3.255626678466797, "lr": 7.054400975005326e-05, "tps": 55517, "wall": 29468.7} {"step": 24964, "train_loss": 3.21177339553833, "lr": 7.053333383890705e-05, "tps": 55510, "wall": 29473.8} {"step": 24965, "train_loss": 3.1337623596191406, "lr": 7.05226596209273e-05, "tps": 55503, "wall": 29478.9} {"step": 24966, "train_loss": 3.3034896850585938, "lr": 7.051198709623497e-05, "tps": 55495, "wall": 29484.0} {"step": 24967, "train_loss": 3.186999797821045, "lr": 7.050131626495095e-05, "tps": 55488, "wall": 29489.1} {"step": 24968, "train_loss": 3.1380841732025146, "lr": 7.049064712719604e-05, "tps": 55480, "wall": 29494.2} {"step": 24969, "train_loss": 3.1856539249420166, "lr": 7.047997968309123e-05, "tps": 55473, "wall": 29499.4} {"step": 24970, "train_loss": 3.2804601192474365, "lr": 7.04693139327573e-05, "tps": 55465, "wall": 29504.6} {"step": 24971, "train_loss": 3.147542715072632, "lr": 7.045864987631503e-05, "tps": 55458, "wall": 29509.8} {"step": 24972, "train_loss": 3.1825246810913086, "lr": 7.044798751388529e-05, "tps": 55450, "wall": 29514.9} {"step": 24973, "train_loss": 3.2142603397369385, "lr": 7.043732684558886e-05, "tps": 55443, "wall": 29520.1} {"step": 24974, "train_loss": 3.2637457847595215, "lr": 7.042666787154642e-05, "tps": 55436, "wall": 29525.2} {"step": 24975, "train_loss": 3.203917980194092, "lr": 7.041601059187884e-05, "tps": 55428, "wall": 29530.4} {"step": 24976, "train_loss": 3.2036237716674805, "lr": 7.040535500670673e-05, "tps": 55420, "wall": 29535.6} {"step": 24977, "train_loss": 3.1840038299560547, "lr": 7.03947011161509e-05, "tps": 55413, "wall": 29540.9} {"step": 24978, "train_loss": 3.2603464126586914, "lr": 7.038404892033199e-05, "tps": 55405, "wall": 29546.0} {"step": 24979, "train_loss": 3.3227133750915527, "lr": 7.03733984193706e-05, "tps": 55398, "wall": 29551.1} {"step": 24980, "train_loss": 3.3029720783233643, "lr": 7.036274961338752e-05, "tps": 55391, "wall": 29556.2} {"step": 24981, "train_loss": 3.1768112182617188, "lr": 7.035210250250329e-05, "tps": 55383, "wall": 29561.4} {"step": 24982, "train_loss": 3.0550644397735596, "lr": 7.034145708683851e-05, "tps": 55376, "wall": 29566.5} {"step": 24983, "train_loss": 3.2604517936706543, "lr": 7.033081336651384e-05, "tps": 55369, "wall": 29571.6} {"step": 24984, "train_loss": 3.3477702140808105, "lr": 7.032017134164982e-05, "tps": 55361, "wall": 29576.7} {"step": 24985, "train_loss": 3.2820985317230225, "lr": 7.030953101236695e-05, "tps": 55354, "wall": 29581.7} {"step": 24986, "train_loss": 3.4109838008880615, "lr": 7.029889237878584e-05, "tps": 55347, "wall": 29586.8} {"step": 24987, "train_loss": 3.2364420890808105, "lr": 7.028825544102698e-05, "tps": 55339, "wall": 29591.9} {"step": 24988, "train_loss": 3.2714765071868896, "lr": 7.027762019921083e-05, "tps": 55332, "wall": 29596.9} {"step": 24989, "train_loss": 3.2171151638031006, "lr": 7.026698665345792e-05, "tps": 55325, "wall": 29602.0} {"step": 24990, "train_loss": 3.194431781768799, "lr": 7.02563548038887e-05, "tps": 55318, "wall": 29607.1} {"step": 24991, "train_loss": 3.2190561294555664, "lr": 7.024572465062355e-05, "tps": 55310, "wall": 29612.1} {"step": 24992, "train_loss": 3.262821674346924, "lr": 7.023509619378298e-05, "tps": 55303, "wall": 29617.3} {"step": 24993, "train_loss": 3.1220924854278564, "lr": 7.022446943348728e-05, "tps": 55296, "wall": 29622.3} {"step": 24994, "train_loss": 3.1543030738830566, "lr": 7.021384436985697e-05, "tps": 55289, "wall": 29627.4} {"step": 24995, "train_loss": 3.1458141803741455, "lr": 7.020322100301232e-05, "tps": 55281, "wall": 29632.6} {"step": 24996, "train_loss": 3.2369580268859863, "lr": 7.019259933307363e-05, "tps": 55274, "wall": 29637.6} {"step": 24997, "train_loss": 3.1599087715148926, "lr": 7.018197936016133e-05, "tps": 55267, "wall": 29642.7} {"step": 24998, "train_loss": 3.2656354904174805, "lr": 7.017136108439568e-05, "tps": 55259, "wall": 29647.8} {"step": 24999, "train_loss": 3.25594162940979, "lr": 7.016074450589691e-05, "tps": 55252, "wall": 29652.9} {"step": 25000, "train_loss": 3.2537295818328857, "lr": 7.015012962478538e-05, "tps": 55245, "wall": 29658.0, "val_loss_monitor": 3.310620700324692, "val_loss_full": 3.3284521606895385} {"step": 25001, "train_loss": 3.1257753372192383, "lr": 7.013951644118127e-05, "tps": 54915, "wall": 29837.4} {"step": 25001, "train_loss": 3.051631212234497, "lr": 7.013951644118127e-05, "tps": 337203753, "wall": 4.9} {"step": 25002, "train_loss": 3.06424880027771, "lr": 7.012890495520478e-05, "tps": 179272723, "wall": 9.1} {"step": 25003, "train_loss": 3.069453239440918, "lr": 7.011829516697624e-05, "tps": 121058175, "wall": 13.5} {"step": 25004, "train_loss": 3.135185480117798, "lr": 7.010768707661572e-05, "tps": 90712415, "wall": 18.1} {"step": 25005, "train_loss": 3.0167484283447266, "lr": 7.009708068424342e-05, "tps": 72255740, "wall": 22.7} {"step": 25006, "train_loss": 3.0370044708251953, "lr": 7.008647598997953e-05, "tps": 59834599, "wall": 27.4} {"step": 25007, "train_loss": 3.0378806591033936, "lr": 7.007587299394415e-05, "tps": 51037213, "wall": 32.1} {"step": 25008, "train_loss": 3.134516716003418, "lr": 7.006527169625734e-05, "tps": 44332896, "wall": 37.0} {"step": 25009, "train_loss": 3.113766670227051, "lr": 7.00546720970393e-05, "tps": 39103955, "wall": 41.9} {"step": 25010, "train_loss": 3.1338930130004883, "lr": 7.004407419641004e-05, "tps": 35537307, "wall": 46.1} {"step": 25011, "train_loss": 3.0322039127349854, "lr": 7.003347799448958e-05, "tps": 31884851, "wall": 51.4} {"step": 25012, "train_loss": 3.117138147354126, "lr": 7.002288349139806e-05, "tps": 29062394, "wall": 56.4} {"step": 25013, "train_loss": 2.9998562335968018, "lr": 7.001229068725535e-05, "tps": 26755394, "wall": 61.3} {"step": 25014, "train_loss": 3.0345706939697266, "lr": 7.000169958218157e-05, "tps": 24797303, "wall": 66.1} {"step": 25015, "train_loss": 3.1956894397735596, "lr": 6.999111017629668e-05, "tps": 23136388, "wall": 70.9} {"step": 25016, "train_loss": 3.1036295890808105, "lr": 6.998052246972053e-05, "tps": 21666753, "wall": 75.7} {"step": 25017, "train_loss": 3.036450147628784, "lr": 6.996993646257321e-05, "tps": 20378553, "wall": 80.5} {"step": 25018, "train_loss": 3.1304049491882324, "lr": 6.995935215497456e-05, "tps": 19235666, "wall": 85.2} {"step": 25019, "train_loss": 3.100078582763672, "lr": 6.994876954704443e-05, "tps": 18216344, "wall": 90.0} {"step": 25020, "train_loss": 3.086507797241211, "lr": 6.993818863890279e-05, "tps": 17302471, "wall": 94.8} {"step": 25021, "train_loss": 3.168142080307007, "lr": 6.99276094306695e-05, "tps": 16474024, "wall": 99.5} {"step": 25022, "train_loss": 3.154029130935669, "lr": 6.991703192246431e-05, "tps": 15718281, "wall": 104.3} {"step": 25023, "train_loss": 3.058382272720337, "lr": 6.990645611440713e-05, "tps": 15035457, "wall": 109.1} {"step": 25024, "train_loss": 3.0105812549591064, "lr": 6.989588200661775e-05, "tps": 14408008, "wall": 113.8} {"step": 25025, "train_loss": 3.0619723796844482, "lr": 6.98853095992159e-05, "tps": 13825145, "wall": 118.6} {"step": 25026, "train_loss": 2.92073917388916, "lr": 6.987473889232142e-05, "tps": 13281920, "wall": 123.5} {"step": 25027, "train_loss": 3.0550076961517334, "lr": 6.986416988605403e-05, "tps": 12792284, "wall": 128.2} {"step": 25028, "train_loss": 3.1654224395751953, "lr": 6.98536025805334e-05, "tps": 12335012, "wall": 133.0} {"step": 25029, "train_loss": 3.0569164752960205, "lr": 6.984303697587931e-05, "tps": 11899793, "wall": 137.8} {"step": 25030, "train_loss": 3.089665174484253, "lr": 6.98324730722114e-05, "tps": 11500121, "wall": 142.6} {"step": 25031, "train_loss": 3.0578126907348633, "lr": 6.98219108696494e-05, "tps": 11123126, "wall": 147.5} {"step": 25032, "train_loss": 3.113044500350952, "lr": 6.98113503683129e-05, "tps": 10768203, "wall": 152.4} {"step": 25033, "train_loss": 3.089240550994873, "lr": 6.980079156832151e-05, "tps": 10441069, "wall": 157.1} {"step": 25034, "train_loss": 2.9658145904541016, "lr": 6.979023446979492e-05, "tps": 10122505, "wall": 162.1} {"step": 25035, "train_loss": 3.1219139099121094, "lr": 6.977967907285267e-05, "tps": 9826457, "wall": 167.0} {"step": 25036, "train_loss": 3.0738167762756348, "lr": 6.976912537761438e-05, "tps": 9552184, "wall": 171.8} {"step": 25037, "train_loss": 3.1034045219421387, "lr": 6.975857338419953e-05, "tps": 9294963, "wall": 176.5} {"step": 25038, "train_loss": 3.0590901374816895, "lr": 6.974802309272768e-05, "tps": 9050756, "wall": 181.3} {"step": 25039, "train_loss": 3.028123378753662, "lr": 6.973747450331838e-05, "tps": 8812243, "wall": 186.2} {"step": 25040, "train_loss": 3.0426347255706787, "lr": 6.972692761609108e-05, "tps": 8592462, "wall": 191.0} {"step": 25041, "train_loss": 3.0500030517578125, "lr": 6.971638243116522e-05, "tps": 8382055, "wall": 195.8} {"step": 25042, "train_loss": 3.150172233581543, "lr": 6.97058389486604e-05, "tps": 8182293, "wall": 200.6} {"step": 25043, "train_loss": 2.9545607566833496, "lr": 6.969529716869594e-05, "tps": 7990473, "wall": 205.4} {"step": 25044, "train_loss": 3.1364941596984863, "lr": 6.968475709139124e-05, "tps": 7809629, "wall": 210.2} {"step": 25045, "train_loss": 2.99060320854187, "lr": 6.96742187168658e-05, "tps": 7635257, "wall": 215.0} {"step": 25046, "train_loss": 3.161797046661377, "lr": 6.966368204523894e-05, "tps": 7468333, "wall": 219.8} {"step": 25047, "train_loss": 2.92793869972229, "lr": 6.965314707662997e-05, "tps": 7309568, "wall": 224.6} {"step": 25048, "train_loss": 3.0938198566436768, "lr": 6.964261381115834e-05, "tps": 7156290, "wall": 229.4} {"step": 25049, "train_loss": 3.160306692123413, "lr": 6.96320822489433e-05, "tps": 7008633, "wall": 234.2} {"step": 25050, "train_loss": 3.0759530067443848, "lr": 6.962155239010413e-05, "tps": 6867234, "wall": 239.1} {"step": 25051, "train_loss": 2.9681437015533447, "lr": 6.961102423476018e-05, "tps": 6724584, "wall": 244.2} {"step": 25052, "train_loss": 3.103644847869873, "lr": 6.960049778303071e-05, "tps": 6587933, "wall": 249.2} {"step": 25053, "train_loss": 3.1223573684692383, "lr": 6.958997303503487e-05, "tps": 6459055, "wall": 254.2} {"step": 25054, "train_loss": 3.070856809616089, "lr": 6.957944999089201e-05, "tps": 6337301, "wall": 259.1} {"step": 25055, "train_loss": 3.0346391201019287, "lr": 6.956892865072122e-05, "tps": 6220633, "wall": 264.0} {"step": 25056, "train_loss": 3.008291482925415, "lr": 6.955840901464182e-05, "tps": 6107547, "wall": 268.9} {"step": 25057, "train_loss": 3.0955936908721924, "lr": 6.954789108277288e-05, "tps": 5998907, "wall": 273.8} {"step": 25058, "train_loss": 3.0991663932800293, "lr": 6.953737485523352e-05, "tps": 5892606, "wall": 278.7} {"step": 25059, "train_loss": 3.070774793624878, "lr": 6.952686033214297e-05, "tps": 5786675, "wall": 283.8} {"step": 25060, "train_loss": 3.186978816986084, "lr": 6.951634751362029e-05, "tps": 5686649, "wall": 288.8} {"step": 25061, "train_loss": 3.1104578971862793, "lr": 6.950583639978451e-05, "tps": 5590673, "wall": 293.8} {"step": 25062, "train_loss": 3.0665383338928223, "lr": 6.949532699075481e-05, "tps": 5496159, "wall": 298.9} {"step": 25063, "train_loss": 3.1302971839904785, "lr": 6.948481928665019e-05, "tps": 5405679, "wall": 303.9} {"step": 25064, "train_loss": 3.06844425201416, "lr": 6.947431328758962e-05, "tps": 5318038, "wall": 308.9} {"step": 25065, "train_loss": 3.085980176925659, "lr": 6.946380899369224e-05, "tps": 5233762, "wall": 313.9} {"step": 25066, "train_loss": 3.1334900856018066, "lr": 6.945330640507697e-05, "tps": 5156472, "wall": 318.6} {"step": 25067, "train_loss": 3.166726589202881, "lr": 6.944280552186273e-05, "tps": 5081643, "wall": 323.3} {"step": 25068, "train_loss": 3.048798084259033, "lr": 6.94323063441686e-05, "tps": 5008819, "wall": 328.0} {"step": 25069, "train_loss": 2.9668099880218506, "lr": 6.942180887211341e-05, "tps": 4938097, "wall": 332.7} {"step": 25070, "train_loss": 3.1712000370025635, "lr": 6.941131310581611e-05, "tps": 4869272, "wall": 337.4} {"step": 25071, "train_loss": 3.0891048908233643, "lr": 6.940081904539564e-05, "tps": 4802134, "wall": 342.2} {"step": 25072, "train_loss": 3.045480728149414, "lr": 6.939032669097077e-05, "tps": 4737065, "wall": 346.9} {"step": 25073, "train_loss": 3.0913896560668945, "lr": 6.937983604266049e-05, "tps": 4673696, "wall": 351.6} {"step": 25074, "train_loss": 3.008897304534912, "lr": 6.936934710058358e-05, "tps": 4612019, "wall": 356.3} {"step": 25075, "train_loss": 3.0736093521118164, "lr": 6.935885986485881e-05, "tps": 4551829, "wall": 361.0} {"step": 25076, "train_loss": 3.1193466186523438, "lr": 6.934837433560506e-05, "tps": 4492487, "wall": 365.8} {"step": 25077, "train_loss": 3.0973217487335205, "lr": 6.933789051294109e-05, "tps": 4435635, "wall": 370.5} {"step": 25078, "train_loss": 3.0873045921325684, "lr": 6.932740839698558e-05, "tps": 4379999, "wall": 375.2} {"step": 25079, "train_loss": 3.1939961910247803, "lr": 6.93169279878574e-05, "tps": 4325628, "wall": 380.0} {"step": 25080, "train_loss": 3.0255465507507324, "lr": 6.930644928567521e-05, "tps": 4272654, "wall": 384.7} {"step": 25081, "train_loss": 3.1071629524230957, "lr": 6.929597229055767e-05, "tps": 4220955, "wall": 389.4} {"step": 25082, "train_loss": 3.067563056945801, "lr": 6.928549700262354e-05, "tps": 4170504, "wall": 394.2} {"step": 25083, "train_loss": 3.040358781814575, "lr": 6.927502342199148e-05, "tps": 4121300, "wall": 398.9} {"step": 25084, "train_loss": 3.0575942993164062, "lr": 6.926455154878004e-05, "tps": 4073088, "wall": 403.6} {"step": 25085, "train_loss": 3.1270251274108887, "lr": 6.925408138310799e-05, "tps": 4025016, "wall": 408.5} {"step": 25086, "train_loss": 3.084686279296875, "lr": 6.924361292509382e-05, "tps": 3979013, "wall": 413.2} {"step": 25087, "train_loss": 3.0575063228607178, "lr": 6.923314617485612e-05, "tps": 3933975, "wall": 417.9} {"step": 25088, "train_loss": 3.0857901573181152, "lr": 6.922268113251357e-05, "tps": 3889837, "wall": 422.7} {"step": 25089, "train_loss": 3.084001064300537, "lr": 6.921221779818464e-05, "tps": 3846065, "wall": 427.5} {"step": 25090, "train_loss": 3.0541396141052246, "lr": 6.920175617198781e-05, "tps": 3803290, "wall": 432.4} {"step": 25091, "train_loss": 2.9976677894592285, "lr": 6.919129625404169e-05, "tps": 3761461, "wall": 437.2} {"step": 25092, "train_loss": 3.1208770275115967, "lr": 6.918083804446467e-05, "tps": 3720624, "wall": 442.0} {"step": 25093, "train_loss": 3.0944721698760986, "lr": 6.917038154337533e-05, "tps": 3681046, "wall": 446.8} {"step": 25094, "train_loss": 3.109039545059204, "lr": 6.915992675089207e-05, "tps": 3642905, "wall": 451.5} {"step": 25095, "train_loss": 3.0204923152923584, "lr": 6.914947366713326e-05, "tps": 3604820, "wall": 456.2} {"step": 25096, "train_loss": 3.0707311630249023, "lr": 6.913902229221745e-05, "tps": 3567574, "wall": 461.0} {"step": 25097, "train_loss": 3.0768637657165527, "lr": 6.912857262626293e-05, "tps": 3531117, "wall": 465.8} {"step": 25098, "train_loss": 3.1322438716888428, "lr": 6.911812466938808e-05, "tps": 3495464, "wall": 470.6} {"step": 25099, "train_loss": 3.141396999359131, "lr": 6.910767842171129e-05, "tps": 3460772, "wall": 475.3} {"step": 25100, "train_loss": 3.0627810955047607, "lr": 6.909723388335088e-05, "tps": 3426969, "wall": 480.0} {"step": 25101, "train_loss": 2.945746421813965, "lr": 6.908679105442515e-05, "tps": 3393395, "wall": 484.8} {"step": 25102, "train_loss": 3.004844903945923, "lr": 6.907634993505245e-05, "tps": 3360703, "wall": 489.5} {"step": 25103, "train_loss": 3.023461103439331, "lr": 6.906591052535103e-05, "tps": 3328699, "wall": 494.3} {"step": 25104, "train_loss": 2.988201856613159, "lr": 6.905547282543909e-05, "tps": 3297209, "wall": 499.0} {"step": 25105, "train_loss": 3.02331280708313, "lr": 6.904503683543496e-05, "tps": 3266062, "wall": 503.8} {"step": 25106, "train_loss": 3.110567808151245, "lr": 6.903460255545681e-05, "tps": 3235929, "wall": 508.5} {"step": 25107, "train_loss": 2.9796717166900635, "lr": 6.902416998562282e-05, "tps": 3206240, "wall": 513.2} {"step": 25108, "train_loss": 3.16320538520813, "lr": 6.901373912605124e-05, "tps": 3176990, "wall": 518.0} {"step": 25109, "train_loss": 3.0366694927215576, "lr": 6.900330997686017e-05, "tps": 3148373, "wall": 522.7} {"step": 25110, "train_loss": 3.0374596118927, "lr": 6.899288253816778e-05, "tps": 3120317, "wall": 527.4} {"step": 25111, "train_loss": 3.019996404647827, "lr": 6.89824568100922e-05, "tps": 3092550, "wall": 532.2} {"step": 25112, "train_loss": 3.039121389389038, "lr": 6.89720327927515e-05, "tps": 3065271, "wall": 536.9} {"step": 25113, "train_loss": 3.056792974472046, "lr": 6.896161048626379e-05, "tps": 3038399, "wall": 541.7} {"step": 25114, "train_loss": 3.049159049987793, "lr": 6.895118989074715e-05, "tps": 3011928, "wall": 546.5} {"step": 25115, "train_loss": 3.073882818222046, "lr": 6.894077100631954e-05, "tps": 2986143, "wall": 551.2} {"step": 25116, "train_loss": 3.0728507041931152, "lr": 6.89303538330991e-05, "tps": 2960582, "wall": 556.0} {"step": 25117, "train_loss": 3.064059257507324, "lr": 6.891993837120379e-05, "tps": 2935170, "wall": 560.8} {"step": 25118, "train_loss": 3.000065565109253, "lr": 6.890952462075156e-05, "tps": 2909706, "wall": 565.8} {"step": 25119, "train_loss": 3.133659839630127, "lr": 6.889911258186041e-05, "tps": 2885296, "wall": 570.6} {"step": 25120, "train_loss": 3.1271560192108154, "lr": 6.888870225464832e-05, "tps": 2861636, "wall": 575.3} {"step": 25121, "train_loss": 3.049471378326416, "lr": 6.887829363923315e-05, "tps": 2838378, "wall": 580.0} {"step": 25122, "train_loss": 3.1050355434417725, "lr": 6.886788673573287e-05, "tps": 2815446, "wall": 584.8} {"step": 25123, "train_loss": 3.058985710144043, "lr": 6.885748154426534e-05, "tps": 2792939, "wall": 589.5} {"step": 25124, "train_loss": 3.042649507522583, "lr": 6.884707806494844e-05, "tps": 2770784, "wall": 594.3} {"step": 25125, "train_loss": 3.057232141494751, "lr": 6.883667629790001e-05, "tps": 2748983, "wall": 599.0} {"step": 25126, "train_loss": 2.994152069091797, "lr": 6.882627624323785e-05, "tps": 2726979, "wall": 603.9} {"step": 25127, "train_loss": 3.111875295639038, "lr": 6.881587790107986e-05, "tps": 2705835, "wall": 608.6} {"step": 25128, "train_loss": 3.078303098678589, "lr": 6.880548127154378e-05, "tps": 2685058, "wall": 613.3} {"step": 25129, "train_loss": 3.0623250007629395, "lr": 6.879508635474738e-05, "tps": 2664614, "wall": 618.1} {"step": 25130, "train_loss": 3.0810675621032715, "lr": 6.878469315080842e-05, "tps": 2644467, "wall": 622.8} {"step": 25131, "train_loss": 3.0459799766540527, "lr": 6.877430165984465e-05, "tps": 2624610, "wall": 627.5} {"step": 25132, "train_loss": 3.146461248397827, "lr": 6.876391188197374e-05, "tps": 2605074, "wall": 632.3} {"step": 25133, "train_loss": 2.965791940689087, "lr": 6.875352381731344e-05, "tps": 2585822, "wall": 637.0} {"step": 25134, "train_loss": 2.9656200408935547, "lr": 6.874313746598142e-05, "tps": 2566825, "wall": 641.7} {"step": 25135, "train_loss": 2.9524729251861572, "lr": 6.873275282809528e-05, "tps": 2548150, "wall": 646.5} {"step": 25136, "train_loss": 3.186056613922119, "lr": 6.872236990377273e-05, "tps": 2529746, "wall": 651.2} {"step": 25137, "train_loss": 3.0792150497436523, "lr": 6.871198869313138e-05, "tps": 2511596, "wall": 655.9} {"step": 25138, "train_loss": 2.978832483291626, "lr": 6.870160919628876e-05, "tps": 2493691, "wall": 660.7} {"step": 25139, "train_loss": 3.186760663986206, "lr": 6.869123141336251e-05, "tps": 2475794, "wall": 665.5} {"step": 25140, "train_loss": 2.973386287689209, "lr": 6.868085534447019e-05, "tps": 2458393, "wall": 670.2} {"step": 25141, "train_loss": 3.083817958831787, "lr": 6.86704809897293e-05, "tps": 2441253, "wall": 674.9} {"step": 25142, "train_loss": 3.0404515266418457, "lr": 6.866010834925742e-05, "tps": 2424382, "wall": 679.7} {"step": 25143, "train_loss": 3.113703966140747, "lr": 6.864973742317202e-05, "tps": 2407734, "wall": 684.4} {"step": 25144, "train_loss": 3.181278705596924, "lr": 6.863936821159054e-05, "tps": 2391200, "wall": 689.2} {"step": 25145, "train_loss": 3.07961368560791, "lr": 6.862900071463053e-05, "tps": 2374944, "wall": 693.9} {"step": 25146, "train_loss": 2.989957809448242, "lr": 6.861863493240934e-05, "tps": 2358921, "wall": 698.6} {"step": 25147, "train_loss": 3.054617166519165, "lr": 6.860827086504448e-05, "tps": 2343148, "wall": 703.4} {"step": 25148, "train_loss": 3.0920090675354004, "lr": 6.859790851265335e-05, "tps": 2327582, "wall": 708.1} {"step": 25149, "train_loss": 3.0886764526367188, "lr": 6.858754787535324e-05, "tps": 2312221, "wall": 712.8} {"step": 25150, "train_loss": 2.9406135082244873, "lr": 6.857718895326161e-05, "tps": 2297027, "wall": 717.6} {"step": 25151, "train_loss": 3.0359954833984375, "lr": 6.856683174649577e-05, "tps": 2282072, "wall": 722.3} {"step": 25152, "train_loss": 3.07197642326355, "lr": 6.855647625517303e-05, "tps": 2267092, "wall": 727.1} {"step": 25153, "train_loss": 3.1184253692626953, "lr": 6.854612247941077e-05, "tps": 2252525, "wall": 731.8} {"step": 25154, "train_loss": 3.05381178855896, "lr": 6.853577041932622e-05, "tps": 2238122, "wall": 736.6} {"step": 25155, "train_loss": 2.996117115020752, "lr": 6.85254200750366e-05, "tps": 2223846, "wall": 741.3} {"step": 25156, "train_loss": 3.0516419410705566, "lr": 6.851507144665928e-05, "tps": 2209838, "wall": 746.1} {"step": 25157, "train_loss": 3.0385398864746094, "lr": 6.85047245343114e-05, "tps": 2195928, "wall": 750.8} {"step": 25158, "train_loss": 3.103001117706299, "lr": 6.849437933811017e-05, "tps": 2182211, "wall": 755.6} {"step": 25159, "train_loss": 3.0133726596832275, "lr": 6.848403585817284e-05, "tps": 2168688, "wall": 760.3} {"step": 25160, "train_loss": 3.0769753456115723, "lr": 6.847369409461657e-05, "tps": 2155341, "wall": 765.1} {"step": 25161, "train_loss": 3.195312261581421, "lr": 6.846335404755844e-05, "tps": 2142168, "wall": 769.8} {"step": 25162, "train_loss": 2.9651105403900146, "lr": 6.845301571711567e-05, "tps": 2129171, "wall": 774.5} {"step": 25163, "train_loss": 3.090414047241211, "lr": 6.844267910340527e-05, "tps": 2116299, "wall": 779.3} {"step": 25164, "train_loss": 3.006957530975342, "lr": 6.843234420654449e-05, "tps": 2103384, "wall": 784.1} {"step": 25165, "train_loss": 3.0565876960754395, "lr": 6.842201102665029e-05, "tps": 2090852, "wall": 788.8} {"step": 25166, "train_loss": 3.169420003890991, "lr": 6.841167956383971e-05, "tps": 2078451, "wall": 793.5} {"step": 25167, "train_loss": 2.941768169403076, "lr": 6.840134981822986e-05, "tps": 2066149, "wall": 798.3} {"step": 25168, "train_loss": 2.944395065307617, "lr": 6.839102178993772e-05, "tps": 2053979, "wall": 803.1} {"step": 25169, "train_loss": 2.992830276489258, "lr": 6.838069547908026e-05, "tps": 2041966, "wall": 807.8} {"step": 25170, "train_loss": 3.0748186111450195, "lr": 6.837037088577451e-05, "tps": 2030192, "wall": 812.5} {"step": 25171, "train_loss": 3.0853424072265625, "lr": 6.836004801013741e-05, "tps": 2018507, "wall": 817.3} {"step": 25172, "train_loss": 3.1417436599731445, "lr": 6.834972685228583e-05, "tps": 2006949, "wall": 822.0} {"step": 25173, "train_loss": 2.965609550476074, "lr": 6.833940741233682e-05, "tps": 1995325, "wall": 826.8} {"step": 25174, "train_loss": 3.0666918754577637, "lr": 6.832908969040719e-05, "tps": 1984003, "wall": 831.6} {"step": 25175, "train_loss": 3.182011604309082, "lr": 6.831877368661382e-05, "tps": 1972846, "wall": 836.3} {"step": 25176, "train_loss": 3.0482044219970703, "lr": 6.830845940107359e-05, "tps": 1961799, "wall": 841.1} {"step": 25177, "train_loss": 3.0757412910461426, "lr": 6.829814683390337e-05, "tps": 1950762, "wall": 845.9} {"step": 25178, "train_loss": 3.056798219680786, "lr": 6.828783598521988e-05, "tps": 1939950, "wall": 850.6} {"step": 25179, "train_loss": 3.0380778312683105, "lr": 6.827752685514006e-05, "tps": 1929265, "wall": 855.3} {"step": 25180, "train_loss": 2.9866843223571777, "lr": 6.826721944378056e-05, "tps": 1918740, "wall": 860.1} {"step": 25181, "train_loss": 3.145754337310791, "lr": 6.825691375125827e-05, "tps": 1908318, "wall": 864.8} {"step": 25182, "train_loss": 2.9780380725860596, "lr": 6.824660977768985e-05, "tps": 1898011, "wall": 869.5} {"step": 25183, "train_loss": 3.1264798641204834, "lr": 6.823630752319201e-05, "tps": 1887804, "wall": 874.3} {"step": 25184, "train_loss": 3.0598530769348145, "lr": 6.822600698788154e-05, "tps": 1877713, "wall": 879.0} {"step": 25185, "train_loss": 3.096553325653076, "lr": 6.821570817187506e-05, "tps": 1867704, "wall": 883.8} {"step": 25186, "train_loss": 3.1216511726379395, "lr": 6.820541107528922e-05, "tps": 1857801, "wall": 888.5} {"step": 25187, "train_loss": 3.116339683532715, "lr": 6.819511569824074e-05, "tps": 1848023, "wall": 893.2} {"step": 25188, "train_loss": 3.1256043910980225, "lr": 6.818482204084617e-05, "tps": 1838353, "wall": 898.0} {"step": 25189, "train_loss": 3.063476085662842, "lr": 6.817453010322212e-05, "tps": 1828760, "wall": 902.7} {"step": 25190, "train_loss": 2.9394688606262207, "lr": 6.816423988548528e-05, "tps": 1819213, "wall": 907.5} {"step": 25191, "train_loss": 3.168572425842285, "lr": 6.815395138775212e-05, "tps": 1809866, "wall": 912.2} {"step": 25192, "train_loss": 2.982708692550659, "lr": 6.814366461013917e-05, "tps": 1800606, "wall": 916.9} {"step": 25193, "train_loss": 2.9355013370513916, "lr": 6.813337955276305e-05, "tps": 1791439, "wall": 921.7} {"step": 25194, "train_loss": 3.0300886631011963, "lr": 6.812309621574021e-05, "tps": 1782354, "wall": 926.4} {"step": 25195, "train_loss": 3.049360752105713, "lr": 6.811281459918712e-05, "tps": 1773356, "wall": 931.1} {"step": 25196, "train_loss": 3.1055750846862793, "lr": 6.810253470322035e-05, "tps": 1764446, "wall": 935.9} {"step": 25197, "train_loss": 2.9662206172943115, "lr": 6.809225652795625e-05, "tps": 1755650, "wall": 940.6} {"step": 25198, "train_loss": 3.035776138305664, "lr": 6.808198007351125e-05, "tps": 1746909, "wall": 945.4} {"step": 25199, "train_loss": 3.1103968620300293, "lr": 6.807170534000185e-05, "tps": 1738265, "wall": 950.1} {"step": 25200, "train_loss": 3.113583564758301, "lr": 6.806143232754434e-05, "tps": 1729606, "wall": 954.9} {"step": 25201, "train_loss": 3.1339054107666016, "lr": 6.80511610362552e-05, "tps": 1721002, "wall": 959.7} {"step": 25202, "train_loss": 3.0621986389160156, "lr": 6.80408914662507e-05, "tps": 1712286, "wall": 964.6} {"step": 25203, "train_loss": 3.060598373413086, "lr": 6.803062361764718e-05, "tps": 1703979, "wall": 969.4} {"step": 25204, "train_loss": 2.9807631969451904, "lr": 6.802035749056107e-05, "tps": 1695737, "wall": 974.1} {"step": 25205, "train_loss": 2.9957780838012695, "lr": 6.801009308510848e-05, "tps": 1687520, "wall": 978.9} {"step": 25206, "train_loss": 3.0764455795288086, "lr": 6.799983040140581e-05, "tps": 1679446, "wall": 983.6} {"step": 25207, "train_loss": 3.016633987426758, "lr": 6.798956943956929e-05, "tps": 1671453, "wall": 988.4} {"step": 25208, "train_loss": 2.9491896629333496, "lr": 6.797931019971512e-05, "tps": 1663536, "wall": 993.1} {"step": 25209, "train_loss": 3.0530173778533936, "lr": 6.796905268195958e-05, "tps": 1655548, "wall": 998.0} {"step": 25210, "train_loss": 2.9780945777893066, "lr": 6.795879688641882e-05, "tps": 1647659, "wall": 1002.8} {"step": 25211, "train_loss": 3.003575325012207, "lr": 6.794854281320902e-05, "tps": 1639838, "wall": 1007.6} {"step": 25212, "train_loss": 2.9858293533325195, "lr": 6.79382904624464e-05, "tps": 1632021, "wall": 1012.5} {"step": 25213, "train_loss": 3.0672779083251953, "lr": 6.792803983424702e-05, "tps": 1624331, "wall": 1017.3} {"step": 25214, "train_loss": 3.044867992401123, "lr": 6.7917790928727e-05, "tps": 1616757, "wall": 1022.1} {"step": 25215, "train_loss": 3.1129467487335205, "lr": 6.790754374600254e-05, "tps": 1608969, "wall": 1027.1} {"step": 25216, "train_loss": 3.0763893127441406, "lr": 6.789729828618963e-05, "tps": 1601509, "wall": 1031.9} {"step": 25217, "train_loss": 3.032412052154541, "lr": 6.78870545494043e-05, "tps": 1594151, "wall": 1036.7} {"step": 25218, "train_loss": 3.020155191421509, "lr": 6.78768125357627e-05, "tps": 1585211, "wall": 1042.6} {"step": 25219, "train_loss": 3.007349729537964, "lr": 6.78665722453808e-05, "tps": 1577787, "wall": 1047.6} {"step": 25220, "train_loss": 3.1049482822418213, "lr": 6.785633367837456e-05, "tps": 1570668, "wall": 1052.3} {"step": 25221, "train_loss": 3.0749778747558594, "lr": 6.784609683486005e-05, "tps": 1563660, "wall": 1057.1} {"step": 25222, "train_loss": 3.1226401329040527, "lr": 6.783586171495313e-05, "tps": 1556553, "wall": 1062.0} {"step": 25223, "train_loss": 3.0483014583587646, "lr": 6.782562831876985e-05, "tps": 1549798, "wall": 1066.6} {"step": 25224, "train_loss": 3.0741546154022217, "lr": 6.781539664642607e-05, "tps": 1543042, "wall": 1071.4} {"step": 25225, "train_loss": 3.1496455669403076, "lr": 6.78051666980377e-05, "tps": 1536321, "wall": 1076.1} {"step": 25226, "train_loss": 3.0373966693878174, "lr": 6.779493847372065e-05, "tps": 1529679, "wall": 1080.8} {"step": 25227, "train_loss": 2.9363651275634766, "lr": 6.77847119735908e-05, "tps": 1523009, "wall": 1085.6} {"step": 25228, "train_loss": 3.0745224952697754, "lr": 6.77744871977639e-05, "tps": 1516493, "wall": 1090.3} {"step": 25229, "train_loss": 3.123560905456543, "lr": 6.776426414635588e-05, "tps": 1510024, "wall": 1095.0} {"step": 25230, "train_loss": 2.9817512035369873, "lr": 6.775404281948253e-05, "tps": 1503617, "wall": 1099.7} {"step": 25231, "train_loss": 3.0308356285095215, "lr": 6.774382321725956e-05, "tps": 1497061, "wall": 1104.6} {"step": 25232, "train_loss": 2.9944636821746826, "lr": 6.773360533980286e-05, "tps": 1490760, "wall": 1109.3} {"step": 25233, "train_loss": 3.0435292720794678, "lr": 6.772338918722809e-05, "tps": 1484300, "wall": 1114.2} {"step": 25234, "train_loss": 3.13053560256958, "lr": 6.7713174759651e-05, "tps": 1477704, "wall": 1119.2} {"step": 25235, "train_loss": 3.0192103385925293, "lr": 6.770296205718732e-05, "tps": 1471108, "wall": 1124.2} {"step": 25236, "train_loss": 3.024169683456421, "lr": 6.769275107995272e-05, "tps": 1464613, "wall": 1129.3} {"step": 25237, "train_loss": 3.094381093978882, "lr": 6.768254182806287e-05, "tps": 1458220, "wall": 1134.3} {"step": 25238, "train_loss": 3.110180377960205, "lr": 6.767233430163344e-05, "tps": 1451869, "wall": 1139.3} {"step": 25239, "train_loss": 3.0051870346069336, "lr": 6.766212850078002e-05, "tps": 1445507, "wall": 1144.3} {"step": 25240, "train_loss": 3.09193754196167, "lr": 6.765192442561825e-05, "tps": 1439261, "wall": 1149.3} {"step": 25241, "train_loss": 3.0116591453552246, "lr": 6.764172207626376e-05, "tps": 1433129, "wall": 1154.3} {"step": 25242, "train_loss": 3.0373482704162598, "lr": 6.763152145283202e-05, "tps": 1427034, "wall": 1159.3} {"step": 25243, "train_loss": 3.0600600242614746, "lr": 6.762132255543872e-05, "tps": 1420986, "wall": 1164.3} {"step": 25244, "train_loss": 3.042457103729248, "lr": 6.76111253841993e-05, "tps": 1414958, "wall": 1169.3} {"step": 25245, "train_loss": 3.0939443111419678, "lr": 6.760092993922926e-05, "tps": 1408977, "wall": 1174.3} {"step": 25246, "train_loss": 3.06276273727417, "lr": 6.759073622064416e-05, "tps": 1403060, "wall": 1179.3} {"step": 25247, "train_loss": 3.0891480445861816, "lr": 6.758054422855948e-05, "tps": 1397184, "wall": 1184.3} {"step": 25248, "train_loss": 2.997675657272339, "lr": 6.757035396309057e-05, "tps": 1391364, "wall": 1189.3} {"step": 25249, "train_loss": 3.1093807220458984, "lr": 6.756016542435298e-05, "tps": 1385629, "wall": 1194.2} {"step": 25250, "train_loss": 3.0859317779541016, "lr": 6.754997861246209e-05, "tps": 1379947, "wall": 1199.2} {"step": 25251, "train_loss": 2.9952895641326904, "lr": 6.753979352753325e-05, "tps": 1374212, "wall": 1204.3} {"step": 25252, "train_loss": 2.9740195274353027, "lr": 6.752961016968191e-05, "tps": 1368646, "wall": 1209.2} {"step": 25253, "train_loss": 3.0550427436828613, "lr": 6.75194285390234e-05, "tps": 1363105, "wall": 1214.2} {"step": 25254, "train_loss": 3.1070003509521484, "lr": 6.750924863567301e-05, "tps": 1357581, "wall": 1219.2} {"step": 25255, "train_loss": 3.095235586166382, "lr": 6.749907045974614e-05, "tps": 1352117, "wall": 1224.1} {"step": 25256, "train_loss": 3.1256864070892334, "lr": 6.748889401135806e-05, "tps": 1346689, "wall": 1229.1} {"step": 25257, "train_loss": 3.004830837249756, "lr": 6.747871929062399e-05, "tps": 1341333, "wall": 1234.1} {"step": 25258, "train_loss": 3.058131694793701, "lr": 6.746854629765929e-05, "tps": 1336007, "wall": 1239.0} {"step": 25259, "train_loss": 3.099970817565918, "lr": 6.745837503257908e-05, "tps": 1330718, "wall": 1244.0} {"step": 25260, "train_loss": 2.9173364639282227, "lr": 6.744820549549873e-05, "tps": 1325481, "wall": 1249.0} {"step": 25261, "train_loss": 3.014860153198242, "lr": 6.743803768653334e-05, "tps": 1320261, "wall": 1254.0} {"step": 25262, "train_loss": 3.0817041397094727, "lr": 6.742787160579806e-05, "tps": 1315054, "wall": 1259.0} {"step": 25263, "train_loss": 3.161289930343628, "lr": 6.741770725340816e-05, "tps": 1309900, "wall": 1264.0} {"step": 25264, "train_loss": 3.0893592834472656, "lr": 6.740754462947874e-05, "tps": 1304835, "wall": 1268.9} {"step": 25265, "train_loss": 2.9171242713928223, "lr": 6.739738373412486e-05, "tps": 1299754, "wall": 1274.0} {"step": 25266, "train_loss": 2.9606080055236816, "lr": 6.73872245674617e-05, "tps": 1294791, "wall": 1278.9} {"step": 25267, "train_loss": 3.0258238315582275, "lr": 6.737706712960433e-05, "tps": 1289875, "wall": 1283.8} {"step": 25268, "train_loss": 3.095177173614502, "lr": 6.736691142066776e-05, "tps": 1284971, "wall": 1288.8} {"step": 25269, "train_loss": 3.015322685241699, "lr": 6.735675744076709e-05, "tps": 1280123, "wall": 1293.7} {"step": 25270, "train_loss": 3.070362091064453, "lr": 6.734660519001736e-05, "tps": 1275331, "wall": 1298.6} {"step": 25271, "train_loss": 3.05094575881958, "lr": 6.733645466853348e-05, "tps": 1270538, "wall": 1303.6} {"step": 25272, "train_loss": 3.083281993865967, "lr": 6.732630587643055e-05, "tps": 1265836, "wall": 1308.5} {"step": 25273, "train_loss": 3.0149827003479004, "lr": 6.731615881382349e-05, "tps": 1261131, "wall": 1313.4} {"step": 25274, "train_loss": 3.1741673946380615, "lr": 6.730601348082721e-05, "tps": 1256471, "wall": 1318.3} {"step": 25275, "train_loss": 3.025869131088257, "lr": 6.729586987755672e-05, "tps": 1251785, "wall": 1323.3} {"step": 25276, "train_loss": 3.042752981185913, "lr": 6.728572800412685e-05, "tps": 1247181, "wall": 1328.2} {"step": 25277, "train_loss": 3.0661568641662598, "lr": 6.727558786065247e-05, "tps": 1242597, "wall": 1333.2} {"step": 25278, "train_loss": 3.067805767059326, "lr": 6.726544944724856e-05, "tps": 1238046, "wall": 1338.1} {"step": 25279, "train_loss": 3.092390298843384, "lr": 6.725531276402984e-05, "tps": 1233568, "wall": 1343.1} {"step": 25280, "train_loss": 3.1282010078430176, "lr": 6.724517781111126e-05, "tps": 1229120, "wall": 1348.0} {"step": 25281, "train_loss": 3.0186259746551514, "lr": 6.723504458860756e-05, "tps": 1224700, "wall": 1352.9} {"step": 25282, "train_loss": 3.0643515586853027, "lr": 6.722491309663348e-05, "tps": 1220312, "wall": 1357.8} {"step": 25283, "train_loss": 3.0006041526794434, "lr": 6.721478333530391e-05, "tps": 1215947, "wall": 1362.7} {"step": 25284, "train_loss": 3.0851330757141113, "lr": 6.720465530473355e-05, "tps": 1211594, "wall": 1367.7} {"step": 25285, "train_loss": 3.051881790161133, "lr": 6.719452900503706e-05, "tps": 1207307, "wall": 1372.6} {"step": 25286, "train_loss": 3.110478639602661, "lr": 6.718440443632926e-05, "tps": 1203033, "wall": 1377.5} {"step": 25287, "train_loss": 3.0490148067474365, "lr": 6.717428159872478e-05, "tps": 1198803, "wall": 1382.4} {"step": 25288, "train_loss": 3.056558609008789, "lr": 6.716416049233831e-05, "tps": 1194526, "wall": 1387.4} {"step": 25289, "train_loss": 2.979440689086914, "lr": 6.715404111728449e-05, "tps": 1190304, "wall": 1392.4} {"step": 25290, "train_loss": 3.0837643146514893, "lr": 6.7143923473678e-05, "tps": 1186148, "wall": 1397.4} {"step": 25291, "train_loss": 3.155879020690918, "lr": 6.713380756163334e-05, "tps": 1182019, "wall": 1402.3} {"step": 25292, "train_loss": 3.028991222381592, "lr": 6.712369338126523e-05, "tps": 1177913, "wall": 1407.2} {"step": 25293, "train_loss": 3.075472116470337, "lr": 6.71135809326882e-05, "tps": 1173864, "wall": 1412.1} {"step": 25294, "train_loss": 3.0485615730285645, "lr": 6.710347021601676e-05, "tps": 1169820, "wall": 1417.1} {"step": 25295, "train_loss": 3.0508437156677246, "lr": 6.709336123136549e-05, "tps": 1165832, "wall": 1422.0} {"step": 25296, "train_loss": 3.0581469535827637, "lr": 6.708325397884889e-05, "tps": 1161841, "wall": 1426.9} {"step": 25297, "train_loss": 3.0874226093292236, "lr": 6.707314845858149e-05, "tps": 1157879, "wall": 1431.9} {"step": 25298, "train_loss": 3.1392788887023926, "lr": 6.706304467067774e-05, "tps": 1153960, "wall": 1436.8} {"step": 25299, "train_loss": 3.130012035369873, "lr": 6.705294261525204e-05, "tps": 1150023, "wall": 1441.8} {"step": 25300, "train_loss": 2.9675371646881104, "lr": 6.704284229241892e-05, "tps": 1146098, "wall": 1446.8} {"step": 25301, "train_loss": 3.1261329650878906, "lr": 6.703274370229277e-05, "tps": 1142230, "wall": 1451.7} {"step": 25302, "train_loss": 3.048204183578491, "lr": 6.702264684498794e-05, "tps": 1138434, "wall": 1456.6} {"step": 25303, "train_loss": 3.0496349334716797, "lr": 6.701255172061889e-05, "tps": 1134635, "wall": 1461.5} {"step": 25304, "train_loss": 3.005364418029785, "lr": 6.70024583292999e-05, "tps": 1130817, "wall": 1466.5} {"step": 25305, "train_loss": 3.004897356033325, "lr": 6.69923666711453e-05, "tps": 1127048, "wall": 1471.5} {"step": 25306, "train_loss": 3.0179433822631836, "lr": 6.698227674626951e-05, "tps": 1123317, "wall": 1476.4} {"step": 25307, "train_loss": 3.0188088417053223, "lr": 6.697218855478677e-05, "tps": 1119597, "wall": 1481.4} {"step": 25308, "train_loss": 3.038416862487793, "lr": 6.696210209681131e-05, "tps": 1115914, "wall": 1486.4} {"step": 25309, "train_loss": 2.9967308044433594, "lr": 6.695201737245747e-05, "tps": 1112262, "wall": 1491.3} {"step": 25310, "train_loss": 2.9590976238250732, "lr": 6.694193438183945e-05, "tps": 1108690, "wall": 1496.2} {"step": 25311, "train_loss": 3.0615787506103516, "lr": 6.693185312507144e-05, "tps": 1105089, "wall": 1501.1} {"step": 25312, "train_loss": 3.0861687660217285, "lr": 6.692177360226774e-05, "tps": 1101503, "wall": 1506.0} {"step": 25313, "train_loss": 3.1221063137054443, "lr": 6.691169581354241e-05, "tps": 1097943, "wall": 1511.0} {"step": 25314, "train_loss": 3.13682222366333, "lr": 6.690161975900971e-05, "tps": 1094429, "wall": 1515.9} {"step": 25315, "train_loss": 3.081951856613159, "lr": 6.689154543878376e-05, "tps": 1090928, "wall": 1520.8} {"step": 25316, "train_loss": 2.9834465980529785, "lr": 6.688147285297863e-05, "tps": 1087467, "wall": 1525.7} {"step": 25317, "train_loss": 3.030946969985962, "lr": 6.687140200170847e-05, "tps": 1083985, "wall": 1530.7} {"step": 25318, "train_loss": 3.0068845748901367, "lr": 6.686133288508738e-05, "tps": 1080551, "wall": 1535.6} {"step": 25319, "train_loss": 3.038978099822998, "lr": 6.685126550322933e-05, "tps": 1077112, "wall": 1540.6} {"step": 25320, "train_loss": 2.9782023429870605, "lr": 6.68411998562485e-05, "tps": 1073731, "wall": 1545.5} {"step": 25321, "train_loss": 3.105894088745117, "lr": 6.68311359442588e-05, "tps": 1070397, "wall": 1550.4} {"step": 25322, "train_loss": 3.0566515922546387, "lr": 6.682107376737429e-05, "tps": 1067034, "wall": 1555.3} {"step": 25323, "train_loss": 3.007108449935913, "lr": 6.681101332570895e-05, "tps": 1063568, "wall": 1560.4} {"step": 25324, "train_loss": 2.959843635559082, "lr": 6.680095461937676e-05, "tps": 1060279, "wall": 1565.3} {"step": 25325, "train_loss": 3.0235252380371094, "lr": 6.679089764849159e-05, "tps": 1057059, "wall": 1570.2} {"step": 25326, "train_loss": 3.0891449451446533, "lr": 6.678084241316744e-05, "tps": 1053866, "wall": 1575.0} {"step": 25327, "train_loss": 3.173182964324951, "lr": 6.677078891351824e-05, "tps": 1050683, "wall": 1579.8} {"step": 25328, "train_loss": 3.0193889141082764, "lr": 6.676073714965777e-05, "tps": 1047534, "wall": 1584.6} {"step": 25329, "train_loss": 2.987285614013672, "lr": 6.67506871217e-05, "tps": 1044384, "wall": 1589.5} {"step": 25330, "train_loss": 3.0125906467437744, "lr": 6.674063882975873e-05, "tps": 1041234, "wall": 1594.4} {"step": 25331, "train_loss": 3.1357202529907227, "lr": 6.673059227394776e-05, "tps": 1038136, "wall": 1599.2} {"step": 25332, "train_loss": 3.002023220062256, "lr": 6.6720547454381e-05, "tps": 1034911, "wall": 1604.2} {"step": 25333, "train_loss": 3.028911828994751, "lr": 6.671050437117208e-05, "tps": 1031816, "wall": 1609.1} {"step": 25334, "train_loss": 2.9804177284240723, "lr": 6.670046302443494e-05, "tps": 1028771, "wall": 1613.9} {"step": 25335, "train_loss": 3.1370882987976074, "lr": 6.669042341428324e-05, "tps": 1025745, "wall": 1618.7} {"step": 25336, "train_loss": 3.045279026031494, "lr": 6.668038554083064e-05, "tps": 1022695, "wall": 1623.6} {"step": 25337, "train_loss": 3.0788230895996094, "lr": 6.667034940419102e-05, "tps": 1019587, "wall": 1628.7} {"step": 25338, "train_loss": 3.0831422805786133, "lr": 6.666031500447793e-05, "tps": 1016532, "wall": 1633.6} {"step": 25339, "train_loss": 2.998988151550293, "lr": 6.66502823418051e-05, "tps": 1013437, "wall": 1638.7} {"step": 25340, "train_loss": 3.007298231124878, "lr": 6.664025141628616e-05, "tps": 1010343, "wall": 1643.7} {"step": 25341, "train_loss": 3.028980255126953, "lr": 6.663022222803478e-05, "tps": 1007432, "wall": 1648.6} {"step": 25342, "train_loss": 3.2841415405273438, "lr": 6.662019477716449e-05, "tps": 1004574, "wall": 1653.3} {"step": 25343, "train_loss": 3.0480217933654785, "lr": 6.661016906378896e-05, "tps": 1001626, "wall": 1658.2} {"step": 25344, "train_loss": 3.0528852939605713, "lr": 6.660014508802175e-05, "tps": 998697, "wall": 1663.2} {"step": 25345, "train_loss": 3.0168986320495605, "lr": 6.659012284997634e-05, "tps": 995849, "wall": 1668.0} {"step": 25346, "train_loss": 3.042628049850464, "lr": 6.658010234976636e-05, "tps": 993031, "wall": 1672.8} {"step": 25347, "train_loss": 3.0941739082336426, "lr": 6.657008358750529e-05, "tps": 990274, "wall": 1677.5} {"step": 25348, "train_loss": 2.994499444961548, "lr": 6.656006656330658e-05, "tps": 987535, "wall": 1682.2} {"step": 25349, "train_loss": 3.0469865798950195, "lr": 6.655005127728375e-05, "tps": 984756, "wall": 1687.1} {"step": 25350, "train_loss": 2.982553482055664, "lr": 6.654003772955022e-05, "tps": 982018, "wall": 1691.8} {"step": 25351, "train_loss": 3.135127544403076, "lr": 6.653002592021949e-05, "tps": 979294, "wall": 1696.6} {"step": 25352, "train_loss": 3.02510666847229, "lr": 6.65200158494049e-05, "tps": 976567, "wall": 1701.4} {"step": 25353, "train_loss": 3.1119019985198975, "lr": 6.651000751721986e-05, "tps": 973797, "wall": 1706.3} {"step": 25354, "train_loss": 3.0666983127593994, "lr": 6.65000009237778e-05, "tps": 971127, "wall": 1711.1} {"step": 25355, "train_loss": 3.1210098266601562, "lr": 6.648999606919203e-05, "tps": 968477, "wall": 1715.8} {"step": 25356, "train_loss": 2.9847397804260254, "lr": 6.647999295357583e-05, "tps": 965843, "wall": 1720.6} {"step": 25357, "train_loss": 3.0424251556396484, "lr": 6.646999157704265e-05, "tps": 963175, "wall": 1725.4} {"step": 25358, "train_loss": 3.061969041824341, "lr": 6.645999193970568e-05, "tps": 960493, "wall": 1730.3} {"step": 25359, "train_loss": 3.031525135040283, "lr": 6.644999404167818e-05, "tps": 957831, "wall": 1735.2} {"step": 25360, "train_loss": 3.0347084999084473, "lr": 6.643999788307353e-05, "tps": 955187, "wall": 1740.0} {"step": 25361, "train_loss": 3.0234503746032715, "lr": 6.643000346400488e-05, "tps": 952494, "wall": 1745.0} {"step": 25362, "train_loss": 3.09999942779541, "lr": 6.642001078458541e-05, "tps": 949910, "wall": 1749.8} {"step": 25363, "train_loss": 2.9719605445861816, "lr": 6.64100198449284e-05, "tps": 947361, "wall": 1754.6} {"step": 25364, "train_loss": 3.0018973350524902, "lr": 6.640003064514701e-05, "tps": 944787, "wall": 1759.5} {"step": 25365, "train_loss": 3.0806808471679688, "lr": 6.639004318535435e-05, "tps": 942133, "wall": 1764.5} {"step": 25366, "train_loss": 3.006625175476074, "lr": 6.638005746566359e-05, "tps": 939487, "wall": 1769.5} {"step": 25367, "train_loss": 3.161809206008911, "lr": 6.637007348618785e-05, "tps": 936807, "wall": 1774.7} {"step": 25368, "train_loss": 2.878389358520508, "lr": 6.636009124704026e-05, "tps": 934257, "wall": 1779.6} {"step": 25369, "train_loss": 2.981102705001831, "lr": 6.635011074833386e-05, "tps": 931704, "wall": 1784.5} {"step": 25370, "train_loss": 2.9111011028289795, "lr": 6.634013199018169e-05, "tps": 929066, "wall": 1789.7} {"step": 25371, "train_loss": 3.0230727195739746, "lr": 6.633015497269684e-05, "tps": 926589, "wall": 1794.5} {"step": 25372, "train_loss": 2.91872501373291, "lr": 6.632017969599231e-05, "tps": 923992, "wall": 1799.6} {"step": 25373, "train_loss": 3.064972400665283, "lr": 6.631020616018111e-05, "tps": 921358, "wall": 1804.8} {"step": 25374, "train_loss": 2.944521427154541, "lr": 6.63002343653762e-05, "tps": 918798, "wall": 1809.9} {"step": 25375, "train_loss": 2.9630699157714844, "lr": 6.629026431169053e-05, "tps": 916278, "wall": 1815.0} {"step": 25376, "train_loss": 3.1057536602020264, "lr": 6.628029599923708e-05, "tps": 913777, "wall": 1820.0} {"step": 25377, "train_loss": 3.0788896083831787, "lr": 6.627032942812877e-05, "tps": 911279, "wall": 1825.1} {"step": 25378, "train_loss": 3.1268718242645264, "lr": 6.626036459847842e-05, "tps": 908838, "wall": 1830.1} {"step": 25379, "train_loss": 3.067092180252075, "lr": 6.625040151039904e-05, "tps": 906422, "wall": 1835.0} {"step": 25380, "train_loss": 3.142324924468994, "lr": 6.624044016400342e-05, "tps": 903971, "wall": 1840.1} {"step": 25381, "train_loss": 2.9511611461639404, "lr": 6.623048055940437e-05, "tps": 901518, "wall": 1845.1} {"step": 25382, "train_loss": 3.0474069118499756, "lr": 6.622052269671481e-05, "tps": 898985, "wall": 1850.4} {"step": 25383, "train_loss": 3.0851497650146484, "lr": 6.621056657604748e-05, "tps": 896456, "wall": 1855.7} {"step": 25384, "train_loss": 3.0811798572540283, "lr": 6.62006121975151e-05, "tps": 894131, "wall": 1860.6} {"step": 25385, "train_loss": 2.979156494140625, "lr": 6.619065956123058e-05, "tps": 891752, "wall": 1865.6} {"step": 25386, "train_loss": 3.051069736480713, "lr": 6.618070866730659e-05, "tps": 889430, "wall": 1870.6} {"step": 25387, "train_loss": 3.0304946899414062, "lr": 6.617075951585579e-05, "tps": 887066, "wall": 1875.7} {"step": 25388, "train_loss": 3.040377616882324, "lr": 6.6160812106991e-05, "tps": 884693, "wall": 1880.8} {"step": 25389, "train_loss": 2.9747426509857178, "lr": 6.615086644082488e-05, "tps": 882359, "wall": 1885.8} {"step": 25390, "train_loss": 3.1034741401672363, "lr": 6.614092251747001e-05, "tps": 880056, "wall": 1890.8} {"step": 25391, "train_loss": 3.124962091445923, "lr": 6.61309803370391e-05, "tps": 877772, "wall": 1895.8} {"step": 25392, "train_loss": 3.065551280975342, "lr": 6.612103989964477e-05, "tps": 875484, "wall": 1900.8} {"step": 25393, "train_loss": 2.985971212387085, "lr": 6.611110120539966e-05, "tps": 873196, "wall": 1905.9} {"step": 25394, "train_loss": 3.052602529525757, "lr": 6.61011642544163e-05, "tps": 870907, "wall": 1911.0} {"step": 25395, "train_loss": 3.0987188816070557, "lr": 6.609122904680727e-05, "tps": 868666, "wall": 1916.0} {"step": 25396, "train_loss": 3.017796277999878, "lr": 6.608129558268514e-05, "tps": 866420, "wall": 1921.0} {"step": 25397, "train_loss": 3.0743160247802734, "lr": 6.607136386216242e-05, "tps": 864179, "wall": 1926.1} {"step": 25398, "train_loss": 3.07462215423584, "lr": 6.606143388535157e-05, "tps": 861985, "wall": 1931.1} {"step": 25399, "train_loss": 3.0906906127929688, "lr": 6.605150565236519e-05, "tps": 859773, "wall": 1936.1} {"step": 25400, "train_loss": 2.9762330055236816, "lr": 6.604157916331567e-05, "tps": 857576, "wall": 1941.1} {"step": 25401, "train_loss": 3.0383405685424805, "lr": 6.603165441831544e-05, "tps": 855390, "wall": 1946.2} {"step": 25402, "train_loss": 3.052255630493164, "lr": 6.602173141747698e-05, "tps": 853222, "wall": 1951.2} {"step": 25403, "train_loss": 3.1039462089538574, "lr": 6.60118101609127e-05, "tps": 851045, "wall": 1956.3} {"step": 25404, "train_loss": 3.111814260482788, "lr": 6.600189064873488e-05, "tps": 848895, "wall": 1961.3} {"step": 25405, "train_loss": 3.021219491958618, "lr": 6.599197288105606e-05, "tps": 846760, "wall": 1966.3} {"step": 25406, "train_loss": 3.1207921504974365, "lr": 6.598205685798847e-05, "tps": 844633, "wall": 1971.4} {"step": 25407, "train_loss": 3.0102274417877197, "lr": 6.597214257964446e-05, "tps": 842517, "wall": 1976.4} {"step": 25408, "train_loss": 3.0761563777923584, "lr": 6.596223004613639e-05, "tps": 840416, "wall": 1981.4} {"step": 25409, "train_loss": 3.0880603790283203, "lr": 6.595231925757645e-05, "tps": 838283, "wall": 1986.5} {"step": 25410, "train_loss": 3.038443088531494, "lr": 6.594241021407702e-05, "tps": 836207, "wall": 1991.5} {"step": 25411, "train_loss": 3.018204927444458, "lr": 6.593250291575031e-05, "tps": 834138, "wall": 1996.6} {"step": 25412, "train_loss": 2.9613921642303467, "lr": 6.592259736270849e-05, "tps": 832079, "wall": 2001.6} {"step": 25413, "train_loss": 3.0289671421051025, "lr": 6.591269355506387e-05, "tps": 830040, "wall": 2006.6} {"step": 25414, "train_loss": 3.0362110137939453, "lr": 6.590279149292859e-05, "tps": 827992, "wall": 2011.6} {"step": 25415, "train_loss": 3.15203595161438, "lr": 6.58928911764148e-05, "tps": 825977, "wall": 2016.6} {"step": 25416, "train_loss": 3.0949249267578125, "lr": 6.588299260563468e-05, "tps": 823974, "wall": 2021.6} {"step": 25417, "train_loss": 2.9695863723754883, "lr": 6.58730957807004e-05, "tps": 821964, "wall": 2026.6} {"step": 25418, "train_loss": 2.958104133605957, "lr": 6.586320070172396e-05, "tps": 819972, "wall": 2031.6} {"step": 25419, "train_loss": 3.076676845550537, "lr": 6.585330736881757e-05, "tps": 817952, "wall": 2036.7} {"step": 25420, "train_loss": 3.0132453441619873, "lr": 6.584341578209326e-05, "tps": 815993, "wall": 2041.7} {"step": 25421, "train_loss": 3.026785135269165, "lr": 6.583352594166301e-05, "tps": 814013, "wall": 2046.7} {"step": 25422, "train_loss": 3.056203842163086, "lr": 6.5823637847639e-05, "tps": 812074, "wall": 2051.7} {"step": 25423, "train_loss": 3.0307366847991943, "lr": 6.581375150013313e-05, "tps": 810119, "wall": 2056.7} {"step": 25424, "train_loss": 3.09212589263916, "lr": 6.58038668992574e-05, "tps": 808190, "wall": 2061.7} {"step": 25425, "train_loss": 2.9319229125976562, "lr": 6.579398404512384e-05, "tps": 806231, "wall": 2066.8} {"step": 25426, "train_loss": 3.0399186611175537, "lr": 6.578410293784436e-05, "tps": 804302, "wall": 2071.8} {"step": 25427, "train_loss": 3.1330819129943848, "lr": 6.577422357753088e-05, "tps": 802329, "wall": 2077.0} {"step": 25428, "train_loss": 3.0843889713287354, "lr": 6.576434596429537e-05, "tps": 800391, "wall": 2082.1} {"step": 25429, "train_loss": 3.087202787399292, "lr": 6.575447009824967e-05, "tps": 798476, "wall": 2087.2} {"step": 25430, "train_loss": 3.0747756958007812, "lr": 6.574459597950571e-05, "tps": 796603, "wall": 2092.2} {"step": 25431, "train_loss": 3.0362181663513184, "lr": 6.57347236081753e-05, "tps": 794697, "wall": 2097.3} {"step": 25432, "train_loss": 3.0233542919158936, "lr": 6.572485298437025e-05, "tps": 792823, "wall": 2102.3} {"step": 25433, "train_loss": 3.0784668922424316, "lr": 6.571498410820247e-05, "tps": 790911, "wall": 2107.5} {"step": 25434, "train_loss": 3.1355578899383545, "lr": 6.570511697978367e-05, "tps": 789113, "wall": 2112.4} {"step": 25435, "train_loss": 3.133777618408203, "lr": 6.569525159922563e-05, "tps": 787285, "wall": 2117.4} {"step": 25436, "train_loss": 3.0764927864074707, "lr": 6.568538796664017e-05, "tps": 785477, "wall": 2122.3} {"step": 25437, "train_loss": 3.1062941551208496, "lr": 6.567552608213896e-05, "tps": 783659, "wall": 2127.3} {"step": 25438, "train_loss": 3.095001220703125, "lr": 6.566566594583372e-05, "tps": 781786, "wall": 2132.5} {"step": 25439, "train_loss": 3.0385868549346924, "lr": 6.56558075578362e-05, "tps": 779957, "wall": 2137.6} {"step": 25440, "train_loss": 2.984762668609619, "lr": 6.564595091825805e-05, "tps": 778148, "wall": 2142.7} {"step": 25441, "train_loss": 3.070676326751709, "lr": 6.563609602721086e-05, "tps": 776318, "wall": 2147.8} {"step": 25442, "train_loss": 2.9549307823181152, "lr": 6.562624288480637e-05, "tps": 774502, "wall": 2152.9} {"step": 25443, "train_loss": 3.0541017055511475, "lr": 6.561639149115617e-05, "tps": 772722, "wall": 2158.0} {"step": 25444, "train_loss": 3.058432102203369, "lr": 6.560654184637179e-05, "tps": 770973, "wall": 2162.9} {"step": 25445, "train_loss": 3.0049850940704346, "lr": 6.559669395056487e-05, "tps": 769216, "wall": 2168.0} {"step": 25446, "train_loss": 3.042970657348633, "lr": 6.558684780384693e-05, "tps": 767457, "wall": 2173.0} {"step": 25447, "train_loss": 3.0714175701141357, "lr": 6.557700340632959e-05, "tps": 765733, "wall": 2178.0} {"step": 25448, "train_loss": 3.116114377975464, "lr": 6.55671607581243e-05, "tps": 764017, "wall": 2183.0} {"step": 25449, "train_loss": 3.0923595428466797, "lr": 6.555731985934255e-05, "tps": 762298, "wall": 2188.0} {"step": 25450, "train_loss": 3.0302529335021973, "lr": 6.554748071009584e-05, "tps": 760576, "wall": 2193.0} {"step": 25451, "train_loss": 3.153210163116455, "lr": 6.553764331049563e-05, "tps": 758870, "wall": 2198.0} {"step": 25452, "train_loss": 3.1001601219177246, "lr": 6.552780766065333e-05, "tps": 757164, "wall": 2203.1} {"step": 25453, "train_loss": 3.0736570358276367, "lr": 6.55179737606804e-05, "tps": 755474, "wall": 2208.1} {"step": 25454, "train_loss": 3.0672807693481445, "lr": 6.550814161068822e-05, "tps": 753782, "wall": 2213.1} {"step": 25455, "train_loss": 3.1816940307617188, "lr": 6.549831121078815e-05, "tps": 752118, "wall": 2218.1} {"step": 25456, "train_loss": 3.0858192443847656, "lr": 6.54884825610916e-05, "tps": 750498, "wall": 2223.0} {"step": 25457, "train_loss": 3.0757455825805664, "lr": 6.547865566170987e-05, "tps": 748858, "wall": 2227.9} {"step": 25458, "train_loss": 2.9884934425354004, "lr": 6.546883051275428e-05, "tps": 747241, "wall": 2232.9} {"step": 25459, "train_loss": 2.9847662448883057, "lr": 6.545900711433615e-05, "tps": 745577, "wall": 2237.9} {"step": 25460, "train_loss": 2.993365526199341, "lr": 6.544918546656675e-05, "tps": 743911, "wall": 2243.0} {"step": 25461, "train_loss": 2.9877302646636963, "lr": 6.54393655695573e-05, "tps": 742279, "wall": 2248.0} {"step": 25462, "train_loss": 2.9871134757995605, "lr": 6.542954742341912e-05, "tps": 740621, "wall": 2253.2} {"step": 25463, "train_loss": 3.0016510486602783, "lr": 6.541973102826336e-05, "tps": 739014, "wall": 2258.2} {"step": 25464, "train_loss": 2.9398856163024902, "lr": 6.540991638420127e-05, "tps": 737313, "wall": 2263.5} {"step": 25465, "train_loss": 3.0431928634643555, "lr": 6.540010349134403e-05, "tps": 735654, "wall": 2268.6} {"step": 25466, "train_loss": 3.0594472885131836, "lr": 6.53902923498027e-05, "tps": 734033, "wall": 2273.7} {"step": 25467, "train_loss": 3.011247158050537, "lr": 6.538048295968857e-05, "tps": 732252, "wall": 2279.4} {"step": 25468, "train_loss": 3.0773849487304688, "lr": 6.537067532111269e-05, "tps": 730627, "wall": 2284.5} {"step": 25469, "train_loss": 3.0346879959106445, "lr": 6.536086943418614e-05, "tps": 729023, "wall": 2289.6} {"step": 25470, "train_loss": 3.0322394371032715, "lr": 6.535106529902006e-05, "tps": 727446, "wall": 2294.7} {"step": 25471, "train_loss": 3.007051944732666, "lr": 6.534126291572548e-05, "tps": 725859, "wall": 2299.8} {"step": 25472, "train_loss": 3.0899546146392822, "lr": 6.53314622844134e-05, "tps": 724245, "wall": 2305.0} {"step": 25473, "train_loss": 3.040469169616699, "lr": 6.532166340519492e-05, "tps": 722685, "wall": 2310.1} {"step": 25474, "train_loss": 3.0518245697021484, "lr": 6.5311866278181e-05, "tps": 721137, "wall": 2315.1} {"step": 25475, "train_loss": 3.0367531776428223, "lr": 6.530207090348258e-05, "tps": 719605, "wall": 2320.2} {"step": 25476, "train_loss": 3.098878860473633, "lr": 6.529227728121073e-05, "tps": 718084, "wall": 2325.2} {"step": 25477, "train_loss": 3.089409828186035, "lr": 6.528248541147633e-05, "tps": 716543, "wall": 2330.3} {"step": 25478, "train_loss": 3.0015788078308105, "lr": 6.527269529439027e-05, "tps": 714996, "wall": 2335.4} {"step": 25479, "train_loss": 3.104511260986328, "lr": 6.52629069300635e-05, "tps": 713445, "wall": 2340.6} {"step": 25480, "train_loss": 3.0467512607574463, "lr": 6.52531203186069e-05, "tps": 711905, "wall": 2345.7} {"step": 25481, "train_loss": 3.021075963973999, "lr": 6.524333546013131e-05, "tps": 710387, "wall": 2350.8} {"step": 25482, "train_loss": 2.9754810333251953, "lr": 6.523355235474761e-05, "tps": 708888, "wall": 2355.9} {"step": 25483, "train_loss": 3.1594791412353516, "lr": 6.522377100256656e-05, "tps": 707370, "wall": 2361.0} {"step": 25484, "train_loss": 3.0390119552612305, "lr": 6.521399140369904e-05, "tps": 705865, "wall": 2366.2} {"step": 25485, "train_loss": 2.932793140411377, "lr": 6.520421355825582e-05, "tps": 704372, "wall": 2371.3} {"step": 25486, "train_loss": 3.0288262367248535, "lr": 6.51944374663476e-05, "tps": 702881, "wall": 2376.4} {"step": 25487, "train_loss": 3.075786590576172, "lr": 6.518466312808519e-05, "tps": 701412, "wall": 2381.5} {"step": 25488, "train_loss": 3.0831961631774902, "lr": 6.51748905435793e-05, "tps": 699927, "wall": 2386.6} {"step": 25489, "train_loss": 3.1258480548858643, "lr": 6.516511971294059e-05, "tps": 698456, "wall": 2391.7} {"step": 25490, "train_loss": 3.0445034503936768, "lr": 6.51553506362798e-05, "tps": 697022, "wall": 2396.7} {"step": 25491, "train_loss": 3.104623317718506, "lr": 6.51455833137076e-05, "tps": 695616, "wall": 2401.7} {"step": 25492, "train_loss": 3.031643867492676, "lr": 6.513581774533457e-05, "tps": 694179, "wall": 2406.7} {"step": 25493, "train_loss": 3.032874584197998, "lr": 6.51260539312714e-05, "tps": 692791, "wall": 2411.7} {"step": 25494, "train_loss": 3.089038372039795, "lr": 6.511629187162866e-05, "tps": 691410, "wall": 2416.6} {"step": 25495, "train_loss": 3.0341429710388184, "lr": 6.510653156651694e-05, "tps": 690039, "wall": 2421.5} {"step": 25496, "train_loss": 3.071148633956909, "lr": 6.509677301604682e-05, "tps": 688665, "wall": 2426.4} {"step": 25497, "train_loss": 3.0483975410461426, "lr": 6.508701622032884e-05, "tps": 687293, "wall": 2431.3} {"step": 25498, "train_loss": 2.9859869480133057, "lr": 6.507726117947349e-05, "tps": 685927, "wall": 2436.3} {"step": 25499, "train_loss": 3.0403952598571777, "lr": 6.506750789359134e-05, "tps": 684594, "wall": 2441.1} {"step": 25500, "train_loss": 3.0517373085021973, "lr": 6.505775636279282e-05, "tps": 683257, "wall": 2446.0} {"step": 25501, "train_loss": 3.119117021560669, "lr": 6.504800658718843e-05, "tps": 681879, "wall": 2451.0} {"step": 25502, "train_loss": 3.0263423919677734, "lr": 6.503825856688861e-05, "tps": 680554, "wall": 2455.9} {"step": 25503, "train_loss": 2.939267635345459, "lr": 6.502851230200376e-05, "tps": 679216, "wall": 2460.8} {"step": 25504, "train_loss": 3.041999578475952, "lr": 6.501876779264432e-05, "tps": 677838, "wall": 2465.9} {"step": 25505, "train_loss": 3.0887231826782227, "lr": 6.500902503892069e-05, "tps": 676490, "wall": 2470.9} {"step": 25506, "train_loss": 2.980517625808716, "lr": 6.499928404094316e-05, "tps": 675154, "wall": 2475.9} {"step": 25507, "train_loss": 2.9602437019348145, "lr": 6.498954479882214e-05, "tps": 673838, "wall": 2480.9} {"step": 25508, "train_loss": 2.8600640296936035, "lr": 6.497980731266797e-05, "tps": 672474, "wall": 2486.0} {"step": 25509, "train_loss": 3.0840415954589844, "lr": 6.49700715825909e-05, "tps": 671177, "wall": 2490.9} {"step": 25510, "train_loss": 3.079362630844116, "lr": 6.496033760870125e-05, "tps": 669888, "wall": 2495.8} {"step": 25511, "train_loss": 2.9502742290496826, "lr": 6.49506053911093e-05, "tps": 668624, "wall": 2500.6} {"step": 25512, "train_loss": 3.0062029361724854, "lr": 6.494087492992526e-05, "tps": 667355, "wall": 2505.4} {"step": 25513, "train_loss": 3.1796905994415283, "lr": 6.493114622525939e-05, "tps": 666092, "wall": 2510.3} {"step": 25514, "train_loss": 3.0277678966522217, "lr": 6.49214192772219e-05, "tps": 664833, "wall": 2515.1} {"step": 25515, "train_loss": 3.062798500061035, "lr": 6.491169408592291e-05, "tps": 663537, "wall": 2520.2} {"step": 25516, "train_loss": 3.166796922683716, "lr": 6.490197065147269e-05, "tps": 662250, "wall": 2525.1} {"step": 25517, "train_loss": 3.0599496364593506, "lr": 6.489224897398128e-05, "tps": 660995, "wall": 2530.0} {"step": 25518, "train_loss": 3.0799801349639893, "lr": 6.488252905355893e-05, "tps": 659744, "wall": 2534.9} {"step": 25519, "train_loss": 3.0434868335723877, "lr": 6.487281089031567e-05, "tps": 658497, "wall": 2539.8} {"step": 25520, "train_loss": 3.0044667720794678, "lr": 6.486309448436156e-05, "tps": 657264, "wall": 2544.7} {"step": 25521, "train_loss": 3.0526528358459473, "lr": 6.485337983580674e-05, "tps": 655968, "wall": 2549.8} {"step": 25522, "train_loss": 3.015800952911377, "lr": 6.484366694476125e-05, "tps": 654690, "wall": 2554.9} {"step": 25523, "train_loss": 3.1023054122924805, "lr": 6.483395581133505e-05, "tps": 653473, "wall": 2559.8} {"step": 25524, "train_loss": 3.0578367710113525, "lr": 6.48242464356382e-05, "tps": 652252, "wall": 2564.7} {"step": 25525, "train_loss": 2.9701285362243652, "lr": 6.481453881778071e-05, "tps": 651039, "wall": 2569.5} {"step": 25526, "train_loss": 2.9622645378112793, "lr": 6.480483295787247e-05, "tps": 649830, "wall": 2574.4} {"step": 25527, "train_loss": 3.0643441677093506, "lr": 6.479512885602353e-05, "tps": 648624, "wall": 2579.3} {"step": 25528, "train_loss": 2.9480245113372803, "lr": 6.478542651234375e-05, "tps": 647388, "wall": 2584.3} {"step": 25529, "train_loss": 2.9529216289520264, "lr": 6.477572592694304e-05, "tps": 646184, "wall": 2589.2} {"step": 25530, "train_loss": 3.0833630561828613, "lr": 6.476602709993133e-05, "tps": 644969, "wall": 2594.2} {"step": 25531, "train_loss": 3.0006747245788574, "lr": 6.475633003141846e-05, "tps": 643769, "wall": 2599.2} {"step": 25532, "train_loss": 3.0496816635131836, "lr": 6.474663472151425e-05, "tps": 642551, "wall": 2604.2} {"step": 25533, "train_loss": 3.1117606163024902, "lr": 6.473694117032857e-05, "tps": 641344, "wall": 2609.2} {"step": 25534, "train_loss": 3.024279832839966, "lr": 6.472724937797125e-05, "tps": 640092, "wall": 2614.4} {"step": 25535, "train_loss": 3.0812554359436035, "lr": 6.471755934455201e-05, "tps": 638861, "wall": 2619.5} {"step": 25536, "train_loss": 3.0575902462005615, "lr": 6.470787107018068e-05, "tps": 637606, "wall": 2624.8} {"step": 25537, "train_loss": 3.0975241661071777, "lr": 6.469818455496697e-05, "tps": 636415, "wall": 2629.8} {"step": 25538, "train_loss": 2.973092555999756, "lr": 6.468849979902067e-05, "tps": 635245, "wall": 2634.8} {"step": 25539, "train_loss": 3.096587657928467, "lr": 6.467881680245142e-05, "tps": 634062, "wall": 2639.8} {"step": 25540, "train_loss": 3.113701343536377, "lr": 6.466913556536892e-05, "tps": 632854, "wall": 2644.9} {"step": 25541, "train_loss": 2.9552760124206543, "lr": 6.465945608788288e-05, "tps": 631653, "wall": 2650.1} {"step": 25542, "train_loss": 3.016108512878418, "lr": 6.464977837010293e-05, "tps": 630510, "wall": 2655.0} {"step": 25543, "train_loss": 3.082641124725342, "lr": 6.46401024121387e-05, "tps": 629356, "wall": 2659.9} {"step": 25544, "train_loss": 3.011676073074341, "lr": 6.463042821409977e-05, "tps": 628221, "wall": 2664.9} {"step": 25545, "train_loss": 3.0830955505371094, "lr": 6.462075577609573e-05, "tps": 627083, "wall": 2669.8} {"step": 25546, "train_loss": 3.13765811920166, "lr": 6.461108509823622e-05, "tps": 625923, "wall": 2674.8} {"step": 25547, "train_loss": 3.056809902191162, "lr": 6.460141618063076e-05, "tps": 624714, "wall": 2680.1} {"step": 25548, "train_loss": 3.0214555263519287, "lr": 6.459174902338881e-05, "tps": 623593, "wall": 2685.0} {"step": 25549, "train_loss": 2.9317057132720947, "lr": 6.458208362661996e-05, "tps": 622476, "wall": 2690.0} {"step": 25550, "train_loss": 2.9888880252838135, "lr": 6.457241999043371e-05, "tps": 621372, "wall": 2694.9} {"step": 25551, "train_loss": 3.0148870944976807, "lr": 6.456275811493942e-05, "tps": 620258, "wall": 2699.8} {"step": 25552, "train_loss": 3.080841302871704, "lr": 6.455309800024667e-05, "tps": 619135, "wall": 2704.8} {"step": 25553, "train_loss": 3.0325052738189697, "lr": 6.45434396464648e-05, "tps": 618037, "wall": 2709.7} {"step": 25554, "train_loss": 2.9810404777526855, "lr": 6.453378305370327e-05, "tps": 616920, "wall": 2714.7} {"step": 25555, "train_loss": 3.033313274383545, "lr": 6.452412822207148e-05, "tps": 615818, "wall": 2719.7} {"step": 25556, "train_loss": 3.0934157371520996, "lr": 6.451447515167876e-05, "tps": 614731, "wall": 2724.6} {"step": 25557, "train_loss": 2.9566519260406494, "lr": 6.450482384263446e-05, "tps": 613626, "wall": 2729.6} {"step": 25558, "train_loss": 2.8980791568756104, "lr": 6.449517429504794e-05, "tps": 612528, "wall": 2734.6} {"step": 25559, "train_loss": 3.0529491901397705, "lr": 6.448552650902852e-05, "tps": 611318, "wall": 2740.1} {"step": 25560, "train_loss": 2.94659161567688, "lr": 6.447588048468541e-05, "tps": 610222, "wall": 2745.2} {"step": 25561, "train_loss": 3.0617523193359375, "lr": 6.446623622212802e-05, "tps": 609153, "wall": 2750.1} {"step": 25562, "train_loss": 3.0248870849609375, "lr": 6.445659372146545e-05, "tps": 608103, "wall": 2755.0} {"step": 25563, "train_loss": 2.991497039794922, "lr": 6.444695298280703e-05, "tps": 607042, "wall": 2759.9} {"step": 25564, "train_loss": 3.070585012435913, "lr": 6.443731400626196e-05, "tps": 605964, "wall": 2764.9} {"step": 25565, "train_loss": 3.040480613708496, "lr": 6.442767679193937e-05, "tps": 604909, "wall": 2769.8} {"step": 25566, "train_loss": 2.9350247383117676, "lr": 6.44180413399485e-05, "tps": 603850, "wall": 2774.8} {"step": 25567, "train_loss": 2.9126129150390625, "lr": 6.44084076503985e-05, "tps": 602781, "wall": 2779.8} {"step": 25568, "train_loss": 3.150724172592163, "lr": 6.43987757233984e-05, "tps": 601691, "wall": 2785.0} {"step": 25569, "train_loss": 2.977398157119751, "lr": 6.438914555905747e-05, "tps": 600595, "wall": 2790.2} {"step": 25570, "train_loss": 3.115135908126831, "lr": 6.437951715748468e-05, "tps": 599543, "wall": 2795.2} {"step": 25571, "train_loss": 2.9310178756713867, "lr": 6.436989051878911e-05, "tps": 598474, "wall": 2800.3} {"step": 25572, "train_loss": 2.94903564453125, "lr": 6.43602656430799e-05, "tps": 597376, "wall": 2805.5} {"step": 25573, "train_loss": 2.918940782546997, "lr": 6.435064253046601e-05, "tps": 596352, "wall": 2810.4} {"step": 25574, "train_loss": 3.13360595703125, "lr": 6.43410211810564e-05, "tps": 595319, "wall": 2815.4} {"step": 25575, "train_loss": 3.0398409366607666, "lr": 6.433140159496019e-05, "tps": 594275, "wall": 2820.5} {"step": 25576, "train_loss": 3.0133285522460938, "lr": 6.432178377228629e-05, "tps": 593173, "wall": 2825.8} {"step": 25577, "train_loss": 3.098011016845703, "lr": 6.431216771314357e-05, "tps": 592110, "wall": 2831.0} {"step": 25578, "train_loss": 2.9509084224700928, "lr": 6.43025534176411e-05, "tps": 591040, "wall": 2836.3} {"step": 25579, "train_loss": 3.0402262210845947, "lr": 6.429294088588768e-05, "tps": 589977, "wall": 2841.5} {"step": 25580, "train_loss": 3.084625482559204, "lr": 6.42833301179923e-05, "tps": 588892, "wall": 2846.8} {"step": 25581, "train_loss": 3.059166669845581, "lr": 6.427372111406375e-05, "tps": 587856, "wall": 2852.0} {"step": 25582, "train_loss": 3.1700985431671143, "lr": 6.426411387421092e-05, "tps": 586819, "wall": 2857.1} {"step": 25583, "train_loss": 3.026401996612549, "lr": 6.425450839854264e-05, "tps": 585788, "wall": 2862.3} {"step": 25584, "train_loss": 3.129896402359009, "lr": 6.424490468716771e-05, "tps": 584739, "wall": 2867.5} {"step": 25585, "train_loss": 3.003969192504883, "lr": 6.423530274019492e-05, "tps": 583680, "wall": 2872.8} {"step": 25586, "train_loss": 3.007533550262451, "lr": 6.422570255773308e-05, "tps": 582662, "wall": 2877.9} {"step": 25587, "train_loss": 3.0926427841186523, "lr": 6.421610413989087e-05, "tps": 581649, "wall": 2883.1} {"step": 25588, "train_loss": 2.926145076751709, "lr": 6.420650748677706e-05, "tps": 580636, "wall": 2888.2} {"step": 25589, "train_loss": 3.012470245361328, "lr": 6.419691259850038e-05, "tps": 579632, "wall": 2893.3} {"step": 25590, "train_loss": 3.021024703979492, "lr": 6.41873194751695e-05, "tps": 578633, "wall": 2898.4} {"step": 25591, "train_loss": 2.9256436824798584, "lr": 6.417772811689306e-05, "tps": 577672, "wall": 2903.4} {"step": 25592, "train_loss": 3.0418224334716797, "lr": 6.416813852377978e-05, "tps": 576692, "wall": 2908.4} {"step": 25593, "train_loss": 2.930586576461792, "lr": 6.415855069593829e-05, "tps": 575732, "wall": 2913.4} {"step": 25594, "train_loss": 3.1340460777282715, "lr": 6.414896463347711e-05, "tps": 574758, "wall": 2918.4} {"step": 25595, "train_loss": 3.0568337440490723, "lr": 6.413938033650493e-05, "tps": 573769, "wall": 2923.6} {"step": 25596, "train_loss": 3.0084540843963623, "lr": 6.412979780513022e-05, "tps": 572810, "wall": 2928.6} {"step": 25597, "train_loss": 2.9565060138702393, "lr": 6.412021703946166e-05, "tps": 571856, "wall": 2933.6} {"step": 25598, "train_loss": 3.073367118835449, "lr": 6.411063803960769e-05, "tps": 570903, "wall": 2938.6} {"step": 25599, "train_loss": 3.107318639755249, "lr": 6.410106080567682e-05, "tps": 569934, "wall": 2943.7} {"step": 25600, "train_loss": 2.9146950244903564, "lr": 6.409148533777762e-05, "tps": 568978, "wall": 2948.8} {"step": 25601, "train_loss": 3.139073371887207, "lr": 6.408191163601849e-05, "tps": 568036, "wall": 2953.8} {"step": 25602, "train_loss": 3.0725245475769043, "lr": 6.407233970050785e-05, "tps": 567094, "wall": 2958.8} {"step": 25603, "train_loss": 3.102590799331665, "lr": 6.406276953135425e-05, "tps": 566160, "wall": 2963.8} {"step": 25604, "train_loss": 2.931903839111328, "lr": 6.405320112866603e-05, "tps": 565231, "wall": 2968.8} {"step": 25605, "train_loss": 3.019021511077881, "lr": 6.404363449255151e-05, "tps": 564265, "wall": 2974.0} {"step": 25606, "train_loss": 3.040036678314209, "lr": 6.403406962311922e-05, "tps": 563299, "wall": 2979.2} {"step": 25607, "train_loss": 3.0270936489105225, "lr": 6.40245065204774e-05, "tps": 562329, "wall": 2984.5} {"step": 25608, "train_loss": 2.9947142601013184, "lr": 6.401494518473438e-05, "tps": 561365, "wall": 2989.7} {"step": 25609, "train_loss": 3.1339306831359863, "lr": 6.400538561599853e-05, "tps": 560448, "wall": 2994.7} {"step": 25610, "train_loss": 2.888350248336792, "lr": 6.399582781437812e-05, "tps": 559529, "wall": 2999.7} {"step": 25611, "train_loss": 2.972855567932129, "lr": 6.398627177998137e-05, "tps": 558600, "wall": 3004.8} {"step": 25612, "train_loss": 3.0224006175994873, "lr": 6.39767175129166e-05, "tps": 557694, "wall": 3009.8} {"step": 25613, "train_loss": 3.0592703819274902, "lr": 6.396716501329203e-05, "tps": 556784, "wall": 3014.9} {"step": 25614, "train_loss": 3.0864272117614746, "lr": 6.395761428121582e-05, "tps": 555887, "wall": 3019.9} {"step": 25615, "train_loss": 3.0011847019195557, "lr": 6.394806531679621e-05, "tps": 554953, "wall": 3025.1} {"step": 25616, "train_loss": 3.1165027618408203, "lr": 6.393851812014134e-05, "tps": 554031, "wall": 3030.2} {"step": 25617, "train_loss": 3.07059383392334, "lr": 6.392897269135943e-05, "tps": 553142, "wall": 3035.2} {"step": 25618, "train_loss": 3.0298614501953125, "lr": 6.391942903055855e-05, "tps": 552255, "wall": 3040.2} {"step": 25619, "train_loss": 3.0615830421447754, "lr": 6.390988713784677e-05, "tps": 551365, "wall": 3045.2} {"step": 25620, "train_loss": 3.0557751655578613, "lr": 6.390034701333228e-05, "tps": 550484, "wall": 3050.2} {"step": 25621, "train_loss": 3.094024181365967, "lr": 6.38908086571231e-05, "tps": 549604, "wall": 3055.2} {"step": 25622, "train_loss": 3.057009220123291, "lr": 6.388127206932727e-05, "tps": 548725, "wall": 3060.2} {"step": 25623, "train_loss": 3.007437229156494, "lr": 6.387173725005285e-05, "tps": 547843, "wall": 3065.3} {"step": 25624, "train_loss": 2.9973838329315186, "lr": 6.386220419940784e-05, "tps": 546974, "wall": 3070.3} {"step": 25625, "train_loss": 3.006972551345825, "lr": 6.385267291750019e-05, "tps": 546107, "wall": 3075.3} {"step": 25626, "train_loss": 3.074693202972412, "lr": 6.384314340443796e-05, "tps": 545236, "wall": 3080.3} {"step": 25627, "train_loss": 2.9426095485687256, "lr": 6.383361566032903e-05, "tps": 544345, "wall": 3085.5} {"step": 25628, "train_loss": 3.115682601928711, "lr": 6.382408968528133e-05, "tps": 543485, "wall": 3090.5} {"step": 25629, "train_loss": 3.0197300910949707, "lr": 6.381456547940281e-05, "tps": 542621, "wall": 3095.5} {"step": 25630, "train_loss": 3.0644545555114746, "lr": 6.380504304280135e-05, "tps": 541769, "wall": 3100.5} {"step": 25631, "train_loss": 3.08840274810791, "lr": 6.379552237558477e-05, "tps": 540898, "wall": 3105.6} {"step": 25632, "train_loss": 3.0396857261657715, "lr": 6.378600347786101e-05, "tps": 540039, "wall": 3110.7} {"step": 25633, "train_loss": 2.993128538131714, "lr": 6.377648634973782e-05, "tps": 539194, "wall": 3115.7} {"step": 25634, "train_loss": 3.012892723083496, "lr": 6.376697099132307e-05, "tps": 538339, "wall": 3120.7} {"step": 25635, "train_loss": 3.031686544418335, "lr": 6.375745740272452e-05, "tps": 537480, "wall": 3125.8} {"step": 25636, "train_loss": 3.115063428878784, "lr": 6.374794558404993e-05, "tps": 536639, "wall": 3130.9} {"step": 25637, "train_loss": 3.0493452548980713, "lr": 6.373843553540709e-05, "tps": 535770, "wall": 3136.1} {"step": 25638, "train_loss": 3.072878837585449, "lr": 6.372892725690369e-05, "tps": 534891, "wall": 3141.3} {"step": 25639, "train_loss": 2.993680477142334, "lr": 6.371942074864743e-05, "tps": 534051, "wall": 3146.4} {"step": 25640, "train_loss": 3.1787960529327393, "lr": 6.370991601074608e-05, "tps": 533223, "wall": 3151.4} {"step": 25641, "train_loss": 2.967278480529785, "lr": 6.370041304330726e-05, "tps": 532397, "wall": 3156.4} {"step": 25642, "train_loss": 2.913102626800537, "lr": 6.369091184643853e-05, "tps": 531576, "wall": 3161.4} {"step": 25643, "train_loss": 3.0552732944488525, "lr": 6.36814124202477e-05, "tps": 530760, "wall": 3166.4} {"step": 25644, "train_loss": 3.075779676437378, "lr": 6.367191476484228e-05, "tps": 529948, "wall": 3171.4} {"step": 25645, "train_loss": 3.0073368549346924, "lr": 6.366241888032981e-05, "tps": 529141, "wall": 3176.3} {"step": 25646, "train_loss": 3.017728328704834, "lr": 6.365292476681794e-05, "tps": 528335, "wall": 3181.3} {"step": 25647, "train_loss": 2.9957098960876465, "lr": 6.364343242441422e-05, "tps": 527504, "wall": 3186.5} {"step": 25648, "train_loss": 3.1187705993652344, "lr": 6.363394185322613e-05, "tps": 526660, "wall": 3191.7} {"step": 25649, "train_loss": 3.0549662113189697, "lr": 6.362445305336122e-05, "tps": 525836, "wall": 3196.8} {"step": 25650, "train_loss": 2.957768678665161, "lr": 6.361496602492693e-05, "tps": 525042, "wall": 3201.8} {"step": 25651, "train_loss": 3.0740742683410645, "lr": 6.360548076803081e-05, "tps": 524247, "wall": 3206.7} {"step": 25652, "train_loss": 3.029975175857544, "lr": 6.359599728278026e-05, "tps": 523453, "wall": 3211.7} {"step": 25653, "train_loss": 3.084683895111084, "lr": 6.358651556928268e-05, "tps": 522656, "wall": 3216.8} {"step": 25654, "train_loss": 3.106424570083618, "lr": 6.357703562764555e-05, "tps": 521867, "wall": 3221.7} {"step": 25655, "train_loss": 3.0842437744140625, "lr": 6.356755745797622e-05, "tps": 521081, "wall": 3226.7} {"step": 25656, "train_loss": 3.089658498764038, "lr": 6.355808106038203e-05, "tps": 520298, "wall": 3231.7} {"step": 25657, "train_loss": 3.0803799629211426, "lr": 6.35486064349704e-05, "tps": 519515, "wall": 3236.7} {"step": 25658, "train_loss": 2.978814125061035, "lr": 6.353913358184862e-05, "tps": 518739, "wall": 3241.7} {"step": 25659, "train_loss": 3.053278684616089, "lr": 6.352966250112396e-05, "tps": 517954, "wall": 3246.7} {"step": 25660, "train_loss": 2.96968674659729, "lr": 6.352019319290376e-05, "tps": 517165, "wall": 3251.8} {"step": 25661, "train_loss": 3.013589382171631, "lr": 6.351072565729533e-05, "tps": 516370, "wall": 3256.9} {"step": 25662, "train_loss": 3.0388131141662598, "lr": 6.350125989440579e-05, "tps": 515549, "wall": 3262.3} {"step": 25663, "train_loss": 2.9912233352661133, "lr": 6.349179590434248e-05, "tps": 514752, "wall": 3267.4} {"step": 25664, "train_loss": 3.0184707641601562, "lr": 6.348233368721259e-05, "tps": 513986, "wall": 3272.4} {"step": 25665, "train_loss": 3.0219149589538574, "lr": 6.347287324312326e-05, "tps": 513225, "wall": 3277.4} {"step": 25666, "train_loss": 3.007356882095337, "lr": 6.34634145721817e-05, "tps": 512417, "wall": 3282.7} {"step": 25667, "train_loss": 3.078319549560547, "lr": 6.345395767449506e-05, "tps": 511665, "wall": 3287.6} {"step": 25668, "train_loss": 3.1381237506866455, "lr": 6.344450255017042e-05, "tps": 510912, "wall": 3292.6} {"step": 25669, "train_loss": 3.0003981590270996, "lr": 6.343504919931496e-05, "tps": 510165, "wall": 3297.6} {"step": 25670, "train_loss": 2.9804606437683105, "lr": 6.34255976220357e-05, "tps": 509416, "wall": 3302.6} {"step": 25671, "train_loss": 3.0668370723724365, "lr": 6.341614781843978e-05, "tps": 508663, "wall": 3307.6} {"step": 25672, "train_loss": 3.0251822471618652, "lr": 6.340669978863421e-05, "tps": 507915, "wall": 3312.6} {"step": 25673, "train_loss": 3.0081310272216797, "lr": 6.339725353272599e-05, "tps": 507174, "wall": 3317.5} {"step": 25674, "train_loss": 3.0670082569122314, "lr": 6.338780905082215e-05, "tps": 506421, "wall": 3322.6} {"step": 25675, "train_loss": 3.034425973892212, "lr": 6.337836634302971e-05, "tps": 505665, "wall": 3327.7} {"step": 25676, "train_loss": 3.024357557296753, "lr": 6.336892540945558e-05, "tps": 504878, "wall": 3333.0} {"step": 25677, "train_loss": 2.9597744941711426, "lr": 6.335948625020675e-05, "tps": 504119, "wall": 3338.2} {"step": 25678, "train_loss": 3.007652997970581, "lr": 6.335004886539015e-05, "tps": 503363, "wall": 3343.3} {"step": 25679, "train_loss": 3.097186326980591, "lr": 6.334061325511265e-05, "tps": 502636, "wall": 3348.3} {"step": 25680, "train_loss": 3.010908842086792, "lr": 6.333117941948116e-05, "tps": 501912, "wall": 3353.2} {"step": 25681, "train_loss": 3.1550045013427734, "lr": 6.332174735860256e-05, "tps": 501183, "wall": 3358.2} {"step": 25682, "train_loss": 3.0843849182128906, "lr": 6.331231707258366e-05, "tps": 500485, "wall": 3363.1} {"step": 25683, "train_loss": 2.9615440368652344, "lr": 6.330288856153132e-05, "tps": 499788, "wall": 3367.9} {"step": 25684, "train_loss": 2.9260501861572266, "lr": 6.329346182555235e-05, "tps": 499089, "wall": 3372.7} {"step": 25685, "train_loss": 3.046015739440918, "lr": 6.328403686475348e-05, "tps": 498384, "wall": 3377.6} {"step": 25686, "train_loss": 3.0708298683166504, "lr": 6.327461367924157e-05, "tps": 497674, "wall": 3382.6} {"step": 25687, "train_loss": 3.102313995361328, "lr": 6.326519226912327e-05, "tps": 496959, "wall": 3387.6} {"step": 25688, "train_loss": 3.076213836669922, "lr": 6.325577263450537e-05, "tps": 496250, "wall": 3392.6} {"step": 25689, "train_loss": 2.9600257873535156, "lr": 6.324635477549457e-05, "tps": 495546, "wall": 3397.5} {"step": 25690, "train_loss": 3.0676302909851074, "lr": 6.323693869219753e-05, "tps": 494846, "wall": 3402.4} {"step": 25691, "train_loss": 2.946882486343384, "lr": 6.322752438472093e-05, "tps": 494154, "wall": 3407.3} {"step": 25692, "train_loss": 3.092393398284912, "lr": 6.321811185317144e-05, "tps": 493444, "wall": 3412.4} {"step": 25693, "train_loss": 3.017578601837158, "lr": 6.32087010976556e-05, "tps": 492738, "wall": 3417.4} {"step": 25694, "train_loss": 3.044973611831665, "lr": 6.319929211828013e-05, "tps": 492034, "wall": 3422.4} {"step": 25695, "train_loss": 3.027386426925659, "lr": 6.318988491515157e-05, "tps": 491328, "wall": 3427.5} {"step": 25696, "train_loss": 3.076333999633789, "lr": 6.318047948837641e-05, "tps": 490631, "wall": 3432.5} {"step": 25697, "train_loss": 2.999345064163208, "lr": 6.317107583806132e-05, "tps": 489933, "wall": 3437.5} {"step": 25698, "train_loss": 2.9568209648132324, "lr": 6.316167396431279e-05, "tps": 489232, "wall": 3442.6} {"step": 25699, "train_loss": 3.074205160140991, "lr": 6.31522738672372e-05, "tps": 488529, "wall": 3447.6} {"step": 25700, "train_loss": 3.068946599960327, "lr": 6.314287554694125e-05, "tps": 487836, "wall": 3452.7} {"step": 25701, "train_loss": 3.065431594848633, "lr": 6.313347900353124e-05, "tps": 487141, "wall": 3457.7} {"step": 25702, "train_loss": 3.071432590484619, "lr": 6.312408423711365e-05, "tps": 486453, "wall": 3462.8} {"step": 25703, "train_loss": 3.0955610275268555, "lr": 6.311469124779493e-05, "tps": 485770, "wall": 3467.8} {"step": 25704, "train_loss": 3.015052318572998, "lr": 6.310530003568147e-05, "tps": 485093, "wall": 3472.7} {"step": 25705, "train_loss": 3.022481918334961, "lr": 6.30959106008797e-05, "tps": 484415, "wall": 3477.7} {"step": 25706, "train_loss": 3.1273491382598877, "lr": 6.308652294349592e-05, "tps": 483737, "wall": 3482.7} {"step": 25707, "train_loss": 2.9998459815979004, "lr": 6.307713706363647e-05, "tps": 483027, "wall": 3488.0} {"step": 25708, "train_loss": 3.08243727684021, "lr": 6.306775296140773e-05, "tps": 482320, "wall": 3493.2} {"step": 25709, "train_loss": 2.937838554382324, "lr": 6.305837063691599e-05, "tps": 481616, "wall": 3498.5} {"step": 25710, "train_loss": 3.0522472858428955, "lr": 6.304899009026751e-05, "tps": 480920, "wall": 3503.7} {"step": 25711, "train_loss": 3.0550620555877686, "lr": 6.303961132156857e-05, "tps": 480216, "wall": 3509.0} {"step": 25712, "train_loss": 3.0557618141174316, "lr": 6.303023433092534e-05, "tps": 479515, "wall": 3514.2} {"step": 25713, "train_loss": 2.983670473098755, "lr": 6.302085911844417e-05, "tps": 478826, "wall": 3519.4} {"step": 25714, "train_loss": 3.059634208679199, "lr": 6.301148568423119e-05, "tps": 478133, "wall": 3524.7} {"step": 25715, "train_loss": 3.1387462615966797, "lr": 6.300211402839257e-05, "tps": 477444, "wall": 3529.9} {"step": 25716, "train_loss": 3.1164114475250244, "lr": 6.299274415103452e-05, "tps": 476757, "wall": 3535.1} {"step": 25717, "train_loss": 2.976623773574829, "lr": 6.298337605226314e-05, "tps": 476074, "wall": 3540.3} {"step": 25718, "train_loss": 3.066249132156372, "lr": 6.297400973218456e-05, "tps": 475419, "wall": 3545.3} {"step": 25719, "train_loss": 2.9710254669189453, "lr": 6.296464519090492e-05, "tps": 474770, "wall": 3550.3} {"step": 25720, "train_loss": 3.0340285301208496, "lr": 6.295528242853027e-05, "tps": 474106, "wall": 3555.4} {"step": 25721, "train_loss": 3.0601096153259277, "lr": 6.294592144516666e-05, "tps": 473460, "wall": 3560.4} {"step": 25722, "train_loss": 3.060141086578369, "lr": 6.293656224092017e-05, "tps": 472819, "wall": 3565.4} {"step": 25723, "train_loss": 3.018972873687744, "lr": 6.292720481589682e-05, "tps": 472145, "wall": 3570.6} {"step": 25724, "train_loss": 3.0779457092285156, "lr": 6.291784917020252e-05, "tps": 471488, "wall": 3575.7} {"step": 25725, "train_loss": 3.014315605163574, "lr": 6.290849530394338e-05, "tps": 470850, "wall": 3580.7} {"step": 25726, "train_loss": 3.0783724784851074, "lr": 6.289914321722529e-05, "tps": 470215, "wall": 3585.7} {"step": 25727, "train_loss": 3.0701143741607666, "lr": 6.288979291015417e-05, "tps": 469576, "wall": 3590.7} {"step": 25728, "train_loss": 3.028977870941162, "lr": 6.288044438283602e-05, "tps": 468936, "wall": 3595.7} {"step": 25729, "train_loss": 3.08597993850708, "lr": 6.287109763537666e-05, "tps": 468305, "wall": 3600.7} {"step": 25730, "train_loss": 3.040971279144287, "lr": 6.286175266788206e-05, "tps": 467665, "wall": 3605.8} {"step": 25731, "train_loss": 2.9639711380004883, "lr": 6.285240948045799e-05, "tps": 467036, "wall": 3610.8} {"step": 25732, "train_loss": 3.0442214012145996, "lr": 6.284306807321033e-05, "tps": 466410, "wall": 3615.8} {"step": 25733, "train_loss": 2.994847297668457, "lr": 6.283372844624489e-05, "tps": 465786, "wall": 3620.8} {"step": 25734, "train_loss": 3.0594048500061035, "lr": 6.282439059966751e-05, "tps": 465162, "wall": 3625.8} {"step": 25735, "train_loss": 3.0468533039093018, "lr": 6.28150545335839e-05, "tps": 464540, "wall": 3630.8} {"step": 25736, "train_loss": 3.091153144836426, "lr": 6.280572024809987e-05, "tps": 463915, "wall": 3635.8} {"step": 25737, "train_loss": 3.0443530082702637, "lr": 6.279638774332116e-05, "tps": 463295, "wall": 3640.8} {"step": 25738, "train_loss": 3.0099363327026367, "lr": 6.278705701935343e-05, "tps": 462677, "wall": 3645.8} {"step": 25739, "train_loss": 3.025282859802246, "lr": 6.277772807630247e-05, "tps": 462062, "wall": 3650.8} {"step": 25740, "train_loss": 3.0629427433013916, "lr": 6.276840091427391e-05, "tps": 461451, "wall": 3655.8} {"step": 25741, "train_loss": 2.9004108905792236, "lr": 6.275907553337335e-05, "tps": 460837, "wall": 3660.8} {"step": 25742, "train_loss": 3.0165646076202393, "lr": 6.274975193370656e-05, "tps": 460224, "wall": 3665.8} {"step": 25743, "train_loss": 3.0700840950012207, "lr": 6.274043011537906e-05, "tps": 459624, "wall": 3670.7} {"step": 25744, "train_loss": 3.0283477306365967, "lr": 6.273111007849645e-05, "tps": 459023, "wall": 3675.7} {"step": 25745, "train_loss": 3.100862503051758, "lr": 6.27217918231644e-05, "tps": 458420, "wall": 3680.7} {"step": 25746, "train_loss": 2.9428977966308594, "lr": 6.271247534948836e-05, "tps": 457822, "wall": 3685.6} {"step": 25747, "train_loss": 3.025820016860962, "lr": 6.270316065757387e-05, "tps": 457225, "wall": 3690.6} {"step": 25748, "train_loss": 3.170116901397705, "lr": 6.269384774752655e-05, "tps": 456624, "wall": 3695.6} {"step": 25749, "train_loss": 3.0286474227905273, "lr": 6.268453661945178e-05, "tps": 456026, "wall": 3700.6} {"step": 25750, "train_loss": 3.0062832832336426, "lr": 6.267522727345513e-05, "tps": 455431, "wall": 3705.5} {"step": 25751, "train_loss": 3.0710043907165527, "lr": 6.266591970964202e-05, "tps": 454840, "wall": 3710.5} {"step": 25752, "train_loss": 2.958300828933716, "lr": 6.265661392811783e-05, "tps": 454251, "wall": 3715.4} {"step": 25753, "train_loss": 2.979353189468384, "lr": 6.264730992898808e-05, "tps": 453631, "wall": 3720.7} {"step": 25754, "train_loss": 2.985631227493286, "lr": 6.263800771235813e-05, "tps": 453056, "wall": 3725.5} {"step": 25755, "train_loss": 2.9104788303375244, "lr": 6.262870727833327e-05, "tps": 452500, "wall": 3730.3} {"step": 25756, "train_loss": 3.1439459323883057, "lr": 6.261940862701899e-05, "tps": 451945, "wall": 3735.0} {"step": 25757, "train_loss": 3.010692834854126, "lr": 6.261011175852057e-05, "tps": 451392, "wall": 3739.7} {"step": 25758, "train_loss": 3.004565715789795, "lr": 6.260081667294325e-05, "tps": 450843, "wall": 3744.4} {"step": 25759, "train_loss": 3.0812721252441406, "lr": 6.259152337039245e-05, "tps": 450295, "wall": 3749.1} {"step": 25760, "train_loss": 3.0025582313537598, "lr": 6.25822318509734e-05, "tps": 449745, "wall": 3753.8} {"step": 25761, "train_loss": 3.028794527053833, "lr": 6.257294211479127e-05, "tps": 449198, "wall": 3758.6} {"step": 25762, "train_loss": 3.1012744903564453, "lr": 6.256365416195145e-05, "tps": 448645, "wall": 3763.3} {"step": 25763, "train_loss": 3.0855536460876465, "lr": 6.255436799255904e-05, "tps": 448101, "wall": 3768.1} {"step": 25764, "train_loss": 2.9168813228607178, "lr": 6.254508360671925e-05, "tps": 447553, "wall": 3772.8} {"step": 25765, "train_loss": 2.964242935180664, "lr": 6.25358010045373e-05, "tps": 447010, "wall": 3777.5} {"step": 25766, "train_loss": 3.0362794399261475, "lr": 6.252652018611828e-05, "tps": 446468, "wall": 3782.3} {"step": 25767, "train_loss": 3.0174179077148438, "lr": 6.25172411515674e-05, "tps": 445920, "wall": 3787.1} {"step": 25768, "train_loss": 3.0100250244140625, "lr": 6.250796390098972e-05, "tps": 445380, "wall": 3791.8} {"step": 25769, "train_loss": 3.066242218017578, "lr": 6.24986884344903e-05, "tps": 444844, "wall": 3796.5} {"step": 25770, "train_loss": 2.985320568084717, "lr": 6.248941475217431e-05, "tps": 444310, "wall": 3801.2} {"step": 25771, "train_loss": 3.030193328857422, "lr": 6.248014285414676e-05, "tps": 443775, "wall": 3806.0} {"step": 25772, "train_loss": 3.0892863273620605, "lr": 6.247087274051263e-05, "tps": 443238, "wall": 3810.7} {"step": 25773, "train_loss": 3.0373497009277344, "lr": 6.246160441137702e-05, "tps": 442703, "wall": 3815.5} {"step": 25774, "train_loss": 2.942379951477051, "lr": 6.245233786684486e-05, "tps": 442174, "wall": 3820.2} {"step": 25775, "train_loss": 3.069185256958008, "lr": 6.244307310702111e-05, "tps": 441646, "wall": 3824.9} {"step": 25776, "train_loss": 3.1326894760131836, "lr": 6.243381013201078e-05, "tps": 441116, "wall": 3829.6} {"step": 25777, "train_loss": 3.0726871490478516, "lr": 6.242454894191879e-05, "tps": 440591, "wall": 3834.4} {"step": 25778, "train_loss": 3.1026597023010254, "lr": 6.241528953684999e-05, "tps": 440064, "wall": 3839.1} {"step": 25779, "train_loss": 2.960223913192749, "lr": 6.240603191690934e-05, "tps": 439525, "wall": 3844.0} {"step": 25780, "train_loss": 2.946350336074829, "lr": 6.239677608220171e-05, "tps": 439005, "wall": 3848.7} {"step": 25781, "train_loss": 3.0043911933898926, "lr": 6.238752203283186e-05, "tps": 438484, "wall": 3853.4} {"step": 25782, "train_loss": 3.0670509338378906, "lr": 6.237826976890476e-05, "tps": 437963, "wall": 3858.1} {"step": 25783, "train_loss": 2.957942008972168, "lr": 6.236901929052508e-05, "tps": 437445, "wall": 3862.8} {"step": 25784, "train_loss": 3.0685644149780273, "lr": 6.235977059779773e-05, "tps": 436926, "wall": 3867.6} {"step": 25785, "train_loss": 2.979252338409424, "lr": 6.235052369082742e-05, "tps": 436405, "wall": 3872.3} {"step": 25786, "train_loss": 3.1961920261383057, "lr": 6.234127856971888e-05, "tps": 435893, "wall": 3877.0} {"step": 25787, "train_loss": 2.998955726623535, "lr": 6.23320352345769e-05, "tps": 435380, "wall": 3881.8} {"step": 25788, "train_loss": 3.106393575668335, "lr": 6.232279368550613e-05, "tps": 434867, "wall": 3886.5} {"step": 25789, "train_loss": 3.0722060203552246, "lr": 6.231355392261128e-05, "tps": 434356, "wall": 3891.2} {"step": 25790, "train_loss": 3.060112237930298, "lr": 6.230431594599704e-05, "tps": 433847, "wall": 3895.9} {"step": 25791, "train_loss": 3.092332363128662, "lr": 6.229507975576804e-05, "tps": 433332, "wall": 3900.7} {"step": 25792, "train_loss": 3.091453790664673, "lr": 6.228584535202887e-05, "tps": 432819, "wall": 3905.5} {"step": 25793, "train_loss": 3.0420234203338623, "lr": 6.227661273488423e-05, "tps": 432312, "wall": 3910.2} {"step": 25794, "train_loss": 3.0753908157348633, "lr": 6.226738190443863e-05, "tps": 431806, "wall": 3915.0} {"step": 25795, "train_loss": 3.0827345848083496, "lr": 6.225815286079664e-05, "tps": 431303, "wall": 3919.7} {"step": 25796, "train_loss": 2.9843153953552246, "lr": 6.224892560406287e-05, "tps": 430799, "wall": 3924.4} {"step": 25797, "train_loss": 3.1413540840148926, "lr": 6.223970013434179e-05, "tps": 430297, "wall": 3929.1} {"step": 25798, "train_loss": 3.0150680541992188, "lr": 6.223047645173789e-05, "tps": 429796, "wall": 3933.9} {"step": 25799, "train_loss": 3.090864896774292, "lr": 6.222125455635573e-05, "tps": 429297, "wall": 3938.6} {"step": 25800, "train_loss": 2.949186325073242, "lr": 6.221203444829973e-05, "tps": 428793, "wall": 3943.4} {"step": 25801, "train_loss": 3.0997939109802246, "lr": 6.22028161276743e-05, "tps": 428296, "wall": 3948.1} {"step": 25802, "train_loss": 3.0379881858825684, "lr": 6.219359959458394e-05, "tps": 427798, "wall": 3952.9} {"step": 25803, "train_loss": 3.0951433181762695, "lr": 6.218438484913299e-05, "tps": 427300, "wall": 3957.6} {"step": 25804, "train_loss": 3.101234197616577, "lr": 6.21751718914259e-05, "tps": 426806, "wall": 3962.3} {"step": 25805, "train_loss": 3.004164695739746, "lr": 6.216596072156701e-05, "tps": 426306, "wall": 3967.2} {"step": 25806, "train_loss": 3.0650577545166016, "lr": 6.215675133966062e-05, "tps": 425814, "wall": 3971.9} {"step": 25807, "train_loss": 2.9973459243774414, "lr": 6.214754374581111e-05, "tps": 425326, "wall": 3976.6} {"step": 25808, "train_loss": 3.0172524452209473, "lr": 6.213833794012278e-05, "tps": 424835, "wall": 3981.3} {"step": 25809, "train_loss": 3.02335262298584, "lr": 6.212913392269985e-05, "tps": 424350, "wall": 3986.1} {"step": 25810, "train_loss": 3.082317352294922, "lr": 6.211993169364666e-05, "tps": 423862, "wall": 3990.8} {"step": 25811, "train_loss": 3.0096259117126465, "lr": 6.211073125306744e-05, "tps": 423373, "wall": 3995.6} {"step": 25812, "train_loss": 2.9704227447509766, "lr": 6.210153260106635e-05, "tps": 422885, "wall": 4000.3} {"step": 25813, "train_loss": 2.924593925476074, "lr": 6.20923357377477e-05, "tps": 422399, "wall": 4005.1} {"step": 25814, "train_loss": 3.009699821472168, "lr": 6.208314066321561e-05, "tps": 421915, "wall": 4009.8} {"step": 25815, "train_loss": 3.0464682579040527, "lr": 6.207394737757419e-05, "tps": 421432, "wall": 4014.6} {"step": 25816, "train_loss": 3.0293216705322266, "lr": 6.206475588092768e-05, "tps": 420948, "wall": 4019.4} {"step": 25817, "train_loss": 3.0578701496124268, "lr": 6.205556617338017e-05, "tps": 420461, "wall": 4024.2} {"step": 25818, "train_loss": 3.0278449058532715, "lr": 6.20463782550357e-05, "tps": 419983, "wall": 4028.9} {"step": 25819, "train_loss": 3.0895636081695557, "lr": 6.203719212599845e-05, "tps": 419503, "wall": 4033.7} {"step": 25820, "train_loss": 3.0432629585266113, "lr": 6.20280077863724e-05, "tps": 419029, "wall": 4038.4} {"step": 25821, "train_loss": 3.0822250843048096, "lr": 6.201882523626165e-05, "tps": 418549, "wall": 4043.2} {"step": 25822, "train_loss": 3.1082983016967773, "lr": 6.20096444757702e-05, "tps": 418076, "wall": 4047.9} {"step": 25823, "train_loss": 3.075741767883301, "lr": 6.200046550500199e-05, "tps": 417601, "wall": 4052.7} {"step": 25824, "train_loss": 3.184251308441162, "lr": 6.199128832406112e-05, "tps": 417128, "wall": 4057.4} {"step": 25825, "train_loss": 3.0790748596191406, "lr": 6.198211293305146e-05, "tps": 416656, "wall": 4062.2} {"step": 25826, "train_loss": 2.950833320617676, "lr": 6.197293933207695e-05, "tps": 416187, "wall": 4066.9} {"step": 25827, "train_loss": 2.946693181991577, "lr": 6.196376752124157e-05, "tps": 415720, "wall": 4071.6} {"step": 25828, "train_loss": 3.0730788707733154, "lr": 6.195459750064916e-05, "tps": 415251, "wall": 4076.4} {"step": 25829, "train_loss": 3.1388003826141357, "lr": 6.194542927040361e-05, "tps": 414786, "wall": 4081.1} {"step": 25830, "train_loss": 3.0709166526794434, "lr": 6.193626283060882e-05, "tps": 414311, "wall": 4086.0} {"step": 25831, "train_loss": 3.0848162174224854, "lr": 6.192709818136859e-05, "tps": 413846, "wall": 4090.7} {"step": 25832, "train_loss": 2.979961395263672, "lr": 6.191793532278671e-05, "tps": 413386, "wall": 4095.4} {"step": 25833, "train_loss": 3.034794330596924, "lr": 6.190877425496704e-05, "tps": 412922, "wall": 4100.2} {"step": 25834, "train_loss": 3.116319179534912, "lr": 6.189961497801335e-05, "tps": 412462, "wall": 4104.9} {"step": 25835, "train_loss": 3.027411460876465, "lr": 6.18904574920293e-05, "tps": 411998, "wall": 4109.7} {"step": 25836, "train_loss": 3.0382895469665527, "lr": 6.188130179711876e-05, "tps": 411538, "wall": 4114.4} {"step": 25837, "train_loss": 3.00077748298645, "lr": 6.187214789338534e-05, "tps": 411080, "wall": 4119.2} {"step": 25838, "train_loss": 3.026381492614746, "lr": 6.186299578093283e-05, "tps": 410623, "wall": 4123.9} {"step": 25839, "train_loss": 3.1818463802337646, "lr": 6.185384545986486e-05, "tps": 410168, "wall": 4128.7} {"step": 25840, "train_loss": 3.0644068717956543, "lr": 6.184469693028505e-05, "tps": 409712, "wall": 4133.4} {"step": 25841, "train_loss": 3.1042160987854004, "lr": 6.183555019229711e-05, "tps": 409261, "wall": 4138.1} {"step": 25842, "train_loss": 2.9553518295288086, "lr": 6.18264052460046e-05, "tps": 408806, "wall": 4142.9} {"step": 25843, "train_loss": 2.9344866275787354, "lr": 6.181726209151109e-05, "tps": 408351, "wall": 4147.7} {"step": 25844, "train_loss": 3.0233068466186523, "lr": 6.180812072892023e-05, "tps": 407900, "wall": 4152.4} {"step": 25845, "train_loss": 2.9649500846862793, "lr": 6.179898115833556e-05, "tps": 407452, "wall": 4157.2} {"step": 25846, "train_loss": 2.9687981605529785, "lr": 6.178984337986054e-05, "tps": 407004, "wall": 4161.9} {"step": 25847, "train_loss": 3.0714359283447266, "lr": 6.178070739359874e-05, "tps": 406558, "wall": 4166.6} {"step": 25848, "train_loss": 3.0582666397094727, "lr": 6.177157319965369e-05, "tps": 406113, "wall": 4171.3} {"step": 25849, "train_loss": 3.036659002304077, "lr": 6.176244079812873e-05, "tps": 405667, "wall": 4176.1} {"step": 25850, "train_loss": 3.073096752166748, "lr": 6.175331018912749e-05, "tps": 405223, "wall": 4180.8} {"step": 25851, "train_loss": 2.961217164993286, "lr": 6.174418137275331e-05, "tps": 404780, "wall": 4185.6} {"step": 25852, "train_loss": 3.0322256088256836, "lr": 6.173505434910954e-05, "tps": 404339, "wall": 4190.3} {"step": 25853, "train_loss": 3.116678237915039, "lr": 6.172592911829968e-05, "tps": 403899, "wall": 4195.0} {"step": 25854, "train_loss": 3.135807514190674, "lr": 6.171680568042708e-05, "tps": 403459, "wall": 4199.8} {"step": 25855, "train_loss": 3.0547428131103516, "lr": 6.170768403559501e-05, "tps": 403012, "wall": 4204.6} {"step": 25856, "train_loss": 3.0353784561157227, "lr": 6.16985641839069e-05, "tps": 402577, "wall": 4209.3} {"step": 25857, "train_loss": 3.1340880393981934, "lr": 6.168944612546598e-05, "tps": 402138, "wall": 4214.0} {"step": 25858, "train_loss": 3.097388744354248, "lr": 6.168032986037562e-05, "tps": 401700, "wall": 4218.8} {"step": 25859, "train_loss": 3.121452808380127, "lr": 6.167121538873906e-05, "tps": 401267, "wall": 4223.5} {"step": 25860, "train_loss": 3.08542799949646, "lr": 6.166210271065947e-05, "tps": 400832, "wall": 4228.3} {"step": 25861, "train_loss": 3.0427699089050293, "lr": 6.165299182624021e-05, "tps": 400392, "wall": 4233.1} {"step": 25862, "train_loss": 2.978055477142334, "lr": 6.164388273558441e-05, "tps": 399963, "wall": 4237.8} {"step": 25863, "train_loss": 3.0633485317230225, "lr": 6.163477543879525e-05, "tps": 399531, "wall": 4242.5} {"step": 25864, "train_loss": 3.110823154449463, "lr": 6.162566993597594e-05, "tps": 399100, "wall": 4247.3} {"step": 25865, "train_loss": 3.0063557624816895, "lr": 6.161656622722961e-05, "tps": 398663, "wall": 4252.1} {"step": 25866, "train_loss": 3.138428211212158, "lr": 6.160746431265937e-05, "tps": 398236, "wall": 4256.8} {"step": 25867, "train_loss": 2.995544910430908, "lr": 6.159836419236835e-05, "tps": 397804, "wall": 4261.6} {"step": 25868, "train_loss": 3.0411224365234375, "lr": 6.158926586645965e-05, "tps": 397375, "wall": 4266.4} {"step": 25869, "train_loss": 3.06264066696167, "lr": 6.158016933503628e-05, "tps": 396949, "wall": 4271.1} {"step": 25870, "train_loss": 3.0327401161193848, "lr": 6.157107459820138e-05, "tps": 396523, "wall": 4275.9} {"step": 25871, "train_loss": 3.0415115356445312, "lr": 6.156198165605786e-05, "tps": 396101, "wall": 4280.6} {"step": 25872, "train_loss": 3.0465939044952393, "lr": 6.15528905087088e-05, "tps": 395676, "wall": 4285.4} {"step": 25873, "train_loss": 3.0063271522521973, "lr": 6.154380115625718e-05, "tps": 395252, "wall": 4290.1} {"step": 25874, "train_loss": 3.1129884719848633, "lr": 6.153471359880591e-05, "tps": 394829, "wall": 4294.9} {"step": 25875, "train_loss": 3.0419464111328125, "lr": 6.152562783645804e-05, "tps": 394405, "wall": 4299.7} {"step": 25876, "train_loss": 3.0802736282348633, "lr": 6.151654386931643e-05, "tps": 393985, "wall": 4304.4} {"step": 25877, "train_loss": 3.005842447280884, "lr": 6.150746169748392e-05, "tps": 393567, "wall": 4309.1} {"step": 25878, "train_loss": 3.0503969192504883, "lr": 6.14983813210635e-05, "tps": 393149, "wall": 4313.9} {"step": 25879, "train_loss": 2.9028968811035156, "lr": 6.148930274015802e-05, "tps": 392731, "wall": 4318.7} {"step": 25880, "train_loss": 2.9815850257873535, "lr": 6.148022595487028e-05, "tps": 392310, "wall": 4323.5} {"step": 25881, "train_loss": 3.06524658203125, "lr": 6.147115096530309e-05, "tps": 391892, "wall": 4328.2} {"step": 25882, "train_loss": 2.939509868621826, "lr": 6.146207777155928e-05, "tps": 391480, "wall": 4333.0} {"step": 25883, "train_loss": 3.0817859172821045, "lr": 6.145300637374165e-05, "tps": 391065, "wall": 4337.7} {"step": 25884, "train_loss": 3.0593090057373047, "lr": 6.144393677195292e-05, "tps": 390652, "wall": 4342.5} {"step": 25885, "train_loss": 3.0567667484283447, "lr": 6.143486896629583e-05, "tps": 390241, "wall": 4347.2} {"step": 25886, "train_loss": 3.0279579162597656, "lr": 6.142580295687317e-05, "tps": 389832, "wall": 4352.0} {"step": 25887, "train_loss": 3.0947554111480713, "lr": 6.141673874378759e-05, "tps": 389422, "wall": 4356.7} {"step": 25888, "train_loss": 2.966284990310669, "lr": 6.140767632714173e-05, "tps": 389014, "wall": 4361.4} {"step": 25889, "train_loss": 2.967766046524048, "lr": 6.139861570703833e-05, "tps": 388607, "wall": 4366.2} {"step": 25890, "train_loss": 3.040773868560791, "lr": 6.138955688357999e-05, "tps": 388200, "wall": 4370.9} {"step": 25891, "train_loss": 3.21567440032959, "lr": 6.13804998568693e-05, "tps": 387790, "wall": 4375.7} {"step": 25892, "train_loss": 2.9825892448425293, "lr": 6.137144462700894e-05, "tps": 387388, "wall": 4380.4} {"step": 25893, "train_loss": 3.002228260040283, "lr": 6.13623911941014e-05, "tps": 386980, "wall": 4385.2} {"step": 25894, "train_loss": 3.0603389739990234, "lr": 6.135333955824927e-05, "tps": 386578, "wall": 4389.9} {"step": 25895, "train_loss": 2.9913039207458496, "lr": 6.134428971955511e-05, "tps": 386176, "wall": 4394.7} {"step": 25896, "train_loss": 3.1238162517547607, "lr": 6.133524167812143e-05, "tps": 385775, "wall": 4399.4} {"step": 25897, "train_loss": 3.161985158920288, "lr": 6.132619543405067e-05, "tps": 385375, "wall": 4404.2} {"step": 25898, "train_loss": 3.0302395820617676, "lr": 6.131715098744539e-05, "tps": 384976, "wall": 4408.9} {"step": 25899, "train_loss": 3.048278331756592, "lr": 6.130810833840798e-05, "tps": 384575, "wall": 4413.7} {"step": 25900, "train_loss": 3.068589210510254, "lr": 6.129906748704092e-05, "tps": 384180, "wall": 4418.4} {"step": 25901, "train_loss": 3.069448947906494, "lr": 6.129002843344663e-05, "tps": 383785, "wall": 4423.1} {"step": 25902, "train_loss": 3.0971813201904297, "lr": 6.128099117772744e-05, "tps": 383389, "wall": 4427.8} {"step": 25903, "train_loss": 3.087282657623291, "lr": 6.127195571998582e-05, "tps": 382994, "wall": 4432.6} {"step": 25904, "train_loss": 3.093858480453491, "lr": 6.126292206032407e-05, "tps": 382601, "wall": 4437.3} {"step": 25905, "train_loss": 3.0489232540130615, "lr": 6.125389019884447e-05, "tps": 382207, "wall": 4442.0} {"step": 25906, "train_loss": 3.021583080291748, "lr": 6.124486013564944e-05, "tps": 381809, "wall": 4446.8} {"step": 25907, "train_loss": 2.9733595848083496, "lr": 6.12358318708412e-05, "tps": 381418, "wall": 4451.6} {"step": 25908, "train_loss": 3.0037484169006348, "lr": 6.122680540452202e-05, "tps": 381027, "wall": 4456.3} {"step": 25909, "train_loss": 3.043459177017212, "lr": 6.121778073679425e-05, "tps": 380638, "wall": 4461.0} {"step": 25910, "train_loss": 3.0172481536865234, "lr": 6.120875786776e-05, "tps": 380248, "wall": 4465.8} {"step": 25911, "train_loss": 2.9813857078552246, "lr": 6.119973679752154e-05, "tps": 379860, "wall": 4470.5} {"step": 25912, "train_loss": 3.0038602352142334, "lr": 6.119071752618105e-05, "tps": 379473, "wall": 4475.2} {"step": 25913, "train_loss": 3.059675931930542, "lr": 6.118170005384071e-05, "tps": 379086, "wall": 4480.0} {"step": 25914, "train_loss": 3.071077346801758, "lr": 6.117268438060265e-05, "tps": 378700, "wall": 4484.7} {"step": 25915, "train_loss": 3.008151054382324, "lr": 6.116367050656902e-05, "tps": 378315, "wall": 4489.5} {"step": 25916, "train_loss": 3.0255513191223145, "lr": 6.115465843184192e-05, "tps": 377931, "wall": 4494.2} {"step": 25917, "train_loss": 3.0077340602874756, "lr": 6.114564815652346e-05, "tps": 377546, "wall": 4498.9} {"step": 25918, "train_loss": 3.0911240577697754, "lr": 6.11366396807157e-05, "tps": 377156, "wall": 4503.8} {"step": 25919, "train_loss": 2.945693016052246, "lr": 6.112763300452063e-05, "tps": 376778, "wall": 4508.5} {"step": 25920, "train_loss": 3.0096192359924316, "lr": 6.111862812804036e-05, "tps": 376397, "wall": 4513.2} {"step": 25921, "train_loss": 3.024336099624634, "lr": 6.110962505137691e-05, "tps": 376015, "wall": 4518.0} {"step": 25922, "train_loss": 2.9778714179992676, "lr": 6.110062377463213e-05, "tps": 375635, "wall": 4522.7} {"step": 25923, "train_loss": 3.0036520957946777, "lr": 6.109162429790813e-05, "tps": 375256, "wall": 4527.5} {"step": 25924, "train_loss": 3.061077117919922, "lr": 6.108262662130684e-05, "tps": 374877, "wall": 4532.2} {"step": 25925, "train_loss": 3.11074161529541, "lr": 6.10736307449301e-05, "tps": 374496, "wall": 4537.0} {"step": 25926, "train_loss": 3.030280113220215, "lr": 6.10646366688799e-05, "tps": 374120, "wall": 4541.7} {"step": 25927, "train_loss": 3.112316608428955, "lr": 6.105564439325808e-05, "tps": 373744, "wall": 4546.5} {"step": 25928, "train_loss": 2.927949905395508, "lr": 6.104665391816651e-05, "tps": 373369, "wall": 4551.2} {"step": 25929, "train_loss": 3.0505142211914062, "lr": 6.103766524370705e-05, "tps": 372995, "wall": 4555.9} {"step": 25930, "train_loss": 3.0516862869262695, "lr": 6.102867836998154e-05, "tps": 372619, "wall": 4560.7} {"step": 25931, "train_loss": 2.98483943939209, "lr": 6.101969329709172e-05, "tps": 372237, "wall": 4565.6} {"step": 25932, "train_loss": 3.0112462043762207, "lr": 6.101071002513946e-05, "tps": 371865, "wall": 4570.3} {"step": 25933, "train_loss": 3.067352056503296, "lr": 6.100172855422647e-05, "tps": 371494, "wall": 4575.1} {"step": 25934, "train_loss": 2.9984068870544434, "lr": 6.099274888445445e-05, "tps": 371119, "wall": 4579.9} {"step": 25935, "train_loss": 2.9692134857177734, "lr": 6.098377101592523e-05, "tps": 370749, "wall": 4584.6} {"step": 25936, "train_loss": 3.102278709411621, "lr": 6.097479494874041e-05, "tps": 370381, "wall": 4589.3} {"step": 25937, "train_loss": 3.1051177978515625, "lr": 6.0965820683001764e-05, "tps": 370010, "wall": 4594.1} {"step": 25938, "train_loss": 2.967376708984375, "lr": 6.095684821881087e-05, "tps": 369644, "wall": 4598.8} {"step": 25939, "train_loss": 3.1856746673583984, "lr": 6.0947877556269396e-05, "tps": 369277, "wall": 4603.6} {"step": 25940, "train_loss": 3.075033664703369, "lr": 6.0938908695479e-05, "tps": 368912, "wall": 4608.3} {"step": 25941, "train_loss": 3.0051779747009277, "lr": 6.092994163654127e-05, "tps": 368547, "wall": 4613.1} {"step": 25942, "train_loss": 3.0217933654785156, "lr": 6.0920976379557716e-05, "tps": 368183, "wall": 4617.8} {"step": 25943, "train_loss": 3.0055036544799805, "lr": 6.0912012924629956e-05, "tps": 367819, "wall": 4622.6} {"step": 25944, "train_loss": 3.0742547512054443, "lr": 6.090305127185956e-05, "tps": 367454, "wall": 4627.3} {"step": 25945, "train_loss": 3.0846610069274902, "lr": 6.0894091421347946e-05, "tps": 367091, "wall": 4632.1} {"step": 25946, "train_loss": 3.0786566734313965, "lr": 6.088513337319672e-05, "tps": 366729, "wall": 4636.8} {"step": 25947, "train_loss": 2.998608112335205, "lr": 6.087617712750731e-05, "tps": 366369, "wall": 4641.6} {"step": 25948, "train_loss": 3.1389577388763428, "lr": 6.086722268438113e-05, "tps": 366010, "wall": 4646.3} {"step": 25949, "train_loss": 3.05450177192688, "lr": 6.0858270043919706e-05, "tps": 365649, "wall": 4651.1} {"step": 25950, "train_loss": 3.0478365421295166, "lr": 6.08493192062244e-05, "tps": 365285, "wall": 4655.9} {"step": 25951, "train_loss": 3.069702625274658, "lr": 6.08403701713966e-05, "tps": 364927, "wall": 4660.6} {"step": 25952, "train_loss": 2.989819288253784, "lr": 6.0831422939537695e-05, "tps": 364564, "wall": 4665.4} {"step": 25953, "train_loss": 3.0497257709503174, "lr": 6.082247751074904e-05, "tps": 364206, "wall": 4670.2} {"step": 25954, "train_loss": 3.0363576412200928, "lr": 6.081353388513199e-05, "tps": 363851, "wall": 4674.9} {"step": 25955, "train_loss": 2.9540517330169678, "lr": 6.0804592062787844e-05, "tps": 363497, "wall": 4679.7} {"step": 25956, "train_loss": 2.9680018424987793, "lr": 6.079565204381786e-05, "tps": 363136, "wall": 4684.5} {"step": 25957, "train_loss": 2.973557472229004, "lr": 6.078671382832338e-05, "tps": 362784, "wall": 4689.2} {"step": 25958, "train_loss": 3.100710391998291, "lr": 6.077777741640562e-05, "tps": 362432, "wall": 4694.0} {"step": 25959, "train_loss": 2.9391238689422607, "lr": 6.076884280816577e-05, "tps": 362080, "wall": 4698.7} {"step": 25960, "train_loss": 3.00352144241333, "lr": 6.07599100037051e-05, "tps": 361728, "wall": 4703.5} {"step": 25961, "train_loss": 2.9204916954040527, "lr": 6.075097900312482e-05, "tps": 361378, "wall": 4708.2} {"step": 25962, "train_loss": 2.968581199645996, "lr": 6.0742049806526005e-05, "tps": 361028, "wall": 4713.0} {"step": 25963, "train_loss": 3.003225326538086, "lr": 6.0733122414009914e-05, "tps": 360679, "wall": 4717.7} {"step": 25964, "train_loss": 2.9678149223327637, "lr": 6.072419682567761e-05, "tps": 360330, "wall": 4722.4} {"step": 25965, "train_loss": 3.042635440826416, "lr": 6.07152730416302e-05, "tps": 359981, "wall": 4727.2} {"step": 25966, "train_loss": 3.0465798377990723, "lr": 6.0706351061968834e-05, "tps": 359634, "wall": 4731.9} {"step": 25967, "train_loss": 3.0523159503936768, "lr": 6.0697430886794525e-05, "tps": 359288, "wall": 4736.7} {"step": 25968, "train_loss": 3.0264813899993896, "lr": 6.068851251620832e-05, "tps": 358943, "wall": 4741.4} {"step": 25969, "train_loss": 3.0540454387664795, "lr": 6.067959595031128e-05, "tps": 358594, "wall": 4746.2} {"step": 25970, "train_loss": 2.9952340126037598, "lr": 6.067068118920437e-05, "tps": 358251, "wall": 4751.0} {"step": 25971, "train_loss": 3.0955543518066406, "lr": 6.066176823298866e-05, "tps": 357904, "wall": 4755.7} {"step": 25972, "train_loss": 2.966747760772705, "lr": 6.0652857081765025e-05, "tps": 357561, "wall": 4760.5} {"step": 25973, "train_loss": 3.0692086219787598, "lr": 6.064394773563442e-05, "tps": 357219, "wall": 4765.2} {"step": 25974, "train_loss": 3.0261902809143066, "lr": 6.063504019469784e-05, "tps": 356877, "wall": 4770.0} {"step": 25975, "train_loss": 3.01115083694458, "lr": 6.062613445905615e-05, "tps": 356534, "wall": 4774.7} {"step": 25976, "train_loss": 2.9955453872680664, "lr": 6.0617230528810186e-05, "tps": 356195, "wall": 4779.5} {"step": 25977, "train_loss": 3.0680034160614014, "lr": 6.060832840406089e-05, "tps": 355854, "wall": 4784.2} {"step": 25978, "train_loss": 2.9809000492095947, "lr": 6.059942808490906e-05, "tps": 355513, "wall": 4789.0} {"step": 25979, "train_loss": 3.062105178833008, "lr": 6.0590529571455536e-05, "tps": 355175, "wall": 4793.8} {"step": 25980, "train_loss": 2.9885494709014893, "lr": 6.0581632863801107e-05, "tps": 354838, "wall": 4798.5} {"step": 25981, "train_loss": 3.053541660308838, "lr": 6.05727379620466e-05, "tps": 354500, "wall": 4803.2} {"step": 25982, "train_loss": 2.9506356716156006, "lr": 6.05638448662927e-05, "tps": 354161, "wall": 4808.0} {"step": 25983, "train_loss": 3.037595748901367, "lr": 6.0554953576640214e-05, "tps": 353826, "wall": 4812.8} {"step": 25984, "train_loss": 3.0617663860321045, "lr": 6.054606409318985e-05, "tps": 353491, "wall": 4817.5} {"step": 25985, "train_loss": 3.0507659912109375, "lr": 6.053717641604225e-05, "tps": 353156, "wall": 4822.3} {"step": 25986, "train_loss": 2.928206443786621, "lr": 6.0528290545298196e-05, "tps": 352822, "wall": 4827.0} {"step": 25987, "train_loss": 2.884302854537964, "lr": 6.051940648105829e-05, "tps": 352489, "wall": 4831.8} {"step": 25988, "train_loss": 3.030505895614624, "lr": 6.051052422342313e-05, "tps": 352156, "wall": 4836.5} {"step": 25989, "train_loss": 3.105510711669922, "lr": 6.050164377249341e-05, "tps": 351825, "wall": 4841.3} {"step": 25990, "train_loss": 3.0131030082702637, "lr": 6.0492765128369675e-05, "tps": 351492, "wall": 4846.0} {"step": 25991, "train_loss": 3.0338733196258545, "lr": 6.048388829115256e-05, "tps": 351161, "wall": 4850.8} {"step": 25992, "train_loss": 3.053975820541382, "lr": 6.047501326094259e-05, "tps": 350832, "wall": 4855.5} {"step": 25993, "train_loss": 3.0419974327087402, "lr": 6.046614003784026e-05, "tps": 350503, "wall": 4860.3} {"step": 25994, "train_loss": 3.043701171875, "lr": 6.045726862194616e-05, "tps": 350170, "wall": 4865.1} {"step": 25995, "train_loss": 3.0282983779907227, "lr": 6.0448399013360765e-05, "tps": 349842, "wall": 4869.8} {"step": 25996, "train_loss": 2.9674789905548096, "lr": 6.04395312121845e-05, "tps": 349512, "wall": 4874.6} {"step": 25997, "train_loss": 3.027132511138916, "lr": 6.0430665218517866e-05, "tps": 349186, "wall": 4879.3} {"step": 25998, "train_loss": 2.953913450241089, "lr": 6.042180103246131e-05, "tps": 348860, "wall": 4884.1} {"step": 25999, "train_loss": 2.970331907272339, "lr": 6.041293865411519e-05, "tps": 348534, "wall": 4888.9} {"step": 26000, "train_loss": 3.022280693054199, "lr": 6.040407808357996e-05, "tps": 348210, "wall": 4893.6, "val_loss_monitor": 3.344622334779956} {"step": 26001, "train_loss": 3.052427291870117, "lr": 6.0395219320955975e-05, "tps": 344576, "wall": 4945.4} {"step": 26002, "train_loss": 3.157419204711914, "lr": 6.0386362366343563e-05, "tps": 344256, "wall": 4950.2} {"step": 26003, "train_loss": 3.103299617767334, "lr": 6.037750721984308e-05, "tps": 343935, "wall": 4955.0} {"step": 26004, "train_loss": 3.0985467433929443, "lr": 6.036865388155485e-05, "tps": 343620, "wall": 4959.7} {"step": 26005, "train_loss": 2.950636863708496, "lr": 6.035980235157909e-05, "tps": 343302, "wall": 4964.5} {"step": 26006, "train_loss": 3.0789387226104736, "lr": 6.0350952630016154e-05, "tps": 342987, "wall": 4969.3} {"step": 26007, "train_loss": 3.156466484069824, "lr": 6.034210471696625e-05, "tps": 342673, "wall": 4974.0} {"step": 26008, "train_loss": 3.2525739669799805, "lr": 6.033325861252967e-05, "tps": 342359, "wall": 4978.8} {"step": 26009, "train_loss": 3.0604188442230225, "lr": 6.0324414316806544e-05, "tps": 342043, "wall": 4983.6} {"step": 26010, "train_loss": 3.103801727294922, "lr": 6.0315571829897074e-05, "tps": 341723, "wall": 4988.4} {"step": 26011, "train_loss": 3.191732883453369, "lr": 6.030673115190146e-05, "tps": 341409, "wall": 4993.2} {"step": 26012, "train_loss": 3.120847702026367, "lr": 6.0297892282919855e-05, "tps": 341098, "wall": 4997.9} {"step": 26013, "train_loss": 3.0580995082855225, "lr": 6.0289055223052326e-05, "tps": 340787, "wall": 5002.7} {"step": 26014, "train_loss": 3.1459314823150635, "lr": 6.0280219972399046e-05, "tps": 340477, "wall": 5007.4} {"step": 26015, "train_loss": 3.1668272018432617, "lr": 6.0271386531060095e-05, "tps": 340167, "wall": 5012.2} {"step": 26016, "train_loss": 3.1325902938842773, "lr": 6.026255489913547e-05, "tps": 339858, "wall": 5016.9} {"step": 26017, "train_loss": 3.1530675888061523, "lr": 6.02537250767253e-05, "tps": 339549, "wall": 5021.7} {"step": 26018, "train_loss": 3.074235200881958, "lr": 6.0244897063929576e-05, "tps": 339239, "wall": 5026.5} {"step": 26019, "train_loss": 3.106738328933716, "lr": 6.0236070860848246e-05, "tps": 338932, "wall": 5031.2} {"step": 26020, "train_loss": 3.151651382446289, "lr": 6.022724646758141e-05, "tps": 338625, "wall": 5036.0} {"step": 26021, "train_loss": 3.160313606262207, "lr": 6.021842388422896e-05, "tps": 338318, "wall": 5040.7} {"step": 26022, "train_loss": 3.195065975189209, "lr": 6.020960311089081e-05, "tps": 338008, "wall": 5045.6} {"step": 26023, "train_loss": 3.030768394470215, "lr": 6.0200784147666965e-05, "tps": 337703, "wall": 5050.3} {"step": 26024, "train_loss": 3.1908178329467773, "lr": 6.0191966994657254e-05, "tps": 337397, "wall": 5055.1} {"step": 26025, "train_loss": 2.981877088546753, "lr": 6.01831516519616e-05, "tps": 337092, "wall": 5059.9} {"step": 26026, "train_loss": 3.133970022201538, "lr": 6.0174338119679855e-05, "tps": 336788, "wall": 5064.6} {"step": 26027, "train_loss": 3.0938005447387695, "lr": 6.016552639791184e-05, "tps": 336484, "wall": 5069.4} {"step": 26028, "train_loss": 3.1127219200134277, "lr": 6.01567164867574e-05, "tps": 336181, "wall": 5074.2} {"step": 26029, "train_loss": 3.1421868801116943, "lr": 6.014790838631632e-05, "tps": 335878, "wall": 5078.9} {"step": 26030, "train_loss": 3.2100088596343994, "lr": 6.013910209668837e-05, "tps": 335575, "wall": 5083.7} {"step": 26031, "train_loss": 3.072474956512451, "lr": 6.013029761797333e-05, "tps": 335273, "wall": 5088.5} {"step": 26032, "train_loss": 3.1276063919067383, "lr": 6.012149495027094e-05, "tps": 334972, "wall": 5093.3} {"step": 26033, "train_loss": 3.213675022125244, "lr": 6.0112694093680877e-05, "tps": 334670, "wall": 5098.0} {"step": 26034, "train_loss": 3.058946132659912, "lr": 6.0103895048302886e-05, "tps": 334370, "wall": 5102.8} {"step": 26035, "train_loss": 3.151338577270508, "lr": 6.0095097814236636e-05, "tps": 334068, "wall": 5107.6} {"step": 26036, "train_loss": 3.1587061882019043, "lr": 6.008630239158172e-05, "tps": 333768, "wall": 5112.4} {"step": 26037, "train_loss": 3.130577564239502, "lr": 6.0077508780437866e-05, "tps": 333464, "wall": 5117.3} {"step": 26038, "train_loss": 3.1679368019104004, "lr": 6.006871698090463e-05, "tps": 333162, "wall": 5122.1} {"step": 26039, "train_loss": 3.0754847526550293, "lr": 6.0059926993081595e-05, "tps": 332861, "wall": 5126.9} {"step": 26040, "train_loss": 3.0517523288726807, "lr": 6.005113881706841e-05, "tps": 332562, "wall": 5131.7} {"step": 26041, "train_loss": 3.0807957649230957, "lr": 6.0042352452964545e-05, "tps": 332263, "wall": 5136.6} {"step": 26042, "train_loss": 3.0320510864257812, "lr": 6.003356790086956e-05, "tps": 331965, "wall": 5141.4} {"step": 26043, "train_loss": 3.130983591079712, "lr": 6.0024785160883e-05, "tps": 331668, "wall": 5146.2} {"step": 26044, "train_loss": 3.0368542671203613, "lr": 6.001600423310428e-05, "tps": 331371, "wall": 5151.0} {"step": 26045, "train_loss": 3.0851149559020996, "lr": 6.000722511763296e-05, "tps": 331072, "wall": 5155.8} {"step": 26046, "train_loss": 2.977261543273926, "lr": 5.999844781456845e-05, "tps": 330778, "wall": 5160.6} {"step": 26047, "train_loss": 3.1527152061462402, "lr": 5.998967232401015e-05, "tps": 330479, "wall": 5165.5} {"step": 26048, "train_loss": 3.074972152709961, "lr": 5.998089864605755e-05, "tps": 330185, "wall": 5170.3} {"step": 26049, "train_loss": 3.097358226776123, "lr": 5.9972126780809945e-05, "tps": 329886, "wall": 5175.2} {"step": 26050, "train_loss": 3.1154165267944336, "lr": 5.996335672836676e-05, "tps": 329590, "wall": 5180.0} {"step": 26051, "train_loss": 3.134620189666748, "lr": 5.9954588488827346e-05, "tps": 329295, "wall": 5184.8} {"step": 26052, "train_loss": 3.1003224849700928, "lr": 5.994582206229096e-05, "tps": 329003, "wall": 5189.6} {"step": 26053, "train_loss": 3.1528589725494385, "lr": 5.993705744885699e-05, "tps": 328712, "wall": 5194.4} {"step": 26054, "train_loss": 3.196732521057129, "lr": 5.9928294648624706e-05, "tps": 328421, "wall": 5199.2} {"step": 26055, "train_loss": 3.0832290649414062, "lr": 5.9919533661693314e-05, "tps": 328132, "wall": 5204.0} {"step": 26056, "train_loss": 3.139172077178955, "lr": 5.991077448816215e-05, "tps": 327841, "wall": 5208.8} {"step": 26057, "train_loss": 3.1125407218933105, "lr": 5.9902017128130386e-05, "tps": 327553, "wall": 5213.6} {"step": 26058, "train_loss": 3.1772654056549072, "lr": 5.989326158169721e-05, "tps": 327264, "wall": 5218.4} {"step": 26059, "train_loss": 3.138829231262207, "lr": 5.9884507848961856e-05, "tps": 326977, "wall": 5223.2} {"step": 26060, "train_loss": 3.092496871948242, "lr": 5.987575593002346e-05, "tps": 326687, "wall": 5228.0} {"step": 26061, "train_loss": 3.021515130996704, "lr": 5.9867005824981124e-05, "tps": 326400, "wall": 5232.8} {"step": 26062, "train_loss": 3.1008291244506836, "lr": 5.985825753393406e-05, "tps": 326114, "wall": 5237.6} {"step": 26063, "train_loss": 2.9793906211853027, "lr": 5.98495110569813e-05, "tps": 325829, "wall": 5242.4} {"step": 26064, "train_loss": 3.052854299545288, "lr": 5.984076639422191e-05, "tps": 325544, "wall": 5247.2} {"step": 26065, "train_loss": 3.1154210567474365, "lr": 5.9832023545755026e-05, "tps": 325260, "wall": 5252.0} {"step": 26066, "train_loss": 3.0945210456848145, "lr": 5.9823282511679604e-05, "tps": 324975, "wall": 5256.8} {"step": 26067, "train_loss": 3.061561107635498, "lr": 5.981454329209473e-05, "tps": 324692, "wall": 5261.6} {"step": 26068, "train_loss": 3.172389030456543, "lr": 5.9805805887099384e-05, "tps": 324408, "wall": 5266.4} {"step": 26069, "train_loss": 3.0980095863342285, "lr": 5.979707029679251e-05, "tps": 324126, "wall": 5271.2} {"step": 26070, "train_loss": 3.0544791221618652, "lr": 5.978833652127311e-05, "tps": 323845, "wall": 5275.9} {"step": 26071, "train_loss": 3.1027841567993164, "lr": 5.9779604560640114e-05, "tps": 323563, "wall": 5280.7} {"step": 26072, "train_loss": 3.0860719680786133, "lr": 5.9770874414992384e-05, "tps": 323278, "wall": 5285.6} {"step": 26073, "train_loss": 3.072578191757202, "lr": 5.976214608442889e-05, "tps": 322999, "wall": 5290.4} {"step": 26074, "train_loss": 3.094374179840088, "lr": 5.975341956904847e-05, "tps": 322719, "wall": 5295.2} {"step": 26075, "train_loss": 3.110776424407959, "lr": 5.974469486894996e-05, "tps": 322439, "wall": 5300.0} {"step": 26076, "train_loss": 3.07496976852417, "lr": 5.973597198423224e-05, "tps": 322160, "wall": 5304.7} {"step": 26077, "train_loss": 3.1558938026428223, "lr": 5.9727250914994104e-05, "tps": 321877, "wall": 5309.6} {"step": 26078, "train_loss": 3.122488260269165, "lr": 5.97185316613343e-05, "tps": 321597, "wall": 5314.4} {"step": 26079, "train_loss": 3.1017191410064697, "lr": 5.970981422335169e-05, "tps": 321319, "wall": 5319.2} {"step": 26080, "train_loss": 3.040336847305298, "lr": 5.9701098601144966e-05, "tps": 321041, "wall": 5324.1} {"step": 26081, "train_loss": 3.0419106483459473, "lr": 5.9692384794812825e-05, "tps": 320766, "wall": 5328.8} {"step": 26082, "train_loss": 2.9662270545959473, "lr": 5.968367280445406e-05, "tps": 320489, "wall": 5333.6} {"step": 26083, "train_loss": 3.135133743286133, "lr": 5.967496263016734e-05, "tps": 320214, "wall": 5338.4} {"step": 26084, "train_loss": 3.137936592102051, "lr": 5.966625427205126e-05, "tps": 319939, "wall": 5343.2} {"step": 26085, "train_loss": 3.043638229370117, "lr": 5.965754773020458e-05, "tps": 319661, "wall": 5348.1} {"step": 26086, "train_loss": 3.136896848678589, "lr": 5.9648843004725815e-05, "tps": 319387, "wall": 5352.9} {"step": 26087, "train_loss": 3.174586772918701, "lr": 5.964014009571368e-05, "tps": 319113, "wall": 5357.7} {"step": 26088, "train_loss": 3.055731773376465, "lr": 5.963143900326671e-05, "tps": 318841, "wall": 5362.4} {"step": 26089, "train_loss": 3.1166276931762695, "lr": 5.962273972748344e-05, "tps": 318567, "wall": 5367.3} {"step": 26090, "train_loss": 3.2132954597473145, "lr": 5.96140422684625e-05, "tps": 318292, "wall": 5372.1} {"step": 26091, "train_loss": 3.0947113037109375, "lr": 5.960534662630237e-05, "tps": 318013, "wall": 5377.0} {"step": 26092, "train_loss": 3.1782593727111816, "lr": 5.959665280110148e-05, "tps": 317732, "wall": 5382.0} {"step": 26093, "train_loss": 3.1087725162506104, "lr": 5.958796079295844e-05, "tps": 317452, "wall": 5386.9} {"step": 26094, "train_loss": 3.1523666381835938, "lr": 5.957927060197166e-05, "tps": 317174, "wall": 5391.9} {"step": 26095, "train_loss": 3.1476621627807617, "lr": 5.957058222823956e-05, "tps": 316899, "wall": 5396.7} {"step": 26096, "train_loss": 3.0813071727752686, "lr": 5.956189567186059e-05, "tps": 316625, "wall": 5401.6} {"step": 26097, "train_loss": 3.0982015132904053, "lr": 5.9553210932933166e-05, "tps": 316349, "wall": 5406.6} {"step": 26098, "train_loss": 3.187337636947632, "lr": 5.95445280115556e-05, "tps": 316073, "wall": 5411.5} {"step": 26099, "train_loss": 3.0906996726989746, "lr": 5.953584690782633e-05, "tps": 315797, "wall": 5416.4} {"step": 26100, "train_loss": 3.1345834732055664, "lr": 5.952716762184369e-05, "tps": 315523, "wall": 5421.3} {"step": 26101, "train_loss": 3.102579116821289, "lr": 5.951849015370594e-05, "tps": 315246, "wall": 5426.3} {"step": 26102, "train_loss": 2.926337718963623, "lr": 5.9509814503511426e-05, "tps": 314973, "wall": 5431.2} {"step": 26103, "train_loss": 3.068291425704956, "lr": 5.9501140671358403e-05, "tps": 314699, "wall": 5436.1} {"step": 26104, "train_loss": 3.084010362625122, "lr": 5.9492468657345176e-05, "tps": 314425, "wall": 5441.1} {"step": 26105, "train_loss": 3.1166391372680664, "lr": 5.9483798461569926e-05, "tps": 314153, "wall": 5446.0} {"step": 26106, "train_loss": 3.057795524597168, "lr": 5.947513008413088e-05, "tps": 313882, "wall": 5450.9} {"step": 26107, "train_loss": 3.076051712036133, "lr": 5.9466463525126284e-05, "tps": 313612, "wall": 5455.8} {"step": 26108, "train_loss": 2.9936208724975586, "lr": 5.945779878465424e-05, "tps": 313342, "wall": 5460.7} {"step": 26109, "train_loss": 3.020512342453003, "lr": 5.944913586281292e-05, "tps": 313068, "wall": 5465.7} {"step": 26110, "train_loss": 3.0889892578125, "lr": 5.944047475970051e-05, "tps": 312804, "wall": 5470.5} {"step": 26111, "train_loss": 3.110687732696533, "lr": 5.94318154754151e-05, "tps": 312540, "wall": 5475.4} {"step": 26112, "train_loss": 3.048373222351074, "lr": 5.942315801005474e-05, "tps": 312273, "wall": 5480.3} {"step": 26113, "train_loss": 3.0390844345092773, "lr": 5.941450236371754e-05, "tps": 312010, "wall": 5485.1} {"step": 26114, "train_loss": 3.058126926422119, "lr": 5.940584853650155e-05, "tps": 311749, "wall": 5489.9} {"step": 26115, "train_loss": 3.1802210807800293, "lr": 5.9397196528504774e-05, "tps": 311485, "wall": 5494.8} {"step": 26116, "train_loss": 3.2110185623168945, "lr": 5.9388546339825276e-05, "tps": 311217, "wall": 5499.7} {"step": 26117, "train_loss": 3.1535205841064453, "lr": 5.9379897970561016e-05, "tps": 310951, "wall": 5504.6} {"step": 26118, "train_loss": 3.070723533630371, "lr": 5.937125142080992e-05, "tps": 310685, "wall": 5509.5} {"step": 26119, "train_loss": 3.0405375957489014, "lr": 5.936260669067002e-05, "tps": 310419, "wall": 5514.5} {"step": 26120, "train_loss": 3.049516439437866, "lr": 5.9353963780239155e-05, "tps": 310156, "wall": 5519.4} {"step": 26121, "train_loss": 3.1649484634399414, "lr": 5.9345322689615326e-05, "tps": 309885, "wall": 5524.4} {"step": 26122, "train_loss": 3.1368441581726074, "lr": 5.9336683418896354e-05, "tps": 309621, "wall": 5529.3} {"step": 26123, "train_loss": 3.201594352722168, "lr": 5.9328045968180114e-05, "tps": 309353, "wall": 5534.3} {"step": 26124, "train_loss": 3.130115509033203, "lr": 5.931941033756448e-05, "tps": 309086, "wall": 5539.3} {"step": 26125, "train_loss": 3.2017860412597656, "lr": 5.931077652714727e-05, "tps": 308820, "wall": 5544.3} {"step": 26126, "train_loss": 3.1858654022216797, "lr": 5.930214453702623e-05, "tps": 308555, "wall": 5549.3} {"step": 26127, "train_loss": 3.154435634613037, "lr": 5.929351436729923e-05, "tps": 308290, "wall": 5554.3} {"step": 26128, "train_loss": 3.1220757961273193, "lr": 5.9284886018064e-05, "tps": 308026, "wall": 5559.2} {"step": 26129, "train_loss": 3.0411369800567627, "lr": 5.927625948941822e-05, "tps": 307762, "wall": 5564.2} {"step": 26130, "train_loss": 3.077542304992676, "lr": 5.9267634781459723e-05, "tps": 307498, "wall": 5569.2} {"step": 26131, "train_loss": 3.0475354194641113, "lr": 5.925901189428616e-05, "tps": 307237, "wall": 5574.1} {"step": 26132, "train_loss": 3.2616987228393555, "lr": 5.925039082799515e-05, "tps": 306980, "wall": 5579.0} {"step": 26133, "train_loss": 3.121699333190918, "lr": 5.924177158268447e-05, "tps": 306716, "wall": 5584.0} {"step": 26134, "train_loss": 3.1182913780212402, "lr": 5.923315415845168e-05, "tps": 306458, "wall": 5589.0} {"step": 26135, "train_loss": 3.2284319400787354, "lr": 5.922453855539437e-05, "tps": 306201, "wall": 5593.9} {"step": 26136, "train_loss": 3.0895493030548096, "lr": 5.921592477361024e-05, "tps": 305946, "wall": 5598.7} {"step": 26137, "train_loss": 3.1340043544769287, "lr": 5.9207312813196804e-05, "tps": 305694, "wall": 5603.6} {"step": 26138, "train_loss": 3.122070550918579, "lr": 5.919870267425161e-05, "tps": 305443, "wall": 5608.4} {"step": 26139, "train_loss": 3.0202829837799072, "lr": 5.919009435687222e-05, "tps": 305194, "wall": 5613.2} {"step": 26140, "train_loss": 3.092475652694702, "lr": 5.918148786115612e-05, "tps": 304944, "wall": 5618.0} {"step": 26141, "train_loss": 3.084988832473755, "lr": 5.9172883187200845e-05, "tps": 304696, "wall": 5622.8} {"step": 26142, "train_loss": 3.126025676727295, "lr": 5.916428033510386e-05, "tps": 304445, "wall": 5627.6} {"step": 26143, "train_loss": 3.0153603553771973, "lr": 5.9155679304962574e-05, "tps": 304196, "wall": 5632.5} {"step": 26144, "train_loss": 3.1116976737976074, "lr": 5.9147080096874494e-05, "tps": 303947, "wall": 5637.3} {"step": 26145, "train_loss": 3.1922366619110107, "lr": 5.9138482710937006e-05, "tps": 303696, "wall": 5642.2} {"step": 26146, "train_loss": 3.0921456813812256, "lr": 5.912988714724743e-05, "tps": 303443, "wall": 5647.1} {"step": 26147, "train_loss": 3.0915985107421875, "lr": 5.912129340590322e-05, "tps": 303196, "wall": 5651.9} {"step": 26148, "train_loss": 3.1109814643859863, "lr": 5.9112701487001746e-05, "tps": 302947, "wall": 5656.7} {"step": 26149, "train_loss": 3.197814464569092, "lr": 5.910411139064022e-05, "tps": 302700, "wall": 5661.6} {"step": 26150, "train_loss": 3.0615005493164062, "lr": 5.9095523116916066e-05, "tps": 302453, "wall": 5666.4} {"step": 26151, "train_loss": 3.098379135131836, "lr": 5.908693666592654e-05, "tps": 302207, "wall": 5671.3} {"step": 26152, "train_loss": 3.1128110885620117, "lr": 5.907835203776887e-05, "tps": 301961, "wall": 5676.1} {"step": 26153, "train_loss": 3.130728006362915, "lr": 5.906976923254035e-05, "tps": 301716, "wall": 5680.9} {"step": 26154, "train_loss": 3.1447644233703613, "lr": 5.906118825033819e-05, "tps": 301471, "wall": 5685.8} {"step": 26155, "train_loss": 3.1287589073181152, "lr": 5.905260909125959e-05, "tps": 301220, "wall": 5690.7} {"step": 26156, "train_loss": 3.1159653663635254, "lr": 5.9044031755401754e-05, "tps": 300935, "wall": 5696.3} {"step": 26157, "train_loss": 3.1700148582458496, "lr": 5.9035456242861795e-05, "tps": 300689, "wall": 5701.2} {"step": 26158, "train_loss": 3.10628080368042, "lr": 5.902688255373694e-05, "tps": 300438, "wall": 5706.2} {"step": 26159, "train_loss": 3.014042615890503, "lr": 5.901831068812429e-05, "tps": 300194, "wall": 5711.0} {"step": 26160, "train_loss": 3.1495885848999023, "lr": 5.900974064612085e-05, "tps": 299949, "wall": 5715.9} {"step": 26161, "train_loss": 3.0652594566345215, "lr": 5.900117242782382e-05, "tps": 299705, "wall": 5720.8} {"step": 26162, "train_loss": 3.1927855014801025, "lr": 5.899260603333024e-05, "tps": 299463, "wall": 5725.6} {"step": 26163, "train_loss": 3.096827507019043, "lr": 5.898404146273708e-05, "tps": 299220, "wall": 5730.5} {"step": 26164, "train_loss": 3.1187334060668945, "lr": 5.897547871614144e-05, "tps": 298979, "wall": 5735.3} {"step": 26165, "train_loss": 3.114607334136963, "lr": 5.89669177936403e-05, "tps": 298737, "wall": 5740.2} {"step": 26166, "train_loss": 3.012773036956787, "lr": 5.895835869533059e-05, "tps": 298495, "wall": 5745.1} {"step": 26167, "train_loss": 3.0694146156311035, "lr": 5.8949801421309335e-05, "tps": 298254, "wall": 5749.9} {"step": 26168, "train_loss": 3.0308384895324707, "lr": 5.894124597167344e-05, "tps": 298015, "wall": 5754.8} {"step": 26169, "train_loss": 3.0933048725128174, "lr": 5.8932692346519814e-05, "tps": 297777, "wall": 5759.6} {"step": 26170, "train_loss": 2.9856081008911133, "lr": 5.892414054594536e-05, "tps": 297533, "wall": 5764.5} {"step": 26171, "train_loss": 3.1372315883636475, "lr": 5.891559057004696e-05, "tps": 297296, "wall": 5769.4} {"step": 26172, "train_loss": 3.0459742546081543, "lr": 5.890704241892147e-05, "tps": 297058, "wall": 5774.2} {"step": 26173, "train_loss": 3.141341209411621, "lr": 5.889849609266571e-05, "tps": 296820, "wall": 5779.1} {"step": 26174, "train_loss": 3.1593332290649414, "lr": 5.888995159137652e-05, "tps": 296583, "wall": 5783.9} {"step": 26175, "train_loss": 3.048879623413086, "lr": 5.8881408915150636e-05, "tps": 296346, "wall": 5788.7} {"step": 26176, "train_loss": 3.094586133956909, "lr": 5.8872868064084916e-05, "tps": 296109, "wall": 5793.6} {"step": 26177, "train_loss": 3.0821220874786377, "lr": 5.8864329038276014e-05, "tps": 295872, "wall": 5798.5} {"step": 26178, "train_loss": 3.099804162979126, "lr": 5.885579183782074e-05, "tps": 295634, "wall": 5803.3} {"step": 26179, "train_loss": 3.0553524494171143, "lr": 5.884725646281578e-05, "tps": 295398, "wall": 5808.2} {"step": 26180, "train_loss": 3.0110116004943848, "lr": 5.883872291335777e-05, "tps": 295164, "wall": 5813.0} {"step": 26181, "train_loss": 3.1147332191467285, "lr": 5.883019118954348e-05, "tps": 294929, "wall": 5817.9} {"step": 26182, "train_loss": 3.0363149642944336, "lr": 5.882166129146951e-05, "tps": 294696, "wall": 5822.7} {"step": 26183, "train_loss": 3.1172358989715576, "lr": 5.881313321923242e-05, "tps": 294457, "wall": 5827.6} {"step": 26184, "train_loss": 3.011322021484375, "lr": 5.880460697292893e-05, "tps": 294221, "wall": 5832.5} {"step": 26185, "train_loss": 3.034838914871216, "lr": 5.879608255265557e-05, "tps": 293949, "wall": 5838.2} {"step": 26186, "train_loss": 3.171208143234253, "lr": 5.878755995850887e-05, "tps": 293715, "wall": 5843.0} {"step": 26187, "train_loss": 3.080232858657837, "lr": 5.877903919058545e-05, "tps": 293482, "wall": 5847.9} {"step": 26188, "train_loss": 2.9907889366149902, "lr": 5.877052024898179e-05, "tps": 293250, "wall": 5852.8} {"step": 26189, "train_loss": 3.2217023372650146, "lr": 5.876200313379436e-05, "tps": 293018, "wall": 5857.6} {"step": 26190, "train_loss": 3.1658518314361572, "lr": 5.8753487845119714e-05, "tps": 292786, "wall": 5862.5} {"step": 26191, "train_loss": 3.0818450450897217, "lr": 5.874497438305431e-05, "tps": 292556, "wall": 5867.3} {"step": 26192, "train_loss": 3.0404319763183594, "lr": 5.873646274769449e-05, "tps": 292327, "wall": 5872.1} {"step": 26193, "train_loss": 3.0975046157836914, "lr": 5.872795293913681e-05, "tps": 292097, "wall": 5877.0} {"step": 26194, "train_loss": 3.121281385421753, "lr": 5.8719444957477545e-05, "tps": 291867, "wall": 5881.8} {"step": 26195, "train_loss": 3.123009204864502, "lr": 5.871093880281316e-05, "tps": 291636, "wall": 5886.7} {"step": 26196, "train_loss": 3.1460022926330566, "lr": 5.870243447524001e-05, "tps": 291407, "wall": 5891.6} {"step": 26197, "train_loss": 3.1583948135375977, "lr": 5.8693931974854375e-05, "tps": 291180, "wall": 5896.4} {"step": 26198, "train_loss": 3.0580151081085205, "lr": 5.8685431301752625e-05, "tps": 290951, "wall": 5901.2} {"step": 26199, "train_loss": 3.2274012565612793, "lr": 5.867693245603104e-05, "tps": 290723, "wall": 5906.1} {"step": 26200, "train_loss": 3.1639766693115234, "lr": 5.866843543778585e-05, "tps": 290496, "wall": 5910.9} {"step": 26201, "train_loss": 3.2007651329040527, "lr": 5.8659940247113385e-05, "tps": 290269, "wall": 5915.8} {"step": 26202, "train_loss": 3.084545135498047, "lr": 5.865144688410986e-05, "tps": 290041, "wall": 5920.7} {"step": 26203, "train_loss": 3.1481733322143555, "lr": 5.864295534887144e-05, "tps": 289814, "wall": 5925.5} {"step": 26204, "train_loss": 3.162827253341675, "lr": 5.8634465641494385e-05, "tps": 289562, "wall": 5930.9} {"step": 26205, "train_loss": 3.162504196166992, "lr": 5.8625977762074826e-05, "tps": 289306, "wall": 5936.4} {"step": 26206, "train_loss": 3.127453088760376, "lr": 5.861749171070887e-05, "tps": 289079, "wall": 5941.3} {"step": 26207, "train_loss": 3.082982063293457, "lr": 5.8609007487492764e-05, "tps": 288846, "wall": 5946.3} {"step": 26208, "train_loss": 3.1421921253204346, "lr": 5.860052509252254e-05, "tps": 288619, "wall": 5951.2} {"step": 26209, "train_loss": 3.0784354209899902, "lr": 5.8592044525894254e-05, "tps": 288393, "wall": 5956.1} {"step": 26210, "train_loss": 3.0333375930786133, "lr": 5.858356578770407e-05, "tps": 288168, "wall": 5961.0} {"step": 26211, "train_loss": 3.0984249114990234, "lr": 5.8575088878047955e-05, "tps": 287945, "wall": 5965.8} {"step": 26212, "train_loss": 3.093930721282959, "lr": 5.8566613797021986e-05, "tps": 287721, "wall": 5970.7} {"step": 26213, "train_loss": 3.13006329536438, "lr": 5.855814054472214e-05, "tps": 287497, "wall": 5975.6} {"step": 26214, "train_loss": 3.1437013149261475, "lr": 5.85496691212444e-05, "tps": 287274, "wall": 5980.4} {"step": 26215, "train_loss": 3.1024985313415527, "lr": 5.8541199526684767e-05, "tps": 287052, "wall": 5985.3} {"step": 26216, "train_loss": 3.1045618057250977, "lr": 5.853273176113919e-05, "tps": 286829, "wall": 5990.2} {"step": 26217, "train_loss": 3.1423869132995605, "lr": 5.852426582470351e-05, "tps": 286607, "wall": 5995.0} {"step": 26218, "train_loss": 3.1425769329071045, "lr": 5.8515801717473704e-05, "tps": 286385, "wall": 5999.9} {"step": 26219, "train_loss": 3.049175500869751, "lr": 5.850733943954559e-05, "tps": 286151, "wall": 6005.1} {"step": 26220, "train_loss": 3.0780019760131836, "lr": 5.8498878991015114e-05, "tps": 285924, "wall": 6010.0} {"step": 26221, "train_loss": 3.1134047508239746, "lr": 5.849042037197808e-05, "tps": 285701, "wall": 6015.0} {"step": 26222, "train_loss": 3.097151041030884, "lr": 5.8481963582530266e-05, "tps": 285480, "wall": 6019.9} {"step": 26223, "train_loss": 3.1435561180114746, "lr": 5.847350862276753e-05, "tps": 285258, "wall": 6024.8} {"step": 26224, "train_loss": 3.136239767074585, "lr": 5.8465055492785636e-05, "tps": 285034, "wall": 6029.7} {"step": 26225, "train_loss": 3.146470546722412, "lr": 5.84566041926803e-05, "tps": 284813, "wall": 6034.6} {"step": 26226, "train_loss": 3.1018993854522705, "lr": 5.844815472254731e-05, "tps": 284593, "wall": 6039.5} {"step": 26227, "train_loss": 3.1037330627441406, "lr": 5.843970708248239e-05, "tps": 284374, "wall": 6044.4} {"step": 26228, "train_loss": 3.318605899810791, "lr": 5.843126127258116e-05, "tps": 284155, "wall": 6049.3} {"step": 26229, "train_loss": 3.0441970825195312, "lr": 5.842281729293937e-05, "tps": 283936, "wall": 6054.2} {"step": 26230, "train_loss": 3.1091318130493164, "lr": 5.8414375143652654e-05, "tps": 283717, "wall": 6059.1} {"step": 26231, "train_loss": 3.046349048614502, "lr": 5.84059348248166e-05, "tps": 283494, "wall": 6064.1} {"step": 26232, "train_loss": 3.0975565910339355, "lr": 5.83974963365269e-05, "tps": 283278, "wall": 6069.0} {"step": 26233, "train_loss": 2.986440896987915, "lr": 5.8389059678879087e-05, "tps": 283060, "wall": 6073.9} {"step": 26234, "train_loss": 3.0667190551757812, "lr": 5.838062485196874e-05, "tps": 282842, "wall": 6078.8} {"step": 26235, "train_loss": 3.122272491455078, "lr": 5.837219185589143e-05, "tps": 282625, "wall": 6083.7} {"step": 26236, "train_loss": 3.1121296882629395, "lr": 5.836376069074265e-05, "tps": 282409, "wall": 6088.6} {"step": 26237, "train_loss": 3.1505768299102783, "lr": 5.835533135661797e-05, "tps": 282192, "wall": 6093.5} {"step": 26238, "train_loss": 3.1569318771362305, "lr": 5.8346903853612845e-05, "tps": 281977, "wall": 6098.4} {"step": 26239, "train_loss": 3.0309059619903564, "lr": 5.83384781818227e-05, "tps": 281762, "wall": 6103.3} {"step": 26240, "train_loss": 3.1065025329589844, "lr": 5.8330054341343056e-05, "tps": 281546, "wall": 6108.1} {"step": 26241, "train_loss": 3.1056528091430664, "lr": 5.8321632332269295e-05, "tps": 281332, "wall": 6113.0} {"step": 26242, "train_loss": 3.137424945831299, "lr": 5.831321215469678e-05, "tps": 281118, "wall": 6117.9} {"step": 26243, "train_loss": 3.123065710067749, "lr": 5.8304793808721016e-05, "tps": 280904, "wall": 6122.8} {"step": 26244, "train_loss": 3.1391351222991943, "lr": 5.8296377294437275e-05, "tps": 280688, "wall": 6127.8} {"step": 26245, "train_loss": 3.0862722396850586, "lr": 5.828796261194088e-05, "tps": 280474, "wall": 6132.7} {"step": 26246, "train_loss": 3.22021222114563, "lr": 5.827954976132724e-05, "tps": 280261, "wall": 6137.6} {"step": 26247, "train_loss": 3.2290258407592773, "lr": 5.827113874269161e-05, "tps": 280049, "wall": 6142.5} {"step": 26248, "train_loss": 3.209346055984497, "lr": 5.8262729556129225e-05, "tps": 279835, "wall": 6147.4} {"step": 26249, "train_loss": 3.16335129737854, "lr": 5.8254322201735434e-05, "tps": 279622, "wall": 6152.3} {"step": 26250, "train_loss": 3.068141460418701, "lr": 5.824591667960543e-05, "tps": 279410, "wall": 6157.2} {"step": 26251, "train_loss": 3.179053544998169, "lr": 5.8237512989834387e-05, "tps": 279197, "wall": 6162.1} {"step": 26252, "train_loss": 3.1718430519104004, "lr": 5.822911113251759e-05, "tps": 278986, "wall": 6167.0} {"step": 26253, "train_loss": 3.13454270362854, "lr": 5.8220711107750146e-05, "tps": 278775, "wall": 6171.9} {"step": 26254, "train_loss": 3.077788829803467, "lr": 5.8212312915627266e-05, "tps": 278565, "wall": 6176.8} {"step": 26255, "train_loss": 3.0956740379333496, "lr": 5.8203916556244054e-05, "tps": 278355, "wall": 6181.7} {"step": 26256, "train_loss": 3.0469789505004883, "lr": 5.8195522029695595e-05, "tps": 278144, "wall": 6186.6} {"step": 26257, "train_loss": 3.1041409969329834, "lr": 5.818712933607706e-05, "tps": 277934, "wall": 6191.5} {"step": 26258, "train_loss": 3.03482723236084, "lr": 5.817873847548347e-05, "tps": 277726, "wall": 6196.4} {"step": 26259, "train_loss": 3.1916747093200684, "lr": 5.817034944800984e-05, "tps": 277517, "wall": 6201.3} {"step": 26260, "train_loss": 3.1018035411834717, "lr": 5.8161962253751304e-05, "tps": 277307, "wall": 6206.2} {"step": 26261, "train_loss": 3.115788459777832, "lr": 5.81535768928028e-05, "tps": 277098, "wall": 6211.2} {"step": 26262, "train_loss": 3.145681142807007, "lr": 5.81451933652593e-05, "tps": 276891, "wall": 6216.1} {"step": 26263, "train_loss": 3.0378332138061523, "lr": 5.813681167121583e-05, "tps": 276683, "wall": 6221.0} {"step": 26264, "train_loss": 3.0847277641296387, "lr": 5.812843181076733e-05, "tps": 276475, "wall": 6225.9} {"step": 26265, "train_loss": 2.9639930725097656, "lr": 5.812005378400868e-05, "tps": 276266, "wall": 6230.8} {"step": 26266, "train_loss": 3.112351894378662, "lr": 5.811167759103483e-05, "tps": 276059, "wall": 6235.7} {"step": 26267, "train_loss": 3.0951943397521973, "lr": 5.810330323194068e-05, "tps": 275853, "wall": 6240.6} {"step": 26268, "train_loss": 2.9773623943328857, "lr": 5.809493070682103e-05, "tps": 275644, "wall": 6245.6} {"step": 26269, "train_loss": 3.0109286308288574, "lr": 5.808656001577079e-05, "tps": 275437, "wall": 6250.5} {"step": 26270, "train_loss": 3.1857776641845703, "lr": 5.807819115888475e-05, "tps": 275231, "wall": 6255.4} {"step": 26271, "train_loss": 3.046658992767334, "lr": 5.8069824136257714e-05, "tps": 275026, "wall": 6260.3} {"step": 26272, "train_loss": 3.105465888977051, "lr": 5.806145894798448e-05, "tps": 274821, "wall": 6265.2} {"step": 26273, "train_loss": 3.1472854614257812, "lr": 5.805309559415978e-05, "tps": 274616, "wall": 6270.2} {"step": 26274, "train_loss": 3.1397135257720947, "lr": 5.804473407487839e-05, "tps": 274412, "wall": 6275.1} {"step": 26275, "train_loss": 3.145291805267334, "lr": 5.803637439023504e-05, "tps": 274207, "wall": 6280.0} {"step": 26276, "train_loss": 3.1800267696380615, "lr": 5.8028016540324334e-05, "tps": 274003, "wall": 6284.9} {"step": 26277, "train_loss": 3.121127128601074, "lr": 5.801966052524109e-05, "tps": 273799, "wall": 6289.8} {"step": 26278, "train_loss": 3.1733856201171875, "lr": 5.8011306345079875e-05, "tps": 273596, "wall": 6294.8} {"step": 26279, "train_loss": 3.0577099323272705, "lr": 5.800295399993531e-05, "tps": 273393, "wall": 6299.7} {"step": 26280, "train_loss": 3.200441360473633, "lr": 5.799460348990209e-05, "tps": 273187, "wall": 6304.7} {"step": 26281, "train_loss": 3.0536060333251953, "lr": 5.7986254815074745e-05, "tps": 272985, "wall": 6309.6} {"step": 26282, "train_loss": 3.0680348873138428, "lr": 5.797790797554786e-05, "tps": 272783, "wall": 6314.5} {"step": 26283, "train_loss": 3.072049379348755, "lr": 5.7969562971416026e-05, "tps": 272582, "wall": 6319.4} {"step": 26284, "train_loss": 3.1318912506103516, "lr": 5.796121980277375e-05, "tps": 272381, "wall": 6324.3} {"step": 26285, "train_loss": 3.036320686340332, "lr": 5.79528784697155e-05, "tps": 272178, "wall": 6329.2} {"step": 26286, "train_loss": 3.1251368522644043, "lr": 5.794453897233584e-05, "tps": 271976, "wall": 6334.2} {"step": 26287, "train_loss": 3.080312728881836, "lr": 5.793620131072923e-05, "tps": 271776, "wall": 6339.1} {"step": 26288, "train_loss": 3.087378740310669, "lr": 5.792786548499004e-05, "tps": 271576, "wall": 6344.0} {"step": 26289, "train_loss": 3.137883186340332, "lr": 5.791953149521281e-05, "tps": 271377, "wall": 6348.9} {"step": 26290, "train_loss": 3.129608631134033, "lr": 5.791119934149185e-05, "tps": 271177, "wall": 6353.8} {"step": 26291, "train_loss": 3.082030773162842, "lr": 5.7902869023921646e-05, "tps": 270977, "wall": 6358.7} {"step": 26292, "train_loss": 3.0504636764526367, "lr": 5.789454054259649e-05, "tps": 270778, "wall": 6363.7} {"step": 26293, "train_loss": 3.1237106323242188, "lr": 5.788621389761072e-05, "tps": 270578, "wall": 6368.6} {"step": 26294, "train_loss": 3.116490364074707, "lr": 5.787788908905873e-05, "tps": 270381, "wall": 6373.5} {"step": 26295, "train_loss": 3.0637729167938232, "lr": 5.786956611703478e-05, "tps": 270182, "wall": 6378.4} {"step": 26296, "train_loss": 3.0966691970825195, "lr": 5.786124498163311e-05, "tps": 269985, "wall": 6383.3} {"step": 26297, "train_loss": 3.1092844009399414, "lr": 5.785292568294809e-05, "tps": 269789, "wall": 6388.2} {"step": 26298, "train_loss": 3.085261821746826, "lr": 5.784460822107387e-05, "tps": 269575, "wall": 6393.5} {"step": 26299, "train_loss": 3.0352745056152344, "lr": 5.7836292596104667e-05, "tps": 269379, "wall": 6398.4} {"step": 26300, "train_loss": 3.103684663772583, "lr": 5.782797880813478e-05, "tps": 269183, "wall": 6403.3} {"step": 26301, "train_loss": 3.17740535736084, "lr": 5.7819666857258293e-05, "tps": 268987, "wall": 6408.2} {"step": 26302, "train_loss": 2.9618988037109375, "lr": 5.781135674356937e-05, "tps": 268792, "wall": 6413.1} {"step": 26303, "train_loss": 3.1014068126678467, "lr": 5.780304846716221e-05, "tps": 268595, "wall": 6418.0} {"step": 26304, "train_loss": 3.209697961807251, "lr": 5.779474202813089e-05, "tps": 268400, "wall": 6423.0} {"step": 26305, "train_loss": 3.092273712158203, "lr": 5.778643742656946e-05, "tps": 268190, "wall": 6428.2} {"step": 26306, "train_loss": 3.05080509185791, "lr": 5.7778134662572104e-05, "tps": 267993, "wall": 6433.2} {"step": 26307, "train_loss": 3.171149730682373, "lr": 5.776983373623276e-05, "tps": 267799, "wall": 6438.1} {"step": 26308, "train_loss": 3.1258695125579834, "lr": 5.776153464764556e-05, "tps": 267606, "wall": 6443.0} {"step": 26309, "train_loss": 3.073415756225586, "lr": 5.7753237396904456e-05, "tps": 267412, "wall": 6447.9} {"step": 26310, "train_loss": 3.0970375537872314, "lr": 5.7744941984103426e-05, "tps": 267218, "wall": 6452.8} {"step": 26311, "train_loss": 3.028956413269043, "lr": 5.7736648409336515e-05, "tps": 267022, "wall": 6457.8} {"step": 26312, "train_loss": 3.143845558166504, "lr": 5.7728356672697616e-05, "tps": 266823, "wall": 6462.9} {"step": 26313, "train_loss": 3.0528106689453125, "lr": 5.7720066774280654e-05, "tps": 266631, "wall": 6467.8} {"step": 26314, "train_loss": 3.127141237258911, "lr": 5.771177871417959e-05, "tps": 266431, "wall": 6472.9} {"step": 26315, "train_loss": 3.208131790161133, "lr": 5.7703492492488265e-05, "tps": 266239, "wall": 6477.8} {"step": 26316, "train_loss": 3.052912950515747, "lr": 5.769520810930051e-05, "tps": 266048, "wall": 6482.7} {"step": 26317, "train_loss": 3.181476354598999, "lr": 5.768692556471028e-05, "tps": 265856, "wall": 6487.6} {"step": 26318, "train_loss": 3.160614252090454, "lr": 5.7678644858811314e-05, "tps": 265665, "wall": 6492.5} {"step": 26319, "train_loss": 3.035858631134033, "lr": 5.767036599169743e-05, "tps": 265469, "wall": 6497.6} {"step": 26320, "train_loss": 3.2301883697509766, "lr": 5.766208896346245e-05, "tps": 265273, "wall": 6502.6} {"step": 26321, "train_loss": 3.1379010677337646, "lr": 5.76538137742001e-05, "tps": 265075, "wall": 6507.7} {"step": 26322, "train_loss": 3.163158416748047, "lr": 5.76455404240041e-05, "tps": 264884, "wall": 6512.7} {"step": 26323, "train_loss": 3.1662864685058594, "lr": 5.763726891296823e-05, "tps": 264680, "wall": 6517.9} {"step": 26324, "train_loss": 3.0739970207214355, "lr": 5.762899924118618e-05, "tps": 264479, "wall": 6523.1} {"step": 26325, "train_loss": 3.131908416748047, "lr": 5.762073140875155e-05, "tps": 264280, "wall": 6528.3} {"step": 26326, "train_loss": 3.1943509578704834, "lr": 5.761246541575811e-05, "tps": 264082, "wall": 6533.4} {"step": 26327, "train_loss": 3.090818166732788, "lr": 5.7604201262299415e-05, "tps": 263884, "wall": 6538.6} {"step": 26328, "train_loss": 3.082615852355957, "lr": 5.759593894846914e-05, "tps": 263683, "wall": 6543.8} {"step": 26329, "train_loss": 3.2479665279388428, "lr": 5.758767847436085e-05, "tps": 263482, "wall": 6549.1} {"step": 26330, "train_loss": 3.0791282653808594, "lr": 5.757941984006809e-05, "tps": 263287, "wall": 6554.2} {"step": 26331, "train_loss": 3.1989145278930664, "lr": 5.7571163045684506e-05, "tps": 263091, "wall": 6559.3} {"step": 26332, "train_loss": 3.1778311729431152, "lr": 5.7562908091303544e-05, "tps": 262895, "wall": 6564.4} {"step": 26333, "train_loss": 3.089677572250366, "lr": 5.755465497701874e-05, "tps": 262698, "wall": 6569.6} {"step": 26334, "train_loss": 3.044121742248535, "lr": 5.754640370292361e-05, "tps": 262502, "wall": 6574.7} {"step": 26335, "train_loss": 3.0364248752593994, "lr": 5.75381542691116e-05, "tps": 262307, "wall": 6579.9} {"step": 26336, "train_loss": 3.062011957168579, "lr": 5.752990667567615e-05, "tps": 262113, "wall": 6585.0} {"step": 26337, "train_loss": 3.1268811225891113, "lr": 5.752166092271074e-05, "tps": 261927, "wall": 6589.9} {"step": 26338, "train_loss": 3.0797226428985596, "lr": 5.7513417010308734e-05, "tps": 261731, "wall": 6595.1} {"step": 26339, "train_loss": 3.1417746543884277, "lr": 5.750517493856351e-05, "tps": 261547, "wall": 6600.0} {"step": 26340, "train_loss": 2.976529121398926, "lr": 5.7496934707568486e-05, "tps": 261360, "wall": 6605.0} {"step": 26341, "train_loss": 3.0823867321014404, "lr": 5.748869631741696e-05, "tps": 261176, "wall": 6609.9} {"step": 26342, "train_loss": 3.2134573459625244, "lr": 5.748045976820227e-05, "tps": 260993, "wall": 6614.8} {"step": 26343, "train_loss": 3.22139310836792, "lr": 5.747222506001773e-05, "tps": 260808, "wall": 6619.7} {"step": 26344, "train_loss": 3.047610282897949, "lr": 5.7463992192956594e-05, "tps": 260624, "wall": 6624.6} {"step": 26345, "train_loss": 3.0807456970214844, "lr": 5.7455761167112167e-05, "tps": 260440, "wall": 6629.6} {"step": 26346, "train_loss": 3.0980653762817383, "lr": 5.744753198257769e-05, "tps": 260246, "wall": 6634.8} {"step": 26347, "train_loss": 3.1960906982421875, "lr": 5.7439304639446336e-05, "tps": 260050, "wall": 6640.0} {"step": 26348, "train_loss": 3.0548315048217773, "lr": 5.743107913781136e-05, "tps": 259866, "wall": 6645.0} {"step": 26349, "train_loss": 3.1552963256835938, "lr": 5.7422855477765904e-05, "tps": 259679, "wall": 6650.0} {"step": 26350, "train_loss": 3.0471713542938232, "lr": 5.74146336594031e-05, "tps": 259476, "wall": 6655.5} {"step": 26351, "train_loss": 3.181793212890625, "lr": 5.740641368281617e-05, "tps": 259282, "wall": 6660.7} {"step": 26352, "train_loss": 3.157644033432007, "lr": 5.739819554809816e-05, "tps": 259090, "wall": 6665.9} {"step": 26353, "train_loss": 2.9970579147338867, "lr": 5.7389979255342195e-05, "tps": 258907, "wall": 6670.9} {"step": 26354, "train_loss": 3.2145378589630127, "lr": 5.738176480464135e-05, "tps": 258716, "wall": 6676.1} {"step": 26355, "train_loss": 3.1385498046875, "lr": 5.737355219608867e-05, "tps": 258521, "wall": 6681.3} {"step": 26356, "train_loss": 3.0489039421081543, "lr": 5.7365341429777155e-05, "tps": 258327, "wall": 6686.6} {"step": 26357, "train_loss": 3.0517430305480957, "lr": 5.7357132505799884e-05, "tps": 258137, "wall": 6691.8} {"step": 26358, "train_loss": 3.060563325881958, "lr": 5.734892542424982e-05, "tps": 257945, "wall": 6697.0} {"step": 26359, "train_loss": 3.088960647583008, "lr": 5.73407201852199e-05, "tps": 257751, "wall": 6702.3} {"step": 26360, "train_loss": 3.1690261363983154, "lr": 5.7332516788803116e-05, "tps": 257563, "wall": 6707.5} {"step": 26361, "train_loss": 3.1309447288513184, "lr": 5.7324315235092365e-05, "tps": 257381, "wall": 6712.4} {"step": 26362, "train_loss": 3.084291934967041, "lr": 5.73161155241806e-05, "tps": 257199, "wall": 6717.4} {"step": 26363, "train_loss": 3.1266698837280273, "lr": 5.730791765616068e-05, "tps": 257016, "wall": 6722.5} {"step": 26364, "train_loss": 3.0521390438079834, "lr": 5.729972163112542e-05, "tps": 256832, "wall": 6727.6} {"step": 26365, "train_loss": 3.083387851715088, "lr": 5.729152744916777e-05, "tps": 256653, "wall": 6732.5} {"step": 26366, "train_loss": 3.1335630416870117, "lr": 5.7283335110380485e-05, "tps": 256474, "wall": 6737.5} {"step": 26367, "train_loss": 3.0920650959014893, "lr": 5.727514461485638e-05, "tps": 256294, "wall": 6742.5} {"step": 26368, "train_loss": 3.1443490982055664, "lr": 5.726695596268824e-05, "tps": 256112, "wall": 6747.5} {"step": 26369, "train_loss": 3.1542725563049316, "lr": 5.725876915396884e-05, "tps": 255935, "wall": 6752.4} {"step": 26370, "train_loss": 3.0313010215759277, "lr": 5.725058418879087e-05, "tps": 255757, "wall": 6757.4} {"step": 26371, "train_loss": 3.0484628677368164, "lr": 5.724240106724712e-05, "tps": 255581, "wall": 6762.3} {"step": 26372, "train_loss": 3.057483196258545, "lr": 5.7234219789430255e-05, "tps": 255404, "wall": 6767.2} {"step": 26373, "train_loss": 3.1201393604278564, "lr": 5.722604035543292e-05, "tps": 255227, "wall": 6772.2} {"step": 26374, "train_loss": 3.1401147842407227, "lr": 5.721786276534785e-05, "tps": 255050, "wall": 6777.1} {"step": 26375, "train_loss": 3.144366502761841, "lr": 5.7209687019267635e-05, "tps": 254871, "wall": 6782.1} {"step": 26376, "train_loss": 3.0690903663635254, "lr": 5.7201513117284844e-05, "tps": 254689, "wall": 6787.3} {"step": 26377, "train_loss": 3.08736515045166, "lr": 5.719334105949216e-05, "tps": 254508, "wall": 6792.3} {"step": 26378, "train_loss": 3.1319990158081055, "lr": 5.718517084598212e-05, "tps": 254329, "wall": 6797.4} {"step": 26379, "train_loss": 3.0769174098968506, "lr": 5.717700247684723e-05, "tps": 254151, "wall": 6802.4} {"step": 26380, "train_loss": 3.1303820610046387, "lr": 5.71688359521801e-05, "tps": 253972, "wall": 6807.4} {"step": 26381, "train_loss": 3.15950870513916, "lr": 5.716067127207321e-05, "tps": 253794, "wall": 6812.5} {"step": 26382, "train_loss": 3.072097063064575, "lr": 5.715250843661904e-05, "tps": 253619, "wall": 6817.4} {"step": 26383, "train_loss": 3.129711389541626, "lr": 5.714434744591005e-05, "tps": 253441, "wall": 6822.5} {"step": 26384, "train_loss": 3.0498404502868652, "lr": 5.71361883000387e-05, "tps": 253264, "wall": 6827.5} {"step": 26385, "train_loss": 3.122856616973877, "lr": 5.7128030999097474e-05, "tps": 253087, "wall": 6832.5} {"step": 26386, "train_loss": 3.1623024940490723, "lr": 5.711987554317866e-05, "tps": 252892, "wall": 6838.1} {"step": 26387, "train_loss": 3.2266664505004883, "lr": 5.711172193237473e-05, "tps": 252709, "wall": 6843.3} {"step": 26388, "train_loss": 3.0738816261291504, "lr": 5.7103570166778054e-05, "tps": 252530, "wall": 6848.4} {"step": 26389, "train_loss": 3.2223682403564453, "lr": 5.709542024648088e-05, "tps": 252344, "wall": 6853.7} {"step": 26390, "train_loss": 3.1025772094726562, "lr": 5.708727217157566e-05, "tps": 252169, "wall": 6858.7} {"step": 26391, "train_loss": 3.1090903282165527, "lr": 5.7079125942154634e-05, "tps": 251994, "wall": 6863.7} {"step": 26392, "train_loss": 3.108321189880371, "lr": 5.7070981558310035e-05, "tps": 251819, "wall": 6868.8} {"step": 26393, "train_loss": 3.0623929500579834, "lr": 5.706283902013421e-05, "tps": 251647, "wall": 6873.7} {"step": 26394, "train_loss": 3.107017755508423, "lr": 5.705469832771935e-05, "tps": 251474, "wall": 6878.7} {"step": 26395, "train_loss": 3.127373218536377, "lr": 5.7046559481157647e-05, "tps": 251303, "wall": 6883.7} {"step": 26396, "train_loss": 3.1828720569610596, "lr": 5.703842248054139e-05, "tps": 251134, "wall": 6888.5} {"step": 26397, "train_loss": 3.115692138671875, "lr": 5.7030287325962686e-05, "tps": 250964, "wall": 6893.5} {"step": 26398, "train_loss": 3.0829851627349854, "lr": 5.702215401751367e-05, "tps": 250796, "wall": 6898.4} {"step": 26399, "train_loss": 3.083709478378296, "lr": 5.7014022555286537e-05, "tps": 250628, "wall": 6903.3} {"step": 26400, "train_loss": 3.1278340816497803, "lr": 5.700589293937338e-05, "tps": 250455, "wall": 6908.3} {"step": 26401, "train_loss": 3.146404981613159, "lr": 5.699776516986626e-05, "tps": 250284, "wall": 6913.3} {"step": 26402, "train_loss": 3.0905020236968994, "lr": 5.69896392468573e-05, "tps": 250112, "wall": 6918.3} {"step": 26403, "train_loss": 3.1570053100585938, "lr": 5.6981515170438524e-05, "tps": 249943, "wall": 6923.2} {"step": 26404, "train_loss": 3.0619287490844727, "lr": 5.697339294070192e-05, "tps": 249775, "wall": 6928.1} {"step": 26405, "train_loss": 3.068809747695923, "lr": 5.696527255773959e-05, "tps": 249606, "wall": 6933.1} {"step": 26406, "train_loss": 3.041781425476074, "lr": 5.6957154021643445e-05, "tps": 249434, "wall": 6938.1} {"step": 26407, "train_loss": 3.020585536956787, "lr": 5.6949037332505495e-05, "tps": 249263, "wall": 6943.1} {"step": 26408, "train_loss": 3.2148027420043945, "lr": 5.694092249041769e-05, "tps": 249090, "wall": 6948.2} {"step": 26409, "train_loss": 3.1402275562286377, "lr": 5.69328094954719e-05, "tps": 248922, "wall": 6953.2} {"step": 26410, "train_loss": 3.0958101749420166, "lr": 5.6924698347760065e-05, "tps": 248755, "wall": 6958.1} {"step": 26411, "train_loss": 3.2054526805877686, "lr": 5.691658904737411e-05, "tps": 248589, "wall": 6963.0} {"step": 26412, "train_loss": 3.142463207244873, "lr": 5.690848159440579e-05, "tps": 248422, "wall": 6968.0} {"step": 26413, "train_loss": 3.0364160537719727, "lr": 5.690037598894708e-05, "tps": 248255, "wall": 6972.9} {"step": 26414, "train_loss": 3.156719923019409, "lr": 5.6892272231089725e-05, "tps": 248090, "wall": 6977.8} {"step": 26415, "train_loss": 3.076993227005005, "lr": 5.688417032092549e-05, "tps": 247925, "wall": 6982.7} {"step": 26416, "train_loss": 3.1048226356506348, "lr": 5.687607025854623e-05, "tps": 247760, "wall": 6987.7} {"step": 26417, "train_loss": 3.0746817588806152, "lr": 5.6867972044043696e-05, "tps": 247595, "wall": 6992.6} {"step": 26418, "train_loss": 3.1917929649353027, "lr": 5.685987567750954e-05, "tps": 247430, "wall": 6997.5} {"step": 26419, "train_loss": 3.0301289558410645, "lr": 5.685178115903559e-05, "tps": 247265, "wall": 7002.4} {"step": 26420, "train_loss": 3.060886859893799, "lr": 5.6843688488713473e-05, "tps": 247101, "wall": 7007.4} {"step": 26421, "train_loss": 3.0842843055725098, "lr": 5.6835597666634845e-05, "tps": 246937, "wall": 7012.3} {"step": 26422, "train_loss": 3.103848457336426, "lr": 5.682750869289144e-05, "tps": 246773, "wall": 7017.2} {"step": 26423, "train_loss": 3.0441088676452637, "lr": 5.681942156757481e-05, "tps": 246609, "wall": 7022.1} {"step": 26424, "train_loss": 3.036024570465088, "lr": 5.681133629077663e-05, "tps": 246440, "wall": 7027.2} {"step": 26425, "train_loss": 3.089858055114746, "lr": 5.6803252862588464e-05, "tps": 246273, "wall": 7032.2} {"step": 26426, "train_loss": 3.077406644821167, "lr": 5.6795171283101845e-05, "tps": 246106, "wall": 7037.3} {"step": 26427, "train_loss": 3.012606143951416, "lr": 5.678709155240838e-05, "tps": 245940, "wall": 7042.3} {"step": 26428, "train_loss": 3.1624879837036133, "lr": 5.677901367059957e-05, "tps": 245771, "wall": 7047.4} {"step": 26429, "train_loss": 3.081909656524658, "lr": 5.677093763776689e-05, "tps": 245603, "wall": 7052.5} {"step": 26430, "train_loss": 3.1728084087371826, "lr": 5.6762863454001905e-05, "tps": 245436, "wall": 7057.6} {"step": 26431, "train_loss": 3.1100258827209473, "lr": 5.6754791119396026e-05, "tps": 245271, "wall": 7062.6} {"step": 26432, "train_loss": 3.1686387062072754, "lr": 5.674672063404068e-05, "tps": 245106, "wall": 7067.6} {"step": 26433, "train_loss": 3.081380844116211, "lr": 5.6738651998027336e-05, "tps": 244942, "wall": 7072.6} {"step": 26434, "train_loss": 3.1510260105133057, "lr": 5.673058521144738e-05, "tps": 244777, "wall": 7077.6} {"step": 26435, "train_loss": 3.108433961868286, "lr": 5.6722520274392155e-05, "tps": 244611, "wall": 7082.7} {"step": 26436, "train_loss": 3.0899429321289062, "lr": 5.671445718695306e-05, "tps": 244448, "wall": 7087.7} {"step": 26437, "train_loss": 3.0918118953704834, "lr": 5.670639594922147e-05, "tps": 244288, "wall": 7092.6} {"step": 26438, "train_loss": 3.1020827293395996, "lr": 5.66983365612886e-05, "tps": 244126, "wall": 7097.6} {"step": 26439, "train_loss": 3.0257225036621094, "lr": 5.669027902324586e-05, "tps": 243964, "wall": 7102.5} {"step": 26440, "train_loss": 3.0725691318511963, "lr": 5.668222333518442e-05, "tps": 243803, "wall": 7107.5} {"step": 26441, "train_loss": 2.9081532955169678, "lr": 5.667416949719565e-05, "tps": 243642, "wall": 7112.5} {"step": 26442, "train_loss": 3.1074013710021973, "lr": 5.6666117509370706e-05, "tps": 243481, "wall": 7117.4} {"step": 26443, "train_loss": 3.1048521995544434, "lr": 5.6658067371800784e-05, "tps": 243320, "wall": 7122.4} {"step": 26444, "train_loss": 2.991763114929199, "lr": 5.665001908457714e-05, "tps": 243161, "wall": 7127.4} {"step": 26445, "train_loss": 3.117934226989746, "lr": 5.6641972647790944e-05, "tps": 242999, "wall": 7132.4} {"step": 26446, "train_loss": 3.1172666549682617, "lr": 5.663392806153326e-05, "tps": 242835, "wall": 7137.5} {"step": 26447, "train_loss": 3.129587411880493, "lr": 5.6625885325895325e-05, "tps": 242672, "wall": 7142.5} {"step": 26448, "train_loss": 3.123035430908203, "lr": 5.6617844440968184e-05, "tps": 242506, "wall": 7147.7} {"step": 26449, "train_loss": 2.922356128692627, "lr": 5.6609805406842896e-05, "tps": 242343, "wall": 7152.8} {"step": 26450, "train_loss": 3.025728225708008, "lr": 5.660176822361063e-05, "tps": 242182, "wall": 7157.8} {"step": 26451, "train_loss": 3.1083669662475586, "lr": 5.659373289136237e-05, "tps": 242021, "wall": 7162.8} {"step": 26452, "train_loss": 3.0483646392822266, "lr": 5.658569941018911e-05, "tps": 241861, "wall": 7167.8} {"step": 26453, "train_loss": 3.078563690185547, "lr": 5.657766778018192e-05, "tps": 241701, "wall": 7172.9} {"step": 26454, "train_loss": 2.8903069496154785, "lr": 5.656963800143175e-05, "tps": 241542, "wall": 7177.9} {"step": 26455, "train_loss": 3.156702995300293, "lr": 5.6561610074029526e-05, "tps": 241380, "wall": 7182.9} {"step": 26456, "train_loss": 3.006823778152466, "lr": 5.655358399806626e-05, "tps": 241219, "wall": 7188.0} {"step": 26457, "train_loss": 3.0542006492614746, "lr": 5.654555977363283e-05, "tps": 241059, "wall": 7193.0} {"step": 26458, "train_loss": 3.1795730590820312, "lr": 5.653753740082012e-05, "tps": 240887, "wall": 7198.5} {"step": 26459, "train_loss": 3.171356201171875, "lr": 5.652951687971906e-05, "tps": 240725, "wall": 7203.6} {"step": 26460, "train_loss": 3.1672139167785645, "lr": 5.6521498210420445e-05, "tps": 240563, "wall": 7208.7} {"step": 26461, "train_loss": 3.0767250061035156, "lr": 5.6513481393015164e-05, "tps": 240402, "wall": 7213.8} {"step": 26462, "train_loss": 3.194086790084839, "lr": 5.6505466427594026e-05, "tps": 240244, "wall": 7218.8} {"step": 26463, "train_loss": 3.0365633964538574, "lr": 5.6497453314247764e-05, "tps": 240087, "wall": 7223.8} {"step": 26464, "train_loss": 3.0440444946289062, "lr": 5.6489442053067234e-05, "tps": 239929, "wall": 7228.8} {"step": 26465, "train_loss": 3.122565746307373, "lr": 5.648143264414315e-05, "tps": 239770, "wall": 7233.9} {"step": 26466, "train_loss": 3.1605162620544434, "lr": 5.64734250875662e-05, "tps": 239600, "wall": 7239.3} {"step": 26467, "train_loss": 3.0991735458374023, "lr": 5.6465419383427185e-05, "tps": 239428, "wall": 7244.8} {"step": 26468, "train_loss": 3.182699680328369, "lr": 5.645741553181674e-05, "tps": 239268, "wall": 7249.9} {"step": 26469, "train_loss": 3.1375300884246826, "lr": 5.644941353282551e-05, "tps": 239110, "wall": 7255.0} {"step": 26470, "train_loss": 3.0451767444610596, "lr": 5.64414133865442e-05, "tps": 238953, "wall": 7260.0} {"step": 26471, "train_loss": 3.0237534046173096, "lr": 5.643341509306341e-05, "tps": 238782, "wall": 7265.5} {"step": 26472, "train_loss": 3.0961084365844727, "lr": 5.642541865247371e-05, "tps": 238620, "wall": 7270.7} {"step": 26473, "train_loss": 2.986755847930908, "lr": 5.641742406486574e-05, "tps": 238461, "wall": 7275.8} {"step": 26474, "train_loss": 3.164503574371338, "lr": 5.640943133033006e-05, "tps": 238297, "wall": 7281.1} {"step": 26475, "train_loss": 3.1970386505126953, "lr": 5.640144044895714e-05, "tps": 238136, "wall": 7286.3} {"step": 26476, "train_loss": 3.0517733097076416, "lr": 5.6393451420837594e-05, "tps": 237981, "wall": 7291.3} {"step": 26477, "train_loss": 3.0524935722351074, "lr": 5.638546424606185e-05, "tps": 237829, "wall": 7296.3} {"step": 26478, "train_loss": 3.1908669471740723, "lr": 5.637747892472044e-05, "tps": 237676, "wall": 7301.2} {"step": 26479, "train_loss": 3.1673688888549805, "lr": 5.636949545690381e-05, "tps": 237525, "wall": 7306.1} {"step": 26480, "train_loss": 3.0471646785736084, "lr": 5.636151384270236e-05, "tps": 237372, "wall": 7311.1} {"step": 26481, "train_loss": 3.0788328647613525, "lr": 5.635353408220656e-05, "tps": 237218, "wall": 7316.1} {"step": 26482, "train_loss": 3.054572582244873, "lr": 5.634555617550678e-05, "tps": 237066, "wall": 7321.1} {"step": 26483, "train_loss": 3.0033607482910156, "lr": 5.6337580122693366e-05, "tps": 236909, "wall": 7326.2} {"step": 26484, "train_loss": 3.013603925704956, "lr": 5.632960592385672e-05, "tps": 236757, "wall": 7331.2} {"step": 26485, "train_loss": 3.078028917312622, "lr": 5.6321633579087176e-05, "tps": 236606, "wall": 7336.2} {"step": 26486, "train_loss": 3.057377815246582, "lr": 5.6313663088474944e-05, "tps": 236457, "wall": 7341.1} {"step": 26487, "train_loss": 3.0132579803466797, "lr": 5.630569445211047e-05, "tps": 236306, "wall": 7346.0} {"step": 26488, "train_loss": 3.025733709335327, "lr": 5.6297727670083924e-05, "tps": 236156, "wall": 7351.0} {"step": 26489, "train_loss": 3.126284122467041, "lr": 5.628976274248554e-05, "tps": 236007, "wall": 7355.9} {"step": 26490, "train_loss": 3.1440322399139404, "lr": 5.628179966940562e-05, "tps": 235855, "wall": 7360.9} {"step": 26491, "train_loss": 3.1348838806152344, "lr": 5.627383845093435e-05, "tps": 235704, "wall": 7365.9} {"step": 26492, "train_loss": 2.9852077960968018, "lr": 5.626587908716181e-05, "tps": 235553, "wall": 7370.9} {"step": 26493, "train_loss": 3.15030574798584, "lr": 5.6257921578178327e-05, "tps": 235404, "wall": 7375.9} {"step": 26494, "train_loss": 3.011242628097534, "lr": 5.624996592407391e-05, "tps": 235255, "wall": 7380.8} {"step": 26495, "train_loss": 3.1463699340820312, "lr": 5.624201212493879e-05, "tps": 235104, "wall": 7385.8} {"step": 26496, "train_loss": 3.0098962783813477, "lr": 5.623406018086299e-05, "tps": 234951, "wall": 7390.9} {"step": 26497, "train_loss": 3.0620079040527344, "lr": 5.622611009193661e-05, "tps": 234798, "wall": 7396.0} {"step": 26498, "train_loss": 3.1183156967163086, "lr": 5.621816185824974e-05, "tps": 234642, "wall": 7401.2} {"step": 26499, "train_loss": 3.1299519538879395, "lr": 5.621021547989239e-05, "tps": 234488, "wall": 7406.3} {"step": 26500, "train_loss": 2.938682794570923, "lr": 5.620227095695455e-05, "tps": 234333, "wall": 7411.5} {"step": 26501, "train_loss": 3.087489128112793, "lr": 5.6194328289526285e-05, "tps": 234173, "wall": 7416.9} {"step": 26502, "train_loss": 3.036247730255127, "lr": 5.618638747769751e-05, "tps": 234018, "wall": 7422.1} {"step": 26503, "train_loss": 3.1703686714172363, "lr": 5.617844852155819e-05, "tps": 233862, "wall": 7427.3} {"step": 26504, "train_loss": 3.084076404571533, "lr": 5.617051142119827e-05, "tps": 233710, "wall": 7432.4} {"step": 26505, "train_loss": 3.008909225463867, "lr": 5.616257617670769e-05, "tps": 233561, "wall": 7437.4} {"step": 26506, "train_loss": 2.978607654571533, "lr": 5.615464278817626e-05, "tps": 233412, "wall": 7442.5} {"step": 26507, "train_loss": 3.0882656574249268, "lr": 5.614671125569395e-05, "tps": 233259, "wall": 7447.6} {"step": 26508, "train_loss": 3.096935749053955, "lr": 5.613878157935055e-05, "tps": 233106, "wall": 7452.8} {"step": 26509, "train_loss": 3.1480138301849365, "lr": 5.613085375923587e-05, "tps": 232954, "wall": 7457.9} {"step": 26510, "train_loss": 3.0445594787597656, "lr": 5.612292779543976e-05, "tps": 232795, "wall": 7463.3} {"step": 26511, "train_loss": 3.1116204261779785, "lr": 5.6115003688052e-05, "tps": 232647, "wall": 7468.4} {"step": 26512, "train_loss": 3.159287691116333, "lr": 5.61070814371623e-05, "tps": 232499, "wall": 7473.4} {"step": 26513, "train_loss": 3.2193140983581543, "lr": 5.6099161042860504e-05, "tps": 232352, "wall": 7478.4} {"step": 26514, "train_loss": 3.1163992881774902, "lr": 5.609124250523624e-05, "tps": 232206, "wall": 7483.4} {"step": 26515, "train_loss": 3.135955810546875, "lr": 5.6083325824379275e-05, "tps": 232049, "wall": 7488.7} {"step": 26516, "train_loss": 3.0880472660064697, "lr": 5.607541100037925e-05, "tps": 231901, "wall": 7493.8} {"step": 26517, "train_loss": 3.1253232955932617, "lr": 5.6067498033325826e-05, "tps": 231750, "wall": 7499.0} {"step": 26518, "train_loss": 3.1796324253082275, "lr": 5.6059586923308674e-05, "tps": 231593, "wall": 7504.3} {"step": 26519, "train_loss": 2.982114791870117, "lr": 5.605167767041739e-05, "tps": 231439, "wall": 7509.6} {"step": 26520, "train_loss": 3.13132643699646, "lr": 5.6043770274741545e-05, "tps": 231294, "wall": 7514.6} {"step": 26521, "train_loss": 3.161588668823242, "lr": 5.603586473637077e-05, "tps": 231148, "wall": 7519.6} {"step": 26522, "train_loss": 3.038426637649536, "lr": 5.602796105539459e-05, "tps": 231003, "wall": 7524.6} {"step": 26523, "train_loss": 3.0910286903381348, "lr": 5.60200592319025e-05, "tps": 230858, "wall": 7529.6} {"step": 26524, "train_loss": 3.1622884273529053, "lr": 5.601215926598409e-05, "tps": 230714, "wall": 7534.6} {"step": 26525, "train_loss": 2.986318826675415, "lr": 5.60042611577288e-05, "tps": 230570, "wall": 7539.6} {"step": 26526, "train_loss": 2.949165105819702, "lr": 5.599636490722608e-05, "tps": 230428, "wall": 7544.5} {"step": 26527, "train_loss": 3.0082895755767822, "lr": 5.598847051456546e-05, "tps": 230285, "wall": 7549.5} {"step": 26528, "train_loss": 3.0997443199157715, "lr": 5.598057797983631e-05, "tps": 230143, "wall": 7554.4} {"step": 26529, "train_loss": 3.217611312866211, "lr": 5.597268730312801e-05, "tps": 230001, "wall": 7559.4} {"step": 26530, "train_loss": 3.1403825283050537, "lr": 5.596479848453001e-05, "tps": 229856, "wall": 7564.4} {"step": 26531, "train_loss": 3.115530490875244, "lr": 5.595691152413164e-05, "tps": 229713, "wall": 7569.4} {"step": 26532, "train_loss": 3.0531721115112305, "lr": 5.594902642202225e-05, "tps": 229571, "wall": 7574.4} {"step": 26533, "train_loss": 3.0956246852874756, "lr": 5.594114317829119e-05, "tps": 229421, "wall": 7579.6} {"step": 26534, "train_loss": 3.047107458114624, "lr": 5.5933261793027694e-05, "tps": 229279, "wall": 7584.6} {"step": 26535, "train_loss": 3.160407781600952, "lr": 5.592538226632109e-05, "tps": 229138, "wall": 7589.6} {"step": 26536, "train_loss": 3.031327486038208, "lr": 5.5917504598260664e-05, "tps": 228994, "wall": 7594.6} {"step": 26537, "train_loss": 3.084980010986328, "lr": 5.5909628788935595e-05, "tps": 228848, "wall": 7599.8} {"step": 26538, "train_loss": 3.0931379795074463, "lr": 5.590175483843514e-05, "tps": 228707, "wall": 7604.7} {"step": 26539, "train_loss": 3.0670132637023926, "lr": 5.589388274684848e-05, "tps": 228566, "wall": 7609.7} {"step": 26540, "train_loss": 3.023488759994507, "lr": 5.5886012514264784e-05, "tps": 228424, "wall": 7614.7} {"step": 26541, "train_loss": 3.0784754753112793, "lr": 5.587814414077325e-05, "tps": 228284, "wall": 7619.7} {"step": 26542, "train_loss": 3.1616063117980957, "lr": 5.5870277626462955e-05, "tps": 228139, "wall": 7624.8} {"step": 26543, "train_loss": 3.1057281494140625, "lr": 5.586241297142303e-05, "tps": 227996, "wall": 7629.9} {"step": 26544, "train_loss": 3.0741076469421387, "lr": 5.585455017574257e-05, "tps": 227852, "wall": 7635.0} {"step": 26545, "train_loss": 3.110962390899658, "lr": 5.5846689239510667e-05, "tps": 227710, "wall": 7640.1} {"step": 26546, "train_loss": 3.048649311065674, "lr": 5.5838830162816314e-05, "tps": 227569, "wall": 7645.1} {"step": 26547, "train_loss": 3.1453967094421387, "lr": 5.5830972945748604e-05, "tps": 227428, "wall": 7650.1} {"step": 26548, "train_loss": 3.061842918395996, "lr": 5.582311758839647e-05, "tps": 227286, "wall": 7655.2} {"step": 26549, "train_loss": 3.1602563858032227, "lr": 5.581526409084898e-05, "tps": 227142, "wall": 7660.3} {"step": 26550, "train_loss": 3.1446661949157715, "lr": 5.580741245319508e-05, "tps": 226999, "wall": 7665.4} {"step": 26551, "train_loss": 3.150986671447754, "lr": 5.5799562675523646e-05, "tps": 226855, "wall": 7670.6} {"step": 26552, "train_loss": 3.112468719482422, "lr": 5.579171475792369e-05, "tps": 226713, "wall": 7675.7} {"step": 26553, "train_loss": 3.129660129547119, "lr": 5.5783868700484056e-05, "tps": 226574, "wall": 7680.7} {"step": 26554, "train_loss": 3.1007332801818848, "lr": 5.577602450329366e-05, "tps": 226431, "wall": 7685.8} {"step": 26555, "train_loss": 3.139219284057617, "lr": 5.576818216644134e-05, "tps": 226288, "wall": 7691.0} {"step": 26556, "train_loss": 3.199368476867676, "lr": 5.5760341690015896e-05, "tps": 226146, "wall": 7696.1} {"step": 26557, "train_loss": 3.0703494548797607, "lr": 5.575250307410622e-05, "tps": 226003, "wall": 7701.2} {"step": 26558, "train_loss": 3.1000783443450928, "lr": 5.5744666318801065e-05, "tps": 225861, "wall": 7706.4} {"step": 26559, "train_loss": 3.1534290313720703, "lr": 5.573683142418922e-05, "tps": 225722, "wall": 7711.4} {"step": 26560, "train_loss": 3.0614266395568848, "lr": 5.572899839035943e-05, "tps": 225586, "wall": 7716.3} {"step": 26561, "train_loss": 3.0030455589294434, "lr": 5.572116721740045e-05, "tps": 225445, "wall": 7721.5} {"step": 26562, "train_loss": 3.1033082008361816, "lr": 5.571333790540093e-05, "tps": 225307, "wall": 7726.5} {"step": 26563, "train_loss": 3.040513753890991, "lr": 5.570551045444965e-05, "tps": 225167, "wall": 7731.6} {"step": 26564, "train_loss": 3.1267998218536377, "lr": 5.5697684864635224e-05, "tps": 225027, "wall": 7736.7} {"step": 26565, "train_loss": 3.1209359169006348, "lr": 5.568986113604631e-05, "tps": 224888, "wall": 7741.8} {"step": 26566, "train_loss": 3.015604257583618, "lr": 5.5682039268771536e-05, "tps": 224750, "wall": 7746.8} {"step": 26567, "train_loss": 3.122699499130249, "lr": 5.5674219262899526e-05, "tps": 224616, "wall": 7751.7} {"step": 26568, "train_loss": 3.135620355606079, "lr": 5.566640111851882e-05, "tps": 224481, "wall": 7756.7} {"step": 26569, "train_loss": 3.12332820892334, "lr": 5.565858483571804e-05, "tps": 224345, "wall": 7761.6} {"step": 26570, "train_loss": 3.0501086711883545, "lr": 5.565077041458571e-05, "tps": 224211, "wall": 7766.6} {"step": 26571, "train_loss": 3.1144638061523438, "lr": 5.564295785521029e-05, "tps": 224076, "wall": 7771.5} {"step": 26572, "train_loss": 3.1388936042785645, "lr": 5.563514715768038e-05, "tps": 223942, "wall": 7776.5} {"step": 26573, "train_loss": 3.143632650375366, "lr": 5.5627338322084386e-05, "tps": 223807, "wall": 7781.5} {"step": 26574, "train_loss": 3.093839406967163, "lr": 5.561953134851082e-05, "tps": 223673, "wall": 7786.4} {"step": 26575, "train_loss": 3.171689510345459, "lr": 5.561172623704811e-05, "tps": 223539, "wall": 7791.4} {"step": 26576, "train_loss": 3.16654634475708, "lr": 5.560392298778463e-05, "tps": 223406, "wall": 7796.3} {"step": 26577, "train_loss": 3.162947416305542, "lr": 5.55961216008088e-05, "tps": 223272, "wall": 7801.3} {"step": 26578, "train_loss": 3.128941059112549, "lr": 5.558832207620903e-05, "tps": 223136, "wall": 7806.4} {"step": 26579, "train_loss": 3.0689902305603027, "lr": 5.55805244140736e-05, "tps": 223002, "wall": 7811.3} {"step": 26580, "train_loss": 3.1359665393829346, "lr": 5.557272861449092e-05, "tps": 222868, "wall": 7816.3} {"step": 26581, "train_loss": 3.0895438194274902, "lr": 5.5564934677549264e-05, "tps": 222730, "wall": 7821.5} {"step": 26582, "train_loss": 3.083076000213623, "lr": 5.555714260333691e-05, "tps": 222592, "wall": 7826.6} {"step": 26583, "train_loss": 3.0885019302368164, "lr": 5.554935239194216e-05, "tps": 222452, "wall": 7831.8} {"step": 26584, "train_loss": 3.168407678604126, "lr": 5.554156404345322e-05, "tps": 222311, "wall": 7837.1} {"step": 26585, "train_loss": 3.126077890396118, "lr": 5.553377755795832e-05, "tps": 222177, "wall": 7842.1} {"step": 26586, "train_loss": 3.1010053157806396, "lr": 5.5525992935545744e-05, "tps": 222042, "wall": 7847.2} {"step": 26587, "train_loss": 3.2194790840148926, "lr": 5.5518210176303586e-05, "tps": 221906, "wall": 7852.3} {"step": 26588, "train_loss": 3.090818405151367, "lr": 5.5510429280320034e-05, "tps": 221772, "wall": 7857.3} {"step": 26589, "train_loss": 3.051905393600464, "lr": 5.550265024768324e-05, "tps": 221639, "wall": 7862.3} {"step": 26590, "train_loss": 3.1417837142944336, "lr": 5.5494873078481345e-05, "tps": 221502, "wall": 7867.5} {"step": 26591, "train_loss": 3.2205090522766113, "lr": 5.548709777280238e-05, "tps": 221368, "wall": 7872.5} {"step": 26592, "train_loss": 3.091717004776001, "lr": 5.5479324330734526e-05, "tps": 221235, "wall": 7877.6} {"step": 26593, "train_loss": 3.1344845294952393, "lr": 5.547155275236574e-05, "tps": 221101, "wall": 7882.7} {"step": 26594, "train_loss": 3.0778965950012207, "lr": 5.5463783037784143e-05, "tps": 220966, "wall": 7887.8} {"step": 26595, "train_loss": 3.1044836044311523, "lr": 5.54560151870777e-05, "tps": 220830, "wall": 7892.9} {"step": 26596, "train_loss": 3.0240774154663086, "lr": 5.54482492003344e-05, "tps": 220694, "wall": 7898.1} {"step": 26597, "train_loss": 3.092508316040039, "lr": 5.5440485077642256e-05, "tps": 220561, "wall": 7903.1} {"step": 26598, "train_loss": 3.143646717071533, "lr": 5.543272281908921e-05, "tps": 220425, "wall": 7908.3} {"step": 26599, "train_loss": 3.1479291915893555, "lr": 5.542496242476314e-05, "tps": 220288, "wall": 7913.5} {"step": 26600, "train_loss": 3.18349027633667, "lr": 5.541720389475204e-05, "tps": 220147, "wall": 7918.9} {"step": 26601, "train_loss": 3.0879874229431152, "lr": 5.540944722914375e-05, "tps": 220008, "wall": 7924.2} {"step": 26602, "train_loss": 3.0964179039001465, "lr": 5.5401692428026145e-05, "tps": 219873, "wall": 7929.4} {"step": 26603, "train_loss": 3.0511183738708496, "lr": 5.539393949148706e-05, "tps": 219739, "wall": 7934.5} {"step": 26604, "train_loss": 3.226313591003418, "lr": 5.538618841961436e-05, "tps": 219605, "wall": 7939.6} {"step": 26605, "train_loss": 3.0512442588806152, "lr": 5.5378439212495784e-05, "tps": 219470, "wall": 7944.8} {"step": 26606, "train_loss": 3.074202299118042, "lr": 5.537069187021917e-05, "tps": 219337, "wall": 7949.9} {"step": 26607, "train_loss": 3.071510076522827, "lr": 5.5362946392872296e-05, "tps": 219205, "wall": 7955.0} {"step": 26608, "train_loss": 3.1530613899230957, "lr": 5.535520278054281e-05, "tps": 219074, "wall": 7960.1} {"step": 26609, "train_loss": 3.0498571395874023, "lr": 5.534746103331855e-05, "tps": 218944, "wall": 7965.1} {"step": 26610, "train_loss": 3.1558375358581543, "lr": 5.533972115128712e-05, "tps": 218814, "wall": 7970.1} {"step": 26611, "train_loss": 3.0480329990386963, "lr": 5.533198313453628e-05, "tps": 218685, "wall": 7975.1} {"step": 26612, "train_loss": 3.0937886238098145, "lr": 5.532424698315363e-05, "tps": 218553, "wall": 7980.2} {"step": 26613, "train_loss": 3.1171507835388184, "lr": 5.531651269722677e-05, "tps": 218418, "wall": 7985.5} {"step": 26614, "train_loss": 3.0796844959259033, "lr": 5.530878027684343e-05, "tps": 218286, "wall": 7990.6} {"step": 26615, "train_loss": 3.0550537109375, "lr": 5.5301049722091114e-05, "tps": 218155, "wall": 7995.7} {"step": 26616, "train_loss": 2.986374616622925, "lr": 5.529332103305739e-05, "tps": 218024, "wall": 8000.8} {"step": 26617, "train_loss": 3.0472421646118164, "lr": 5.528559420982986e-05, "tps": 217893, "wall": 8005.9} {"step": 26618, "train_loss": 3.1317601203918457, "lr": 5.527786925249605e-05, "tps": 217761, "wall": 8011.1} {"step": 26619, "train_loss": 3.0978918075561523, "lr": 5.527014616114339e-05, "tps": 217631, "wall": 8016.2} {"step": 26620, "train_loss": 3.177297592163086, "lr": 5.526242493585949e-05, "tps": 217499, "wall": 8021.3} {"step": 26621, "train_loss": 3.0977492332458496, "lr": 5.5254705576731715e-05, "tps": 217368, "wall": 8026.5} {"step": 26622, "train_loss": 3.05586576461792, "lr": 5.524698808384755e-05, "tps": 217237, "wall": 8031.6} {"step": 26623, "train_loss": 3.0517349243164062, "lr": 5.523927245729444e-05, "tps": 217106, "wall": 8036.7} {"step": 26624, "train_loss": 3.0326719284057617, "lr": 5.523155869715977e-05, "tps": 216977, "wall": 8041.8} {"step": 26625, "train_loss": 2.9776620864868164, "lr": 5.522384680353086e-05, "tps": 216848, "wall": 8046.9} {"step": 26626, "train_loss": 3.112767457962036, "lr": 5.5216136776495174e-05, "tps": 216720, "wall": 8052.0} {"step": 26627, "train_loss": 3.2307450771331787, "lr": 5.520842861613997e-05, "tps": 216591, "wall": 8057.1} {"step": 26628, "train_loss": 3.0942697525024414, "lr": 5.5200722322552635e-05, "tps": 216462, "wall": 8062.2} {"step": 26629, "train_loss": 3.1097679138183594, "lr": 5.5193017895820444e-05, "tps": 216333, "wall": 8067.3} {"step": 26630, "train_loss": 3.0695862770080566, "lr": 5.518531533603062e-05, "tps": 216203, "wall": 8072.4} {"step": 26631, "train_loss": 3.1720638275146484, "lr": 5.5177614643270495e-05, "tps": 216074, "wall": 8077.5} {"step": 26632, "train_loss": 3.164245128631592, "lr": 5.5169915817627246e-05, "tps": 215944, "wall": 8082.7} {"step": 26633, "train_loss": 3.1203815937042236, "lr": 5.516221885918811e-05, "tps": 215815, "wall": 8087.9} {"step": 26634, "train_loss": 3.0802178382873535, "lr": 5.51545237680403e-05, "tps": 215689, "wall": 8092.9} {"step": 26635, "train_loss": 3.118741035461426, "lr": 5.514683054427094e-05, "tps": 215557, "wall": 8098.1} {"step": 26636, "train_loss": 2.92626953125, "lr": 5.513913918796719e-05, "tps": 215431, "wall": 8103.2} {"step": 26637, "train_loss": 3.1525678634643555, "lr": 5.5131449699216244e-05, "tps": 215303, "wall": 8108.3} {"step": 26638, "train_loss": 3.064112901687622, "lr": 5.512376207810512e-05, "tps": 215178, "wall": 8113.3} {"step": 26639, "train_loss": 3.138836622238159, "lr": 5.511607632472091e-05, "tps": 215052, "wall": 8118.4} {"step": 26640, "train_loss": 3.126746416091919, "lr": 5.510839243915076e-05, "tps": 214927, "wall": 8123.4} {"step": 26641, "train_loss": 3.097167491912842, "lr": 5.510071042148165e-05, "tps": 214802, "wall": 8128.5} {"step": 26642, "train_loss": 3.1360666751861572, "lr": 5.509303027180057e-05, "tps": 214672, "wall": 8133.7} {"step": 26643, "train_loss": 3.108402967453003, "lr": 5.50853519901946e-05, "tps": 214546, "wall": 8138.8} {"step": 26644, "train_loss": 3.1296863555908203, "lr": 5.50776755767507e-05, "tps": 214416, "wall": 8144.0} {"step": 26645, "train_loss": 3.1721253395080566, "lr": 5.5070001031555774e-05, "tps": 214289, "wall": 8149.1} {"step": 26646, "train_loss": 3.1190218925476074, "lr": 5.5062328354696815e-05, "tps": 214161, "wall": 8154.3} {"step": 26647, "train_loss": 3.0239386558532715, "lr": 5.505465754626071e-05, "tps": 214035, "wall": 8159.4} {"step": 26648, "train_loss": 3.14277982711792, "lr": 5.504698860633439e-05, "tps": 213907, "wall": 8164.6} {"step": 26649, "train_loss": 3.12373948097229, "lr": 5.503932153500471e-05, "tps": 213781, "wall": 8169.7} {"step": 26650, "train_loss": 3.190685749053955, "lr": 5.503165633235849e-05, "tps": 213654, "wall": 8174.9} {"step": 26651, "train_loss": 3.221393346786499, "lr": 5.502399299848262e-05, "tps": 213527, "wall": 8180.1} {"step": 26652, "train_loss": 3.1093811988830566, "lr": 5.501633153346391e-05, "tps": 213400, "wall": 8185.2} {"step": 26653, "train_loss": 3.1476082801818848, "lr": 5.500867193738906e-05, "tps": 213272, "wall": 8190.4} {"step": 26654, "train_loss": 3.120896339416504, "lr": 5.5001014210344914e-05, "tps": 213146, "wall": 8195.6} {"step": 26655, "train_loss": 3.102200508117676, "lr": 5.499335835241822e-05, "tps": 213020, "wall": 8200.8} {"step": 26656, "train_loss": 3.038332223892212, "lr": 5.4985704363695675e-05, "tps": 212896, "wall": 8205.8} {"step": 26657, "train_loss": 3.0179519653320312, "lr": 5.4978052244264024e-05, "tps": 212770, "wall": 8211.0} {"step": 26658, "train_loss": 3.0444602966308594, "lr": 5.497040199420992e-05, "tps": 212644, "wall": 8216.2} {"step": 26659, "train_loss": 3.0820608139038086, "lr": 5.496275361362001e-05, "tps": 212518, "wall": 8221.3} {"step": 26660, "train_loss": 3.043107509613037, "lr": 5.495510710258096e-05, "tps": 212391, "wall": 8226.6} {"step": 26661, "train_loss": 3.151589870452881, "lr": 5.494746246117941e-05, "tps": 212265, "wall": 8231.8} {"step": 26662, "train_loss": 3.163846969604492, "lr": 5.4939819689501906e-05, "tps": 212140, "wall": 8236.9} {"step": 26663, "train_loss": 3.144243001937866, "lr": 5.4932178787635055e-05, "tps": 212016, "wall": 8242.1} {"step": 26664, "train_loss": 3.074059247970581, "lr": 5.492453975566541e-05, "tps": 211891, "wall": 8247.2} {"step": 26665, "train_loss": 3.210881233215332, "lr": 5.491690259367954e-05, "tps": 211766, "wall": 8252.4} {"step": 26666, "train_loss": 3.1153922080993652, "lr": 5.490926730176392e-05, "tps": 211642, "wall": 8257.6} {"step": 26667, "train_loss": 3.033040761947632, "lr": 5.490163388000501e-05, "tps": 211517, "wall": 8262.7} {"step": 26668, "train_loss": 3.147712230682373, "lr": 5.489400232848936e-05, "tps": 211394, "wall": 8267.9} {"step": 26669, "train_loss": 3.0739777088165283, "lr": 5.48863726473034e-05, "tps": 211270, "wall": 8273.0} {"step": 26670, "train_loss": 3.158933162689209, "lr": 5.48787448365335e-05, "tps": 211145, "wall": 8278.2} {"step": 26671, "train_loss": 3.0602641105651855, "lr": 5.487111889626614e-05, "tps": 211020, "wall": 8283.4} {"step": 26672, "train_loss": 3.084592580795288, "lr": 5.486349482658768e-05, "tps": 210895, "wall": 8288.7} {"step": 26673, "train_loss": 3.0574774742126465, "lr": 5.4855872627584445e-05, "tps": 210771, "wall": 8293.9} {"step": 26674, "train_loss": 3.0765719413757324, "lr": 5.484825229934287e-05, "tps": 210649, "wall": 8298.9} {"step": 26675, "train_loss": 3.0865039825439453, "lr": 5.4840633841949206e-05, "tps": 210522, "wall": 8304.3} {"step": 26676, "train_loss": 3.1569900512695312, "lr": 5.483301725548975e-05, "tps": 210396, "wall": 8309.6} {"step": 26677, "train_loss": 3.00070858001709, "lr": 5.4825402540050864e-05, "tps": 210272, "wall": 8314.8} {"step": 26678, "train_loss": 3.1410515308380127, "lr": 5.4817789695718736e-05, "tps": 210152, "wall": 8319.8} {"step": 26679, "train_loss": 3.071636915206909, "lr": 5.481017872257959e-05, "tps": 210033, "wall": 8324.9} {"step": 26680, "train_loss": 2.966843366622925, "lr": 5.48025696207197e-05, "tps": 209909, "wall": 8330.1} {"step": 26681, "train_loss": 3.098206043243408, "lr": 5.4794962390225235e-05, "tps": 209787, "wall": 8335.3} {"step": 26682, "train_loss": 3.108980178833008, "lr": 5.478735703118237e-05, "tps": 209665, "wall": 8340.4} {"step": 26683, "train_loss": 3.090776205062866, "lr": 5.4779753543677284e-05, "tps": 209539, "wall": 8345.8} {"step": 26684, "train_loss": 3.0159752368927, "lr": 5.477215192779606e-05, "tps": 209419, "wall": 8350.8} {"step": 26685, "train_loss": 3.176069498062134, "lr": 5.4764552183624853e-05, "tps": 209296, "wall": 8356.0} {"step": 26686, "train_loss": 3.1142756938934326, "lr": 5.475695431124974e-05, "tps": 209176, "wall": 8361.2} {"step": 26687, "train_loss": 3.1396915912628174, "lr": 5.474935831075677e-05, "tps": 209053, "wall": 8366.4} {"step": 26688, "train_loss": 3.113035202026367, "lr": 5.474176418223202e-05, "tps": 208931, "wall": 8371.6} {"step": 26689, "train_loss": 3.113431930541992, "lr": 5.473417192576153e-05, "tps": 208813, "wall": 8376.7} {"step": 26690, "train_loss": 3.1142210960388184, "lr": 5.4726581541431246e-05, "tps": 208693, "wall": 8381.8} {"step": 26691, "train_loss": 3.0900964736938477, "lr": 5.471899302932721e-05, "tps": 208572, "wall": 8386.9} {"step": 26692, "train_loss": 3.1392993927001953, "lr": 5.471140638953536e-05, "tps": 208456, "wall": 8391.9} {"step": 26693, "train_loss": 3.0902762413024902, "lr": 5.470382162214161e-05, "tps": 208337, "wall": 8397.0} {"step": 26694, "train_loss": 3.120368003845215, "lr": 5.469623872723194e-05, "tps": 208218, "wall": 8402.1} {"step": 26695, "train_loss": 3.136636257171631, "lr": 5.468865770489223e-05, "tps": 208098, "wall": 8407.3} {"step": 26696, "train_loss": 3.087406873703003, "lr": 5.468107855520832e-05, "tps": 207981, "wall": 8412.3} {"step": 26697, "train_loss": 3.1480982303619385, "lr": 5.4673501278266105e-05, "tps": 207864, "wall": 8417.4} {"step": 26698, "train_loss": 3.1771202087402344, "lr": 5.466592587415142e-05, "tps": 207747, "wall": 8422.5} {"step": 26699, "train_loss": 3.123178005218506, "lr": 5.465835234295007e-05, "tps": 207630, "wall": 8427.5} {"step": 26700, "train_loss": 3.1007089614868164, "lr": 5.4650780684747845e-05, "tps": 207512, "wall": 8432.7} {"step": 26701, "train_loss": 3.071293592453003, "lr": 5.4643210899630515e-05, "tps": 207394, "wall": 8437.7} {"step": 26702, "train_loss": 3.1501593589782715, "lr": 5.463564298768383e-05, "tps": 207273, "wall": 8443.0} {"step": 26703, "train_loss": 3.12858510017395, "lr": 5.462807694899357e-05, "tps": 207152, "wall": 8448.2} {"step": 26704, "train_loss": 3.204829692840576, "lr": 5.462051278364535e-05, "tps": 207030, "wall": 8453.5} {"step": 26705, "train_loss": 3.147947072982788, "lr": 5.461295049172494e-05, "tps": 206914, "wall": 8458.6} {"step": 26706, "train_loss": 3.1102685928344727, "lr": 5.4605390073317976e-05, "tps": 206796, "wall": 8463.7} {"step": 26707, "train_loss": 3.0543222427368164, "lr": 5.459783152851008e-05, "tps": 206678, "wall": 8468.9} {"step": 26708, "train_loss": 3.1981170177459717, "lr": 5.4590274857386916e-05, "tps": 206554, "wall": 8474.3} {"step": 26709, "train_loss": 3.0412075519561768, "lr": 5.4582720060034066e-05, "tps": 206437, "wall": 8479.4} {"step": 26710, "train_loss": 3.1889567375183105, "lr": 5.457516713653708e-05, "tps": 206316, "wall": 8484.7} {"step": 26711, "train_loss": 3.126417398452759, "lr": 5.456761608698159e-05, "tps": 206197, "wall": 8489.9} {"step": 26712, "train_loss": 3.1568636894226074, "lr": 5.456006691145309e-05, "tps": 206078, "wall": 8495.1} {"step": 26713, "train_loss": 3.1138181686401367, "lr": 5.455251961003707e-05, "tps": 205956, "wall": 8500.5} {"step": 26714, "train_loss": 3.1441407203674316, "lr": 5.4544974182819074e-05, "tps": 205836, "wall": 8505.8} {"step": 26715, "train_loss": 3.0457489490509033, "lr": 5.453743062988459e-05, "tps": 205719, "wall": 8510.9} {"step": 26716, "train_loss": 3.0506906509399414, "lr": 5.4529888951318995e-05, "tps": 205598, "wall": 8516.3} {"step": 26717, "train_loss": 2.9916012287139893, "lr": 5.4522349147207806e-05, "tps": 205482, "wall": 8521.4} {"step": 26718, "train_loss": 3.1275343894958496, "lr": 5.451481121763637e-05, "tps": 205364, "wall": 8526.6} {"step": 26719, "train_loss": 3.0635528564453125, "lr": 5.450727516269013e-05, "tps": 205249, "wall": 8531.7} {"step": 26720, "train_loss": 2.956437110900879, "lr": 5.4499740982454426e-05, "tps": 205131, "wall": 8536.9} {"step": 26721, "train_loss": 3.057053565979004, "lr": 5.449220867701459e-05, "tps": 205013, "wall": 8542.1} {"step": 26722, "train_loss": 3.132476329803467, "lr": 5.4484678246456023e-05, "tps": 204894, "wall": 8547.4} {"step": 26723, "train_loss": 3.0060620307922363, "lr": 5.4477149690863926e-05, "tps": 204780, "wall": 8552.5} {"step": 26724, "train_loss": 3.238870143890381, "lr": 5.4469623010323645e-05, "tps": 204666, "wall": 8557.6} {"step": 26725, "train_loss": 2.9328150749206543, "lr": 5.446209820492044e-05, "tps": 204552, "wall": 8562.7} {"step": 26726, "train_loss": 3.223217010498047, "lr": 5.44545752747395e-05, "tps": 204438, "wall": 8567.8} {"step": 26727, "train_loss": 3.09322452545166, "lr": 5.444705421986612e-05, "tps": 204324, "wall": 8572.9} {"step": 26728, "train_loss": 3.1286752223968506, "lr": 5.443953504038549e-05, "tps": 204211, "wall": 8577.9} {"step": 26729, "train_loss": 3.07505464553833, "lr": 5.443201773638271e-05, "tps": 204098, "wall": 8583.0} {"step": 26730, "train_loss": 3.040072441101074, "lr": 5.4424502307943015e-05, "tps": 203980, "wall": 8588.3} {"step": 26731, "train_loss": 3.155377149581909, "lr": 5.4416988755151534e-05, "tps": 203865, "wall": 8593.4} {"step": 26732, "train_loss": 3.122591018676758, "lr": 5.440947707809333e-05, "tps": 203751, "wall": 8598.6} {"step": 26733, "train_loss": 3.197577953338623, "lr": 5.440196727685354e-05, "tps": 203637, "wall": 8603.7} {"step": 26734, "train_loss": 3.143637180328369, "lr": 5.439445935151725e-05, "tps": 203524, "wall": 8608.8} {"step": 26735, "train_loss": 3.1506452560424805, "lr": 5.438695330216943e-05, "tps": 203410, "wall": 8614.0} {"step": 26736, "train_loss": 3.082792043685913, "lr": 5.4379449128895196e-05, "tps": 203298, "wall": 8619.0} {"step": 26737, "train_loss": 3.0958921909332275, "lr": 5.437194683177953e-05, "tps": 203183, "wall": 8624.2} {"step": 26738, "train_loss": 3.1031925678253174, "lr": 5.436444641090739e-05, "tps": 203069, "wall": 8629.4} {"step": 26739, "train_loss": 3.104102849960327, "lr": 5.4356947866363774e-05, "tps": 202956, "wall": 8634.5} {"step": 26740, "train_loss": 3.130321502685547, "lr": 5.4349451198233626e-05, "tps": 202842, "wall": 8639.7} {"step": 26741, "train_loss": 3.0835723876953125, "lr": 5.4341956406601804e-05, "tps": 202726, "wall": 8645.0} {"step": 26742, "train_loss": 3.0997188091278076, "lr": 5.43344634915533e-05, "tps": 202613, "wall": 8650.1} {"step": 26743, "train_loss": 3.1019675731658936, "lr": 5.432697245317294e-05, "tps": 202497, "wall": 8655.4} {"step": 26744, "train_loss": 3.098573684692383, "lr": 5.431948329154564e-05, "tps": 202386, "wall": 8660.5} {"step": 26745, "train_loss": 3.078134536743164, "lr": 5.431199600675616e-05, "tps": 202272, "wall": 8665.7} {"step": 26746, "train_loss": 2.98013973236084, "lr": 5.4304510598889335e-05, "tps": 202156, "wall": 8671.0} {"step": 26747, "train_loss": 3.1361687183380127, "lr": 5.429702706803001e-05, "tps": 202043, "wall": 8676.1} {"step": 26748, "train_loss": 2.9873838424682617, "lr": 5.428954541426294e-05, "tps": 201930, "wall": 8681.3} {"step": 26749, "train_loss": 3.079167127609253, "lr": 5.428206563767284e-05, "tps": 201816, "wall": 8686.5} {"step": 26750, "train_loss": 3.09132981300354, "lr": 5.427458773834446e-05, "tps": 201705, "wall": 8691.6} {"step": 26751, "train_loss": 3.0570108890533447, "lr": 5.426711171636255e-05, "tps": 201592, "wall": 8696.8} {"step": 26752, "train_loss": 3.1100072860717773, "lr": 5.4259637571811715e-05, "tps": 201476, "wall": 8702.2} {"step": 26753, "train_loss": 3.148995876312256, "lr": 5.425216530477671e-05, "tps": 201349, "wall": 8708.0} {"step": 26754, "train_loss": 3.2612075805664062, "lr": 5.4244694915342146e-05, "tps": 201228, "wall": 8713.5} {"step": 26755, "train_loss": 3.151446580886841, "lr": 5.42372264035926e-05, "tps": 201108, "wall": 8719.1} {"step": 26756, "train_loss": 3.052232027053833, "lr": 5.4229759769612775e-05, "tps": 200988, "wall": 8724.6} {"step": 26757, "train_loss": 3.0975146293640137, "lr": 5.422229501348719e-05, "tps": 200875, "wall": 8729.8} {"step": 26758, "train_loss": 3.0845351219177246, "lr": 5.421483213530038e-05, "tps": 200756, "wall": 8735.4} {"step": 26759, "train_loss": 3.141709804534912, "lr": 5.420737113513695e-05, "tps": 200642, "wall": 8740.6} {"step": 26760, "train_loss": 3.0910701751708984, "lr": 5.4199912013081355e-05, "tps": 200529, "wall": 8745.9} {"step": 26761, "train_loss": 3.172593593597412, "lr": 5.419245476921816e-05, "tps": 200413, "wall": 8751.3} {"step": 26762, "train_loss": 3.04145884513855, "lr": 5.418499940363182e-05, "tps": 200298, "wall": 8756.6} {"step": 26763, "train_loss": 3.117751359939575, "lr": 5.417754591640674e-05, "tps": 200185, "wall": 8761.9} {"step": 26764, "train_loss": 3.087432861328125, "lr": 5.417009430762742e-05, "tps": 200067, "wall": 8767.4} {"step": 26765, "train_loss": 3.07763671875, "lr": 5.416264457737823e-05, "tps": 199956, "wall": 8772.6} {"step": 26766, "train_loss": 3.1738815307617188, "lr": 5.415519672574355e-05, "tps": 199844, "wall": 8777.8} {"step": 26767, "train_loss": 3.1423697471618652, "lr": 5.414775075280782e-05, "tps": 199733, "wall": 8783.1} {"step": 26768, "train_loss": 3.0987114906311035, "lr": 5.4140306658655324e-05, "tps": 199624, "wall": 8788.2} {"step": 26769, "train_loss": 3.1983799934387207, "lr": 5.413286444337039e-05, "tps": 199514, "wall": 8793.3} {"step": 26770, "train_loss": 3.133754253387451, "lr": 5.412542410703736e-05, "tps": 199401, "wall": 8798.7} {"step": 26771, "train_loss": 2.9642868041992188, "lr": 5.4117985649740486e-05, "tps": 199284, "wall": 8804.1} {"step": 26772, "train_loss": 3.0341036319732666, "lr": 5.4110549071564056e-05, "tps": 199167, "wall": 8809.7} {"step": 26773, "train_loss": 3.1730856895446777, "lr": 5.410311437259229e-05, "tps": 199053, "wall": 8815.0} {"step": 26774, "train_loss": 3.035085916519165, "lr": 5.409568155290945e-05, "tps": 198938, "wall": 8820.4} {"step": 26775, "train_loss": 3.1323471069335938, "lr": 5.4088250612599644e-05, "tps": 198827, "wall": 8825.7} {"step": 26776, "train_loss": 3.0108070373535156, "lr": 5.4080821551747155e-05, "tps": 198717, "wall": 8830.9} {"step": 26777, "train_loss": 3.092461347579956, "lr": 5.407339437043608e-05, "tps": 198607, "wall": 8836.1} {"step": 26778, "train_loss": 3.104736089706421, "lr": 5.406596906875059e-05, "tps": 198496, "wall": 8841.4} {"step": 26779, "train_loss": 3.0043106079101562, "lr": 5.405854564677476e-05, "tps": 198381, "wall": 8846.9} {"step": 26780, "train_loss": 3.0342278480529785, "lr": 5.40511241045927e-05, "tps": 198270, "wall": 8852.2} {"step": 26781, "train_loss": 3.1813344955444336, "lr": 5.40437044422885e-05, "tps": 198155, "wall": 8857.6} {"step": 26782, "train_loss": 3.1039414405822754, "lr": 5.403628665994619e-05, "tps": 198043, "wall": 8863.0} {"step": 26783, "train_loss": 3.232046127319336, "lr": 5.402887075764979e-05, "tps": 197937, "wall": 8868.0} {"step": 26784, "train_loss": 3.1346373558044434, "lr": 5.4021456735483334e-05, "tps": 197829, "wall": 8873.2} {"step": 26785, "train_loss": 3.130378484725952, "lr": 5.401404459353081e-05, "tps": 197723, "wall": 8878.3} {"step": 26786, "train_loss": 2.966508388519287, "lr": 5.400663433187611e-05, "tps": 197616, "wall": 8883.4} {"step": 26787, "train_loss": 3.1684200763702393, "lr": 5.3999225950603296e-05, "tps": 197510, "wall": 8888.5} {"step": 26788, "train_loss": 3.1243090629577637, "lr": 5.399181944979623e-05, "tps": 197405, "wall": 8893.6} {"step": 26789, "train_loss": 3.169497489929199, "lr": 5.398441482953878e-05, "tps": 197301, "wall": 8898.6} {"step": 26790, "train_loss": 3.0595932006835938, "lr": 5.397701208991488e-05, "tps": 197197, "wall": 8903.7} {"step": 26791, "train_loss": 3.134718418121338, "lr": 5.396961123100838e-05, "tps": 197092, "wall": 8908.7} {"step": 26792, "train_loss": 3.112525463104248, "lr": 5.3962212252903055e-05, "tps": 196988, "wall": 8913.7} {"step": 26793, "train_loss": 3.0623955726623535, "lr": 5.395481515568283e-05, "tps": 196884, "wall": 8918.8} {"step": 26794, "train_loss": 3.1421260833740234, "lr": 5.3947419939431445e-05, "tps": 196780, "wall": 8923.8} {"step": 26795, "train_loss": 3.188063859939575, "lr": 5.394002660423262e-05, "tps": 196676, "wall": 8928.9} {"step": 26796, "train_loss": 3.0666446685791016, "lr": 5.393263515017019e-05, "tps": 196572, "wall": 8933.9} {"step": 26797, "train_loss": 3.0896825790405273, "lr": 5.3925245577327824e-05, "tps": 196468, "wall": 8939.0} {"step": 26798, "train_loss": 2.997537136077881, "lr": 5.39178578857893e-05, "tps": 196362, "wall": 8944.2} {"step": 26799, "train_loss": 3.062347650527954, "lr": 5.391047207563824e-05, "tps": 196256, "wall": 8949.3} {"step": 26800, "train_loss": 3.021373987197876, "lr": 5.3903088146958335e-05, "tps": 196148, "wall": 8954.6} {"step": 26801, "train_loss": 3.0622448921203613, "lr": 5.389570609983325e-05, "tps": 196039, "wall": 8959.9} {"step": 26802, "train_loss": 3.1546831130981445, "lr": 5.388832593434662e-05, "tps": 195926, "wall": 8965.4} {"step": 26803, "train_loss": 3.041215419769287, "lr": 5.388094765058196e-05, "tps": 195819, "wall": 8970.6} {"step": 26804, "train_loss": 3.130514144897461, "lr": 5.3873571248622946e-05, "tps": 195704, "wall": 8976.2} {"step": 26805, "train_loss": 3.0843892097473145, "lr": 5.386619672855311e-05, "tps": 195595, "wall": 8981.6} {"step": 26806, "train_loss": 3.12850284576416, "lr": 5.385882409045594e-05, "tps": 195489, "wall": 8986.8} {"step": 26807, "train_loss": 3.1322989463806152, "lr": 5.385145333441505e-05, "tps": 195384, "wall": 8992.0} {"step": 26808, "train_loss": 3.019897937774658, "lr": 5.3844084460513875e-05, "tps": 195281, "wall": 8997.0} {"step": 26809, "train_loss": 3.117772102355957, "lr": 5.383671746883586e-05, "tps": 195177, "wall": 9002.2} {"step": 26810, "train_loss": 3.062458038330078, "lr": 5.382935235946454e-05, "tps": 195073, "wall": 9007.3} {"step": 26811, "train_loss": 3.242617130279541, "lr": 5.3821989132483316e-05, "tps": 194971, "wall": 9012.4} {"step": 26812, "train_loss": 3.1308069229125977, "lr": 5.3814627787975545e-05, "tps": 194869, "wall": 9017.4} {"step": 26813, "train_loss": 3.0379176139831543, "lr": 5.3807268326024704e-05, "tps": 194768, "wall": 9022.4} {"step": 26814, "train_loss": 3.0154929161071777, "lr": 5.3799910746714086e-05, "tps": 194666, "wall": 9027.5} {"step": 26815, "train_loss": 3.1329989433288574, "lr": 5.379255505012709e-05, "tps": 194565, "wall": 9032.5} {"step": 26816, "train_loss": 3.160694122314453, "lr": 5.378520123634702e-05, "tps": 194463, "wall": 9037.6} {"step": 26817, "train_loss": 3.186504364013672, "lr": 5.377784930545715e-05, "tps": 194360, "wall": 9042.7} {"step": 26818, "train_loss": 3.204636335372925, "lr": 5.377049925754084e-05, "tps": 194260, "wall": 9047.7} {"step": 26819, "train_loss": 3.0593600273132324, "lr": 5.376315109268131e-05, "tps": 194156, "wall": 9052.9} {"step": 26820, "train_loss": 3.1880974769592285, "lr": 5.375580481096176e-05, "tps": 194046, "wall": 9058.4} {"step": 26821, "train_loss": 3.155536413192749, "lr": 5.374846041246547e-05, "tps": 193945, "wall": 9063.4} {"step": 26822, "train_loss": 3.077646255493164, "lr": 5.3741117897275614e-05, "tps": 193838, "wall": 9068.7} {"step": 26823, "train_loss": 3.084465265274048, "lr": 5.3733777265475346e-05, "tps": 193735, "wall": 9073.9} {"step": 26824, "train_loss": 3.0661025047302246, "lr": 5.3726438517147894e-05, "tps": 193632, "wall": 9079.1} {"step": 26825, "train_loss": 3.052388906478882, "lr": 5.3719101652376314e-05, "tps": 193530, "wall": 9084.2} {"step": 26826, "train_loss": 3.145781993865967, "lr": 5.371176667124371e-05, "tps": 193429, "wall": 9089.3} {"step": 26827, "train_loss": 3.040736436843872, "lr": 5.370443357383327e-05, "tps": 193329, "wall": 9094.3} {"step": 26828, "train_loss": 2.9586780071258545, "lr": 5.369710236022798e-05, "tps": 193229, "wall": 9099.4} {"step": 26829, "train_loss": 3.0930228233337402, "lr": 5.368977303051088e-05, "tps": 193128, "wall": 9104.5} {"step": 26830, "train_loss": 3.113043785095215, "lr": 5.3682445584765075e-05, "tps": 193028, "wall": 9109.5} {"step": 26831, "train_loss": 2.97737455368042, "lr": 5.367512002307351e-05, "tps": 192927, "wall": 9114.6} {"step": 26832, "train_loss": 3.105564832687378, "lr": 5.366779634551916e-05, "tps": 192826, "wall": 9119.7} {"step": 26833, "train_loss": 3.1908836364746094, "lr": 5.3660474552185035e-05, "tps": 192726, "wall": 9124.8} {"step": 26834, "train_loss": 3.1440751552581787, "lr": 5.3653154643154025e-05, "tps": 192625, "wall": 9129.9} {"step": 26835, "train_loss": 3.145817756652832, "lr": 5.3645836618509115e-05, "tps": 192526, "wall": 9135.0} {"step": 26836, "train_loss": 3.1804208755493164, "lr": 5.363852047833315e-05, "tps": 192427, "wall": 9140.0} {"step": 26837, "train_loss": 3.0546822547912598, "lr": 5.363120622270903e-05, "tps": 192329, "wall": 9145.0} {"step": 26838, "train_loss": 3.180136203765869, "lr": 5.362389385171961e-05, "tps": 192229, "wall": 9150.1} {"step": 26839, "train_loss": 3.0472640991210938, "lr": 5.361658336544773e-05, "tps": 192130, "wall": 9155.2} {"step": 26840, "train_loss": 3.039619207382202, "lr": 5.3609274763976146e-05, "tps": 192032, "wall": 9160.2} {"step": 26841, "train_loss": 3.1500589847564697, "lr": 5.360196804738775e-05, "tps": 191933, "wall": 9165.3} {"step": 26842, "train_loss": 3.1771013736724854, "lr": 5.359466321576524e-05, "tps": 191834, "wall": 9170.3} {"step": 26843, "train_loss": 3.0871644020080566, "lr": 5.3587360269191386e-05, "tps": 191736, "wall": 9175.3} {"step": 26844, "train_loss": 3.052194833755493, "lr": 5.3580059207748925e-05, "tps": 191636, "wall": 9180.5} {"step": 26845, "train_loss": 3.173586845397949, "lr": 5.357276003152056e-05, "tps": 191534, "wall": 9185.7} {"step": 26846, "train_loss": 3.1860663890838623, "lr": 5.356546274058897e-05, "tps": 191435, "wall": 9190.8} {"step": 26847, "train_loss": 3.106414318084717, "lr": 5.355816733503682e-05, "tps": 191337, "wall": 9195.9} {"step": 26848, "train_loss": 3.105569362640381, "lr": 5.3550873814946765e-05, "tps": 191239, "wall": 9200.9} {"step": 26849, "train_loss": 3.0407049655914307, "lr": 5.3543582180401386e-05, "tps": 191141, "wall": 9206.0} {"step": 26850, "train_loss": 3.078277111053467, "lr": 5.353629243148335e-05, "tps": 191043, "wall": 9211.0} {"step": 26851, "train_loss": 3.140911102294922, "lr": 5.352900456827516e-05, "tps": 190946, "wall": 9216.0} {"step": 26852, "train_loss": 3.079150438308716, "lr": 5.352171859085945e-05, "tps": 190848, "wall": 9221.1} {"step": 26853, "train_loss": 3.1232147216796875, "lr": 5.351443449931871e-05, "tps": 190749, "wall": 9226.3} {"step": 26854, "train_loss": 3.0405712127685547, "lr": 5.350715229373543e-05, "tps": 190646, "wall": 9231.6} {"step": 26855, "train_loss": 3.1672706604003906, "lr": 5.349987197419218e-05, "tps": 190538, "wall": 9237.2} {"step": 26856, "train_loss": 3.2083024978637695, "lr": 5.349259354077137e-05, "tps": 190437, "wall": 9242.4} {"step": 26857, "train_loss": 2.9804511070251465, "lr": 5.348531699355544e-05, "tps": 190336, "wall": 9247.6} {"step": 26858, "train_loss": 3.027287483215332, "lr": 5.34780423326269e-05, "tps": 190238, "wall": 9252.7} {"step": 26859, "train_loss": 3.1734414100646973, "lr": 5.347076955806809e-05, "tps": 190141, "wall": 9257.8} {"step": 26860, "train_loss": 3.0122995376586914, "lr": 5.3463498669961376e-05, "tps": 190043, "wall": 9263.0} {"step": 26861, "train_loss": 3.1670913696289062, "lr": 5.345622966838919e-05, "tps": 189944, "wall": 9268.1} {"step": 26862, "train_loss": 3.0962955951690674, "lr": 5.344896255343386e-05, "tps": 189845, "wall": 9273.3} {"step": 26863, "train_loss": 3.117410182952881, "lr": 5.3441697325177655e-05, "tps": 189747, "wall": 9278.4} {"step": 26864, "train_loss": 3.106424331665039, "lr": 5.3434433983702935e-05, "tps": 189649, "wall": 9283.6} {"step": 26865, "train_loss": 3.0701792240142822, "lr": 5.3427172529091954e-05, "tps": 189551, "wall": 9288.7} {"step": 26866, "train_loss": 3.0285162925720215, "lr": 5.341991296142697e-05, "tps": 189453, "wall": 9293.8} {"step": 26867, "train_loss": 3.0544114112854004, "lr": 5.3412655280790224e-05, "tps": 189357, "wall": 9298.9} {"step": 26868, "train_loss": 3.1481921672821045, "lr": 5.340539948726391e-05, "tps": 189258, "wall": 9304.1} {"step": 26869, "train_loss": 3.0318117141723633, "lr": 5.339814558093028e-05, "tps": 189161, "wall": 9309.2} {"step": 26870, "train_loss": 3.091123104095459, "lr": 5.339089356187147e-05, "tps": 189065, "wall": 9314.3} {"step": 26871, "train_loss": 3.093416929244995, "lr": 5.338364343016959e-05, "tps": 188968, "wall": 9319.5} {"step": 26872, "train_loss": 3.0146753787994385, "lr": 5.3376395185906845e-05, "tps": 188871, "wall": 9324.6} {"step": 26873, "train_loss": 3.0443129539489746, "lr": 5.3369148829165304e-05, "tps": 188775, "wall": 9329.7} {"step": 26874, "train_loss": 3.039757490158081, "lr": 5.336190436002705e-05, "tps": 188679, "wall": 9334.8} {"step": 26875, "train_loss": 3.1662089824676514, "lr": 5.335466177857418e-05, "tps": 188581, "wall": 9339.9} {"step": 26876, "train_loss": 3.046009063720703, "lr": 5.3347421084888715e-05, "tps": 188485, "wall": 9345.1} {"step": 26877, "train_loss": 3.1728475093841553, "lr": 5.3340182279052645e-05, "tps": 188387, "wall": 9350.3} {"step": 26878, "train_loss": 3.151693820953369, "lr": 5.333294536114804e-05, "tps": 188291, "wall": 9355.4} {"step": 26879, "train_loss": 3.1043612957000732, "lr": 5.332571033125684e-05, "tps": 188195, "wall": 9360.5} {"step": 26880, "train_loss": 3.123880624771118, "lr": 5.3318477189460994e-05, "tps": 188098, "wall": 9365.7} {"step": 26881, "train_loss": 3.2374536991119385, "lr": 5.331124593584247e-05, "tps": 188003, "wall": 9370.8} {"step": 26882, "train_loss": 3.064321517944336, "lr": 5.330401657048318e-05, "tps": 187908, "wall": 9375.8} {"step": 26883, "train_loss": 3.1192331314086914, "lr": 5.3296789093464974e-05, "tps": 187814, "wall": 9380.9} {"step": 26884, "train_loss": 3.115298271179199, "lr": 5.32895635048698e-05, "tps": 187720, "wall": 9386.0} {"step": 26885, "train_loss": 3.266413927078247, "lr": 5.328233980477946e-05, "tps": 187625, "wall": 9391.0} {"step": 26886, "train_loss": 3.071998357772827, "lr": 5.327511799327577e-05, "tps": 187530, "wall": 9396.1} {"step": 26887, "train_loss": 3.1238207817077637, "lr": 5.326789807044058e-05, "tps": 187435, "wall": 9401.3} {"step": 26888, "train_loss": 3.1800193786621094, "lr": 5.3260680036355645e-05, "tps": 187340, "wall": 9406.4} {"step": 26889, "train_loss": 3.1143810749053955, "lr": 5.325346389110277e-05, "tps": 187246, "wall": 9411.4} {"step": 26890, "train_loss": 3.0932183265686035, "lr": 5.324624963476368e-05, "tps": 187152, "wall": 9416.5} {"step": 26891, "train_loss": 2.9950196743011475, "lr": 5.32390372674201e-05, "tps": 187059, "wall": 9421.6} {"step": 26892, "train_loss": 3.1366348266601562, "lr": 5.3231826789153714e-05, "tps": 186963, "wall": 9426.8} {"step": 26893, "train_loss": 3.1174116134643555, "lr": 5.3224618200046185e-05, "tps": 186862, "wall": 9432.2} {"step": 26894, "train_loss": 3.158076047897339, "lr": 5.321741150017925e-05, "tps": 186766, "wall": 9437.4} {"step": 26895, "train_loss": 3.1236472129821777, "lr": 5.321020668963448e-05, "tps": 186662, "wall": 9443.0} {"step": 26896, "train_loss": 3.246959924697876, "lr": 5.320300376849351e-05, "tps": 186569, "wall": 9448.1} {"step": 26897, "train_loss": 3.1362433433532715, "lr": 5.319580273683794e-05, "tps": 186476, "wall": 9453.1} {"step": 26898, "train_loss": 3.041635513305664, "lr": 5.318860359474935e-05, "tps": 186382, "wall": 9458.3} {"step": 26899, "train_loss": 3.1886465549468994, "lr": 5.3181406342309245e-05, "tps": 186288, "wall": 9463.4} {"step": 26900, "train_loss": 3.13546085357666, "lr": 5.3174210979599225e-05, "tps": 186194, "wall": 9468.5} {"step": 26901, "train_loss": 3.0207576751708984, "lr": 5.316701750670079e-05, "tps": 186101, "wall": 9473.6} {"step": 26902, "train_loss": 3.0940604209899902, "lr": 5.315982592369536e-05, "tps": 186006, "wall": 9478.8} {"step": 26903, "train_loss": 3.1895041465759277, "lr": 5.315263623066449e-05, "tps": 185912, "wall": 9483.9} {"step": 26904, "train_loss": 3.0822103023529053, "lr": 5.3145448427689574e-05, "tps": 185817, "wall": 9489.1} {"step": 26905, "train_loss": 3.090175151824951, "lr": 5.3138262514852e-05, "tps": 185725, "wall": 9494.2} {"step": 26906, "train_loss": 3.036423921585083, "lr": 5.3131078492233265e-05, "tps": 185632, "wall": 9499.3} {"step": 26907, "train_loss": 3.0986227989196777, "lr": 5.3123896359914705e-05, "tps": 185539, "wall": 9504.4} {"step": 26908, "train_loss": 3.1004137992858887, "lr": 5.311671611797762e-05, "tps": 185446, "wall": 9509.5} {"step": 26909, "train_loss": 3.1902287006378174, "lr": 5.310953776650345e-05, "tps": 185353, "wall": 9514.6} {"step": 26910, "train_loss": 3.0882890224456787, "lr": 5.3102361305573426e-05, "tps": 185261, "wall": 9519.7} {"step": 26911, "train_loss": 3.0335943698883057, "lr": 5.309518673526891e-05, "tps": 185168, "wall": 9524.9} {"step": 26912, "train_loss": 3.097090482711792, "lr": 5.308801405567116e-05, "tps": 185076, "wall": 9529.9} {"step": 26913, "train_loss": 3.211549997329712, "lr": 5.308084326686138e-05, "tps": 184984, "wall": 9535.0} {"step": 26914, "train_loss": 3.062445878982544, "lr": 5.307367436892088e-05, "tps": 184893, "wall": 9540.1} {"step": 26915, "train_loss": 3.118818759918213, "lr": 5.306650736193082e-05, "tps": 184801, "wall": 9545.2} {"step": 26916, "train_loss": 3.0501277446746826, "lr": 5.305934224597237e-05, "tps": 184710, "wall": 9550.2} {"step": 26917, "train_loss": 3.056056022644043, "lr": 5.3052179021126746e-05, "tps": 184620, "wall": 9555.3} {"step": 26918, "train_loss": 3.065732955932617, "lr": 5.3045017687475065e-05, "tps": 184525, "wall": 9560.5} {"step": 26919, "train_loss": 2.9917197227478027, "lr": 5.303785824509842e-05, "tps": 184432, "wall": 9565.7} {"step": 26920, "train_loss": 3.095648765563965, "lr": 5.3030700694077994e-05, "tps": 184335, "wall": 9571.1} {"step": 26921, "train_loss": 3.099748134613037, "lr": 5.30235450344948e-05, "tps": 184245, "wall": 9576.2} {"step": 26922, "train_loss": 3.122163772583008, "lr": 5.301639126642992e-05, "tps": 184155, "wall": 9581.2} {"step": 26923, "train_loss": 3.066976547241211, "lr": 5.30092393899644e-05, "tps": 184067, "wall": 9586.1} {"step": 26924, "train_loss": 3.0446629524230957, "lr": 5.3002089405179276e-05, "tps": 183979, "wall": 9591.1} {"step": 26925, "train_loss": 2.9925553798675537, "lr": 5.2994941312155475e-05, "tps": 183890, "wall": 9596.0} {"step": 26926, "train_loss": 3.0262253284454346, "lr": 5.2987795110974056e-05, "tps": 183802, "wall": 9601.0} {"step": 26927, "train_loss": 3.061426877975464, "lr": 5.29806508017159e-05, "tps": 183712, "wall": 9606.1} {"step": 26928, "train_loss": 3.082648754119873, "lr": 5.2973508384461965e-05, "tps": 183624, "wall": 9611.0} {"step": 26929, "train_loss": 3.1430234909057617, "lr": 5.2966367859293185e-05, "tps": 183537, "wall": 9615.9} {"step": 26930, "train_loss": 3.160454273223877, "lr": 5.295922922629037e-05, "tps": 183450, "wall": 9620.9} {"step": 26931, "train_loss": 3.067046642303467, "lr": 5.295209248553452e-05, "tps": 183362, "wall": 9625.8} {"step": 26932, "train_loss": 3.0604987144470215, "lr": 5.294495763710636e-05, "tps": 183275, "wall": 9630.8} {"step": 26933, "train_loss": 3.0854732990264893, "lr": 5.2937824681086764e-05, "tps": 183188, "wall": 9635.7} {"step": 26934, "train_loss": 3.2064740657806396, "lr": 5.2930693617556535e-05, "tps": 183100, "wall": 9640.6} {"step": 26935, "train_loss": 3.1286449432373047, "lr": 5.292356444659645e-05, "tps": 183012, "wall": 9645.7} {"step": 26936, "train_loss": 3.061228036880493, "lr": 5.2916437168287234e-05, "tps": 182926, "wall": 9650.6} {"step": 26937, "train_loss": 3.1560277938842773, "lr": 5.2909311782709714e-05, "tps": 182839, "wall": 9655.5} {"step": 26938, "train_loss": 3.1190590858459473, "lr": 5.290218828994451e-05, "tps": 182752, "wall": 9660.4} {"step": 26939, "train_loss": 3.1484134197235107, "lr": 5.2895066690072356e-05, "tps": 182665, "wall": 9665.4} {"step": 26940, "train_loss": 3.1218626499176025, "lr": 5.288794698317394e-05, "tps": 182578, "wall": 9670.4} {"step": 26941, "train_loss": 3.010918617248535, "lr": 5.2880829169329905e-05, "tps": 182492, "wall": 9675.3} {"step": 26942, "train_loss": 3.0753207206726074, "lr": 5.287371324862085e-05, "tps": 182406, "wall": 9680.2} {"step": 26943, "train_loss": 3.0799403190612793, "lr": 5.286659922112744e-05, "tps": 182320, "wall": 9685.1} {"step": 26944, "train_loss": 3.046156406402588, "lr": 5.285948708693025e-05, "tps": 182234, "wall": 9690.1} {"step": 26945, "train_loss": 3.042497158050537, "lr": 5.2852376846109786e-05, "tps": 182148, "wall": 9695.0} {"step": 26946, "train_loss": 3.068143367767334, "lr": 5.284526849874666e-05, "tps": 182060, "wall": 9700.1} {"step": 26947, "train_loss": 3.027806282043457, "lr": 5.283816204492136e-05, "tps": 181970, "wall": 9705.2} {"step": 26948, "train_loss": 3.1341609954833984, "lr": 5.283105748471444e-05, "tps": 181881, "wall": 9710.3} {"step": 26949, "train_loss": 3.0830183029174805, "lr": 5.2823954818206344e-05, "tps": 181793, "wall": 9715.4} {"step": 26950, "train_loss": 3.144055128097534, "lr": 5.281685404547749e-05, "tps": 181707, "wall": 9720.3} {"step": 26951, "train_loss": 3.0576205253601074, "lr": 5.28097551666084e-05, "tps": 181620, "wall": 9725.4} {"step": 26952, "train_loss": 3.1218132972717285, "lr": 5.280265818167944e-05, "tps": 181534, "wall": 9730.3} {"step": 26953, "train_loss": 2.9904351234436035, "lr": 5.279556309077096e-05, "tps": 181448, "wall": 9735.3} {"step": 26954, "train_loss": 3.092054605484009, "lr": 5.2788469893963444e-05, "tps": 181361, "wall": 9740.3} {"step": 26955, "train_loss": 3.0379343032836914, "lr": 5.27813785913372e-05, "tps": 181276, "wall": 9745.3} {"step": 26956, "train_loss": 3.087944507598877, "lr": 5.2774289182972504e-05, "tps": 181190, "wall": 9750.3} {"step": 26957, "train_loss": 3.0627894401550293, "lr": 5.2767201668949726e-05, "tps": 181104, "wall": 9755.2} {"step": 26958, "train_loss": 3.1142265796661377, "lr": 5.276011604934914e-05, "tps": 181018, "wall": 9760.2} {"step": 26959, "train_loss": 3.0648727416992188, "lr": 5.275303232425097e-05, "tps": 180932, "wall": 9765.3} {"step": 26960, "train_loss": 3.131004571914673, "lr": 5.274595049373554e-05, "tps": 180846, "wall": 9770.3} {"step": 26961, "train_loss": 3.1095166206359863, "lr": 5.2738870557883027e-05, "tps": 180761, "wall": 9775.2} {"step": 26962, "train_loss": 3.209930181503296, "lr": 5.273179251677363e-05, "tps": 180675, "wall": 9780.2} {"step": 26963, "train_loss": 3.0359840393066406, "lr": 5.2724716370487526e-05, "tps": 180589, "wall": 9785.3} {"step": 26964, "train_loss": 3.101301670074463, "lr": 5.2717642119104874e-05, "tps": 180502, "wall": 9790.3} {"step": 26965, "train_loss": 3.0672717094421387, "lr": 5.2710569762705855e-05, "tps": 180417, "wall": 9795.3} {"step": 26966, "train_loss": 3.121481418609619, "lr": 5.270349930137054e-05, "tps": 180325, "wall": 9800.7} {"step": 26967, "train_loss": 3.130310297012329, "lr": 5.2696430735179016e-05, "tps": 180239, "wall": 9805.7} {"step": 26968, "train_loss": 2.986035108566284, "lr": 5.26893640642114e-05, "tps": 180156, "wall": 9810.6} {"step": 26969, "train_loss": 3.0880932807922363, "lr": 5.268229928854772e-05, "tps": 180072, "wall": 9815.5} {"step": 26970, "train_loss": 3.0149025917053223, "lr": 5.267523640826797e-05, "tps": 179987, "wall": 9820.5} {"step": 26971, "train_loss": 3.170731544494629, "lr": 5.266817542345225e-05, "tps": 179904, "wall": 9825.4} {"step": 26972, "train_loss": 3.031885862350464, "lr": 5.266111633418047e-05, "tps": 179820, "wall": 9830.4} {"step": 26973, "train_loss": 3.2158305644989014, "lr": 5.265405914053259e-05, "tps": 179736, "wall": 9835.3} {"step": 26974, "train_loss": 3.118694305419922, "lr": 5.264700384258859e-05, "tps": 179653, "wall": 9840.2} {"step": 26975, "train_loss": 3.1008691787719727, "lr": 5.263995044042841e-05, "tps": 179568, "wall": 9845.3} {"step": 26976, "train_loss": 3.1070432662963867, "lr": 5.2632898934131905e-05, "tps": 179485, "wall": 9850.2} {"step": 26977, "train_loss": 3.036670684814453, "lr": 5.262584932377899e-05, "tps": 179402, "wall": 9855.1} {"step": 26978, "train_loss": 3.179859161376953, "lr": 5.26188016094495e-05, "tps": 179319, "wall": 9860.0} {"step": 26979, "train_loss": 3.0407729148864746, "lr": 5.261175579122326e-05, "tps": 179237, "wall": 9864.9} {"step": 26980, "train_loss": 3.128732681274414, "lr": 5.2604711869180126e-05, "tps": 179154, "wall": 9869.8} {"step": 26981, "train_loss": 3.061480760574341, "lr": 5.259766984339989e-05, "tps": 179071, "wall": 9874.8} {"step": 26982, "train_loss": 3.1401541233062744, "lr": 5.259062971396227e-05, "tps": 178989, "wall": 9879.7} {"step": 26983, "train_loss": 3.0781521797180176, "lr": 5.2583591480947094e-05, "tps": 178906, "wall": 9884.6} {"step": 26984, "train_loss": 3.060896873474121, "lr": 5.257655514443398e-05, "tps": 178823, "wall": 9889.6} {"step": 26985, "train_loss": 3.023159980773926, "lr": 5.2569520704502774e-05, "tps": 178740, "wall": 9894.5} {"step": 26986, "train_loss": 3.157618999481201, "lr": 5.256248816123308e-05, "tps": 178658, "wall": 9899.4} {"step": 26987, "train_loss": 3.149416923522949, "lr": 5.255545751470456e-05, "tps": 178575, "wall": 9904.4} {"step": 26988, "train_loss": 3.18564772605896, "lr": 5.25484287649969e-05, "tps": 178493, "wall": 9909.4} {"step": 26989, "train_loss": 3.158339262008667, "lr": 5.2541401912189704e-05, "tps": 178410, "wall": 9914.3} {"step": 26990, "train_loss": 3.029574394226074, "lr": 5.253437695636253e-05, "tps": 178328, "wall": 9919.2} {"step": 26991, "train_loss": 3.1308279037475586, "lr": 5.252735389759502e-05, "tps": 178246, "wall": 9924.2} {"step": 26992, "train_loss": 3.0444679260253906, "lr": 5.2520332735966714e-05, "tps": 178164, "wall": 9929.1} {"step": 26993, "train_loss": 3.1303303241729736, "lr": 5.25133134715571e-05, "tps": 178081, "wall": 9934.1} {"step": 26994, "train_loss": 3.0671544075012207, "lr": 5.250629610444576e-05, "tps": 177999, "wall": 9939.0} {"step": 26995, "train_loss": 3.051252841949463, "lr": 5.2499280634712165e-05, "tps": 177917, "wall": 9944.0} {"step": 26996, "train_loss": 3.167360305786133, "lr": 5.249226706243575e-05, "tps": 177836, "wall": 9948.9} {"step": 26997, "train_loss": 3.0311968326568604, "lr": 5.2485255387696034e-05, "tps": 177755, "wall": 9953.8} {"step": 26998, "train_loss": 3.2034449577331543, "lr": 5.2478245610572395e-05, "tps": 177673, "wall": 9958.7} {"step": 26999, "train_loss": 3.1177072525024414, "lr": 5.247123773114422e-05, "tps": 177592, "wall": 9963.7} {"step": 27000, "train_loss": 3.127882957458496, "lr": 5.246423174949097e-05, "tps": 177510, "wall": 9968.7, "val_loss_monitor": 3.326191087096106} {"step": 27001, "train_loss": 3.022836923599243, "lr": 5.245722766569193e-05, "tps": 176568, "wall": 10022.2} {"step": 27002, "train_loss": 3.0431454181671143, "lr": 5.2450225479826495e-05, "tps": 176484, "wall": 10027.4} {"step": 27003, "train_loss": 3.0007729530334473, "lr": 5.2443225191974e-05, "tps": 176399, "wall": 10032.5} {"step": 27004, "train_loss": 3.109316825866699, "lr": 5.243622680221367e-05, "tps": 176316, "wall": 10037.6} {"step": 27005, "train_loss": 3.0389842987060547, "lr": 5.242923031062487e-05, "tps": 176234, "wall": 10042.7} {"step": 27006, "train_loss": 3.198599100112915, "lr": 5.2422235717286795e-05, "tps": 176153, "wall": 10047.7} {"step": 27007, "train_loss": 3.193061351776123, "lr": 5.241524302227866e-05, "tps": 176071, "wall": 10052.7} {"step": 27008, "train_loss": 3.1342062950134277, "lr": 5.240825222567978e-05, "tps": 175989, "wall": 10057.8} {"step": 27009, "train_loss": 3.126300573348999, "lr": 5.240126332756926e-05, "tps": 175908, "wall": 10062.8} {"step": 27010, "train_loss": 3.004380226135254, "lr": 5.2394276328026284e-05, "tps": 175824, "wall": 10068.0} {"step": 27011, "train_loss": 3.1425633430480957, "lr": 5.238729122713003e-05, "tps": 175742, "wall": 10073.0} {"step": 27012, "train_loss": 2.9187734127044678, "lr": 5.2380308024959614e-05, "tps": 175661, "wall": 10078.0} {"step": 27013, "train_loss": 3.0928337574005127, "lr": 5.237332672159411e-05, "tps": 175581, "wall": 10083.0} {"step": 27014, "train_loss": 3.0821444988250732, "lr": 5.236634731711265e-05, "tps": 175500, "wall": 10088.0} {"step": 27015, "train_loss": 3.041710376739502, "lr": 5.235936981159428e-05, "tps": 175419, "wall": 10093.1} {"step": 27016, "train_loss": 3.0241036415100098, "lr": 5.2352394205118014e-05, "tps": 175337, "wall": 10098.1} {"step": 27017, "train_loss": 3.0470736026763916, "lr": 5.234542049776293e-05, "tps": 175252, "wall": 10103.4} {"step": 27018, "train_loss": 3.0305376052856445, "lr": 5.233844868960794e-05, "tps": 175171, "wall": 10108.5} {"step": 27019, "train_loss": 3.118306875228882, "lr": 5.233147878073213e-05, "tps": 175091, "wall": 10113.5} {"step": 27020, "train_loss": 3.115532159805298, "lr": 5.232451077121439e-05, "tps": 175012, "wall": 10118.4} {"step": 27021, "train_loss": 3.2529404163360596, "lr": 5.231754466113361e-05, "tps": 174932, "wall": 10123.4} {"step": 27022, "train_loss": 3.1149144172668457, "lr": 5.231058045056883e-05, "tps": 174853, "wall": 10128.3} {"step": 27023, "train_loss": 3.2362613677978516, "lr": 5.230361813959883e-05, "tps": 174775, "wall": 10133.3} {"step": 27024, "train_loss": 3.1136045455932617, "lr": 5.22966577283025e-05, "tps": 174696, "wall": 10138.2} {"step": 27025, "train_loss": 3.120161533355713, "lr": 5.2289699216758725e-05, "tps": 174618, "wall": 10143.1} {"step": 27026, "train_loss": 3.164907932281494, "lr": 5.228274260504633e-05, "tps": 174537, "wall": 10148.2} {"step": 27027, "train_loss": 3.0469884872436523, "lr": 5.227578789324405e-05, "tps": 174454, "wall": 10153.4} {"step": 27028, "train_loss": 3.0793089866638184, "lr": 5.2268835081430765e-05, "tps": 174370, "wall": 10158.6} {"step": 27029, "train_loss": 3.1028895378112793, "lr": 5.226188416968518e-05, "tps": 174287, "wall": 10163.9} {"step": 27030, "train_loss": 3.07340407371521, "lr": 5.225493515808602e-05, "tps": 174205, "wall": 10169.1} {"step": 27031, "train_loss": 3.076385736465454, "lr": 5.224798804671205e-05, "tps": 174122, "wall": 10174.3} {"step": 27032, "train_loss": 3.2180652618408203, "lr": 5.224104283564195e-05, "tps": 174039, "wall": 10179.5} {"step": 27033, "train_loss": 3.1040399074554443, "lr": 5.2234099524954374e-05, "tps": 173955, "wall": 10184.8} {"step": 27034, "train_loss": 3.0276405811309814, "lr": 5.2227158114728e-05, "tps": 173876, "wall": 10189.8} {"step": 27035, "train_loss": 3.105678081512451, "lr": 5.222021860504147e-05, "tps": 173793, "wall": 10195.1} {"step": 27036, "train_loss": 3.1330432891845703, "lr": 5.2213280995973366e-05, "tps": 173710, "wall": 10200.3} {"step": 27037, "train_loss": 3.004931926727295, "lr": 5.22063452876023e-05, "tps": 173627, "wall": 10205.5} {"step": 27038, "train_loss": 3.109564781188965, "lr": 5.219941148000681e-05, "tps": 173545, "wall": 10210.7} {"step": 27039, "train_loss": 3.0759634971618652, "lr": 5.2192479573265496e-05, "tps": 173462, "wall": 10216.0} {"step": 27040, "train_loss": 3.0606398582458496, "lr": 5.218554956745684e-05, "tps": 173379, "wall": 10221.2} {"step": 27041, "train_loss": 3.1003220081329346, "lr": 5.2178621462659336e-05, "tps": 173302, "wall": 10226.2} {"step": 27042, "train_loss": 3.025275707244873, "lr": 5.217169525895154e-05, "tps": 173225, "wall": 10231.1} {"step": 27043, "train_loss": 3.108220338821411, "lr": 5.2164770956411827e-05, "tps": 173148, "wall": 10236.0} {"step": 27044, "train_loss": 3.0121333599090576, "lr": 5.2157848555118636e-05, "tps": 173067, "wall": 10241.2} {"step": 27045, "train_loss": 3.1120622158050537, "lr": 5.215092805515047e-05, "tps": 172983, "wall": 10246.6} {"step": 27046, "train_loss": 3.118255138397217, "lr": 5.214400945658566e-05, "tps": 172900, "wall": 10251.8} {"step": 27047, "train_loss": 3.054849147796631, "lr": 5.213709275950256e-05, "tps": 172818, "wall": 10257.1} {"step": 27048, "train_loss": 3.092973232269287, "lr": 5.213017796397959e-05, "tps": 172737, "wall": 10262.3} {"step": 27049, "train_loss": 3.11915922164917, "lr": 5.212326507009504e-05, "tps": 172654, "wall": 10267.6} {"step": 27050, "train_loss": 3.034071445465088, "lr": 5.2116354077927196e-05, "tps": 172572, "wall": 10272.9} {"step": 27051, "train_loss": 3.20234751701355, "lr": 5.21094449875544e-05, "tps": 172489, "wall": 10278.2} {"step": 27052, "train_loss": 3.0887739658355713, "lr": 5.210253779905492e-05, "tps": 172405, "wall": 10283.6} {"step": 27053, "train_loss": 3.054351806640625, "lr": 5.209563251250692e-05, "tps": 172321, "wall": 10289.0} {"step": 27054, "train_loss": 3.139756917953491, "lr": 5.20887291279887e-05, "tps": 172239, "wall": 10294.2} {"step": 27055, "train_loss": 3.1093671321868896, "lr": 5.208182764557844e-05, "tps": 172149, "wall": 10300.0} {"step": 27056, "train_loss": 3.141995906829834, "lr": 5.207492806535433e-05, "tps": 172065, "wall": 10305.4} {"step": 27057, "train_loss": 2.967158079147339, "lr": 5.206803038739453e-05, "tps": 171979, "wall": 10311.0} {"step": 27058, "train_loss": 3.090933322906494, "lr": 5.206113461177713e-05, "tps": 171902, "wall": 10315.9} {"step": 27059, "train_loss": 3.186152458190918, "lr": 5.205424073858031e-05, "tps": 171826, "wall": 10320.9} {"step": 27060, "train_loss": 3.0662333965301514, "lr": 5.204734876788217e-05, "tps": 171749, "wall": 10325.9} {"step": 27061, "train_loss": 3.1944828033447266, "lr": 5.204045869976067e-05, "tps": 171673, "wall": 10330.9} {"step": 27062, "train_loss": 3.0080606937408447, "lr": 5.2033570534294005e-05, "tps": 171597, "wall": 10335.8} {"step": 27063, "train_loss": 3.116776943206787, "lr": 5.202668427156011e-05, "tps": 171521, "wall": 10340.8} {"step": 27064, "train_loss": 3.1159183979034424, "lr": 5.2019799911637035e-05, "tps": 171446, "wall": 10345.7} {"step": 27065, "train_loss": 3.0119893550872803, "lr": 5.201291745460275e-05, "tps": 171369, "wall": 10350.7} {"step": 27066, "train_loss": 3.1727166175842285, "lr": 5.20060369005352e-05, "tps": 171294, "wall": 10355.6} {"step": 27067, "train_loss": 3.1194303035736084, "lr": 5.199915824951239e-05, "tps": 171219, "wall": 10360.6} {"step": 27068, "train_loss": 3.1533203125, "lr": 5.1992281501612195e-05, "tps": 171143, "wall": 10365.5} {"step": 27069, "train_loss": 3.0396103858947754, "lr": 5.198540665691248e-05, "tps": 171067, "wall": 10370.5} {"step": 27070, "train_loss": 3.166437864303589, "lr": 5.197853371549122e-05, "tps": 170985, "wall": 10375.9} {"step": 27071, "train_loss": 3.156937599182129, "lr": 5.1971662677426226e-05, "tps": 170909, "wall": 10380.9} {"step": 27072, "train_loss": 3.086514711380005, "lr": 5.1964793542795276e-05, "tps": 170828, "wall": 10386.2} {"step": 27073, "train_loss": 3.1040663719177246, "lr": 5.195792631167629e-05, "tps": 170750, "wall": 10391.3} {"step": 27074, "train_loss": 3.142709493637085, "lr": 5.195106098414697e-05, "tps": 170675, "wall": 10396.2} {"step": 27075, "train_loss": 3.0549492835998535, "lr": 5.1944197560285123e-05, "tps": 170600, "wall": 10401.2} {"step": 27076, "train_loss": 3.08798885345459, "lr": 5.193733604016852e-05, "tps": 170522, "wall": 10406.4} {"step": 27077, "train_loss": 3.0544676780700684, "lr": 5.193047642387485e-05, "tps": 170438, "wall": 10411.9} {"step": 27078, "train_loss": 3.252178192138672, "lr": 5.1923618711481826e-05, "tps": 170365, "wall": 10416.7} {"step": 27079, "train_loss": 3.0666561126708984, "lr": 5.191676290306717e-05, "tps": 170290, "wall": 10421.7} {"step": 27080, "train_loss": 3.050617218017578, "lr": 5.1909908998708465e-05, "tps": 170215, "wall": 10426.7} {"step": 27081, "train_loss": 3.109071731567383, "lr": 5.1903056998483455e-05, "tps": 170138, "wall": 10431.7} {"step": 27082, "train_loss": 3.037968635559082, "lr": 5.189620690246971e-05, "tps": 170061, "wall": 10436.9} {"step": 27083, "train_loss": 3.0123772621154785, "lr": 5.188935871074481e-05, "tps": 169982, "wall": 10442.1} {"step": 27084, "train_loss": 3.143731117248535, "lr": 5.188251242338635e-05, "tps": 169899, "wall": 10447.6} {"step": 27085, "train_loss": 3.0824825763702393, "lr": 5.1875668040471906e-05, "tps": 169821, "wall": 10452.8} {"step": 27086, "train_loss": 3.087207317352295, "lr": 5.1868825562078937e-05, "tps": 169743, "wall": 10457.9} {"step": 27087, "train_loss": 2.97285795211792, "lr": 5.1861984988285065e-05, "tps": 169666, "wall": 10463.1} {"step": 27088, "train_loss": 3.1490087509155273, "lr": 5.185514631916769e-05, "tps": 169587, "wall": 10468.3} {"step": 27089, "train_loss": 3.1991987228393555, "lr": 5.184830955480432e-05, "tps": 169512, "wall": 10473.4} {"step": 27090, "train_loss": 3.071162223815918, "lr": 5.184147469527241e-05, "tps": 169439, "wall": 10478.3} {"step": 27091, "train_loss": 3.0760750770568848, "lr": 5.183464174064937e-05, "tps": 169360, "wall": 10483.6} {"step": 27092, "train_loss": 3.2144556045532227, "lr": 5.182781069101257e-05, "tps": 169280, "wall": 10488.9} {"step": 27093, "train_loss": 3.0805160999298096, "lr": 5.182098154643947e-05, "tps": 169207, "wall": 10493.8} {"step": 27094, "train_loss": 3.1172163486480713, "lr": 5.181415430700739e-05, "tps": 169132, "wall": 10498.8} {"step": 27095, "train_loss": 3.13657546043396, "lr": 5.180732897279362e-05, "tps": 169059, "wall": 10503.8} {"step": 27096, "train_loss": 3.147190809249878, "lr": 5.180050554387558e-05, "tps": 168985, "wall": 10508.8} {"step": 27097, "train_loss": 3.0848186016082764, "lr": 5.179368402033048e-05, "tps": 168910, "wall": 10513.8} {"step": 27098, "train_loss": 3.1174750328063965, "lr": 5.1786864402235644e-05, "tps": 168830, "wall": 10519.2} {"step": 27099, "train_loss": 3.0290637016296387, "lr": 5.1780046689668315e-05, "tps": 168755, "wall": 10524.3} {"step": 27100, "train_loss": 3.0968873500823975, "lr": 5.1773230882705695e-05, "tps": 168682, "wall": 10529.2} {"step": 27101, "train_loss": 3.090912103652954, "lr": 5.1766416981425034e-05, "tps": 168609, "wall": 10534.1} {"step": 27102, "train_loss": 3.1524930000305176, "lr": 5.17596049859035e-05, "tps": 168536, "wall": 10539.1} {"step": 27103, "train_loss": 3.1209018230438232, "lr": 5.175279489621825e-05, "tps": 168462, "wall": 10544.1} {"step": 27104, "train_loss": 3.0726613998413086, "lr": 5.1745986712446456e-05, "tps": 168389, "wall": 10549.1} {"step": 27105, "train_loss": 3.126791000366211, "lr": 5.1739180434665236e-05, "tps": 168316, "wall": 10554.0} {"step": 27106, "train_loss": 3.0798566341400146, "lr": 5.173237606295165e-05, "tps": 168243, "wall": 10559.0} {"step": 27107, "train_loss": 2.9821081161499023, "lr": 5.1725573597382825e-05, "tps": 168169, "wall": 10564.0} {"step": 27108, "train_loss": 3.0028345584869385, "lr": 5.171877303803584e-05, "tps": 168093, "wall": 10569.2} {"step": 27109, "train_loss": 3.1119959354400635, "lr": 5.171197438498764e-05, "tps": 168016, "wall": 10574.4} {"step": 27110, "train_loss": 3.1382462978363037, "lr": 5.1705177638315326e-05, "tps": 167939, "wall": 10579.7} {"step": 27111, "train_loss": 3.0409975051879883, "lr": 5.169838279809588e-05, "tps": 167859, "wall": 10585.1} {"step": 27112, "train_loss": 3.087428569793701, "lr": 5.169158986440623e-05, "tps": 167780, "wall": 10590.5} {"step": 27113, "train_loss": 3.1303532123565674, "lr": 5.168479883732338e-05, "tps": 167703, "wall": 10595.7} {"step": 27114, "train_loss": 3.062274217605591, "lr": 5.1678009716924235e-05, "tps": 167630, "wall": 10600.7} {"step": 27115, "train_loss": 3.168778419494629, "lr": 5.167122250328567e-05, "tps": 167556, "wall": 10605.8} {"step": 27116, "train_loss": 3.0129528045654297, "lr": 5.166443719648464e-05, "tps": 167484, "wall": 10610.8} {"step": 27117, "train_loss": 3.086493492126465, "lr": 5.165765379659794e-05, "tps": 167411, "wall": 10615.8} {"step": 27118, "train_loss": 3.2325439453125, "lr": 5.165087230370246e-05, "tps": 167338, "wall": 10620.8} {"step": 27119, "train_loss": 3.0205607414245605, "lr": 5.1644092717875006e-05, "tps": 167264, "wall": 10625.9} {"step": 27120, "train_loss": 3.1634678840637207, "lr": 5.163731503919238e-05, "tps": 167191, "wall": 10630.9} {"step": 27121, "train_loss": 3.1025309562683105, "lr": 5.1630539267731346e-05, "tps": 167120, "wall": 10635.8} {"step": 27122, "train_loss": 2.985858678817749, "lr": 5.162376540356869e-05, "tps": 167048, "wall": 10640.8} {"step": 27123, "train_loss": 3.088772773742676, "lr": 5.1616993446781106e-05, "tps": 166976, "wall": 10645.8} {"step": 27124, "train_loss": 3.082838296890259, "lr": 5.161022339744537e-05, "tps": 166904, "wall": 10650.8} {"step": 27125, "train_loss": 3.0917584896087646, "lr": 5.160345525563811e-05, "tps": 166829, "wall": 10656.0} {"step": 27126, "train_loss": 3.0843098163604736, "lr": 5.1596689021435995e-05, "tps": 166751, "wall": 10661.3} {"step": 27127, "train_loss": 3.090991973876953, "lr": 5.158992469491573e-05, "tps": 166679, "wall": 10666.3} {"step": 27128, "train_loss": 3.1020565032958984, "lr": 5.1583162276153904e-05, "tps": 166608, "wall": 10671.3} {"step": 27129, "train_loss": 3.0543060302734375, "lr": 5.157640176522709e-05, "tps": 166530, "wall": 10676.7} {"step": 27130, "train_loss": 3.1286427974700928, "lr": 5.1569643162211945e-05, "tps": 166454, "wall": 10681.9} {"step": 27131, "train_loss": 3.164106845855713, "lr": 5.156288646718501e-05, "tps": 166379, "wall": 10687.2} {"step": 27132, "train_loss": 3.1014204025268555, "lr": 5.1556131680222755e-05, "tps": 166303, "wall": 10692.4} {"step": 27133, "train_loss": 3.0027475357055664, "lr": 5.154937880140182e-05, "tps": 166227, "wall": 10697.7} {"step": 27134, "train_loss": 3.046377182006836, "lr": 5.1542627830798576e-05, "tps": 166151, "wall": 10703.0} {"step": 27135, "train_loss": 3.1344387531280518, "lr": 5.153587876848956e-05, "tps": 166079, "wall": 10708.0} {"step": 27136, "train_loss": 3.11020565032959, "lr": 5.1529131614551276e-05, "tps": 166006, "wall": 10713.2} {"step": 27137, "train_loss": 3.20650577545166, "lr": 5.152238636906005e-05, "tps": 165929, "wall": 10718.5} {"step": 27138, "train_loss": 3.181199550628662, "lr": 5.1515643032092374e-05, "tps": 165856, "wall": 10723.6} {"step": 27139, "train_loss": 3.1040737628936768, "lr": 5.150890160372461e-05, "tps": 165785, "wall": 10728.6} {"step": 27140, "train_loss": 3.042128086090088, "lr": 5.150216208403309e-05, "tps": 165716, "wall": 10733.5} {"step": 27141, "train_loss": 3.0489635467529297, "lr": 5.149542447309425e-05, "tps": 165645, "wall": 10738.4} {"step": 27142, "train_loss": 3.1077330112457275, "lr": 5.148868877098433e-05, "tps": 165575, "wall": 10743.4} {"step": 27143, "train_loss": 3.036825180053711, "lr": 5.148195497777963e-05, "tps": 165502, "wall": 10748.6} {"step": 27144, "train_loss": 3.132643222808838, "lr": 5.147522309355651e-05, "tps": 165431, "wall": 10753.5} {"step": 27145, "train_loss": 3.0725772380828857, "lr": 5.146849311839116e-05, "tps": 165361, "wall": 10758.5} {"step": 27146, "train_loss": 3.130110740661621, "lr": 5.146176505235981e-05, "tps": 165291, "wall": 10763.4} {"step": 27147, "train_loss": 3.260617733001709, "lr": 5.145503889553874e-05, "tps": 165222, "wall": 10768.3} {"step": 27148, "train_loss": 3.1451504230499268, "lr": 5.144831464800409e-05, "tps": 165153, "wall": 10773.2} {"step": 27149, "train_loss": 3.061971426010132, "lr": 5.1441592309832045e-05, "tps": 165084, "wall": 10778.1} {"step": 27150, "train_loss": 3.07149600982666, "lr": 5.143487188109879e-05, "tps": 165015, "wall": 10783.1} {"step": 27151, "train_loss": 3.011888027191162, "lr": 5.142815336188038e-05, "tps": 164945, "wall": 10788.0} {"step": 27152, "train_loss": 3.16928768157959, "lr": 5.1421436752253003e-05, "tps": 164876, "wall": 10792.9} {"step": 27153, "train_loss": 3.1137521266937256, "lr": 5.141472205229272e-05, "tps": 164806, "wall": 10797.9} {"step": 27154, "train_loss": 3.1657350063323975, "lr": 5.140800926207555e-05, "tps": 164735, "wall": 10803.0} {"step": 27155, "train_loss": 3.0684123039245605, "lr": 5.14012983816776e-05, "tps": 164664, "wall": 10808.0} {"step": 27156, "train_loss": 3.125703811645508, "lr": 5.139458941117485e-05, "tps": 164594, "wall": 10813.0} {"step": 27157, "train_loss": 3.1118650436401367, "lr": 5.1387882350643316e-05, "tps": 164517, "wall": 10818.4} {"step": 27158, "train_loss": 3.011110305786133, "lr": 5.138117720015897e-05, "tps": 164443, "wall": 10823.7} {"step": 27159, "train_loss": 3.143012523651123, "lr": 5.1374473959797787e-05, "tps": 164372, "wall": 10828.8} {"step": 27160, "train_loss": 3.0743231773376465, "lr": 5.136777262963565e-05, "tps": 164301, "wall": 10833.9} {"step": 27161, "train_loss": 3.175333023071289, "lr": 5.136107320974853e-05, "tps": 164230, "wall": 10839.0} {"step": 27162, "train_loss": 3.100092887878418, "lr": 5.135437570021231e-05, "tps": 164162, "wall": 10843.9} {"step": 27163, "train_loss": 3.090515375137329, "lr": 5.134768010110281e-05, "tps": 164093, "wall": 10848.8} {"step": 27164, "train_loss": 3.102593421936035, "lr": 5.134098641249594e-05, "tps": 164025, "wall": 10853.7} {"step": 27165, "train_loss": 3.0915560722351074, "lr": 5.133429463446752e-05, "tps": 163957, "wall": 10858.6} {"step": 27166, "train_loss": 3.1125364303588867, "lr": 5.1327604767093275e-05, "tps": 163888, "wall": 10863.6} {"step": 27167, "train_loss": 3.036628484725952, "lr": 5.13209168104491e-05, "tps": 163818, "wall": 10868.6} {"step": 27168, "train_loss": 3.0753285884857178, "lr": 5.1314230764610685e-05, "tps": 163745, "wall": 10873.9} {"step": 27169, "train_loss": 3.043421983718872, "lr": 5.130754662965378e-05, "tps": 163670, "wall": 10879.3} {"step": 27170, "train_loss": 3.001180648803711, "lr": 5.1300864405654124e-05, "tps": 163600, "wall": 10884.3} {"step": 27171, "train_loss": 3.1478354930877686, "lr": 5.1294184092687404e-05, "tps": 163531, "wall": 10889.3} {"step": 27172, "train_loss": 3.1069753170013428, "lr": 5.12875056908293e-05, "tps": 163462, "wall": 10894.3} {"step": 27173, "train_loss": 3.025425434112549, "lr": 5.1280829200155456e-05, "tps": 163394, "wall": 10899.2} {"step": 27174, "train_loss": 3.154367208480835, "lr": 5.127415462074149e-05, "tps": 163327, "wall": 10904.1} {"step": 27175, "train_loss": 3.0172417163848877, "lr": 5.126748195266303e-05, "tps": 163259, "wall": 10909.1} {"step": 27176, "train_loss": 3.1248669624328613, "lr": 5.1260811195995684e-05, "tps": 163191, "wall": 10914.0} {"step": 27177, "train_loss": 3.133453607559204, "lr": 5.125414235081498e-05, "tps": 163122, "wall": 10919.0} {"step": 27178, "train_loss": 3.0757994651794434, "lr": 5.12474754171965e-05, "tps": 163053, "wall": 10924.0} {"step": 27179, "train_loss": 3.140467643737793, "lr": 5.1240810395215734e-05, "tps": 162985, "wall": 10929.0} {"step": 27180, "train_loss": 3.085118293762207, "lr": 5.123414728494818e-05, "tps": 162918, "wall": 10933.9} {"step": 27181, "train_loss": 3.011308193206787, "lr": 5.1227486086469364e-05, "tps": 162850, "wall": 10938.9} {"step": 27182, "train_loss": 3.0738844871520996, "lr": 5.12208267998547e-05, "tps": 162782, "wall": 10943.8} {"step": 27183, "train_loss": 3.022524833679199, "lr": 5.121416942517966e-05, "tps": 162714, "wall": 10948.8} {"step": 27184, "train_loss": 3.141772985458374, "lr": 5.1207513962519624e-05, "tps": 162646, "wall": 10953.8} {"step": 27185, "train_loss": 3.157972574234009, "lr": 5.1200860411950005e-05, "tps": 162578, "wall": 10958.8} {"step": 27186, "train_loss": 3.114757537841797, "lr": 5.119420877354617e-05, "tps": 162511, "wall": 10963.7} {"step": 27187, "train_loss": 2.998662233352661, "lr": 5.118755904738348e-05, "tps": 162443, "wall": 10968.7} {"step": 27188, "train_loss": 3.1077280044555664, "lr": 5.118091123353721e-05, "tps": 162376, "wall": 10973.7} {"step": 27189, "train_loss": 3.159209728240967, "lr": 5.117426533208275e-05, "tps": 162308, "wall": 10978.6} {"step": 27190, "train_loss": 3.1099181175231934, "lr": 5.116762134309535e-05, "tps": 162240, "wall": 10983.6} {"step": 27191, "train_loss": 3.0788238048553467, "lr": 5.1160979266650244e-05, "tps": 162172, "wall": 10988.6} {"step": 27192, "train_loss": 3.129446268081665, "lr": 5.115433910282274e-05, "tps": 162106, "wall": 10993.5} {"step": 27193, "train_loss": 3.1367225646972656, "lr": 5.1147700851687995e-05, "tps": 162038, "wall": 10998.5} {"step": 27194, "train_loss": 3.1254518032073975, "lr": 5.114106451332119e-05, "tps": 161971, "wall": 11003.5} {"step": 27195, "train_loss": 3.063060998916626, "lr": 5.11344300877976e-05, "tps": 161904, "wall": 11008.5} {"step": 27196, "train_loss": 3.0808918476104736, "lr": 5.1127797575192306e-05, "tps": 161837, "wall": 11013.4} {"step": 27197, "train_loss": 3.146695137023926, "lr": 5.1121166975580424e-05, "tps": 161770, "wall": 11018.4} {"step": 27198, "train_loss": 3.0362770557403564, "lr": 5.111453828903714e-05, "tps": 161703, "wall": 11023.3} {"step": 27199, "train_loss": 3.1705892086029053, "lr": 5.1107911515637496e-05, "tps": 161636, "wall": 11028.3} {"step": 27200, "train_loss": 3.02510929107666, "lr": 5.110128665545654e-05, "tps": 161569, "wall": 11033.3} {"step": 27201, "train_loss": 3.072323799133301, "lr": 5.109466370856937e-05, "tps": 161502, "wall": 11038.3} {"step": 27202, "train_loss": 3.15928053855896, "lr": 5.1088042675050996e-05, "tps": 161435, "wall": 11043.2} {"step": 27203, "train_loss": 3.113053560256958, "lr": 5.108142355497637e-05, "tps": 161368, "wall": 11048.2} {"step": 27204, "train_loss": 3.1042613983154297, "lr": 5.107480634842057e-05, "tps": 161302, "wall": 11053.2} {"step": 27205, "train_loss": 3.1083905696868896, "lr": 5.106819105545845e-05, "tps": 161236, "wall": 11058.1} {"step": 27206, "train_loss": 3.0901808738708496, "lr": 5.1061577676165026e-05, "tps": 161169, "wall": 11063.1} {"step": 27207, "train_loss": 3.0726943016052246, "lr": 5.1054966210615215e-05, "tps": 161102, "wall": 11068.1} {"step": 27208, "train_loss": 3.057312488555908, "lr": 5.104835665888382e-05, "tps": 161034, "wall": 11073.2} {"step": 27209, "train_loss": 3.0846657752990723, "lr": 5.104174902104584e-05, "tps": 160967, "wall": 11078.2} {"step": 27210, "train_loss": 3.073817729949951, "lr": 5.103514329717606e-05, "tps": 160899, "wall": 11083.3} {"step": 27211, "train_loss": 3.0643362998962402, "lr": 5.1028539487349305e-05, "tps": 160831, "wall": 11088.4} {"step": 27212, "train_loss": 3.114123582839966, "lr": 5.102193759164041e-05, "tps": 160763, "wall": 11093.5} {"step": 27213, "train_loss": 3.160693883895874, "lr": 5.1015337610124134e-05, "tps": 160695, "wall": 11098.6} {"step": 27214, "train_loss": 3.0236656665802, "lr": 5.100873954287524e-05, "tps": 160628, "wall": 11103.6} {"step": 27215, "train_loss": 3.0602030754089355, "lr": 5.1002143389968516e-05, "tps": 160560, "wall": 11108.8} {"step": 27216, "train_loss": 3.126629114151001, "lr": 5.099554915147866e-05, "tps": 160493, "wall": 11113.8} {"step": 27217, "train_loss": 3.0554704666137695, "lr": 5.098895682748034e-05, "tps": 160425, "wall": 11118.9} {"step": 27218, "train_loss": 3.100998878479004, "lr": 5.098236641804827e-05, "tps": 160358, "wall": 11124.0} {"step": 27219, "train_loss": 3.0327348709106445, "lr": 5.0975777923257094e-05, "tps": 160291, "wall": 11129.0} {"step": 27220, "train_loss": 3.0592150688171387, "lr": 5.0969191343181445e-05, "tps": 160225, "wall": 11134.0} {"step": 27221, "train_loss": 3.186194896697998, "lr": 5.0962606677895953e-05, "tps": 160159, "wall": 11139.0} {"step": 27222, "train_loss": 3.02372145652771, "lr": 5.095602392747519e-05, "tps": 160093, "wall": 11144.1} {"step": 27223, "train_loss": 2.9282875061035156, "lr": 5.094944309199373e-05, "tps": 160027, "wall": 11149.1} {"step": 27224, "train_loss": 3.0309805870056152, "lr": 5.094286417152614e-05, "tps": 159961, "wall": 11154.0} {"step": 27225, "train_loss": 3.090064764022827, "lr": 5.0936287166146915e-05, "tps": 159897, "wall": 11158.9} {"step": 27226, "train_loss": 3.151602268218994, "lr": 5.092971207593058e-05, "tps": 159832, "wall": 11163.8} {"step": 27227, "train_loss": 3.0271031856536865, "lr": 5.092313890095162e-05, "tps": 159767, "wall": 11168.8} {"step": 27228, "train_loss": 3.221184253692627, "lr": 5.091656764128449e-05, "tps": 159702, "wall": 11173.8} {"step": 27229, "train_loss": 3.0597691535949707, "lr": 5.090999829700363e-05, "tps": 159638, "wall": 11178.7} {"step": 27230, "train_loss": 3.0275840759277344, "lr": 5.090343086818344e-05, "tps": 159573, "wall": 11183.6} {"step": 27231, "train_loss": 3.0564727783203125, "lr": 5.0896865354898336e-05, "tps": 159509, "wall": 11188.5} {"step": 27232, "train_loss": 2.9565110206604004, "lr": 5.0890301757222714e-05, "tps": 159445, "wall": 11193.4} {"step": 27233, "train_loss": 2.965916633605957, "lr": 5.0883740075230856e-05, "tps": 159381, "wall": 11198.4} {"step": 27234, "train_loss": 3.1589179039001465, "lr": 5.08771803089972e-05, "tps": 159316, "wall": 11203.3} {"step": 27235, "train_loss": 3.13905930519104, "lr": 5.0870622458595964e-05, "tps": 159252, "wall": 11208.2} {"step": 27236, "train_loss": 3.052485942840576, "lr": 5.086406652410144e-05, "tps": 159188, "wall": 11213.2} {"step": 27237, "train_loss": 3.150541305541992, "lr": 5.0857512505587954e-05, "tps": 159124, "wall": 11218.1} {"step": 27238, "train_loss": 3.1409599781036377, "lr": 5.085096040312972e-05, "tps": 159060, "wall": 11223.0} {"step": 27239, "train_loss": 3.1696009635925293, "lr": 5.0844410216800934e-05, "tps": 158995, "wall": 11228.0} {"step": 27240, "train_loss": 3.156109571456909, "lr": 5.083786194667583e-05, "tps": 158931, "wall": 11232.9} {"step": 27241, "train_loss": 3.093064308166504, "lr": 5.0831315592828585e-05, "tps": 158867, "wall": 11237.9} {"step": 27242, "train_loss": 3.1182477474212646, "lr": 5.0824771155333316e-05, "tps": 158803, "wall": 11242.8} {"step": 27243, "train_loss": 3.143925189971924, "lr": 5.081822863426423e-05, "tps": 158739, "wall": 11247.7} {"step": 27244, "train_loss": 3.114591598510742, "lr": 5.0811688029695404e-05, "tps": 158676, "wall": 11252.7} {"step": 27245, "train_loss": 3.0300612449645996, "lr": 5.080514934170091e-05, "tps": 158612, "wall": 11257.6} {"step": 27246, "train_loss": 3.0777430534362793, "lr": 5.0798612570354844e-05, "tps": 158549, "wall": 11262.5} {"step": 27247, "train_loss": 3.1512577533721924, "lr": 5.0792077715731255e-05, "tps": 158485, "wall": 11267.4} {"step": 27248, "train_loss": 3.085435628890991, "lr": 5.0785544777904146e-05, "tps": 158422, "wall": 11272.4} {"step": 27249, "train_loss": 3.1366381645202637, "lr": 5.0779013756947556e-05, "tps": 158358, "wall": 11277.3} {"step": 27250, "train_loss": 3.0631747245788574, "lr": 5.0772484652935434e-05, "tps": 158295, "wall": 11282.2} {"step": 27251, "train_loss": 3.117079019546509, "lr": 5.076595746594177e-05, "tps": 158231, "wall": 11287.2} {"step": 27252, "train_loss": 2.937730550765991, "lr": 5.0759432196040526e-05, "tps": 158167, "wall": 11292.2} {"step": 27253, "train_loss": 3.055426836013794, "lr": 5.0752908843305537e-05, "tps": 158104, "wall": 11297.1} {"step": 27254, "train_loss": 3.1686489582061768, "lr": 5.074638740781079e-05, "tps": 158041, "wall": 11302.0} {"step": 27255, "train_loss": 3.1652140617370605, "lr": 5.073986788963012e-05, "tps": 157978, "wall": 11306.9} {"step": 27256, "train_loss": 3.138472080230713, "lr": 5.0733350288837355e-05, "tps": 157914, "wall": 11311.9} {"step": 27257, "train_loss": 2.997141122817993, "lr": 5.072683460550639e-05, "tps": 157851, "wall": 11316.8} {"step": 27258, "train_loss": 3.151703119277954, "lr": 5.072032083971099e-05, "tps": 157788, "wall": 11321.7} {"step": 27259, "train_loss": 3.119391918182373, "lr": 5.0713808991524934e-05, "tps": 157725, "wall": 11326.7} {"step": 27260, "train_loss": 2.96419358253479, "lr": 5.070729906102203e-05, "tps": 157662, "wall": 11331.6} {"step": 27261, "train_loss": 3.0551257133483887, "lr": 5.0700791048275995e-05, "tps": 157600, "wall": 11336.5} {"step": 27262, "train_loss": 3.114259719848633, "lr": 5.069428495336055e-05, "tps": 157537, "wall": 11341.5} {"step": 27263, "train_loss": 3.0960800647735596, "lr": 5.068778077634943e-05, "tps": 157473, "wall": 11346.5} {"step": 27264, "train_loss": 3.2159371376037598, "lr": 5.0681278517316264e-05, "tps": 157411, "wall": 11351.4} {"step": 27265, "train_loss": 3.1017072200775146, "lr": 5.0674778176334714e-05, "tps": 157348, "wall": 11356.3} {"step": 27266, "train_loss": 3.0394344329833984, "lr": 5.066827975347849e-05, "tps": 157286, "wall": 11361.3} {"step": 27267, "train_loss": 3.1087918281555176, "lr": 5.06617832488211e-05, "tps": 157224, "wall": 11366.2} {"step": 27268, "train_loss": 3.139954090118408, "lr": 5.065528866243624e-05, "tps": 157161, "wall": 11371.1} {"step": 27269, "train_loss": 3.090970993041992, "lr": 5.064879599439741e-05, "tps": 157099, "wall": 11376.0} {"step": 27270, "train_loss": 3.1801114082336426, "lr": 5.064230524477818e-05, "tps": 157036, "wall": 11381.0} {"step": 27271, "train_loss": 3.147475481033325, "lr": 5.063581641365207e-05, "tps": 156973, "wall": 11385.9} {"step": 27272, "train_loss": 3.0190582275390625, "lr": 5.062932950109263e-05, "tps": 156912, "wall": 11390.9} {"step": 27273, "train_loss": 3.1168713569641113, "lr": 5.062284450717324e-05, "tps": 156849, "wall": 11395.8} {"step": 27274, "train_loss": 3.1186976432800293, "lr": 5.061636143196748e-05, "tps": 156787, "wall": 11400.8} {"step": 27275, "train_loss": 3.0207877159118652, "lr": 5.060988027554876e-05, "tps": 156724, "wall": 11405.8} {"step": 27276, "train_loss": 3.0225207805633545, "lr": 5.060340103799042e-05, "tps": 156662, "wall": 11410.7} {"step": 27277, "train_loss": 3.118317127227783, "lr": 5.059692371936597e-05, "tps": 156600, "wall": 11415.6} {"step": 27278, "train_loss": 3.025468587875366, "lr": 5.059044831974872e-05, "tps": 156539, "wall": 11420.5} {"step": 27279, "train_loss": 3.16375994682312, "lr": 5.0583974839212e-05, "tps": 156477, "wall": 11425.4} {"step": 27280, "train_loss": 3.0895185470581055, "lr": 5.057750327782922e-05, "tps": 156416, "wall": 11430.3} {"step": 27281, "train_loss": 3.028186082839966, "lr": 5.057103363567366e-05, "tps": 156354, "wall": 11435.3} {"step": 27282, "train_loss": 3.094428539276123, "lr": 5.056456591281855e-05, "tps": 156293, "wall": 11440.2} {"step": 27283, "train_loss": 3.084895610809326, "lr": 5.055810010933723e-05, "tps": 156231, "wall": 11445.1} {"step": 27284, "train_loss": 3.042553186416626, "lr": 5.05516362253029e-05, "tps": 156170, "wall": 11450.0} {"step": 27285, "train_loss": 3.1601548194885254, "lr": 5.054517426078882e-05, "tps": 156109, "wall": 11454.9} {"step": 27286, "train_loss": 3.115809917449951, "lr": 5.0538714215868186e-05, "tps": 156047, "wall": 11459.8} {"step": 27287, "train_loss": 3.0484204292297363, "lr": 5.0532256090614125e-05, "tps": 155985, "wall": 11464.8} {"step": 27288, "train_loss": 3.1464219093322754, "lr": 5.052579988509987e-05, "tps": 155924, "wall": 11469.7} {"step": 27289, "train_loss": 3.0214743614196777, "lr": 5.0519345599398514e-05, "tps": 155863, "wall": 11474.6} {"step": 27290, "train_loss": 2.9846503734588623, "lr": 5.051289323358317e-05, "tps": 155802, "wall": 11479.5} {"step": 27291, "train_loss": 3.0277633666992188, "lr": 5.050644278772695e-05, "tps": 155741, "wall": 11484.4} {"step": 27292, "train_loss": 3.1369848251342773, "lr": 5.049999426190293e-05, "tps": 155681, "wall": 11489.3} {"step": 27293, "train_loss": 3.062032461166382, "lr": 5.04935476561841e-05, "tps": 155620, "wall": 11494.3} {"step": 27294, "train_loss": 3.1004509925842285, "lr": 5.0487102970643574e-05, "tps": 155559, "wall": 11499.2} {"step": 27295, "train_loss": 3.1244306564331055, "lr": 5.0480660205354325e-05, "tps": 155498, "wall": 11504.1} {"step": 27296, "train_loss": 3.0889649391174316, "lr": 5.0474219360389274e-05, "tps": 155437, "wall": 11509.0} {"step": 27297, "train_loss": 3.1274898052215576, "lr": 5.0467780435821474e-05, "tps": 155377, "wall": 11513.9} {"step": 27298, "train_loss": 3.122027635574341, "lr": 5.046134343172383e-05, "tps": 155316, "wall": 11518.8} {"step": 27299, "train_loss": 3.14145565032959, "lr": 5.045490834816925e-05, "tps": 155256, "wall": 11523.7} {"step": 27300, "train_loss": 3.118293523788452, "lr": 5.044847518523065e-05, "tps": 155194, "wall": 11528.7} {"step": 27301, "train_loss": 3.0677614212036133, "lr": 5.0442043942980896e-05, "tps": 155134, "wall": 11533.6} {"step": 27302, "train_loss": 3.0043153762817383, "lr": 5.043561462149282e-05, "tps": 155074, "wall": 11538.5} {"step": 27303, "train_loss": 3.081939935684204, "lr": 5.042918722083929e-05, "tps": 155013, "wall": 11543.4} {"step": 27304, "train_loss": 3.032339096069336, "lr": 5.042276174109308e-05, "tps": 154953, "wall": 11548.4} {"step": 27305, "train_loss": 3.1389689445495605, "lr": 5.041633818232704e-05, "tps": 154893, "wall": 11553.3} {"step": 27306, "train_loss": 3.101861000061035, "lr": 5.040991654461388e-05, "tps": 154833, "wall": 11558.2} {"step": 27307, "train_loss": 3.095776319503784, "lr": 5.040349682802633e-05, "tps": 154773, "wall": 11563.1} {"step": 27308, "train_loss": 3.0722010135650635, "lr": 5.0397079032637184e-05, "tps": 154712, "wall": 11568.1} {"step": 27309, "train_loss": 3.18886137008667, "lr": 5.039066315851908e-05, "tps": 154652, "wall": 11573.0} {"step": 27310, "train_loss": 3.0386245250701904, "lr": 5.038424920574471e-05, "tps": 154592, "wall": 11577.9} {"step": 27311, "train_loss": 3.0747995376586914, "lr": 5.0377837174386776e-05, "tps": 154532, "wall": 11582.8} {"step": 27312, "train_loss": 3.0664427280426025, "lr": 5.0371427064517874e-05, "tps": 154471, "wall": 11587.8} {"step": 27313, "train_loss": 3.0995242595672607, "lr": 5.036501887621058e-05, "tps": 154411, "wall": 11592.7} {"step": 27314, "train_loss": 3.094710350036621, "lr": 5.035861260953757e-05, "tps": 154351, "wall": 11597.6} {"step": 27315, "train_loss": 3.1147396564483643, "lr": 5.035220826457137e-05, "tps": 154291, "wall": 11602.6} {"step": 27316, "train_loss": 3.164473056793213, "lr": 5.03458058413845e-05, "tps": 154232, "wall": 11607.5} {"step": 27317, "train_loss": 3.0708956718444824, "lr": 5.0339405340049564e-05, "tps": 154172, "wall": 11612.4} {"step": 27318, "train_loss": 3.165010452270508, "lr": 5.0333006760639e-05, "tps": 154112, "wall": 11617.3} {"step": 27319, "train_loss": 3.1301052570343018, "lr": 5.0326610103225304e-05, "tps": 154053, "wall": 11622.2} {"step": 27320, "train_loss": 3.015477180480957, "lr": 5.032021536788095e-05, "tps": 153993, "wall": 11627.2} {"step": 27321, "train_loss": 3.060563325881958, "lr": 5.0313822554678366e-05, "tps": 153933, "wall": 11632.1} {"step": 27322, "train_loss": 3.1482043266296387, "lr": 5.030743166369002e-05, "tps": 153874, "wall": 11637.0} {"step": 27323, "train_loss": 3.070568799972534, "lr": 5.030104269498826e-05, "tps": 153814, "wall": 11642.0} {"step": 27324, "train_loss": 3.0956931114196777, "lr": 5.0294655648645425e-05, "tps": 153754, "wall": 11647.0} {"step": 27325, "train_loss": 3.0944294929504395, "lr": 5.028827052473397e-05, "tps": 153695, "wall": 11651.9} {"step": 27326, "train_loss": 3.1361708641052246, "lr": 5.028188732332615e-05, "tps": 153635, "wall": 11656.8} {"step": 27327, "train_loss": 3.0411059856414795, "lr": 5.027550604449426e-05, "tps": 153576, "wall": 11661.7} {"step": 27328, "train_loss": 3.0996248722076416, "lr": 5.0269126688310656e-05, "tps": 153517, "wall": 11666.7} {"step": 27329, "train_loss": 3.1727683544158936, "lr": 5.026274925484755e-05, "tps": 153457, "wall": 11671.6} {"step": 27330, "train_loss": 3.0872881412506104, "lr": 5.0256373744177196e-05, "tps": 153398, "wall": 11676.5} {"step": 27331, "train_loss": 3.0417330265045166, "lr": 5.0250000156371845e-05, "tps": 153339, "wall": 11681.5} {"step": 27332, "train_loss": 3.103449821472168, "lr": 5.024362849150368e-05, "tps": 153280, "wall": 11686.4} {"step": 27333, "train_loss": 3.054882526397705, "lr": 5.023725874964483e-05, "tps": 153221, "wall": 11691.3} {"step": 27334, "train_loss": 3.046006202697754, "lr": 5.023089093086754e-05, "tps": 153162, "wall": 11696.3} {"step": 27335, "train_loss": 3.022700309753418, "lr": 5.02245250352439e-05, "tps": 153103, "wall": 11701.2} {"step": 27336, "train_loss": 3.0658230781555176, "lr": 5.0218161062846e-05, "tps": 153043, "wall": 11706.2} {"step": 27337, "train_loss": 3.1087262630462646, "lr": 5.021179901374597e-05, "tps": 152984, "wall": 11711.2} {"step": 27338, "train_loss": 3.095122814178467, "lr": 5.020543888801587e-05, "tps": 152925, "wall": 11716.1} {"step": 27339, "train_loss": 3.129390239715576, "lr": 5.019908068572773e-05, "tps": 152866, "wall": 11721.0} {"step": 27340, "train_loss": 3.1554551124572754, "lr": 5.019272440695361e-05, "tps": 152807, "wall": 11726.0} {"step": 27341, "train_loss": 3.016284942626953, "lr": 5.018637005176547e-05, "tps": 152749, "wall": 11730.9} {"step": 27342, "train_loss": 3.0539987087249756, "lr": 5.018001762023534e-05, "tps": 152690, "wall": 11735.9} {"step": 27343, "train_loss": 3.089155435562134, "lr": 5.0173667112435154e-05, "tps": 152631, "wall": 11740.8} {"step": 27344, "train_loss": 3.1346983909606934, "lr": 5.016731852843684e-05, "tps": 152572, "wall": 11745.7} {"step": 27345, "train_loss": 3.162975549697876, "lr": 5.016097186831234e-05, "tps": 152514, "wall": 11750.7} {"step": 27346, "train_loss": 3.120765447616577, "lr": 5.0154627132133545e-05, "tps": 152455, "wall": 11755.6} {"step": 27347, "train_loss": 3.0375938415527344, "lr": 5.0148284319972305e-05, "tps": 152397, "wall": 11760.6} {"step": 27348, "train_loss": 3.1404902935028076, "lr": 5.014194343190052e-05, "tps": 152337, "wall": 11765.6} {"step": 27349, "train_loss": 3.107975959777832, "lr": 5.013560446798996e-05, "tps": 152279, "wall": 11770.5} {"step": 27350, "train_loss": 3.077446937561035, "lr": 5.012926742831245e-05, "tps": 152221, "wall": 11775.4} {"step": 27351, "train_loss": 3.047640800476074, "lr": 5.012293231293982e-05, "tps": 152162, "wall": 11780.4} {"step": 27352, "train_loss": 3.118943214416504, "lr": 5.011659912194381e-05, "tps": 152104, "wall": 11785.4} {"step": 27353, "train_loss": 3.03621506690979, "lr": 5.011026785539611e-05, "tps": 152046, "wall": 11790.3} {"step": 27354, "train_loss": 3.112327814102173, "lr": 5.010393851336852e-05, "tps": 151988, "wall": 11795.2} {"step": 27355, "train_loss": 3.0908095836639404, "lr": 5.009761109593272e-05, "tps": 151930, "wall": 11800.2} {"step": 27356, "train_loss": 3.1123430728912354, "lr": 5.009128560316033e-05, "tps": 151872, "wall": 11805.1} {"step": 27357, "train_loss": 3.028308391571045, "lr": 5.0084962035123084e-05, "tps": 151813, "wall": 11810.1} {"step": 27358, "train_loss": 3.10028076171875, "lr": 5.007864039189255e-05, "tps": 151755, "wall": 11815.0} {"step": 27359, "train_loss": 2.9857301712036133, "lr": 5.0072320673540406e-05, "tps": 151698, "wall": 11820.0} {"step": 27360, "train_loss": 3.190673828125, "lr": 5.006600288013818e-05, "tps": 151639, "wall": 11825.0} {"step": 27361, "train_loss": 3.0045218467712402, "lr": 5.005968701175746e-05, "tps": 151581, "wall": 11829.9} {"step": 27362, "train_loss": 3.047288417816162, "lr": 5.005337306846983e-05, "tps": 151523, "wall": 11834.8} {"step": 27363, "train_loss": 3.0407493114471436, "lr": 5.0047061050346775e-05, "tps": 151465, "wall": 11839.8} {"step": 27364, "train_loss": 3.1325788497924805, "lr": 5.004075095745979e-05, "tps": 151408, "wall": 11844.7} {"step": 27365, "train_loss": 3.0585875511169434, "lr": 5.003444278988037e-05, "tps": 151351, "wall": 11849.7} {"step": 27366, "train_loss": 3.093249797821045, "lr": 5.002813654768001e-05, "tps": 151293, "wall": 11854.6} {"step": 27367, "train_loss": 3.1981544494628906, "lr": 5.002183223093008e-05, "tps": 151236, "wall": 11859.5} {"step": 27368, "train_loss": 3.0852248668670654, "lr": 5.0015529839702035e-05, "tps": 151178, "wall": 11864.5} {"step": 27369, "train_loss": 3.025879383087158, "lr": 5.000922937406729e-05, "tps": 151121, "wall": 11869.4} {"step": 27370, "train_loss": 3.019392728805542, "lr": 5.000293083409716e-05, "tps": 151064, "wall": 11874.3} {"step": 27371, "train_loss": 3.172971248626709, "lr": 4.999663421986305e-05, "tps": 151007, "wall": 11879.2} {"step": 27372, "train_loss": 3.155683994293213, "lr": 4.999033953143627e-05, "tps": 150948, "wall": 11884.3} {"step": 27373, "train_loss": 3.19978666305542, "lr": 4.998404676888809e-05, "tps": 150891, "wall": 11889.2} {"step": 27374, "train_loss": 3.0144903659820557, "lr": 4.997775593228984e-05, "tps": 150834, "wall": 11894.2} {"step": 27375, "train_loss": 3.1435742378234863, "lr": 4.997146702171276e-05, "tps": 150777, "wall": 11899.1} {"step": 27376, "train_loss": 3.009817123413086, "lr": 4.996518003722811e-05, "tps": 150720, "wall": 11904.0} {"step": 27377, "train_loss": 3.112964391708374, "lr": 4.995889497890712e-05, "tps": 150663, "wall": 11908.9} {"step": 27378, "train_loss": 3.1219732761383057, "lr": 4.995261184682092e-05, "tps": 150606, "wall": 11913.9} {"step": 27379, "train_loss": 3.031404972076416, "lr": 4.9946330641040764e-05, "tps": 150550, "wall": 11918.8} {"step": 27380, "train_loss": 3.1158316135406494, "lr": 4.994005136163778e-05, "tps": 150493, "wall": 11923.7} {"step": 27381, "train_loss": 3.17582368850708, "lr": 4.993377400868308e-05, "tps": 150436, "wall": 11928.7} {"step": 27382, "train_loss": 3.1728744506835938, "lr": 4.99274985822478e-05, "tps": 150379, "wall": 11933.6} {"step": 27383, "train_loss": 3.1290504932403564, "lr": 4.9921225082403005e-05, "tps": 150322, "wall": 11938.5} {"step": 27384, "train_loss": 3.1695547103881836, "lr": 4.9914953509219766e-05, "tps": 150266, "wall": 11943.5} {"step": 27385, "train_loss": 3.134852170944214, "lr": 4.990868386276916e-05, "tps": 150208, "wall": 11948.5} {"step": 27386, "train_loss": 3.167910575866699, "lr": 4.990241614312216e-05, "tps": 150152, "wall": 11953.4} {"step": 27387, "train_loss": 3.055201530456543, "lr": 4.9896150350349796e-05, "tps": 150095, "wall": 11958.4} {"step": 27388, "train_loss": 3.086880683898926, "lr": 4.9889886484523066e-05, "tps": 150038, "wall": 11963.3} {"step": 27389, "train_loss": 3.0954384803771973, "lr": 4.9883624545712886e-05, "tps": 149982, "wall": 11968.3} {"step": 27390, "train_loss": 3.1070871353149414, "lr": 4.9877364533990196e-05, "tps": 149925, "wall": 11973.2} {"step": 27391, "train_loss": 3.177682876586914, "lr": 4.987110644942596e-05, "tps": 149869, "wall": 11978.2} {"step": 27392, "train_loss": 3.2219629287719727, "lr": 4.986485029209099e-05, "tps": 149812, "wall": 11983.1} {"step": 27393, "train_loss": 3.0874810218811035, "lr": 4.985859606205623e-05, "tps": 149756, "wall": 11988.1} {"step": 27394, "train_loss": 2.9929652214050293, "lr": 4.985234375939251e-05, "tps": 149700, "wall": 11993.0} {"step": 27395, "train_loss": 3.187859535217285, "lr": 4.984609338417062e-05, "tps": 149643, "wall": 11998.0} {"step": 27396, "train_loss": 3.0283010005950928, "lr": 4.983984493646139e-05, "tps": 149587, "wall": 12003.0} {"step": 27397, "train_loss": 3.111530065536499, "lr": 4.983359841633566e-05, "tps": 149530, "wall": 12007.9} {"step": 27398, "train_loss": 3.066929578781128, "lr": 4.982735382386406e-05, "tps": 149474, "wall": 12012.9} {"step": 27399, "train_loss": 2.975933074951172, "lr": 4.982111115911743e-05, "tps": 149418, "wall": 12017.8} {"step": 27400, "train_loss": 3.026186943054199, "lr": 4.981487042216643e-05, "tps": 149362, "wall": 12022.8} {"step": 27401, "train_loss": 3.1854958534240723, "lr": 4.9808631613081825e-05, "tps": 149306, "wall": 12027.7} {"step": 27402, "train_loss": 3.1217029094696045, "lr": 4.980239473193425e-05, "tps": 149250, "wall": 12032.7} {"step": 27403, "train_loss": 3.120361089706421, "lr": 4.97961597787943e-05, "tps": 149194, "wall": 12037.6} {"step": 27404, "train_loss": 3.0498836040496826, "lr": 4.9789926753732716e-05, "tps": 149138, "wall": 12042.6} {"step": 27405, "train_loss": 3.2175381183624268, "lr": 4.978369565682003e-05, "tps": 149082, "wall": 12047.5} {"step": 27406, "train_loss": 3.0581085681915283, "lr": 4.9777466488126855e-05, "tps": 149027, "wall": 12052.5} {"step": 27407, "train_loss": 3.133498191833496, "lr": 4.977123924772374e-05, "tps": 148971, "wall": 12057.4} {"step": 27408, "train_loss": 3.1474993228912354, "lr": 4.976501393568126e-05, "tps": 148915, "wall": 12062.4} {"step": 27409, "train_loss": 3.1422648429870605, "lr": 4.9758790552069866e-05, "tps": 148859, "wall": 12067.4} {"step": 27410, "train_loss": 3.090862274169922, "lr": 4.9752569096960136e-05, "tps": 148803, "wall": 12072.4} {"step": 27411, "train_loss": 3.096273422241211, "lr": 4.974634957042251e-05, "tps": 148747, "wall": 12077.3} {"step": 27412, "train_loss": 2.977552890777588, "lr": 4.974013197252743e-05, "tps": 148692, "wall": 12082.3} {"step": 27413, "train_loss": 2.958425521850586, "lr": 4.973391630334536e-05, "tps": 148636, "wall": 12087.2} {"step": 27414, "train_loss": 3.0613341331481934, "lr": 4.9727702562946696e-05, "tps": 148581, "wall": 12092.2} {"step": 27415, "train_loss": 3.213012456893921, "lr": 4.972149075140182e-05, "tps": 148526, "wall": 12097.1} {"step": 27416, "train_loss": 3.140432357788086, "lr": 4.971528086878111e-05, "tps": 148470, "wall": 12102.0} {"step": 27417, "train_loss": 3.0792648792266846, "lr": 4.970907291515491e-05, "tps": 148415, "wall": 12107.0} {"step": 27418, "train_loss": 3.1144518852233887, "lr": 4.970286689059356e-05, "tps": 148360, "wall": 12112.0} {"step": 27419, "train_loss": 3.000439167022705, "lr": 4.969666279516735e-05, "tps": 148305, "wall": 12116.9} {"step": 27420, "train_loss": 3.030851364135742, "lr": 4.969046062894652e-05, "tps": 148250, "wall": 12121.8} {"step": 27421, "train_loss": 3.082850217819214, "lr": 4.96842603920014e-05, "tps": 148194, "wall": 12126.9} {"step": 27422, "train_loss": 3.1783645153045654, "lr": 4.96780620844022e-05, "tps": 148139, "wall": 12131.8} {"step": 27423, "train_loss": 3.258035182952881, "lr": 4.9671865706219085e-05, "tps": 148084, "wall": 12136.7} {"step": 27424, "train_loss": 3.1458840370178223, "lr": 4.966567125752232e-05, "tps": 148029, "wall": 12141.7} {"step": 27425, "train_loss": 3.0884780883789062, "lr": 4.965947873838205e-05, "tps": 147974, "wall": 12146.6} {"step": 27426, "train_loss": 3.0835962295532227, "lr": 4.96532881488684e-05, "tps": 147919, "wall": 12151.6} {"step": 27427, "train_loss": 3.1640939712524414, "lr": 4.9647099489051526e-05, "tps": 147864, "wall": 12156.5} {"step": 27428, "train_loss": 3.1553659439086914, "lr": 4.964091275900155e-05, "tps": 147809, "wall": 12161.5} {"step": 27429, "train_loss": 3.0982930660247803, "lr": 4.963472795878848e-05, "tps": 147754, "wall": 12166.4} {"step": 27430, "train_loss": 3.0329344272613525, "lr": 4.962854508848246e-05, "tps": 147700, "wall": 12171.4} {"step": 27431, "train_loss": 3.1121838092803955, "lr": 4.962236414815352e-05, "tps": 147645, "wall": 12176.4} {"step": 27432, "train_loss": 3.084566116333008, "lr": 4.961618513787161e-05, "tps": 147590, "wall": 12181.3} {"step": 27433, "train_loss": 3.1404953002929688, "lr": 4.961000805770679e-05, "tps": 147534, "wall": 12186.4} {"step": 27434, "train_loss": 3.0683560371398926, "lr": 4.960383290772903e-05, "tps": 147480, "wall": 12191.3} {"step": 27435, "train_loss": 3.1565158367156982, "lr": 4.9597659688008247e-05, "tps": 147425, "wall": 12196.3} {"step": 27436, "train_loss": 2.945314884185791, "lr": 4.959148839861442e-05, "tps": 147371, "wall": 12201.3} {"step": 27437, "train_loss": 3.0841574668884277, "lr": 4.95853190396174e-05, "tps": 147316, "wall": 12206.2} {"step": 27438, "train_loss": 3.1519041061401367, "lr": 4.9579151611087116e-05, "tps": 147262, "wall": 12211.2} {"step": 27439, "train_loss": 3.122633934020996, "lr": 4.957298611309344e-05, "tps": 147207, "wall": 12216.1} {"step": 27440, "train_loss": 3.031343460083008, "lr": 4.956682254570617e-05, "tps": 147153, "wall": 12221.1} {"step": 27441, "train_loss": 3.1578915119171143, "lr": 4.9560660908995175e-05, "tps": 147099, "wall": 12226.0} {"step": 27442, "train_loss": 3.0600156784057617, "lr": 4.9554501203030244e-05, "tps": 147044, "wall": 12231.0} {"step": 27443, "train_loss": 3.093966484069824, "lr": 4.95483434278811e-05, "tps": 146990, "wall": 12235.9} {"step": 27444, "train_loss": 3.1797451972961426, "lr": 4.9542187583617585e-05, "tps": 146936, "wall": 12240.9} {"step": 27445, "train_loss": 3.0414505004882812, "lr": 4.953603367030939e-05, "tps": 146881, "wall": 12245.9} {"step": 27446, "train_loss": 3.1489782333374023, "lr": 4.952988168802619e-05, "tps": 146827, "wall": 12250.8} {"step": 27447, "train_loss": 3.1161346435546875, "lr": 4.952373163683776e-05, "tps": 146773, "wall": 12255.8} {"step": 27448, "train_loss": 3.1300220489501953, "lr": 4.951758351681369e-05, "tps": 146719, "wall": 12260.8} {"step": 27449, "train_loss": 3.1857993602752686, "lr": 4.9511437328023656e-05, "tps": 146665, "wall": 12265.7} {"step": 27450, "train_loss": 3.0052075386047363, "lr": 4.95052930705373e-05, "tps": 146612, "wall": 12270.7} {"step": 27451, "train_loss": 3.100879669189453, "lr": 4.949915074442421e-05, "tps": 146558, "wall": 12275.6} {"step": 27452, "train_loss": 3.0502660274505615, "lr": 4.949301034975394e-05, "tps": 146504, "wall": 12280.6} {"step": 27453, "train_loss": 3.085580587387085, "lr": 4.9486871886596084e-05, "tps": 146451, "wall": 12285.5} {"step": 27454, "train_loss": 3.1466288566589355, "lr": 4.9480735355020156e-05, "tps": 146397, "wall": 12290.5} {"step": 27455, "train_loss": 3.052032470703125, "lr": 4.9474600755095716e-05, "tps": 146343, "wall": 12295.4} {"step": 27456, "train_loss": 3.096210479736328, "lr": 4.9468468086892206e-05, "tps": 146289, "wall": 12300.4} {"step": 27457, "train_loss": 3.0718250274658203, "lr": 4.9462337350479096e-05, "tps": 146235, "wall": 12305.4} {"step": 27458, "train_loss": 3.1808042526245117, "lr": 4.945620854592589e-05, "tps": 146181, "wall": 12310.4} {"step": 27459, "train_loss": 3.213717460632324, "lr": 4.945008167330196e-05, "tps": 146128, "wall": 12315.3} {"step": 27460, "train_loss": 3.0199286937713623, "lr": 4.944395673267672e-05, "tps": 146075, "wall": 12320.3} {"step": 27461, "train_loss": 3.079704761505127, "lr": 4.9437833724119596e-05, "tps": 146021, "wall": 12325.2} {"step": 27462, "train_loss": 3.0560152530670166, "lr": 4.9431712647699914e-05, "tps": 145968, "wall": 12330.2} {"step": 27463, "train_loss": 3.014922857284546, "lr": 4.942559350348698e-05, "tps": 145915, "wall": 12335.1} {"step": 27464, "train_loss": 3.1448798179626465, "lr": 4.941947629155018e-05, "tps": 145861, "wall": 12340.1} {"step": 27465, "train_loss": 3.1702895164489746, "lr": 4.941336101195879e-05, "tps": 145808, "wall": 12345.1} {"step": 27466, "train_loss": 3.0995595455169678, "lr": 4.9407247664782044e-05, "tps": 145754, "wall": 12350.0} {"step": 27467, "train_loss": 3.0577552318573, "lr": 4.940113625008925e-05, "tps": 145701, "wall": 12355.0} {"step": 27468, "train_loss": 3.1121299266815186, "lr": 4.939502676794962e-05, "tps": 145648, "wall": 12360.0} {"step": 27469, "train_loss": 3.1476247310638428, "lr": 4.938891921843233e-05, "tps": 145594, "wall": 12365.0} {"step": 27470, "train_loss": 3.167214870452881, "lr": 4.938281360160663e-05, "tps": 145541, "wall": 12370.0} {"step": 27471, "train_loss": 3.1827821731567383, "lr": 4.937670991754159e-05, "tps": 145488, "wall": 12374.9} {"step": 27472, "train_loss": 3.1949191093444824, "lr": 4.9370608166306476e-05, "tps": 145435, "wall": 12379.9} {"step": 27473, "train_loss": 3.0869550704956055, "lr": 4.9364508347970317e-05, "tps": 145382, "wall": 12384.8} {"step": 27474, "train_loss": 3.1491997241973877, "lr": 4.9358410462602205e-05, "tps": 145329, "wall": 12389.7} {"step": 27475, "train_loss": 3.097651481628418, "lr": 4.9352314510271286e-05, "tps": 145277, "wall": 12394.7} {"step": 27476, "train_loss": 3.1104588508605957, "lr": 4.93462204910466e-05, "tps": 145224, "wall": 12399.6} {"step": 27477, "train_loss": 3.157538414001465, "lr": 4.934012840499712e-05, "tps": 145171, "wall": 12404.6} {"step": 27478, "train_loss": 3.1962826251983643, "lr": 4.933403825219191e-05, "tps": 145119, "wall": 12409.5} {"step": 27479, "train_loss": 3.118853807449341, "lr": 4.932795003269997e-05, "tps": 145066, "wall": 12414.5} {"step": 27480, "train_loss": 3.075934886932373, "lr": 4.9321863746590207e-05, "tps": 145013, "wall": 12419.5} {"step": 27481, "train_loss": 3.1524605751037598, "lr": 4.9315779393931634e-05, "tps": 144960, "wall": 12424.5} {"step": 27482, "train_loss": 3.084196090698242, "lr": 4.930969697479314e-05, "tps": 144908, "wall": 12429.4} {"step": 27483, "train_loss": 3.0636801719665527, "lr": 4.930361648924361e-05, "tps": 144855, "wall": 12434.4} {"step": 27484, "train_loss": 2.9628677368164062, "lr": 4.9297537937351984e-05, "tps": 144803, "wall": 12439.4} {"step": 27485, "train_loss": 3.11873197555542, "lr": 4.9291461319187074e-05, "tps": 144750, "wall": 12444.3} {"step": 27486, "train_loss": 3.135650157928467, "lr": 4.92853866348177e-05, "tps": 144698, "wall": 12449.2} {"step": 27487, "train_loss": 3.0815107822418213, "lr": 4.927931388431272e-05, "tps": 144646, "wall": 12454.2} {"step": 27488, "train_loss": 3.1401383876800537, "lr": 4.9273243067740917e-05, "tps": 144594, "wall": 12459.1} {"step": 27489, "train_loss": 2.990060329437256, "lr": 4.926717418517103e-05, "tps": 144541, "wall": 12464.1} {"step": 27490, "train_loss": 2.9574358463287354, "lr": 4.926110723667184e-05, "tps": 144489, "wall": 12469.1} {"step": 27491, "train_loss": 3.086348533630371, "lr": 4.9255042222312054e-05, "tps": 144437, "wall": 12474.0} {"step": 27492, "train_loss": 3.0630147457122803, "lr": 4.924897914216041e-05, "tps": 144385, "wall": 12479.0} {"step": 27493, "train_loss": 3.0939855575561523, "lr": 4.924291799628556e-05, "tps": 144332, "wall": 12484.0} {"step": 27494, "train_loss": 3.128577470779419, "lr": 4.9236858784756166e-05, "tps": 144280, "wall": 12489.0} {"step": 27495, "train_loss": 3.0603160858154297, "lr": 4.923080150764088e-05, "tps": 144228, "wall": 12493.9} {"step": 27496, "train_loss": 3.0461602210998535, "lr": 4.922474616500832e-05, "tps": 144176, "wall": 12498.9} {"step": 27497, "train_loss": 3.0116708278656006, "lr": 4.921869275692704e-05, "tps": 144124, "wall": 12503.8} {"step": 27498, "train_loss": 3.112231731414795, "lr": 4.921264128346569e-05, "tps": 144072, "wall": 12508.8} {"step": 27499, "train_loss": 3.1183183193206787, "lr": 4.920659174469277e-05, "tps": 144020, "wall": 12513.7} {"step": 27500, "train_loss": 3.1297426223754883, "lr": 4.92005441406768e-05, "tps": 143969, "wall": 12518.7} {"step": 27501, "train_loss": 3.041682243347168, "lr": 4.9194498471486314e-05, "tps": 143915, "wall": 12523.8} {"step": 27502, "train_loss": 3.1382815837860107, "lr": 4.918845473718981e-05, "tps": 143863, "wall": 12528.8} {"step": 27503, "train_loss": 3.1239173412323, "lr": 4.9182412937855694e-05, "tps": 143811, "wall": 12533.8} {"step": 27504, "train_loss": 3.1110031604766846, "lr": 4.917637307355248e-05, "tps": 143760, "wall": 12538.7} {"step": 27505, "train_loss": 3.09175968170166, "lr": 4.917033514434854e-05, "tps": 143708, "wall": 12543.7} {"step": 27506, "train_loss": 3.1569056510925293, "lr": 4.916429915031227e-05, "tps": 143656, "wall": 12548.7} {"step": 27507, "train_loss": 3.0643227100372314, "lr": 4.915826509151207e-05, "tps": 143605, "wall": 12553.6} {"step": 27508, "train_loss": 2.9944233894348145, "lr": 4.915223296801626e-05, "tps": 143554, "wall": 12558.5} {"step": 27509, "train_loss": 3.181187629699707, "lr": 4.9146202779893246e-05, "tps": 143502, "wall": 12563.5} {"step": 27510, "train_loss": 3.093550205230713, "lr": 4.9140174527211294e-05, "tps": 143451, "wall": 12568.4} {"step": 27511, "train_loss": 3.0149717330932617, "lr": 4.913414821003863e-05, "tps": 143400, "wall": 12573.4} {"step": 27512, "train_loss": 3.1274619102478027, "lr": 4.912812382844363e-05, "tps": 143349, "wall": 12578.3} {"step": 27513, "train_loss": 3.0337634086608887, "lr": 4.912210138249449e-05, "tps": 143298, "wall": 12583.3} {"step": 27514, "train_loss": 3.0001778602600098, "lr": 4.9116080872259385e-05, "tps": 143246, "wall": 12588.2} {"step": 27515, "train_loss": 3.1222362518310547, "lr": 4.9110062297806605e-05, "tps": 143195, "wall": 12593.2} {"step": 27516, "train_loss": 3.120288848876953, "lr": 4.910404565920427e-05, "tps": 143144, "wall": 12598.1} {"step": 27517, "train_loss": 3.0747807025909424, "lr": 4.9098030956520526e-05, "tps": 143093, "wall": 12603.1} {"step": 27518, "train_loss": 3.057858943939209, "lr": 4.9092018189823566e-05, "tps": 143041, "wall": 12608.1} {"step": 27519, "train_loss": 3.1388540267944336, "lr": 4.9086007359181465e-05, "tps": 142991, "wall": 12613.0} {"step": 27520, "train_loss": 3.0845015048980713, "lr": 4.9079998464662304e-05, "tps": 142940, "wall": 12618.0} {"step": 27521, "train_loss": 3.073570489883423, "lr": 4.9073991506334165e-05, "tps": 142889, "wall": 12622.9} {"step": 27522, "train_loss": 3.1183924674987793, "lr": 4.906798648426513e-05, "tps": 142838, "wall": 12627.9} {"step": 27523, "train_loss": 3.1228764057159424, "lr": 4.9061983398523146e-05, "tps": 142788, "wall": 12632.8} {"step": 27524, "train_loss": 3.1291370391845703, "lr": 4.905598224917629e-05, "tps": 142737, "wall": 12637.7} {"step": 27525, "train_loss": 3.1460676193237305, "lr": 4.90499830362925e-05, "tps": 142687, "wall": 12642.6} {"step": 27526, "train_loss": 3.096846580505371, "lr": 4.904398575993977e-05, "tps": 142636, "wall": 12647.6} {"step": 27527, "train_loss": 3.1042261123657227, "lr": 4.903799042018602e-05, "tps": 142586, "wall": 12652.5} {"step": 27528, "train_loss": 3.154261589050293, "lr": 4.9031997017099135e-05, "tps": 142536, "wall": 12657.4} {"step": 27529, "train_loss": 3.055778980255127, "lr": 4.9026005550747044e-05, "tps": 142485, "wall": 12662.4} {"step": 27530, "train_loss": 3.1637020111083984, "lr": 4.9020016021197635e-05, "tps": 142434, "wall": 12667.4} {"step": 27531, "train_loss": 3.116461992263794, "lr": 4.90140284285187e-05, "tps": 142384, "wall": 12672.3} {"step": 27532, "train_loss": 3.1038331985473633, "lr": 4.900804277277815e-05, "tps": 142333, "wall": 12677.3} {"step": 27533, "train_loss": 3.0019404888153076, "lr": 4.90020590540437e-05, "tps": 142283, "wall": 12682.2} {"step": 27534, "train_loss": 3.087982177734375, "lr": 4.899607727238318e-05, "tps": 142233, "wall": 12687.1} {"step": 27535, "train_loss": 3.060805320739746, "lr": 4.8990097427864364e-05, "tps": 142183, "wall": 12692.0} {"step": 27536, "train_loss": 3.0880777835845947, "lr": 4.898411952055498e-05, "tps": 142133, "wall": 12696.9} {"step": 27537, "train_loss": 3.155867576599121, "lr": 4.897814355052272e-05, "tps": 142084, "wall": 12701.8} {"step": 27538, "train_loss": 3.123326301574707, "lr": 4.897216951783532e-05, "tps": 142034, "wall": 12706.7} {"step": 27539, "train_loss": 3.0086870193481445, "lr": 4.896619742256043e-05, "tps": 141984, "wall": 12711.7} {"step": 27540, "train_loss": 3.101759672164917, "lr": 4.8960227264765694e-05, "tps": 141934, "wall": 12716.6} {"step": 27541, "train_loss": 2.969987154006958, "lr": 4.895425904451877e-05, "tps": 141885, "wall": 12721.5} {"step": 27542, "train_loss": 3.105598211288452, "lr": 4.894829276188726e-05, "tps": 141834, "wall": 12726.5} {"step": 27543, "train_loss": 3.1791346073150635, "lr": 4.894232841693872e-05, "tps": 141784, "wall": 12731.4} {"step": 27544, "train_loss": 3.1540298461914062, "lr": 4.893636600974077e-05, "tps": 141735, "wall": 12736.3} {"step": 27545, "train_loss": 3.2095608711242676, "lr": 4.893040554036088e-05, "tps": 141686, "wall": 12741.2} {"step": 27546, "train_loss": 3.0112807750701904, "lr": 4.892444700886666e-05, "tps": 141636, "wall": 12746.1} {"step": 27547, "train_loss": 3.1612462997436523, "lr": 4.8918490415325525e-05, "tps": 141587, "wall": 12751.0} {"step": 27548, "train_loss": 3.027904510498047, "lr": 4.891253575980498e-05, "tps": 141538, "wall": 12755.9} {"step": 27549, "train_loss": 3.191244602203369, "lr": 4.8906583042372515e-05, "tps": 141489, "wall": 12760.8} {"step": 27550, "train_loss": 3.107313632965088, "lr": 4.890063226309551e-05, "tps": 141440, "wall": 12765.7} {"step": 27551, "train_loss": 3.0426173210144043, "lr": 4.88946834220414e-05, "tps": 141391, "wall": 12770.6} {"step": 27552, "train_loss": 3.1578497886657715, "lr": 4.8888736519277584e-05, "tps": 141342, "wall": 12775.4} {"step": 27553, "train_loss": 3.0496201515197754, "lr": 4.8882791554871424e-05, "tps": 141293, "wall": 12780.3} {"step": 27554, "train_loss": 3.1598970890045166, "lr": 4.887684852889023e-05, "tps": 141243, "wall": 12785.3} {"step": 27555, "train_loss": 3.137280225753784, "lr": 4.8870907441401384e-05, "tps": 141195, "wall": 12790.2} {"step": 27556, "train_loss": 3.070108652114868, "lr": 4.886496829247216e-05, "tps": 141146, "wall": 12795.1} {"step": 27557, "train_loss": 3.067812919616699, "lr": 4.8859031082169805e-05, "tps": 141097, "wall": 12799.9} {"step": 27558, "train_loss": 3.0565788745880127, "lr": 4.8853095810561614e-05, "tps": 141049, "wall": 12804.8} {"step": 27559, "train_loss": 2.992910385131836, "lr": 4.884716247771483e-05, "tps": 141000, "wall": 12809.7} {"step": 27560, "train_loss": 3.071089744567871, "lr": 4.884123108369663e-05, "tps": 140952, "wall": 12814.5} {"step": 27561, "train_loss": 3.0923829078674316, "lr": 4.8835301628574225e-05, "tps": 140903, "wall": 12819.4} {"step": 27562, "train_loss": 3.188934803009033, "lr": 4.8829374112414776e-05, "tps": 140855, "wall": 12824.3} {"step": 27563, "train_loss": 3.0670738220214844, "lr": 4.882344853528544e-05, "tps": 140806, "wall": 12829.2} {"step": 27564, "train_loss": 3.1115612983703613, "lr": 4.881752489725337e-05, "tps": 140758, "wall": 12834.0} {"step": 27565, "train_loss": 3.1301894187927246, "lr": 4.881160319838559e-05, "tps": 140710, "wall": 12838.9} {"step": 27566, "train_loss": 3.1091442108154297, "lr": 4.880568343874929e-05, "tps": 140662, "wall": 12843.8} {"step": 27567, "train_loss": 3.114590883255005, "lr": 4.879976561841143e-05, "tps": 140613, "wall": 12848.7} {"step": 27568, "train_loss": 3.135486125946045, "lr": 4.879384973743911e-05, "tps": 140565, "wall": 12853.5} {"step": 27569, "train_loss": 3.1541635990142822, "lr": 4.8787935795899306e-05, "tps": 140517, "wall": 12858.4} {"step": 27570, "train_loss": 3.080984592437744, "lr": 4.878202379385901e-05, "tps": 140469, "wall": 12863.3} {"step": 27571, "train_loss": 3.132779121398926, "lr": 4.877611373138523e-05, "tps": 140421, "wall": 12868.1} {"step": 27572, "train_loss": 2.987633466720581, "lr": 4.8770205608544895e-05, "tps": 140373, "wall": 12873.0} {"step": 27573, "train_loss": 3.192920684814453, "lr": 4.876429942540491e-05, "tps": 140325, "wall": 12877.8} {"step": 27574, "train_loss": 3.1295385360717773, "lr": 4.875839518203225e-05, "tps": 140278, "wall": 12882.7} {"step": 27575, "train_loss": 3.054863691329956, "lr": 4.8752492878493746e-05, "tps": 140230, "wall": 12887.5} {"step": 27576, "train_loss": 3.0664710998535156, "lr": 4.874659251485623e-05, "tps": 140182, "wall": 12892.4} {"step": 27577, "train_loss": 3.0589652061462402, "lr": 4.874069409118661e-05, "tps": 140134, "wall": 12897.2} {"step": 27578, "train_loss": 3.093663215637207, "lr": 4.873479760755167e-05, "tps": 140087, "wall": 12902.1} {"step": 27579, "train_loss": 3.031341075897217, "lr": 4.8728903064018196e-05, "tps": 140038, "wall": 12907.0} {"step": 27580, "train_loss": 3.0622692108154297, "lr": 4.872301046065298e-05, "tps": 139991, "wall": 12911.8} {"step": 27581, "train_loss": 3.0939102172851562, "lr": 4.871711979752278e-05, "tps": 139944, "wall": 12916.7} {"step": 27582, "train_loss": 3.1678571701049805, "lr": 4.871123107469427e-05, "tps": 139896, "wall": 12921.5} {"step": 27583, "train_loss": 3.1780006885528564, "lr": 4.870534429223424e-05, "tps": 139849, "wall": 12926.4} {"step": 27584, "train_loss": 3.1414005756378174, "lr": 4.869945945020934e-05, "tps": 139802, "wall": 12931.2} {"step": 27585, "train_loss": 3.098196029663086, "lr": 4.869357654868622e-05, "tps": 139754, "wall": 12936.1} {"step": 27586, "train_loss": 3.090550422668457, "lr": 4.8687695587731535e-05, "tps": 139707, "wall": 12940.9} {"step": 27587, "train_loss": 2.9969353675842285, "lr": 4.868181656741187e-05, "tps": 139660, "wall": 12945.7} {"step": 27588, "train_loss": 3.108081340789795, "lr": 4.86759394877939e-05, "tps": 139613, "wall": 12950.6} {"step": 27589, "train_loss": 3.0811877250671387, "lr": 4.867006434894414e-05, "tps": 139566, "wall": 12955.4} {"step": 27590, "train_loss": 3.229343891143799, "lr": 4.866419115092913e-05, "tps": 139518, "wall": 12960.3} {"step": 27591, "train_loss": 3.111868381500244, "lr": 4.8658319893815485e-05, "tps": 139471, "wall": 12965.2} {"step": 27592, "train_loss": 3.0348076820373535, "lr": 4.8652450577669645e-05, "tps": 139424, "wall": 12970.0} {"step": 27593, "train_loss": 3.174022674560547, "lr": 4.864658320255808e-05, "tps": 139377, "wall": 12974.9} {"step": 27594, "train_loss": 3.0682530403137207, "lr": 4.8640717768547325e-05, "tps": 139330, "wall": 12979.7} {"step": 27595, "train_loss": 3.030790090560913, "lr": 4.863485427570379e-05, "tps": 139283, "wall": 12984.6} {"step": 27596, "train_loss": 3.0940256118774414, "lr": 4.8628992724093883e-05, "tps": 139236, "wall": 12989.4} {"step": 27597, "train_loss": 3.163116455078125, "lr": 4.862313311378404e-05, "tps": 139189, "wall": 12994.2} {"step": 27598, "train_loss": 3.1847786903381348, "lr": 4.86172754448406e-05, "tps": 139142, "wall": 12999.1} {"step": 27599, "train_loss": 3.12484073638916, "lr": 4.8611419717329915e-05, "tps": 139096, "wall": 13003.9} {"step": 27600, "train_loss": 3.1643264293670654, "lr": 4.860556593131837e-05, "tps": 139049, "wall": 13008.8} {"step": 27601, "train_loss": 3.115691661834717, "lr": 4.859971408687224e-05, "tps": 139002, "wall": 13013.6} {"step": 27602, "train_loss": 3.0847694873809814, "lr": 4.85938641840578e-05, "tps": 138955, "wall": 13018.4} {"step": 27603, "train_loss": 3.0379281044006348, "lr": 4.858801622294136e-05, "tps": 138909, "wall": 13023.3} {"step": 27604, "train_loss": 3.1793150901794434, "lr": 4.8582170203589134e-05, "tps": 138862, "wall": 13028.2} {"step": 27605, "train_loss": 3.134632110595703, "lr": 4.8576326126067365e-05, "tps": 138815, "wall": 13033.0} {"step": 27606, "train_loss": 3.138932704925537, "lr": 4.857048399044226e-05, "tps": 138769, "wall": 13037.8} {"step": 27607, "train_loss": 3.1096224784851074, "lr": 4.856464379677996e-05, "tps": 138722, "wall": 13042.7} {"step": 27608, "train_loss": 3.171252965927124, "lr": 4.8558805545146665e-05, "tps": 138676, "wall": 13047.5} {"step": 27609, "train_loss": 3.0354976654052734, "lr": 4.8552969235608505e-05, "tps": 138630, "wall": 13052.3} {"step": 27610, "train_loss": 3.059251308441162, "lr": 4.854713486823157e-05, "tps": 138583, "wall": 13057.2} {"step": 27611, "train_loss": 3.103712320327759, "lr": 4.854130244308196e-05, "tps": 138537, "wall": 13062.0} {"step": 27612, "train_loss": 3.0439653396606445, "lr": 4.8535471960225786e-05, "tps": 138491, "wall": 13066.9} {"step": 27613, "train_loss": 3.1326379776000977, "lr": 4.852964341972902e-05, "tps": 138444, "wall": 13071.7} {"step": 27614, "train_loss": 3.083667278289795, "lr": 4.852381682165776e-05, "tps": 138398, "wall": 13076.5} {"step": 27615, "train_loss": 3.1070709228515625, "lr": 4.8517992166077964e-05, "tps": 138352, "wall": 13081.4} {"step": 27616, "train_loss": 3.034092903137207, "lr": 4.8512169453055624e-05, "tps": 138305, "wall": 13086.3} {"step": 27617, "train_loss": 3.029771327972412, "lr": 4.850634868265672e-05, "tps": 138259, "wall": 13091.1} {"step": 27618, "train_loss": 3.1176552772521973, "lr": 4.8500529854947176e-05, "tps": 138213, "wall": 13095.9} {"step": 27619, "train_loss": 3.1555471420288086, "lr": 4.849471296999288e-05, "tps": 138168, "wall": 13100.7} {"step": 27620, "train_loss": 3.224165439605713, "lr": 4.848889802785979e-05, "tps": 138122, "wall": 13105.6} {"step": 27621, "train_loss": 3.056441307067871, "lr": 4.848308502861371e-05, "tps": 138076, "wall": 13110.4} {"step": 27622, "train_loss": 3.062182903289795, "lr": 4.8477273972320555e-05, "tps": 138030, "wall": 13115.2} {"step": 27623, "train_loss": 3.055529832839966, "lr": 4.8471464859046104e-05, "tps": 137984, "wall": 13120.1} {"step": 27624, "train_loss": 3.004150629043579, "lr": 4.846565768885616e-05, "tps": 137938, "wall": 13124.9} {"step": 27625, "train_loss": 3.1106367111206055, "lr": 4.845985246181656e-05, "tps": 137892, "wall": 13129.8} {"step": 27626, "train_loss": 3.0041165351867676, "lr": 4.845404917799301e-05, "tps": 137846, "wall": 13134.6} {"step": 27627, "train_loss": 3.100928544998169, "lr": 4.844824783745128e-05, "tps": 137801, "wall": 13139.4} {"step": 27628, "train_loss": 3.115316152572632, "lr": 4.8442448440257084e-05, "tps": 137755, "wall": 13144.3} {"step": 27629, "train_loss": 3.114762544631958, "lr": 4.84366509864761e-05, "tps": 137709, "wall": 13149.2} {"step": 27630, "train_loss": 3.064394474029541, "lr": 4.843085547617401e-05, "tps": 137663, "wall": 13154.0} {"step": 27631, "train_loss": 3.1258347034454346, "lr": 4.8425061909416495e-05, "tps": 137618, "wall": 13158.8} {"step": 27632, "train_loss": 3.1073379516601562, "lr": 4.841927028626915e-05, "tps": 137572, "wall": 13163.6} {"step": 27633, "train_loss": 3.035679817199707, "lr": 4.841348060679758e-05, "tps": 137527, "wall": 13168.5} {"step": 27634, "train_loss": 3.0119457244873047, "lr": 4.8407692871067404e-05, "tps": 137481, "wall": 13173.3} {"step": 27635, "train_loss": 3.1202666759490967, "lr": 4.840190707914416e-05, "tps": 137436, "wall": 13178.1} {"step": 27636, "train_loss": 2.985283613204956, "lr": 4.839612323109338e-05, "tps": 137391, "wall": 13182.9} {"step": 27637, "train_loss": 3.1474289894104004, "lr": 4.839034132698061e-05, "tps": 137346, "wall": 13187.7} {"step": 27638, "train_loss": 3.0669708251953125, "lr": 4.838456136687136e-05, "tps": 137300, "wall": 13192.6} {"step": 27639, "train_loss": 3.2147297859191895, "lr": 4.837878335083104e-05, "tps": 137255, "wall": 13197.4} {"step": 27640, "train_loss": 2.9818243980407715, "lr": 4.837300727892518e-05, "tps": 137210, "wall": 13202.2} {"step": 27641, "train_loss": 3.1566505432128906, "lr": 4.8367233151219156e-05, "tps": 137164, "wall": 13207.1} {"step": 27642, "train_loss": 2.9776415824890137, "lr": 4.836146096777841e-05, "tps": 137119, "wall": 13211.9} {"step": 27643, "train_loss": 3.00038480758667, "lr": 4.835569072866835e-05, "tps": 137074, "wall": 13216.7} {"step": 27644, "train_loss": 3.0915932655334473, "lr": 4.834992243395427e-05, "tps": 137029, "wall": 13221.6} {"step": 27645, "train_loss": 3.0695388317108154, "lr": 4.834415608370155e-05, "tps": 136984, "wall": 13226.4} {"step": 27646, "train_loss": 3.0029706954956055, "lr": 4.8338391677975566e-05, "tps": 136939, "wall": 13231.2} {"step": 27647, "train_loss": 3.0661284923553467, "lr": 4.83326292168415e-05, "tps": 136894, "wall": 13236.0} {"step": 27648, "train_loss": 3.0257608890533447, "lr": 4.832686870036476e-05, "tps": 136849, "wall": 13240.9} {"step": 27649, "train_loss": 3.1084046363830566, "lr": 4.8321110128610516e-05, "tps": 136804, "wall": 13245.7} {"step": 27650, "train_loss": 3.0712811946868896, "lr": 4.8315353501644e-05, "tps": 136759, "wall": 13250.5} {"step": 27651, "train_loss": 3.2127881050109863, "lr": 4.830959881953048e-05, "tps": 136714, "wall": 13255.4} {"step": 27652, "train_loss": 3.037479877471924, "lr": 4.8303846082335115e-05, "tps": 136669, "wall": 13260.2} {"step": 27653, "train_loss": 2.9639194011688232, "lr": 4.8298095290123025e-05, "tps": 136624, "wall": 13265.1} {"step": 27654, "train_loss": 3.117032289505005, "lr": 4.8292346442959455e-05, "tps": 136579, "wall": 13269.9} {"step": 27655, "train_loss": 3.0372531414031982, "lr": 4.828659954090945e-05, "tps": 136535, "wall": 13274.7} {"step": 27656, "train_loss": 3.081364870071411, "lr": 4.828085458403813e-05, "tps": 136490, "wall": 13279.5} {"step": 27657, "train_loss": 3.0609617233276367, "lr": 4.827511157241059e-05, "tps": 136446, "wall": 13284.3} {"step": 27658, "train_loss": 3.1790802478790283, "lr": 4.8269370506091846e-05, "tps": 136401, "wall": 13289.1} {"step": 27659, "train_loss": 3.1037588119506836, "lr": 4.826363138514699e-05, "tps": 136357, "wall": 13294.0} {"step": 27660, "train_loss": 3.0498158931732178, "lr": 4.8257894209641015e-05, "tps": 136312, "wall": 13298.8} {"step": 27661, "train_loss": 3.1073057651519775, "lr": 4.8252158979638886e-05, "tps": 136268, "wall": 13303.6} {"step": 27662, "train_loss": 3.1105732917785645, "lr": 4.824642569520561e-05, "tps": 136223, "wall": 13308.4} {"step": 27663, "train_loss": 3.047891616821289, "lr": 4.8240694356406125e-05, "tps": 136178, "wall": 13313.3} {"step": 27664, "train_loss": 3.017833948135376, "lr": 4.823496496330531e-05, "tps": 136134, "wall": 13318.1} {"step": 27665, "train_loss": 3.067622423171997, "lr": 4.822923751596813e-05, "tps": 136090, "wall": 13322.9} {"step": 27666, "train_loss": 3.1092138290405273, "lr": 4.8223512014459424e-05, "tps": 136045, "wall": 13327.8} {"step": 27667, "train_loss": 3.1661229133605957, "lr": 4.821778845884407e-05, "tps": 136000, "wall": 13332.6} {"step": 27668, "train_loss": 3.108593702316284, "lr": 4.821206684918691e-05, "tps": 135956, "wall": 13337.5} {"step": 27669, "train_loss": 3.0217411518096924, "lr": 4.820634718555275e-05, "tps": 135912, "wall": 13342.3} {"step": 27670, "train_loss": 3.0710277557373047, "lr": 4.8200629468006384e-05, "tps": 135868, "wall": 13347.1} {"step": 27671, "train_loss": 3.192296028137207, "lr": 4.819491369661258e-05, "tps": 135823, "wall": 13352.0} {"step": 27672, "train_loss": 3.158569574356079, "lr": 4.8189199871436095e-05, "tps": 135779, "wall": 13356.8} {"step": 27673, "train_loss": 3.1791446208953857, "lr": 4.818348799254163e-05, "tps": 135735, "wall": 13361.6} {"step": 27674, "train_loss": 3.211604595184326, "lr": 4.8177778059993925e-05, "tps": 135691, "wall": 13366.4} {"step": 27675, "train_loss": 3.1264944076538086, "lr": 4.8172070073857624e-05, "tps": 135647, "wall": 13371.3} {"step": 27676, "train_loss": 3.047321081161499, "lr": 4.816636403419743e-05, "tps": 135603, "wall": 13376.1} {"step": 27677, "train_loss": 3.124629497528076, "lr": 4.8160659941077954e-05, "tps": 135559, "wall": 13380.9} {"step": 27678, "train_loss": 2.9916844367980957, "lr": 4.81549577945638e-05, "tps": 135514, "wall": 13385.8} {"step": 27679, "train_loss": 3.098557710647583, "lr": 4.814925759471961e-05, "tps": 135470, "wall": 13390.6} {"step": 27680, "train_loss": 3.1050868034362793, "lr": 4.8143559341609925e-05, "tps": 135426, "wall": 13395.5} {"step": 27681, "train_loss": 3.147677421569824, "lr": 4.813786303529928e-05, "tps": 135382, "wall": 13400.3} {"step": 27682, "train_loss": 3.0952882766723633, "lr": 4.813216867585223e-05, "tps": 135338, "wall": 13405.1} {"step": 27683, "train_loss": 3.1246862411499023, "lr": 4.8126476263333296e-05, "tps": 135295, "wall": 13409.9} {"step": 27684, "train_loss": 3.169931411743164, "lr": 4.812078579780689e-05, "tps": 135251, "wall": 13414.8} {"step": 27685, "train_loss": 3.077195644378662, "lr": 4.8115097279337535e-05, "tps": 135207, "wall": 13419.6} {"step": 27686, "train_loss": 3.0656967163085938, "lr": 4.810941070798969e-05, "tps": 135163, "wall": 13424.4} {"step": 27687, "train_loss": 3.0016727447509766, "lr": 4.8103726083827696e-05, "tps": 135119, "wall": 13429.3} {"step": 27688, "train_loss": 3.191079616546631, "lr": 4.8098043406916e-05, "tps": 135076, "wall": 13434.1} {"step": 27689, "train_loss": 3.1263794898986816, "lr": 4.8092362677318997e-05, "tps": 135032, "wall": 13438.9} {"step": 27690, "train_loss": 3.205441474914551, "lr": 4.808668389510097e-05, "tps": 134988, "wall": 13443.7} {"step": 27691, "train_loss": 3.156920909881592, "lr": 4.808100706032631e-05, "tps": 134944, "wall": 13448.6} {"step": 27692, "train_loss": 3.188196897506714, "lr": 4.8075332173059305e-05, "tps": 134901, "wall": 13453.5} {"step": 27693, "train_loss": 3.1719400882720947, "lr": 4.806965923336423e-05, "tps": 134857, "wall": 13458.3} {"step": 27694, "train_loss": 3.080932140350342, "lr": 4.8063988241305355e-05, "tps": 134814, "wall": 13463.1} {"step": 27695, "train_loss": 3.160892963409424, "lr": 4.805831919694693e-05, "tps": 134771, "wall": 13467.9} {"step": 27696, "train_loss": 3.1881608963012695, "lr": 4.8052652100353174e-05, "tps": 134727, "wall": 13472.7} {"step": 27697, "train_loss": 3.0313591957092285, "lr": 4.804698695158827e-05, "tps": 134684, "wall": 13477.6} {"step": 27698, "train_loss": 3.0906331539154053, "lr": 4.8041323750716383e-05, "tps": 134641, "wall": 13482.4} {"step": 27699, "train_loss": 3.1407370567321777, "lr": 4.8035662497801705e-05, "tps": 134597, "wall": 13487.2} {"step": 27700, "train_loss": 3.0995402336120605, "lr": 4.803000319290835e-05, "tps": 134554, "wall": 13492.0} {"step": 27701, "train_loss": 3.0464015007019043, "lr": 4.802434583610039e-05, "tps": 134511, "wall": 13496.9} {"step": 27702, "train_loss": 3.0815823078155518, "lr": 4.801869042744197e-05, "tps": 134468, "wall": 13501.7} {"step": 27703, "train_loss": 3.0805344581604004, "lr": 4.801303696699714e-05, "tps": 134424, "wall": 13506.6} {"step": 27704, "train_loss": 3.1253886222839355, "lr": 4.8007385454829895e-05, "tps": 134381, "wall": 13511.4} {"step": 27705, "train_loss": 3.123401641845703, "lr": 4.800173589100433e-05, "tps": 134338, "wall": 13516.2} {"step": 27706, "train_loss": 3.015596389770508, "lr": 4.799608827558439e-05, "tps": 134295, "wall": 13521.0} {"step": 27707, "train_loss": 3.1871495246887207, "lr": 4.7990442608634056e-05, "tps": 134252, "wall": 13525.8} {"step": 27708, "train_loss": 3.0742619037628174, "lr": 4.7984798890217306e-05, "tps": 134209, "wall": 13530.6} {"step": 27709, "train_loss": 3.08828067779541, "lr": 4.7979157120398075e-05, "tps": 134166, "wall": 13535.5} {"step": 27710, "train_loss": 3.0763139724731445, "lr": 4.7973517299240224e-05, "tps": 134123, "wall": 13540.3} {"step": 27711, "train_loss": 3.1418368816375732, "lr": 4.796787942680769e-05, "tps": 134080, "wall": 13545.1} {"step": 27712, "train_loss": 3.1404027938842773, "lr": 4.7962243503164314e-05, "tps": 134037, "wall": 13549.9} {"step": 27713, "train_loss": 3.0890142917633057, "lr": 4.795660952837398e-05, "tps": 133994, "wall": 13554.7} {"step": 27714, "train_loss": 3.1352791786193848, "lr": 4.795097750250047e-05, "tps": 133952, "wall": 13559.5} {"step": 27715, "train_loss": 3.017202377319336, "lr": 4.794534742560758e-05, "tps": 133908, "wall": 13564.5} {"step": 27716, "train_loss": 3.11029052734375, "lr": 4.7939719297759135e-05, "tps": 133865, "wall": 13569.3} {"step": 27717, "train_loss": 3.2173449993133545, "lr": 4.793409311901884e-05, "tps": 133822, "wall": 13574.1} {"step": 27718, "train_loss": 3.123781442642212, "lr": 4.792846888945041e-05, "tps": 133779, "wall": 13579.0} {"step": 27719, "train_loss": 3.0258126258850098, "lr": 4.7922846609117636e-05, "tps": 133737, "wall": 13583.8} {"step": 27720, "train_loss": 3.0934386253356934, "lr": 4.791722627808416e-05, "tps": 133694, "wall": 13588.6} {"step": 27721, "train_loss": 3.0088632106781006, "lr": 4.791160789641364e-05, "tps": 133652, "wall": 13593.4} {"step": 27722, "train_loss": 3.0829243659973145, "lr": 4.790599146416976e-05, "tps": 133609, "wall": 13598.2} {"step": 27723, "train_loss": 3.164088487625122, "lr": 4.790037698141611e-05, "tps": 133567, "wall": 13603.0} {"step": 27724, "train_loss": 3.1077356338500977, "lr": 4.789476444821627e-05, "tps": 133524, "wall": 13607.9} {"step": 27725, "train_loss": 3.1092939376831055, "lr": 4.7889153864633886e-05, "tps": 133481, "wall": 13612.8} {"step": 27726, "train_loss": 3.038266181945801, "lr": 4.788354523073247e-05, "tps": 133437, "wall": 13617.7} {"step": 27727, "train_loss": 3.090181350708008, "lr": 4.787793854657554e-05, "tps": 133394, "wall": 13622.6} {"step": 27728, "train_loss": 3.063037872314453, "lr": 4.787233381222666e-05, "tps": 133351, "wall": 13627.5} {"step": 27729, "train_loss": 3.016968250274658, "lr": 4.786673102774929e-05, "tps": 133309, "wall": 13632.3} {"step": 27730, "train_loss": 3.0742359161376953, "lr": 4.7861130193206884e-05, "tps": 133266, "wall": 13637.1} {"step": 27731, "train_loss": 3.140537738800049, "lr": 4.7855531308662934e-05, "tps": 133224, "wall": 13641.9} {"step": 27732, "train_loss": 3.13584303855896, "lr": 4.784993437418081e-05, "tps": 133182, "wall": 13646.8} {"step": 27733, "train_loss": 3.1496007442474365, "lr": 4.7844339389823975e-05, "tps": 133140, "wall": 13651.6} {"step": 27734, "train_loss": 3.095975399017334, "lr": 4.78387463556558e-05, "tps": 133098, "wall": 13656.4} {"step": 27735, "train_loss": 3.0869202613830566, "lr": 4.783315527173955e-05, "tps": 133056, "wall": 13661.2} {"step": 27736, "train_loss": 3.113246202468872, "lr": 4.782756613813867e-05, "tps": 133014, "wall": 13666.0} {"step": 27737, "train_loss": 3.0791614055633545, "lr": 4.7821978954916414e-05, "tps": 132971, "wall": 13670.9} {"step": 27738, "train_loss": 3.0209803581237793, "lr": 4.781639372213612e-05, "tps": 132929, "wall": 13675.7} {"step": 27739, "train_loss": 3.0088002681732178, "lr": 4.781081043986103e-05, "tps": 132888, "wall": 13680.5} {"step": 27740, "train_loss": 3.1196627616882324, "lr": 4.7805229108154385e-05, "tps": 132845, "wall": 13685.4} {"step": 27741, "train_loss": 3.19592547416687, "lr": 4.779964972707942e-05, "tps": 132803, "wall": 13690.2} {"step": 27742, "train_loss": 3.1414873600006104, "lr": 4.779407229669935e-05, "tps": 132761, "wall": 13695.0} {"step": 27743, "train_loss": 3.125875473022461, "lr": 4.778849681707732e-05, "tps": 132719, "wall": 13699.8} {"step": 27744, "train_loss": 3.140866756439209, "lr": 4.778292328827654e-05, "tps": 132677, "wall": 13704.7} {"step": 27745, "train_loss": 3.0450053215026855, "lr": 4.777735171036013e-05, "tps": 132635, "wall": 13709.5} {"step": 27746, "train_loss": 3.1419625282287598, "lr": 4.7771782083391166e-05, "tps": 132593, "wall": 13714.3} {"step": 27747, "train_loss": 3.0688912868499756, "lr": 4.776621440743279e-05, "tps": 132551, "wall": 13719.1} {"step": 27748, "train_loss": 3.0910277366638184, "lr": 4.776064868254806e-05, "tps": 132510, "wall": 13723.9} {"step": 27749, "train_loss": 3.043698787689209, "lr": 4.775508490879998e-05, "tps": 132468, "wall": 13728.7} {"step": 27750, "train_loss": 2.977970600128174, "lr": 4.774952308625166e-05, "tps": 132427, "wall": 13733.5} {"step": 27751, "train_loss": 3.078242778778076, "lr": 4.774396321496606e-05, "tps": 132385, "wall": 13738.4} {"step": 27752, "train_loss": 3.070648193359375, "lr": 4.7738405295006136e-05, "tps": 132343, "wall": 13743.2} {"step": 27753, "train_loss": 3.0785531997680664, "lr": 4.77328493264349e-05, "tps": 132297, "wall": 13748.4} {"step": 27754, "train_loss": 3.032216787338257, "lr": 4.772729530931524e-05, "tps": 132254, "wall": 13753.4} {"step": 27755, "train_loss": 3.114037036895752, "lr": 4.772174324371013e-05, "tps": 132212, "wall": 13758.2} {"step": 27756, "train_loss": 3.167375326156616, "lr": 4.771619312968242e-05, "tps": 132169, "wall": 13763.3} {"step": 27757, "train_loss": 3.036057233810425, "lr": 4.771064496729499e-05, "tps": 132124, "wall": 13768.4} {"step": 27758, "train_loss": 3.1594932079315186, "lr": 4.770509875661069e-05, "tps": 132083, "wall": 13773.2} {"step": 27759, "train_loss": 3.107020854949951, "lr": 4.769955449769238e-05, "tps": 132042, "wall": 13778.0} {"step": 27760, "train_loss": 3.038484573364258, "lr": 4.76940121906028e-05, "tps": 132000, "wall": 13782.8} {"step": 27761, "train_loss": 3.098707914352417, "lr": 4.7688471835404794e-05, "tps": 131959, "wall": 13787.6} {"step": 27762, "train_loss": 3.1202824115753174, "lr": 4.7682933432161096e-05, "tps": 131917, "wall": 13792.5} {"step": 27763, "train_loss": 2.970681667327881, "lr": 4.7677396980934444e-05, "tps": 131875, "wall": 13797.4} {"step": 27764, "train_loss": 3.089956283569336, "lr": 4.7671862481787586e-05, "tps": 131833, "wall": 13802.3} {"step": 27765, "train_loss": 3.123561382293701, "lr": 4.766632993478318e-05, "tps": 131791, "wall": 13807.3} {"step": 27766, "train_loss": 3.0932483673095703, "lr": 4.7660799339983894e-05, "tps": 131750, "wall": 13812.1} {"step": 27767, "train_loss": 3.1396212577819824, "lr": 4.7655270697452406e-05, "tps": 131708, "wall": 13816.9} {"step": 27768, "train_loss": 3.0944671630859375, "lr": 4.764974400725134e-05, "tps": 131666, "wall": 13821.8} {"step": 27769, "train_loss": 3.0893678665161133, "lr": 4.764421926944329e-05, "tps": 131625, "wall": 13826.6} {"step": 27770, "train_loss": 3.0388567447662354, "lr": 4.763869648409086e-05, "tps": 131584, "wall": 13831.4} {"step": 27771, "train_loss": 3.214250087738037, "lr": 4.763317565125661e-05, "tps": 131543, "wall": 13836.2} {"step": 27772, "train_loss": 3.022041082382202, "lr": 4.762765677100303e-05, "tps": 131502, "wall": 13841.0} {"step": 27773, "train_loss": 3.0191493034362793, "lr": 4.7622139843392724e-05, "tps": 131462, "wall": 13845.8} {"step": 27774, "train_loss": 3.051783561706543, "lr": 4.7616624868488115e-05, "tps": 131420, "wall": 13850.6} {"step": 27775, "train_loss": 3.0142953395843506, "lr": 4.761111184635171e-05, "tps": 131380, "wall": 13855.4} {"step": 27776, "train_loss": 3.030719041824341, "lr": 4.760560077704598e-05, "tps": 131338, "wall": 13860.3} {"step": 27777, "train_loss": 3.118584394454956, "lr": 4.760009166063329e-05, "tps": 131297, "wall": 13865.2} {"step": 27778, "train_loss": 3.0955355167388916, "lr": 4.7594584497176115e-05, "tps": 131256, "wall": 13870.0} {"step": 27779, "train_loss": 3.112806797027588, "lr": 4.758907928673682e-05, "tps": 131215, "wall": 13874.8} {"step": 27780, "train_loss": 3.0089070796966553, "lr": 4.758357602937774e-05, "tps": 131175, "wall": 13879.6} {"step": 27781, "train_loss": 3.130821466445923, "lr": 4.757807472516125e-05, "tps": 131134, "wall": 13884.4} {"step": 27782, "train_loss": 3.163789987564087, "lr": 4.7572575374149676e-05, "tps": 131093, "wall": 13889.2} {"step": 27783, "train_loss": 2.980487823486328, "lr": 4.756707797640525e-05, "tps": 131053, "wall": 13894.0} {"step": 27784, "train_loss": 3.140010356903076, "lr": 4.7561582531990345e-05, "tps": 131012, "wall": 13898.8} {"step": 27785, "train_loss": 3.1599783897399902, "lr": 4.755608904096714e-05, "tps": 130971, "wall": 13903.6} {"step": 27786, "train_loss": 3.221062183380127, "lr": 4.7550597503397864e-05, "tps": 130931, "wall": 13908.4} {"step": 27787, "train_loss": 3.053269863128662, "lr": 4.754510791934477e-05, "tps": 130890, "wall": 13913.3} {"step": 27788, "train_loss": 3.199838638305664, "lr": 4.753962028887004e-05, "tps": 130850, "wall": 13918.1} {"step": 27789, "train_loss": 3.1517457962036133, "lr": 4.753413461203578e-05, "tps": 130809, "wall": 13922.9} {"step": 27790, "train_loss": 3.004295825958252, "lr": 4.752865088890421e-05, "tps": 130768, "wall": 13927.8} {"step": 27791, "train_loss": 2.977642297744751, "lr": 4.7523169119537384e-05, "tps": 130728, "wall": 13932.6} {"step": 27792, "train_loss": 3.1552038192749023, "lr": 4.7517689303997445e-05, "tps": 130687, "wall": 13937.4} {"step": 27793, "train_loss": 3.1640830039978027, "lr": 4.751221144234647e-05, "tps": 130647, "wall": 13942.2} {"step": 27794, "train_loss": 3.1192965507507324, "lr": 4.750673553464647e-05, "tps": 130607, "wall": 13947.0} {"step": 27795, "train_loss": 3.0581464767456055, "lr": 4.7501261580959514e-05, "tps": 130566, "wall": 13951.8} {"step": 27796, "train_loss": 3.055039882659912, "lr": 4.749578958134761e-05, "tps": 130526, "wall": 13956.6} {"step": 27797, "train_loss": 3.036879539489746, "lr": 4.74903195358727e-05, "tps": 130486, "wall": 13961.4} {"step": 27798, "train_loss": 3.0338287353515625, "lr": 4.74848514445968e-05, "tps": 130445, "wall": 13966.2} {"step": 27799, "train_loss": 3.1017773151397705, "lr": 4.747938530758186e-05, "tps": 130405, "wall": 13971.0} {"step": 27800, "train_loss": 3.1113181114196777, "lr": 4.7473921124889726e-05, "tps": 130365, "wall": 13975.9} {"step": 27801, "train_loss": 3.0769782066345215, "lr": 4.746845889658238e-05, "tps": 130325, "wall": 13980.7} {"step": 27802, "train_loss": 3.052591323852539, "lr": 4.746299862272168e-05, "tps": 130284, "wall": 13985.5} {"step": 27803, "train_loss": 3.0134196281433105, "lr": 4.745754030336942e-05, "tps": 130244, "wall": 13990.4} {"step": 27804, "train_loss": 3.0744705200195312, "lr": 4.745208393858752e-05, "tps": 130203, "wall": 13995.2} {"step": 27805, "train_loss": 3.186582565307617, "lr": 4.744662952843774e-05, "tps": 130163, "wall": 14000.0} {"step": 27806, "train_loss": 2.9841437339782715, "lr": 4.744117707298185e-05, "tps": 130123, "wall": 14004.8} {"step": 27807, "train_loss": 3.1419191360473633, "lr": 4.743572657228167e-05, "tps": 130083, "wall": 14009.7} {"step": 27808, "train_loss": 2.9711782932281494, "lr": 4.7430278026398885e-05, "tps": 130043, "wall": 14014.5} {"step": 27809, "train_loss": 3.135859489440918, "lr": 4.7424831435395276e-05, "tps": 130003, "wall": 14019.3} {"step": 27810, "train_loss": 3.1162052154541016, "lr": 4.741938679933251e-05, "tps": 129963, "wall": 14024.1} {"step": 27811, "train_loss": 3.07291579246521, "lr": 4.7413944118272244e-05, "tps": 129923, "wall": 14028.9} {"step": 27812, "train_loss": 3.0880379676818848, "lr": 4.740850339227618e-05, "tps": 129883, "wall": 14033.7} {"step": 27813, "train_loss": 3.170614242553711, "lr": 4.740306462140593e-05, "tps": 129843, "wall": 14038.6} {"step": 27814, "train_loss": 3.2201991081237793, "lr": 4.739762780572307e-05, "tps": 129800, "wall": 14043.7} {"step": 27815, "train_loss": 3.0001204013824463, "lr": 4.739219294528924e-05, "tps": 129757, "wall": 14048.9} {"step": 27816, "train_loss": 3.1353540420532227, "lr": 4.738676004016599e-05, "tps": 129716, "wall": 14053.8} {"step": 27817, "train_loss": 3.054466962814331, "lr": 4.738132909041484e-05, "tps": 129676, "wall": 14058.7} {"step": 27818, "train_loss": 3.121870517730713, "lr": 4.737590009609735e-05, "tps": 129637, "wall": 14063.5} {"step": 27819, "train_loss": 3.1039557456970215, "lr": 4.7370473057275015e-05, "tps": 129597, "wall": 14068.3} {"step": 27820, "train_loss": 3.0965042114257812, "lr": 4.736504797400928e-05, "tps": 129556, "wall": 14073.2} {"step": 27821, "train_loss": 3.2059831619262695, "lr": 4.735962484636163e-05, "tps": 129516, "wall": 14078.0} {"step": 27822, "train_loss": 3.124542236328125, "lr": 4.7354203674393494e-05, "tps": 129476, "wall": 14083.0} {"step": 27823, "train_loss": 3.1319401264190674, "lr": 4.7348784458166246e-05, "tps": 129436, "wall": 14087.8} {"step": 27824, "train_loss": 3.049974203109741, "lr": 4.734336719774134e-05, "tps": 129394, "wall": 14092.9} {"step": 27825, "train_loss": 3.016770601272583, "lr": 4.733795189318011e-05, "tps": 129350, "wall": 14098.1} {"step": 27826, "train_loss": 3.101174831390381, "lr": 4.7332538544543874e-05, "tps": 129307, "wall": 14103.4} {"step": 27827, "train_loss": 3.1010117530822754, "lr": 4.732712715189402e-05, "tps": 129266, "wall": 14108.3} {"step": 27828, "train_loss": 3.0665807723999023, "lr": 4.732171771529178e-05, "tps": 129225, "wall": 14113.3} {"step": 27829, "train_loss": 3.1581411361694336, "lr": 4.731631023479848e-05, "tps": 129186, "wall": 14118.1} {"step": 27830, "train_loss": 3.098142147064209, "lr": 4.7310904710475365e-05, "tps": 129146, "wall": 14122.9} {"step": 27831, "train_loss": 3.1124768257141113, "lr": 4.730550114238365e-05, "tps": 129107, "wall": 14127.8} {"step": 27832, "train_loss": 3.1322975158691406, "lr": 4.730009953058458e-05, "tps": 129067, "wall": 14132.7} {"step": 27833, "train_loss": 3.0213537216186523, "lr": 4.7294699875139307e-05, "tps": 129027, "wall": 14137.5} {"step": 27834, "train_loss": 3.119629383087158, "lr": 4.7289302176109005e-05, "tps": 128988, "wall": 14142.3} {"step": 27835, "train_loss": 3.1669487953186035, "lr": 4.728390643355487e-05, "tps": 128948, "wall": 14147.2} {"step": 27836, "train_loss": 3.2042181491851807, "lr": 4.727851264753798e-05, "tps": 128909, "wall": 14152.0} {"step": 27837, "train_loss": 3.0913310050964355, "lr": 4.72731208181194e-05, "tps": 128870, "wall": 14156.8} {"step": 27838, "train_loss": 3.09567928314209, "lr": 4.726773094536029e-05, "tps": 128830, "wall": 14161.7} {"step": 27839, "train_loss": 3.1208295822143555, "lr": 4.7262343029321666e-05, "tps": 128789, "wall": 14166.7} {"step": 27840, "train_loss": 3.105226993560791, "lr": 4.7256957070064554e-05, "tps": 128748, "wall": 14171.7} {"step": 27841, "train_loss": 3.069403886795044, "lr": 4.725157306764998e-05, "tps": 128708, "wall": 14176.6} {"step": 27842, "train_loss": 3.257178783416748, "lr": 4.7246191022138945e-05, "tps": 128669, "wall": 14181.4} {"step": 27843, "train_loss": 3.037604331970215, "lr": 4.724081093359237e-05, "tps": 128630, "wall": 14186.3} {"step": 27844, "train_loss": 3.0899128913879395, "lr": 4.723543280207126e-05, "tps": 128591, "wall": 14191.1} {"step": 27845, "train_loss": 3.058458089828491, "lr": 4.723005662763651e-05, "tps": 128552, "wall": 14195.9} {"step": 27846, "train_loss": 3.119187116622925, "lr": 4.7224682410349034e-05, "tps": 128512, "wall": 14200.8} {"step": 27847, "train_loss": 3.105614185333252, "lr": 4.72193101502697e-05, "tps": 128473, "wall": 14205.6} {"step": 27848, "train_loss": 3.091454267501831, "lr": 4.7213939847459356e-05, "tps": 128434, "wall": 14210.4} {"step": 27849, "train_loss": 3.1221048831939697, "lr": 4.7208571501978844e-05, "tps": 128395, "wall": 14215.2} {"step": 27850, "train_loss": 3.0697507858276367, "lr": 4.7203205113889003e-05, "tps": 128356, "wall": 14220.1} {"step": 27851, "train_loss": 3.092933416366577, "lr": 4.719784068325058e-05, "tps": 128317, "wall": 14225.0} {"step": 27852, "train_loss": 3.094142198562622, "lr": 4.71924782101244e-05, "tps": 128278, "wall": 14229.8} {"step": 27853, "train_loss": 3.0974485874176025, "lr": 4.718711769457115e-05, "tps": 128239, "wall": 14234.6} {"step": 27854, "train_loss": 3.0931670665740967, "lr": 4.7181759136651565e-05, "tps": 128201, "wall": 14239.4} {"step": 27855, "train_loss": 3.064055919647217, "lr": 4.717640253642641e-05, "tps": 128162, "wall": 14244.2} {"step": 27856, "train_loss": 3.0872437953948975, "lr": 4.7171047893956284e-05, "tps": 128123, "wall": 14249.0} {"step": 27857, "train_loss": 3.084419012069702, "lr": 4.716569520930187e-05, "tps": 128084, "wall": 14253.8} {"step": 27858, "train_loss": 3.0569100379943848, "lr": 4.7160344482523835e-05, "tps": 128046, "wall": 14258.6} {"step": 27859, "train_loss": 3.076760768890381, "lr": 4.715499571368275e-05, "tps": 128007, "wall": 14263.5} {"step": 27860, "train_loss": 3.0573291778564453, "lr": 4.7149648902839216e-05, "tps": 127968, "wall": 14268.3} {"step": 27861, "train_loss": 3.141068458557129, "lr": 4.714430405005384e-05, "tps": 127927, "wall": 14273.5} {"step": 27862, "train_loss": 3.1605048179626465, "lr": 4.713896115538711e-05, "tps": 127887, "wall": 14278.4} {"step": 27863, "train_loss": 2.988943576812744, "lr": 4.7133620218899585e-05, "tps": 127848, "wall": 14283.2} {"step": 27864, "train_loss": 3.106208562850952, "lr": 4.7128281240651786e-05, "tps": 127809, "wall": 14288.1} {"step": 27865, "train_loss": 3.071091890335083, "lr": 4.712294422070415e-05, "tps": 127770, "wall": 14293.0} {"step": 27866, "train_loss": 3.079545259475708, "lr": 4.7117609159117154e-05, "tps": 127732, "wall": 14297.8} {"step": 27867, "train_loss": 3.133599042892456, "lr": 4.711227605595123e-05, "tps": 127693, "wall": 14302.6} {"step": 27868, "train_loss": 3.1694231033325195, "lr": 4.7106944911266805e-05, "tps": 127655, "wall": 14307.5} {"step": 27869, "train_loss": 3.034963607788086, "lr": 4.710161572512427e-05, "tps": 127616, "wall": 14312.3} {"step": 27870, "train_loss": 3.0617787837982178, "lr": 4.7096288497583974e-05, "tps": 127578, "wall": 14317.1} {"step": 27871, "train_loss": 3.0731446743011475, "lr": 4.709096322870627e-05, "tps": 127539, "wall": 14321.9} {"step": 27872, "train_loss": 3.1786837577819824, "lr": 4.7085639918551505e-05, "tps": 127501, "wall": 14326.8} {"step": 27873, "train_loss": 3.0540807247161865, "lr": 4.708031856717996e-05, "tps": 127462, "wall": 14331.6} {"step": 27874, "train_loss": 3.1139631271362305, "lr": 4.70749991746519e-05, "tps": 127424, "wall": 14336.4} {"step": 27875, "train_loss": 3.087224006652832, "lr": 4.706968174102762e-05, "tps": 127386, "wall": 14341.3} {"step": 27876, "train_loss": 3.049848794937134, "lr": 4.7064366266367355e-05, "tps": 127347, "wall": 14346.2} {"step": 27877, "train_loss": 3.0310206413269043, "lr": 4.705905275073129e-05, "tps": 127309, "wall": 14351.0} {"step": 27878, "train_loss": 3.110154151916504, "lr": 4.705374119417964e-05, "tps": 127271, "wall": 14355.8} {"step": 27879, "train_loss": 3.1896262168884277, "lr": 4.7048431596772557e-05, "tps": 127232, "wall": 14360.6} {"step": 27880, "train_loss": 3.0506129264831543, "lr": 4.704312395857019e-05, "tps": 127194, "wall": 14365.5} {"step": 27881, "train_loss": 3.079317331314087, "lr": 4.7037818279632696e-05, "tps": 127156, "wall": 14370.3} {"step": 27882, "train_loss": 3.250436782836914, "lr": 4.703251456002012e-05, "tps": 127118, "wall": 14375.1} {"step": 27883, "train_loss": 3.140054702758789, "lr": 4.70272127997926e-05, "tps": 127080, "wall": 14379.9} {"step": 27884, "train_loss": 3.129159927368164, "lr": 4.702191299901017e-05, "tps": 127042, "wall": 14384.8} {"step": 27885, "train_loss": 3.1099705696105957, "lr": 4.701661515773286e-05, "tps": 127003, "wall": 14389.6} {"step": 27886, "train_loss": 3.0805187225341797, "lr": 4.7011319276020696e-05, "tps": 126965, "wall": 14394.4} {"step": 27887, "train_loss": 3.091485023498535, "lr": 4.700602535393367e-05, "tps": 126927, "wall": 14399.3} {"step": 27888, "train_loss": 3.115610122680664, "lr": 4.7000733391531726e-05, "tps": 126889, "wall": 14404.1} {"step": 27889, "train_loss": 3.1396541595458984, "lr": 4.699544338887486e-05, "tps": 126851, "wall": 14409.0} {"step": 27890, "train_loss": 3.035274028778076, "lr": 4.699015534602298e-05, "tps": 126813, "wall": 14413.8} {"step": 27891, "train_loss": 3.0714449882507324, "lr": 4.6984869263035944e-05, "tps": 126775, "wall": 14418.6} {"step": 27892, "train_loss": 3.168952226638794, "lr": 4.69795851399737e-05, "tps": 126737, "wall": 14423.5} {"step": 27893, "train_loss": 3.1463305950164795, "lr": 4.697430297689606e-05, "tps": 126699, "wall": 14428.3} {"step": 27894, "train_loss": 3.125758647918701, "lr": 4.696902277386287e-05, "tps": 126661, "wall": 14433.1} {"step": 27895, "train_loss": 2.9939987659454346, "lr": 4.696374453093396e-05, "tps": 126623, "wall": 14438.0} {"step": 27896, "train_loss": 3.0657219886779785, "lr": 4.695846824816913e-05, "tps": 126586, "wall": 14442.8} {"step": 27897, "train_loss": 3.1111772060394287, "lr": 4.695319392562809e-05, "tps": 126548, "wall": 14447.6} {"step": 27898, "train_loss": 3.153154134750366, "lr": 4.694792156337067e-05, "tps": 126510, "wall": 14452.4} {"step": 27899, "train_loss": 3.0659775733947754, "lr": 4.6942651161456514e-05, "tps": 126472, "wall": 14457.3} {"step": 27900, "train_loss": 3.169829845428467, "lr": 4.69373827199454e-05, "tps": 126435, "wall": 14462.1} {"step": 27901, "train_loss": 3.1066300868988037, "lr": 4.6932116238897e-05, "tps": 126397, "wall": 14467.0} {"step": 27902, "train_loss": 3.1287994384765625, "lr": 4.6926851718370905e-05, "tps": 126359, "wall": 14471.8} {"step": 27903, "train_loss": 3.0954408645629883, "lr": 4.692158915842685e-05, "tps": 126321, "wall": 14476.7} {"step": 27904, "train_loss": 3.1388890743255615, "lr": 4.6916328559124355e-05, "tps": 126283, "wall": 14481.5} {"step": 27905, "train_loss": 3.0745484828948975, "lr": 4.691106992052305e-05, "tps": 126246, "wall": 14486.3} {"step": 27906, "train_loss": 3.0510363578796387, "lr": 4.690581324268253e-05, "tps": 126208, "wall": 14491.2} {"step": 27907, "train_loss": 3.126854181289673, "lr": 4.6900558525662306e-05, "tps": 126171, "wall": 14496.0} {"step": 27908, "train_loss": 3.08787202835083, "lr": 4.6895305769521916e-05, "tps": 126133, "wall": 14500.8} {"step": 27909, "train_loss": 2.986281156539917, "lr": 4.68900549743209e-05, "tps": 126096, "wall": 14505.7} {"step": 27910, "train_loss": 3.1890981197357178, "lr": 4.688480614011866e-05, "tps": 126058, "wall": 14510.5} {"step": 27911, "train_loss": 3.0213565826416016, "lr": 4.6879559266974714e-05, "tps": 126021, "wall": 14515.3} {"step": 27912, "train_loss": 3.0650150775909424, "lr": 4.6874314354948524e-05, "tps": 125983, "wall": 14520.2} {"step": 27913, "train_loss": 3.2626781463623047, "lr": 4.686907140409941e-05, "tps": 125945, "wall": 14525.1} {"step": 27914, "train_loss": 3.062002182006836, "lr": 4.686383041448685e-05, "tps": 125908, "wall": 14529.9} {"step": 27915, "train_loss": 3.0355923175811768, "lr": 4.68585913861702e-05, "tps": 125871, "wall": 14534.7} {"step": 27916, "train_loss": 3.056337594985962, "lr": 4.685335431920877e-05, "tps": 125834, "wall": 14539.5} {"step": 27917, "train_loss": 3.142062187194824, "lr": 4.684811921366192e-05, "tps": 125796, "wall": 14544.4} {"step": 27918, "train_loss": 3.0959067344665527, "lr": 4.684288606958897e-05, "tps": 125759, "wall": 14549.2} {"step": 27919, "train_loss": 3.0299980640411377, "lr": 4.683765488704912e-05, "tps": 125722, "wall": 14554.0} {"step": 27920, "train_loss": 3.0569915771484375, "lr": 4.6832425666101706e-05, "tps": 125684, "wall": 14558.9} {"step": 27921, "train_loss": 3.002448558807373, "lr": 4.682719840680597e-05, "tps": 125647, "wall": 14563.7} {"step": 27922, "train_loss": 3.189943790435791, "lr": 4.682197310922105e-05, "tps": 125610, "wall": 14568.6} {"step": 27923, "train_loss": 3.1016435623168945, "lr": 4.681674977340622e-05, "tps": 125573, "wall": 14573.4} {"step": 27924, "train_loss": 3.1381821632385254, "lr": 4.68115283994206e-05, "tps": 125536, "wall": 14578.2} {"step": 27925, "train_loss": 2.9939475059509277, "lr": 4.680630898732338e-05, "tps": 125499, "wall": 14583.0} {"step": 27926, "train_loss": 3.148752212524414, "lr": 4.6801091537173635e-05, "tps": 125461, "wall": 14588.0} {"step": 27927, "train_loss": 3.108558177947998, "lr": 4.679587604903049e-05, "tps": 125424, "wall": 14592.8} {"step": 27928, "train_loss": 3.094238758087158, "lr": 4.679066252295306e-05, "tps": 125387, "wall": 14597.6} {"step": 27929, "train_loss": 3.187401294708252, "lr": 4.6785450959000374e-05, "tps": 125350, "wall": 14602.5} {"step": 27930, "train_loss": 3.1243133544921875, "lr": 4.678024135723144e-05, "tps": 125313, "wall": 14607.3} {"step": 27931, "train_loss": 3.114902973175049, "lr": 4.677503371770533e-05, "tps": 125276, "wall": 14612.1} {"step": 27932, "train_loss": 3.08842396736145, "lr": 4.676982804048101e-05, "tps": 125239, "wall": 14616.9} {"step": 27933, "train_loss": 3.1283211708068848, "lr": 4.676462432561744e-05, "tps": 125202, "wall": 14621.8} {"step": 27934, "train_loss": 3.1110754013061523, "lr": 4.6759422573173574e-05, "tps": 125165, "wall": 14626.6} {"step": 27935, "train_loss": 2.999429702758789, "lr": 4.6754222783208344e-05, "tps": 125128, "wall": 14631.5} {"step": 27936, "train_loss": 3.052527666091919, "lr": 4.6749024955780656e-05, "tps": 125091, "wall": 14636.3} {"step": 27937, "train_loss": 3.0801312923431396, "lr": 4.674382909094939e-05, "tps": 125054, "wall": 14641.2} {"step": 27938, "train_loss": 3.079962730407715, "lr": 4.67386351887734e-05, "tps": 125016, "wall": 14646.1} {"step": 27939, "train_loss": 3.075972557067871, "lr": 4.67334432493115e-05, "tps": 124979, "wall": 14651.0} {"step": 27940, "train_loss": 3.1358518600463867, "lr": 4.672825327262255e-05, "tps": 124943, "wall": 14655.8} {"step": 27941, "train_loss": 3.0879111289978027, "lr": 4.67230652587653e-05, "tps": 124906, "wall": 14660.6} {"step": 27942, "train_loss": 3.082420825958252, "lr": 4.671787920779857e-05, "tps": 124869, "wall": 14665.5} {"step": 27943, "train_loss": 3.057359218597412, "lr": 4.671269511978107e-05, "tps": 124833, "wall": 14670.3} {"step": 27944, "train_loss": 3.1277239322662354, "lr": 4.670751299477152e-05, "tps": 124796, "wall": 14675.1} {"step": 27945, "train_loss": 3.06563663482666, "lr": 4.670233283282867e-05, "tps": 124760, "wall": 14679.9} {"step": 27946, "train_loss": 3.163301944732666, "lr": 4.669715463401113e-05, "tps": 124723, "wall": 14684.7} {"step": 27947, "train_loss": 3.0961177349090576, "lr": 4.669197839837761e-05, "tps": 124687, "wall": 14689.6} {"step": 27948, "train_loss": 3.022038459777832, "lr": 4.668680412598674e-05, "tps": 124650, "wall": 14694.4} {"step": 27949, "train_loss": 3.104402780532837, "lr": 4.668163181689715e-05, "tps": 124613, "wall": 14699.3} {"step": 27950, "train_loss": 3.1021885871887207, "lr": 4.6676461471167375e-05, "tps": 124577, "wall": 14704.1} {"step": 27951, "train_loss": 3.0660767555236816, "lr": 4.667129308885603e-05, "tps": 124539, "wall": 14709.0} {"step": 27952, "train_loss": 3.1162796020507812, "lr": 4.6666126670021684e-05, "tps": 124503, "wall": 14713.9} {"step": 27953, "train_loss": 3.1179211139678955, "lr": 4.666096221472279e-05, "tps": 124466, "wall": 14718.7} {"step": 27954, "train_loss": 3.125434637069702, "lr": 4.6655799723017903e-05, "tps": 124430, "wall": 14723.5} {"step": 27955, "train_loss": 3.042226791381836, "lr": 4.665063919496552e-05, "tps": 124394, "wall": 14728.4} {"step": 27956, "train_loss": 3.0780978202819824, "lr": 4.664548063062405e-05, "tps": 124358, "wall": 14733.2} {"step": 27957, "train_loss": 3.04491925239563, "lr": 4.664032403005197e-05, "tps": 124321, "wall": 14738.0} {"step": 27958, "train_loss": 3.080906867980957, "lr": 4.6635169393307666e-05, "tps": 124285, "wall": 14742.8} {"step": 27959, "train_loss": 3.1580052375793457, "lr": 4.6630016720449534e-05, "tps": 124249, "wall": 14747.6} {"step": 27960, "train_loss": 3.119518280029297, "lr": 4.662486601153598e-05, "tps": 124213, "wall": 14752.5} {"step": 27961, "train_loss": 3.214604377746582, "lr": 4.6619717266625274e-05, "tps": 124177, "wall": 14757.3} {"step": 27962, "train_loss": 3.093208074569702, "lr": 4.6614570485775825e-05, "tps": 124140, "wall": 14762.1} {"step": 27963, "train_loss": 3.048215389251709, "lr": 4.660942566904591e-05, "tps": 124104, "wall": 14767.0} {"step": 27964, "train_loss": 3.1312692165374756, "lr": 4.6604282816493785e-05, "tps": 124068, "wall": 14771.8} {"step": 27965, "train_loss": 3.1106038093566895, "lr": 4.659914192817774e-05, "tps": 124032, "wall": 14776.6} {"step": 27966, "train_loss": 3.0813040733337402, "lr": 4.659400300415599e-05, "tps": 123996, "wall": 14781.4} {"step": 27967, "train_loss": 3.0554912090301514, "lr": 4.6588866044486744e-05, "tps": 123960, "wall": 14786.2} {"step": 27968, "train_loss": 3.0939197540283203, "lr": 4.658373104922822e-05, "tps": 123924, "wall": 14791.0} {"step": 27969, "train_loss": 3.0184597969055176, "lr": 4.657859801843856e-05, "tps": 123888, "wall": 14795.9} {"step": 27970, "train_loss": 3.098682403564453, "lr": 4.6573466952175903e-05, "tps": 123852, "wall": 14800.7} {"step": 27971, "train_loss": 3.0970420837402344, "lr": 4.6568337850498444e-05, "tps": 123816, "wall": 14805.5} {"step": 27972, "train_loss": 3.2425131797790527, "lr": 4.656321071346421e-05, "tps": 123781, "wall": 14810.3} {"step": 27973, "train_loss": 2.9718453884124756, "lr": 4.6558085541131304e-05, "tps": 123745, "wall": 14815.1} {"step": 27974, "train_loss": 3.0886917114257812, "lr": 4.65529623335578e-05, "tps": 123709, "wall": 14819.9} {"step": 27975, "train_loss": 3.226992607116699, "lr": 4.6547841090801716e-05, "tps": 123673, "wall": 14824.8} {"step": 27976, "train_loss": 3.0600247383117676, "lr": 4.6542721812921055e-05, "tps": 123637, "wall": 14829.6} {"step": 27977, "train_loss": 3.126763105392456, "lr": 4.6537604499973866e-05, "tps": 123601, "wall": 14834.5} {"step": 27978, "train_loss": 3.0343496799468994, "lr": 4.6532489152018025e-05, "tps": 123565, "wall": 14839.4} {"step": 27979, "train_loss": 3.012822389602661, "lr": 4.6527375769111563e-05, "tps": 123529, "wall": 14844.2} {"step": 27980, "train_loss": 3.104599952697754, "lr": 4.6522264351312385e-05, "tps": 123493, "wall": 14849.0} {"step": 27981, "train_loss": 3.1591153144836426, "lr": 4.651715489867834e-05, "tps": 123457, "wall": 14853.9} {"step": 27982, "train_loss": 3.1575682163238525, "lr": 4.651204741126739e-05, "tps": 123422, "wall": 14858.7} {"step": 27983, "train_loss": 3.081528663635254, "lr": 4.650694188913735e-05, "tps": 123386, "wall": 14863.5} {"step": 27984, "train_loss": 3.0856680870056152, "lr": 4.6501838332346035e-05, "tps": 123351, "wall": 14868.3} {"step": 27985, "train_loss": 3.066112995147705, "lr": 4.649673674095128e-05, "tps": 123315, "wall": 14873.1} {"step": 27986, "train_loss": 3.200338363647461, "lr": 4.649163711501091e-05, "tps": 123279, "wall": 14878.0} {"step": 27987, "train_loss": 3.0996294021606445, "lr": 4.6486539454582636e-05, "tps": 123243, "wall": 14882.9} {"step": 27988, "train_loss": 3.1133830547332764, "lr": 4.648144375972422e-05, "tps": 123207, "wall": 14887.8} {"step": 27989, "train_loss": 3.100950241088867, "lr": 4.6476350030493434e-05, "tps": 123170, "wall": 14892.7} {"step": 27990, "train_loss": 3.073698043823242, "lr": 4.64712582669479e-05, "tps": 123134, "wall": 14897.7} {"step": 27991, "train_loss": 3.1297173500061035, "lr": 4.646616846914537e-05, "tps": 123099, "wall": 14902.5} {"step": 27992, "train_loss": 3.1738715171813965, "lr": 4.646108063714347e-05, "tps": 123062, "wall": 14907.4} {"step": 27993, "train_loss": 3.145638942718506, "lr": 4.645599477099982e-05, "tps": 123026, "wall": 14912.3} {"step": 27994, "train_loss": 3.0491294860839844, "lr": 4.645091087077206e-05, "tps": 122990, "wall": 14917.2} {"step": 27995, "train_loss": 3.080564022064209, "lr": 4.644582893651775e-05, "tps": 122954, "wall": 14922.1} {"step": 27996, "train_loss": 3.0347886085510254, "lr": 4.644074896829451e-05, "tps": 122918, "wall": 14927.1} {"step": 27997, "train_loss": 3.0163145065307617, "lr": 4.643567096615985e-05, "tps": 122881, "wall": 14932.0} {"step": 27998, "train_loss": 3.0163612365722656, "lr": 4.643059493017127e-05, "tps": 122845, "wall": 14937.0} {"step": 27999, "train_loss": 3.0979199409484863, "lr": 4.6425520860386326e-05, "tps": 122809, "wall": 14941.9} {"step": 28000, "train_loss": 3.142759084701538, "lr": 4.642044875686249e-05, "tps": 122772, "wall": 14946.9, "val_loss_monitor": 3.3246549134854773} {"step": 28001, "train_loss": 3.178520917892456, "lr": 4.6415378619657154e-05, "tps": 122349, "wall": 14999.2} {"step": 28002, "train_loss": 3.1496779918670654, "lr": 4.6410310448827837e-05, "tps": 122310, "wall": 15004.4} {"step": 28003, "train_loss": 3.0828542709350586, "lr": 4.64052442444319e-05, "tps": 122274, "wall": 15009.4} {"step": 28004, "train_loss": 2.998363733291626, "lr": 4.640018000652675e-05, "tps": 122238, "wall": 15014.4} {"step": 28005, "train_loss": 3.115877866744995, "lr": 4.639511773516974e-05, "tps": 122202, "wall": 15019.3} {"step": 28006, "train_loss": 3.1173510551452637, "lr": 4.639005743041826e-05, "tps": 122165, "wall": 15024.4} {"step": 28007, "train_loss": 3.2038726806640625, "lr": 4.638499909232957e-05, "tps": 122129, "wall": 15029.4} {"step": 28008, "train_loss": 3.0616488456726074, "lr": 4.6379942720961025e-05, "tps": 122093, "wall": 15034.4} {"step": 28009, "train_loss": 3.2187626361846924, "lr": 4.637488831636988e-05, "tps": 122057, "wall": 15039.3} {"step": 28010, "train_loss": 3.119476318359375, "lr": 4.6369835878613365e-05, "tps": 122021, "wall": 15044.3} {"step": 28011, "train_loss": 3.0981760025024414, "lr": 4.6364785407748765e-05, "tps": 121985, "wall": 15049.3} {"step": 28012, "train_loss": 3.086792469024658, "lr": 4.635973690383327e-05, "tps": 121949, "wall": 15054.2} {"step": 28013, "train_loss": 3.1590771675109863, "lr": 4.635469036692405e-05, "tps": 121914, "wall": 15059.1} {"step": 28014, "train_loss": 3.1115760803222656, "lr": 4.634964579707832e-05, "tps": 121879, "wall": 15064.0} {"step": 28015, "train_loss": 3.134707450866699, "lr": 4.6344603194353165e-05, "tps": 121844, "wall": 15068.9} {"step": 28016, "train_loss": 3.1142578125, "lr": 4.6339562558805764e-05, "tps": 121809, "wall": 15073.7} {"step": 28017, "train_loss": 3.1796860694885254, "lr": 4.6334523890493196e-05, "tps": 121774, "wall": 15078.6} {"step": 28018, "train_loss": 3.19828724861145, "lr": 4.6329487189472504e-05, "tps": 121738, "wall": 15083.5} {"step": 28019, "train_loss": 3.1512882709503174, "lr": 4.632445245580082e-05, "tps": 121703, "wall": 15088.5} {"step": 28020, "train_loss": 3.1302337646484375, "lr": 4.631941968953512e-05, "tps": 121668, "wall": 15093.4} {"step": 28021, "train_loss": 3.258742094039917, "lr": 4.63143888907324e-05, "tps": 121632, "wall": 15098.4} {"step": 28022, "train_loss": 3.242755889892578, "lr": 4.6309360059449724e-05, "tps": 121597, "wall": 15103.3} {"step": 28023, "train_loss": 3.1213912963867188, "lr": 4.6304333195743995e-05, "tps": 121561, "wall": 15108.2} {"step": 28024, "train_loss": 3.1771955490112305, "lr": 4.629930829967215e-05, "tps": 121526, "wall": 15113.2} {"step": 28025, "train_loss": 3.134366035461426, "lr": 4.629428537129117e-05, "tps": 121491, "wall": 15118.0} {"step": 28026, "train_loss": 3.148197650909424, "lr": 4.628926441065793e-05, "tps": 121456, "wall": 15122.9} {"step": 28027, "train_loss": 3.17425537109375, "lr": 4.628424541782927e-05, "tps": 121421, "wall": 15127.8} {"step": 28028, "train_loss": 3.1301820278167725, "lr": 4.627922839286209e-05, "tps": 121386, "wall": 15132.7} {"step": 28029, "train_loss": 3.013094186782837, "lr": 4.627421333581323e-05, "tps": 121352, "wall": 15137.5} {"step": 28030, "train_loss": 3.0758297443389893, "lr": 4.626920024673944e-05, "tps": 121318, "wall": 15142.3} {"step": 28031, "train_loss": 3.155254602432251, "lr": 4.6264189125697575e-05, "tps": 121283, "wall": 15147.2} {"step": 28032, "train_loss": 3.1361517906188965, "lr": 4.625917997274435e-05, "tps": 121249, "wall": 15152.0} {"step": 28033, "train_loss": 3.137416362762451, "lr": 4.625417278793657e-05, "tps": 121215, "wall": 15156.8} {"step": 28034, "train_loss": 3.2622251510620117, "lr": 4.6249167571330886e-05, "tps": 121181, "wall": 15161.6} {"step": 28035, "train_loss": 3.187171459197998, "lr": 4.624416432298404e-05, "tps": 121146, "wall": 15166.4} {"step": 28036, "train_loss": 3.130145311355591, "lr": 4.623916304295271e-05, "tps": 121112, "wall": 15171.2} {"step": 28037, "train_loss": 3.12630558013916, "lr": 4.623416373129356e-05, "tps": 121078, "wall": 15176.1} {"step": 28038, "train_loss": 3.1476051807403564, "lr": 4.622916638806315e-05, "tps": 121044, "wall": 15180.9} {"step": 28039, "train_loss": 3.121342420578003, "lr": 4.6224171013318195e-05, "tps": 121009, "wall": 15185.8} {"step": 28040, "train_loss": 3.2265799045562744, "lr": 4.621917760711522e-05, "tps": 120975, "wall": 15190.6} {"step": 28041, "train_loss": 3.2474169731140137, "lr": 4.621418616951078e-05, "tps": 120941, "wall": 15195.4} {"step": 28042, "train_loss": 3.2177138328552246, "lr": 4.620919670056145e-05, "tps": 120907, "wall": 15200.3} {"step": 28043, "train_loss": 3.153989553451538, "lr": 4.6204209200323765e-05, "tps": 120873, "wall": 15205.1} {"step": 28044, "train_loss": 3.2019588947296143, "lr": 4.6199223668854165e-05, "tps": 120839, "wall": 15209.9} {"step": 28045, "train_loss": 3.1653828620910645, "lr": 4.619424010620919e-05, "tps": 120805, "wall": 15214.8} {"step": 28046, "train_loss": 3.0515966415405273, "lr": 4.618925851244527e-05, "tps": 120771, "wall": 15219.6} {"step": 28047, "train_loss": 3.100698232650757, "lr": 4.6184278887618786e-05, "tps": 120735, "wall": 15224.6} {"step": 28048, "train_loss": 3.204845428466797, "lr": 4.617930123178625e-05, "tps": 120700, "wall": 15229.5} {"step": 28049, "train_loss": 3.1330668926239014, "lr": 4.617432554500396e-05, "tps": 120666, "wall": 15234.5} {"step": 28050, "train_loss": 3.1261565685272217, "lr": 4.616935182732832e-05, "tps": 120632, "wall": 15239.3} {"step": 28051, "train_loss": 3.21292781829834, "lr": 4.616438007881568e-05, "tps": 120598, "wall": 15244.2} {"step": 28052, "train_loss": 3.0759525299072266, "lr": 4.615941029952232e-05, "tps": 120563, "wall": 15249.1} {"step": 28053, "train_loss": 3.1820008754730225, "lr": 4.615444248950459e-05, "tps": 120529, "wall": 15254.0} {"step": 28054, "train_loss": 3.250222682952881, "lr": 4.614947664881874e-05, "tps": 120495, "wall": 15258.8} {"step": 28055, "train_loss": 3.1228792667388916, "lr": 4.614451277752099e-05, "tps": 120461, "wall": 15263.7} {"step": 28056, "train_loss": 3.1391215324401855, "lr": 4.613955087566764e-05, "tps": 120427, "wall": 15268.5} {"step": 28057, "train_loss": 3.1236045360565186, "lr": 4.613459094331487e-05, "tps": 120393, "wall": 15273.3} {"step": 28058, "train_loss": 3.1446313858032227, "lr": 4.612963298051883e-05, "tps": 120358, "wall": 15278.2} {"step": 28059, "train_loss": 3.2695484161376953, "lr": 4.6124676987335725e-05, "tps": 120324, "wall": 15283.1} {"step": 28060, "train_loss": 3.1085870265960693, "lr": 4.611972296382169e-05, "tps": 120289, "wall": 15288.1} {"step": 28061, "train_loss": 3.1465582847595215, "lr": 4.611477091003284e-05, "tps": 120253, "wall": 15293.3} {"step": 28062, "train_loss": 3.1856279373168945, "lr": 4.610982082602527e-05, "tps": 120218, "wall": 15298.3} {"step": 28063, "train_loss": 3.206632137298584, "lr": 4.610487271185507e-05, "tps": 120184, "wall": 15303.1} {"step": 28064, "train_loss": 3.0943212509155273, "lr": 4.609992656757823e-05, "tps": 120150, "wall": 15308.0} {"step": 28065, "train_loss": 3.143986225128174, "lr": 4.6094982393250884e-05, "tps": 120116, "wall": 15312.9} {"step": 28066, "train_loss": 3.120015859603882, "lr": 4.609004018892898e-05, "tps": 120083, "wall": 15317.7} {"step": 28067, "train_loss": 3.1732335090637207, "lr": 4.608509995466848e-05, "tps": 120049, "wall": 15322.5} {"step": 28068, "train_loss": 3.25705885887146, "lr": 4.6080161690525395e-05, "tps": 120016, "wall": 15327.4} {"step": 28069, "train_loss": 3.1273016929626465, "lr": 4.6075225396555636e-05, "tps": 119981, "wall": 15332.3} {"step": 28070, "train_loss": 3.1041359901428223, "lr": 4.6070291072815154e-05, "tps": 119947, "wall": 15337.2} {"step": 28071, "train_loss": 3.1580891609191895, "lr": 4.6065358719359806e-05, "tps": 119912, "wall": 15342.2} {"step": 28072, "train_loss": 3.2780466079711914, "lr": 4.606042833624551e-05, "tps": 119876, "wall": 15347.4} {"step": 28073, "train_loss": 3.1653354167938232, "lr": 4.6055499923528076e-05, "tps": 119842, "wall": 15352.2} {"step": 28074, "train_loss": 3.0899832248687744, "lr": 4.6050573481263326e-05, "tps": 119809, "wall": 15357.1} {"step": 28075, "train_loss": 3.0774168968200684, "lr": 4.604564900950711e-05, "tps": 119775, "wall": 15362.0} {"step": 28076, "train_loss": 3.228440284729004, "lr": 4.604072650831521e-05, "tps": 119741, "wall": 15366.9} {"step": 28077, "train_loss": 3.1337952613830566, "lr": 4.603580597774334e-05, "tps": 119707, "wall": 15371.8} {"step": 28078, "train_loss": 3.185119152069092, "lr": 4.603088741784729e-05, "tps": 119672, "wall": 15376.8} {"step": 28079, "train_loss": 3.206406354904175, "lr": 4.602597082868275e-05, "tps": 119638, "wall": 15381.7} {"step": 28080, "train_loss": 3.1090645790100098, "lr": 4.602105621030543e-05, "tps": 119605, "wall": 15386.6} {"step": 28081, "train_loss": 3.1144285202026367, "lr": 4.6016143562771e-05, "tps": 119571, "wall": 15391.5} {"step": 28082, "train_loss": 3.237173557281494, "lr": 4.601123288613512e-05, "tps": 119538, "wall": 15396.3} {"step": 28083, "train_loss": 3.1519217491149902, "lr": 4.600632418045336e-05, "tps": 119504, "wall": 15401.2} {"step": 28084, "train_loss": 3.10166335105896, "lr": 4.6001417445781415e-05, "tps": 119471, "wall": 15406.0} {"step": 28085, "train_loss": 3.2697601318359375, "lr": 4.599651268217481e-05, "tps": 119437, "wall": 15410.9} {"step": 28086, "train_loss": 3.071197032928467, "lr": 4.599160988968911e-05, "tps": 119404, "wall": 15415.8} {"step": 28087, "train_loss": 3.1781163215637207, "lr": 4.59867090683799e-05, "tps": 119370, "wall": 15420.6} {"step": 28088, "train_loss": 3.214524030685425, "lr": 4.5981810218302645e-05, "tps": 119336, "wall": 15425.7} {"step": 28089, "train_loss": 3.169924736022949, "lr": 4.597691333951285e-05, "tps": 119302, "wall": 15430.6} {"step": 28090, "train_loss": 3.0867555141448975, "lr": 4.597201843206601e-05, "tps": 119268, "wall": 15435.5} {"step": 28091, "train_loss": 3.2575390338897705, "lr": 4.5967125496017565e-05, "tps": 119235, "wall": 15440.4} {"step": 28092, "train_loss": 3.1166982650756836, "lr": 4.596223453142291e-05, "tps": 119200, "wall": 15445.4} {"step": 28093, "train_loss": 3.217268466949463, "lr": 4.5957345538337506e-05, "tps": 119165, "wall": 15450.5} {"step": 28094, "train_loss": 3.1136770248413086, "lr": 4.595245851681668e-05, "tps": 119132, "wall": 15455.3} {"step": 28095, "train_loss": 3.160036325454712, "lr": 4.594757346691585e-05, "tps": 119099, "wall": 15460.2} {"step": 28096, "train_loss": 3.3134689331054688, "lr": 4.594269038869032e-05, "tps": 119066, "wall": 15465.1} {"step": 28097, "train_loss": 3.224902868270874, "lr": 4.5937809282195366e-05, "tps": 119032, "wall": 15470.0} {"step": 28098, "train_loss": 3.133179187774658, "lr": 4.593293014748637e-05, "tps": 118998, "wall": 15475.0} {"step": 28099, "train_loss": 3.059112787246704, "lr": 4.592805298461856e-05, "tps": 118964, "wall": 15479.9} {"step": 28100, "train_loss": 3.169271945953369, "lr": 4.592317779364716e-05, "tps": 118930, "wall": 15484.9} {"step": 28101, "train_loss": 3.1791462898254395, "lr": 4.5918304574627424e-05, "tps": 118897, "wall": 15489.8} {"step": 28102, "train_loss": 3.0534229278564453, "lr": 4.591343332761457e-05, "tps": 118863, "wall": 15494.7} {"step": 28103, "train_loss": 3.183581829071045, "lr": 4.5908564052663736e-05, "tps": 118830, "wall": 15499.6} {"step": 28104, "train_loss": 3.082658529281616, "lr": 4.590369674983012e-05, "tps": 118797, "wall": 15504.4} {"step": 28105, "train_loss": 3.139720916748047, "lr": 4.589883141916885e-05, "tps": 118764, "wall": 15509.3} {"step": 28106, "train_loss": 3.1001219749450684, "lr": 4.589396806073502e-05, "tps": 118731, "wall": 15514.2} {"step": 28107, "train_loss": 3.124736785888672, "lr": 4.588910667458376e-05, "tps": 118697, "wall": 15519.1} {"step": 28108, "train_loss": 3.0737667083740234, "lr": 4.58842472607701e-05, "tps": 118664, "wall": 15524.0} {"step": 28109, "train_loss": 3.19643497467041, "lr": 4.587938981934911e-05, "tps": 118631, "wall": 15528.9} {"step": 28110, "train_loss": 3.2213165760040283, "lr": 4.5874534350375825e-05, "tps": 118598, "wall": 15533.8} {"step": 28111, "train_loss": 3.2037439346313477, "lr": 4.5869680853905214e-05, "tps": 118564, "wall": 15538.8} {"step": 28112, "train_loss": 3.1363956928253174, "lr": 4.5864829329992294e-05, "tps": 118528, "wall": 15544.1} {"step": 28113, "train_loss": 3.0991241931915283, "lr": 4.585997977869202e-05, "tps": 118493, "wall": 15549.2} {"step": 28114, "train_loss": 3.088273763656616, "lr": 4.585513220005927e-05, "tps": 118456, "wall": 15554.6} {"step": 28115, "train_loss": 3.165565013885498, "lr": 4.585028659414905e-05, "tps": 118421, "wall": 15559.7} {"step": 28116, "train_loss": 3.1745493412017822, "lr": 4.5845442961016194e-05, "tps": 118386, "wall": 15564.9} {"step": 28117, "train_loss": 3.142399549484253, "lr": 4.5840601300715554e-05, "tps": 118351, "wall": 15570.1} {"step": 28118, "train_loss": 3.146097183227539, "lr": 4.5835761613302045e-05, "tps": 118316, "wall": 15575.3} {"step": 28119, "train_loss": 3.0314135551452637, "lr": 4.583092389883043e-05, "tps": 118281, "wall": 15580.4} {"step": 28120, "train_loss": 3.050072431564331, "lr": 4.582608815735552e-05, "tps": 118246, "wall": 15585.6} {"step": 28121, "train_loss": 3.0715277194976807, "lr": 4.582125438893213e-05, "tps": 118211, "wall": 15590.7} {"step": 28122, "train_loss": 3.222212791442871, "lr": 4.5816422593615e-05, "tps": 118177, "wall": 15595.8} {"step": 28123, "train_loss": 3.150174379348755, "lr": 4.581159277145882e-05, "tps": 118142, "wall": 15600.9} {"step": 28001, "train_loss": 2.9647340774536133, "lr": 4.6415378619657154e-05, "tps": 382935313, "wall": 4.8} {"step": 28002, "train_loss": 2.9913859367370605, "lr": 4.6410310448827837e-05, "tps": 204521301, "wall": 9.0} {"step": 28003, "train_loss": 2.990828514099121, "lr": 4.64052442444319e-05, "tps": 138101494, "wall": 13.3} {"step": 28004, "train_loss": 3.0489695072174072, "lr": 4.640018000652675e-05, "tps": 103487365, "wall": 17.7} {"step": 28005, "train_loss": 2.9280641078948975, "lr": 4.639511773516974e-05, "tps": 82129936, "wall": 22.3} {"step": 28006, "train_loss": 2.9488472938537598, "lr": 4.639005743041826e-05, "tps": 67996884, "wall": 27.0} {"step": 28007, "train_loss": 2.946371078491211, "lr": 4.638499909232957e-05, "tps": 57530645, "wall": 31.9} {"step": 28008, "train_loss": 3.046123504638672, "lr": 4.6379942720961025e-05, "tps": 50124318, "wall": 36.6} {"step": 28009, "train_loss": 3.017887592315674, "lr": 4.637488831636988e-05, "tps": 44182996, "wall": 41.5} {"step": 28010, "train_loss": 3.04941463470459, "lr": 4.6369835878613365e-05, "tps": 39608443, "wall": 46.3} {"step": 28011, "train_loss": 2.9475555419921875, "lr": 4.6364785407748765e-05, "tps": 35975751, "wall": 51.0} {"step": 28012, "train_loss": 3.0279390811920166, "lr": 4.635973690383327e-05, "tps": 32972786, "wall": 55.7} {"step": 28013, "train_loss": 2.9172840118408203, "lr": 4.635469036692405e-05, "tps": 30410504, "wall": 60.4} {"step": 28014, "train_loss": 2.946443557739258, "lr": 4.634964579707832e-05, "tps": 28221759, "wall": 65.1} {"step": 28015, "train_loss": 3.1208858489990234, "lr": 4.6344603194353165e-05, "tps": 26308862, "wall": 69.8} {"step": 28016, "train_loss": 3.0101242065429688, "lr": 4.6339562558805764e-05, "tps": 24656050, "wall": 74.5} {"step": 28017, "train_loss": 2.9514262676239014, "lr": 4.6334523890493196e-05, "tps": 23198059, "wall": 79.2} {"step": 28018, "train_loss": 3.041865825653076, "lr": 4.6329487189472504e-05, "tps": 21852417, "wall": 84.0} {"step": 28019, "train_loss": 3.012661933898926, "lr": 4.632445245580082e-05, "tps": 20651021, "wall": 88.9} {"step": 28020, "train_loss": 3.0149662494659424, "lr": 4.631941968953512e-05, "tps": 19603408, "wall": 93.7} {"step": 28021, "train_loss": 3.080782413482666, "lr": 4.63143888907324e-05, "tps": 18666476, "wall": 98.4} {"step": 28022, "train_loss": 3.0706496238708496, "lr": 4.6309360059449724e-05, "tps": 17829345, "wall": 103.0} {"step": 28023, "train_loss": 2.969280242919922, "lr": 4.6304333195743995e-05, "tps": 17060059, "wall": 107.7} {"step": 28024, "train_loss": 2.9137985706329346, "lr": 4.629930829967215e-05, "tps": 16353284, "wall": 112.3} {"step": 28025, "train_loss": 2.9777050018310547, "lr": 4.629428537129117e-05, "tps": 15699450, "wall": 117.0} {"step": 28026, "train_loss": 2.833646297454834, "lr": 4.628926441065793e-05, "tps": 15098350, "wall": 121.7} {"step": 28027, "train_loss": 2.968886137008667, "lr": 4.628424541782927e-05, "tps": 14539844, "wall": 126.3} {"step": 28028, "train_loss": 3.0664494037628174, "lr": 4.627922839286209e-05, "tps": 14023800, "wall": 131.0} {"step": 28029, "train_loss": 2.9663848876953125, "lr": 4.627421333581323e-05, "tps": 13543030, "wall": 135.6} {"step": 28030, "train_loss": 3.0022165775299072, "lr": 4.626920024673944e-05, "tps": 13087783, "wall": 140.4} {"step": 28031, "train_loss": 2.978928804397583, "lr": 4.6264189125697575e-05, "tps": 12665846, "wall": 145.0} {"step": 28032, "train_loss": 3.0229527950286865, "lr": 4.625917997274435e-05, "tps": 12266013, "wall": 149.8} {"step": 28033, "train_loss": 2.9948372840881348, "lr": 4.625417278793657e-05, "tps": 11869702, "wall": 154.8} {"step": 28034, "train_loss": 2.881392478942871, "lr": 4.6249167571330886e-05, "tps": 11515514, "wall": 159.6} {"step": 28035, "train_loss": 3.021763563156128, "lr": 4.624416432298404e-05, "tps": 11187638, "wall": 164.2} {"step": 28036, "train_loss": 2.9799749851226807, "lr": 4.623916304295271e-05, "tps": 10871806, "wall": 169.0} {"step": 28037, "train_loss": 3.0101704597473145, "lr": 4.623416373129356e-05, "tps": 10567942, "wall": 173.9} {"step": 28038, "train_loss": 2.975006103515625, "lr": 4.622916638806315e-05, "tps": 10282026, "wall": 178.7} {"step": 28039, "train_loss": 2.9525115489959717, "lr": 4.6224171013318195e-05, "tps": 10018578, "wall": 183.4} {"step": 28040, "train_loss": 2.9541807174682617, "lr": 4.621917760711522e-05, "tps": 9758182, "wall": 188.3} {"step": 28041, "train_loss": 2.965052604675293, "lr": 4.621418616951078e-05, "tps": 9516445, "wall": 193.1} {"step": 28042, "train_loss": 3.0730886459350586, "lr": 4.620919670056145e-05, "tps": 9288373, "wall": 197.9} {"step": 28043, "train_loss": 2.873682737350464, "lr": 4.6204209200323765e-05, "tps": 9072165, "wall": 202.6} {"step": 28044, "train_loss": 3.04799747467041, "lr": 4.6199223668854165e-05, "tps": 8866794, "wall": 207.3} {"step": 28045, "train_loss": 2.891479015350342, "lr": 4.619424010620919e-05, "tps": 8668299, "wall": 212.0} {"step": 28046, "train_loss": 3.0923218727111816, "lr": 4.618925851244527e-05, "tps": 8479740, "wall": 216.8} {"step": 28047, "train_loss": 2.8404009342193604, "lr": 4.6184278887618786e-05, "tps": 8301008, "wall": 221.4} {"step": 28048, "train_loss": 3.0094192028045654, "lr": 4.617930123178625e-05, "tps": 8128400, "wall": 226.1} {"step": 28049, "train_loss": 3.069896936416626, "lr": 4.617432554500396e-05, "tps": 7963169, "wall": 230.8} {"step": 28050, "train_loss": 2.99208927154541, "lr": 4.616935182732832e-05, "tps": 7804535, "wall": 235.5} {"step": 28051, "train_loss": 2.8750948905944824, "lr": 4.616438007881568e-05, "tps": 7651067, "wall": 240.3} {"step": 28052, "train_loss": 3.0085906982421875, "lr": 4.615941029952232e-05, "tps": 7502165, "wall": 245.1} {"step": 28053, "train_loss": 3.039923667907715, "lr": 4.615444248950459e-05, "tps": 7360280, "wall": 249.8} {"step": 28054, "train_loss": 2.988448143005371, "lr": 4.614947664881874e-05, "tps": 7222165, "wall": 254.6} {"step": 28055, "train_loss": 2.955883741378784, "lr": 4.614451277752099e-05, "tps": 7087553, "wall": 259.4} {"step": 28056, "train_loss": 2.927325487136841, "lr": 4.613955087566764e-05, "tps": 6959493, "wall": 264.2} {"step": 28057, "train_loss": 3.0131921768188477, "lr": 4.613459094331487e-05, "tps": 6837803, "wall": 268.9} {"step": 28058, "train_loss": 3.0001375675201416, "lr": 4.612963298051883e-05, "tps": 6719157, "wall": 273.7} {"step": 28059, "train_loss": 2.9944980144500732, "lr": 4.6124676987335725e-05, "tps": 6605785, "wall": 278.4} {"step": 28060, "train_loss": 3.093909502029419, "lr": 4.611972296382169e-05, "tps": 6495696, "wall": 283.1} {"step": 28061, "train_loss": 3.0271377563476562, "lr": 4.611477091003284e-05, "tps": 6389346, "wall": 287.8} {"step": 28062, "train_loss": 2.981889247894287, "lr": 4.610982082602527e-05, "tps": 6286432, "wall": 292.6} {"step": 28063, "train_loss": 3.0344996452331543, "lr": 4.610487271185507e-05, "tps": 6186297, "wall": 297.3} {"step": 28064, "train_loss": 2.984103202819824, "lr": 4.609992656757823e-05, "tps": 6089581, "wall": 302.0} {"step": 28065, "train_loss": 3.0106749534606934, "lr": 4.6094982393250884e-05, "tps": 5995613, "wall": 306.8} {"step": 28066, "train_loss": 3.041428327560425, "lr": 4.609004018892898e-05, "tps": 5904046, "wall": 311.5} {"step": 28067, "train_loss": 3.074711322784424, "lr": 4.608509995466848e-05, "tps": 5812507, "wall": 316.5} {"step": 28068, "train_loss": 2.9691288471221924, "lr": 4.6080161690525395e-05, "tps": 5724909, "wall": 321.3} {"step": 28069, "train_loss": 2.8787856101989746, "lr": 4.6075225396555636e-05, "tps": 5640177, "wall": 326.2} {"step": 28070, "train_loss": 3.0910823345184326, "lr": 4.6070291072815154e-05, "tps": 5557043, "wall": 331.1} {"step": 28071, "train_loss": 3.008664131164551, "lr": 4.6065358719359806e-05, "tps": 5477994, "wall": 335.8} {"step": 28072, "train_loss": 2.9624948501586914, "lr": 4.606042833624551e-05, "tps": 5398882, "wall": 340.8} {"step": 28073, "train_loss": 2.9929773807525635, "lr": 4.6055499923528076e-05, "tps": 5316228, "wall": 346.1} {"step": 28074, "train_loss": 2.9183976650238037, "lr": 4.6050573481263326e-05, "tps": 5235419, "wall": 351.4} {"step": 28075, "train_loss": 2.99074649810791, "lr": 4.604564900950711e-05, "tps": 5164931, "wall": 356.2} {"step": 28076, "train_loss": 3.039360284805298, "lr": 4.604072650831521e-05, "tps": 5095719, "wall": 361.1} {"step": 28077, "train_loss": 3.018338680267334, "lr": 4.603580597774334e-05, "tps": 5028527, "wall": 365.9} {"step": 28078, "train_loss": 3.000732183456421, "lr": 4.603088741784729e-05, "tps": 4961851, "wall": 370.9} {"step": 28079, "train_loss": 3.1017189025878906, "lr": 4.602597082868275e-05, "tps": 4898526, "wall": 375.7} {"step": 28080, "train_loss": 2.9512033462524414, "lr": 4.602105621030543e-05, "tps": 4835829, "wall": 380.6} {"step": 28081, "train_loss": 3.028001070022583, "lr": 4.6016143562771e-05, "tps": 4776203, "wall": 385.3} {"step": 28082, "train_loss": 2.9866013526916504, "lr": 4.601123288613512e-05, "tps": 4717150, "wall": 390.2} {"step": 28083, "train_loss": 2.961005687713623, "lr": 4.600632418045336e-05, "tps": 4659205, "wall": 395.0} {"step": 28084, "train_loss": 2.957371234893799, "lr": 4.6001417445781415e-05, "tps": 4603901, "wall": 399.8} {"step": 28085, "train_loss": 3.0494818687438965, "lr": 4.599651268217481e-05, "tps": 4550114, "wall": 404.5} {"step": 28086, "train_loss": 3.0017316341400146, "lr": 4.599160988968911e-05, "tps": 4496965, "wall": 409.3} {"step": 28087, "train_loss": 2.970675230026245, "lr": 4.59867090683799e-05, "tps": 4444330, "wall": 414.2} {"step": 28088, "train_loss": 2.999269485473633, "lr": 4.5981810218302645e-05, "tps": 4392820, "wall": 419.1} {"step": 28089, "train_loss": 2.9989800453186035, "lr": 4.597691333951285e-05, "tps": 4342860, "wall": 423.9} {"step": 28090, "train_loss": 2.9680488109588623, "lr": 4.597201843206601e-05, "tps": 4294579, "wall": 428.7} {"step": 28091, "train_loss": 2.912959575653076, "lr": 4.5967125496017565e-05, "tps": 4247761, "wall": 433.4} {"step": 28092, "train_loss": 3.0435187816619873, "lr": 4.596223453142291e-05, "tps": 4201669, "wall": 438.2} {"step": 28093, "train_loss": 3.0073680877685547, "lr": 4.5957345538337506e-05, "tps": 4155476, "wall": 443.1} {"step": 28094, "train_loss": 3.0194804668426514, "lr": 4.595245851681668e-05, "tps": 4110847, "wall": 447.9} {"step": 28095, "train_loss": 2.935454845428467, "lr": 4.594757346691585e-05, "tps": 4066729, "wall": 452.8} {"step": 28096, "train_loss": 2.990828037261963, "lr": 4.594269038869032e-05, "tps": 4023948, "wall": 457.6} {"step": 28097, "train_loss": 2.9930293560028076, "lr": 4.5937809282195366e-05, "tps": 3981827, "wall": 462.5} {"step": 28098, "train_loss": 3.050929069519043, "lr": 4.593293014748637e-05, "tps": 3940821, "wall": 467.3} {"step": 28099, "train_loss": 3.0558958053588867, "lr": 4.592805298461856e-05, "tps": 3900887, "wall": 472.1} {"step": 28100, "train_loss": 2.978278160095215, "lr": 4.592317779364716e-05, "tps": 3861773, "wall": 476.9} {"step": 28101, "train_loss": 2.8597395420074463, "lr": 4.5918304574627424e-05, "tps": 3823510, "wall": 481.7} {"step": 28102, "train_loss": 2.9151999950408936, "lr": 4.591343332761457e-05, "tps": 3786078, "wall": 486.5} {"step": 28103, "train_loss": 2.9452261924743652, "lr": 4.5908564052663736e-05, "tps": 3749381, "wall": 491.2} {"step": 28104, "train_loss": 2.8992133140563965, "lr": 4.590369674983012e-05, "tps": 3713345, "wall": 496.0} {"step": 28105, "train_loss": 2.941685676574707, "lr": 4.589883141916885e-05, "tps": 3677946, "wall": 500.8} {"step": 28106, "train_loss": 3.031895399093628, "lr": 4.589396806073502e-05, "tps": 3643372, "wall": 505.6} {"step": 28107, "train_loss": 2.888430595397949, "lr": 4.588910667458376e-05, "tps": 3608921, "wall": 510.4} {"step": 28108, "train_loss": 3.0846400260925293, "lr": 4.58842472607701e-05, "tps": 3575065, "wall": 515.3} {"step": 28109, "train_loss": 2.9562125205993652, "lr": 4.587938981934911e-05, "tps": 3541805, "wall": 520.1} {"step": 28110, "train_loss": 2.937410354614258, "lr": 4.5874534350375825e-05, "tps": 3509202, "wall": 525.0} {"step": 28111, "train_loss": 2.9241394996643066, "lr": 4.5869680853905214e-05, "tps": 3477516, "wall": 529.8} {"step": 28112, "train_loss": 2.957526683807373, "lr": 4.5864829329992294e-05, "tps": 3446426, "wall": 534.6} {"step": 28113, "train_loss": 2.977785587310791, "lr": 4.585997977869202e-05, "tps": 3415781, "wall": 539.4} {"step": 28114, "train_loss": 2.9673309326171875, "lr": 4.585513220005927e-05, "tps": 3385821, "wall": 544.2} {"step": 28115, "train_loss": 2.9921305179595947, "lr": 4.585028659414905e-05, "tps": 3356450, "wall": 549.0} {"step": 28116, "train_loss": 2.995830535888672, "lr": 4.5845442961016194e-05, "tps": 3327436, "wall": 553.8} {"step": 28117, "train_loss": 2.979175329208374, "lr": 4.5840601300715554e-05, "tps": 3298879, "wall": 558.6} {"step": 28118, "train_loss": 2.93005108833313, "lr": 4.5835761613302045e-05, "tps": 3270843, "wall": 563.4} {"step": 28119, "train_loss": 3.045231819152832, "lr": 4.583092389883043e-05, "tps": 3243264, "wall": 568.2} {"step": 28120, "train_loss": 3.044631004333496, "lr": 4.582608815735552e-05, "tps": 3215502, "wall": 573.1} {"step": 28121, "train_loss": 2.964582920074463, "lr": 4.582125438893213e-05, "tps": 3188849, "wall": 578.0} {"step": 28122, "train_loss": 3.020461082458496, "lr": 4.5816422593615e-05, "tps": 3162654, "wall": 582.8} {"step": 28123, "train_loss": 2.9725091457366943, "lr": 4.581159277145882e-05, "tps": 3136788, "wall": 587.6} {"step": 28124, "train_loss": 2.956298351287842, "lr": 4.580676492251836e-05, "tps": 3111396, "wall": 592.4} {"step": 28125, "train_loss": 2.9638876914978027, "lr": 4.5801939046848294e-05, "tps": 3086354, "wall": 597.2} {"step": 28126, "train_loss": 2.908252000808716, "lr": 4.579711514450328e-05, "tps": 3061784, "wall": 602.0} {"step": 28127, "train_loss": 3.0252838134765625, "lr": 4.579229321553799e-05, "tps": 3037585, "wall": 606.9} {"step": 28128, "train_loss": 3.0057005882263184, "lr": 4.578747326000699e-05, "tps": 3013682, "wall": 611.7} {"step": 28129, "train_loss": 2.9848709106445312, "lr": 4.578265527796494e-05, "tps": 2990172, "wall": 616.5} {"step": 28130, "train_loss": 2.9991204738616943, "lr": 4.57778392694664e-05, "tps": 2966926, "wall": 621.4} {"step": 28131, "train_loss": 2.961383819580078, "lr": 4.577302523456591e-05, "tps": 2944104, "wall": 626.2} {"step": 28132, "train_loss": 3.0618090629577637, "lr": 4.576821317331804e-05, "tps": 2921373, "wall": 631.1} {"step": 28133, "train_loss": 2.8864803314208984, "lr": 4.576340308577727e-05, "tps": 2899178, "wall": 636.0} {"step": 28134, "train_loss": 2.883056640625, "lr": 4.5758594971998065e-05, "tps": 2877343, "wall": 640.8} {"step": 28135, "train_loss": 2.8643879890441895, "lr": 4.575378883203494e-05, "tps": 2855812, "wall": 645.7} {"step": 28136, "train_loss": 3.1064000129699707, "lr": 4.574898466594233e-05, "tps": 2834559, "wall": 650.5} {"step": 28137, "train_loss": 2.9910168647766113, "lr": 4.574418247377463e-05, "tps": 2812766, "wall": 655.6} {"step": 28138, "train_loss": 2.889881134033203, "lr": 4.573938225558628e-05, "tps": 2791660, "wall": 660.6} {"step": 28139, "train_loss": 3.108880043029785, "lr": 4.5734584011431635e-05, "tps": 2770734, "wall": 665.6} {"step": 28140, "train_loss": 2.9031906127929688, "lr": 4.5729787741365026e-05, "tps": 2750175, "wall": 670.6} {"step": 28141, "train_loss": 3.003166913986206, "lr": 4.5724993445440825e-05, "tps": 2729646, "wall": 675.7} {"step": 28142, "train_loss": 2.952270984649658, "lr": 4.572020112371333e-05, "tps": 2709539, "wall": 680.7} {"step": 28143, "train_loss": 3.0134758949279785, "lr": 4.571541077623682e-05, "tps": 2688677, "wall": 686.0} {"step": 28144, "train_loss": 3.091421127319336, "lr": 4.571062240306557e-05, "tps": 2667737, "wall": 691.4} {"step": 28145, "train_loss": 2.998870372772217, "lr": 4.570583600425381e-05, "tps": 2648229, "wall": 696.5} {"step": 28146, "train_loss": 2.9098832607269287, "lr": 4.570105157985577e-05, "tps": 2629885, "wall": 701.4} {"step": 28147, "train_loss": 2.977994918823242, "lr": 4.569626912992566e-05, "tps": 2611778, "wall": 706.3} {"step": 28148, "train_loss": 3.0161242485046387, "lr": 4.569148865451763e-05, "tps": 2593992, "wall": 711.2} {"step": 28149, "train_loss": 3.003384590148926, "lr": 4.568671015368584e-05, "tps": 2575762, "wall": 716.2} {"step": 28150, "train_loss": 2.857990264892578, "lr": 4.568193362748445e-05, "tps": 2558285, "wall": 721.1} {"step": 28151, "train_loss": 2.9537699222564697, "lr": 4.5677159075967524e-05, "tps": 2541020, "wall": 726.1} {"step": 28152, "train_loss": 2.988422155380249, "lr": 4.5672386499189186e-05, "tps": 2523979, "wall": 731.0} {"step": 28153, "train_loss": 3.0489795207977295, "lr": 4.566761589720347e-05, "tps": 2507299, "wall": 735.9} {"step": 28154, "train_loss": 2.9689114093780518, "lr": 4.5662847270064435e-05, "tps": 2490607, "wall": 740.8} {"step": 28155, "train_loss": 2.907383680343628, "lr": 4.565808061782612e-05, "tps": 2474031, "wall": 745.8} {"step": 28156, "train_loss": 2.968083620071411, "lr": 4.565331594054247e-05, "tps": 2457078, "wall": 751.0} {"step": 28157, "train_loss": 2.954866886138916, "lr": 4.564855323826751e-05, "tps": 2441032, "wall": 756.0} {"step": 28158, "train_loss": 3.013956069946289, "lr": 4.5643792511055163e-05, "tps": 2425432, "wall": 760.9} {"step": 28159, "train_loss": 2.9151713848114014, "lr": 4.563903375895938e-05, "tps": 2409614, "wall": 765.9} {"step": 28160, "train_loss": 2.999917507171631, "lr": 4.563427698203403e-05, "tps": 2394388, "wall": 770.8} {"step": 28161, "train_loss": 3.1171512603759766, "lr": 4.5629522180333044e-05, "tps": 2379370, "wall": 775.7} {"step": 28162, "train_loss": 2.883025884628296, "lr": 4.562476935391026e-05, "tps": 2364651, "wall": 780.5} {"step": 28163, "train_loss": 3.0094692707061768, "lr": 4.562001850281951e-05, "tps": 2350090, "wall": 785.4} {"step": 28164, "train_loss": 2.9329819679260254, "lr": 4.561526962711463e-05, "tps": 2335556, "wall": 790.3} {"step": 28165, "train_loss": 2.9750494956970215, "lr": 4.5610522726849414e-05, "tps": 2320900, "wall": 795.3} {"step": 28166, "train_loss": 3.0769386291503906, "lr": 4.560577780207762e-05, "tps": 2306427, "wall": 800.4} {"step": 28167, "train_loss": 2.85817813873291, "lr": 4.560103485285303e-05, "tps": 2292608, "wall": 805.2} {"step": 28168, "train_loss": 2.862771987915039, "lr": 4.5596293879229323e-05, "tps": 2278605, "wall": 810.2} {"step": 28169, "train_loss": 2.907989025115967, "lr": 4.559155488126026e-05, "tps": 2265143, "wall": 815.0} {"step": 28170, "train_loss": 2.9890835285186768, "lr": 4.558681785899949e-05, "tps": 2251755, "wall": 819.9} {"step": 28171, "train_loss": 3.0023083686828613, "lr": 4.5582082812500684e-05, "tps": 2238546, "wall": 824.8} {"step": 28172, "train_loss": 3.054100275039673, "lr": 4.557734974181748e-05, "tps": 2225458, "wall": 829.6} {"step": 28173, "train_loss": 2.883533000946045, "lr": 4.55726186470035e-05, "tps": 2212551, "wall": 834.5} {"step": 28174, "train_loss": 2.99497127532959, "lr": 4.5567889528112315e-05, "tps": 2199689, "wall": 839.4} {"step": 28175, "train_loss": 3.105220079421997, "lr": 4.556316238519753e-05, "tps": 2187037, "wall": 844.3} {"step": 28176, "train_loss": 2.9587888717651367, "lr": 4.5558437218312675e-05, "tps": 2174360, "wall": 849.3} {"step": 28177, "train_loss": 2.9920403957366943, "lr": 4.5553714027511266e-05, "tps": 2161798, "wall": 854.2} {"step": 28178, "train_loss": 2.986302375793457, "lr": 4.554899281284685e-05, "tps": 2148916, "wall": 859.4} {"step": 28179, "train_loss": 2.9559309482574463, "lr": 4.554427357437287e-05, "tps": 2135634, "wall": 864.8} {"step": 28180, "train_loss": 2.9088125228881836, "lr": 4.5539556312142774e-05, "tps": 2122811, "wall": 870.0} {"step": 28181, "train_loss": 3.073908805847168, "lr": 4.553484102621006e-05, "tps": 2110535, "wall": 875.1} {"step": 28182, "train_loss": 2.883671760559082, "lr": 4.553012771662807e-05, "tps": 2098552, "wall": 880.1} {"step": 28183, "train_loss": 3.0465240478515625, "lr": 4.552541638345025e-05, "tps": 2086630, "wall": 885.2} {"step": 28184, "train_loss": 2.977893114089966, "lr": 4.552070702672996e-05, "tps": 2075228, "wall": 890.1} {"step": 28185, "train_loss": 3.0192501544952393, "lr": 4.551599964652052e-05, "tps": 2063982, "wall": 895.0} {"step": 28186, "train_loss": 3.0354809761047363, "lr": 4.551129424287528e-05, "tps": 2052977, "wall": 899.8} {"step": 28187, "train_loss": 3.03645658493042, "lr": 4.550659081584755e-05, "tps": 2042068, "wall": 904.6} {"step": 28188, "train_loss": 3.0439846515655518, "lr": 4.5501889365490585e-05, "tps": 2031255, "wall": 909.5} {"step": 28189, "train_loss": 2.9779012203216553, "lr": 4.5497189891857685e-05, "tps": 2020048, "wall": 914.6} {"step": 28190, "train_loss": 2.8464345932006836, "lr": 4.549249239500202e-05, "tps": 2009155, "wall": 919.6} {"step": 28191, "train_loss": 3.0812883377075195, "lr": 4.548779687497686e-05, "tps": 1998289, "wall": 924.6} {"step": 28192, "train_loss": 2.8938381671905518, "lr": 4.548310333183538e-05, "tps": 1987361, "wall": 929.7} {"step": 28193, "train_loss": 2.8507633209228516, "lr": 4.5478411765630755e-05, "tps": 1976953, "wall": 934.6} {"step": 28194, "train_loss": 2.9602584838867188, "lr": 4.54737221764161e-05, "tps": 1966489, "wall": 939.6} {"step": 28195, "train_loss": 2.9668383598327637, "lr": 4.546903456424459e-05, "tps": 1956279, "wall": 944.6} {"step": 28196, "train_loss": 3.0199708938598633, "lr": 4.546434892916929e-05, "tps": 1945955, "wall": 949.6} {"step": 28197, "train_loss": 2.885936975479126, "lr": 4.5459665271243266e-05, "tps": 1935984, "wall": 954.5} {"step": 28198, "train_loss": 2.946361780166626, "lr": 4.5454983590519615e-05, "tps": 1926243, "wall": 959.4} {"step": 28199, "train_loss": 3.020717144012451, "lr": 4.545030388705136e-05, "tps": 1916518, "wall": 964.3} {"step": 28200, "train_loss": 3.029210090637207, "lr": 4.544562616089148e-05, "tps": 1906795, "wall": 969.3} {"step": 28201, "train_loss": 3.0552892684936523, "lr": 4.5440950412093e-05, "tps": 1897217, "wall": 974.2} {"step": 28202, "train_loss": 2.9662013053894043, "lr": 4.5436276640708886e-05, "tps": 1887813, "wall": 979.1} {"step": 28203, "train_loss": 2.9826741218566895, "lr": 4.543160484679206e-05, "tps": 1878542, "wall": 983.9} {"step": 28204, "train_loss": 2.9054102897644043, "lr": 4.542693503039549e-05, "tps": 1869357, "wall": 988.8} {"step": 28205, "train_loss": 2.92069149017334, "lr": 4.5422267191572e-05, "tps": 1860210, "wall": 993.7} {"step": 28206, "train_loss": 2.986241340637207, "lr": 4.5417601330374535e-05, "tps": 1851266, "wall": 998.5} {"step": 28207, "train_loss": 2.927163600921631, "lr": 4.541293744685593e-05, "tps": 1842397, "wall": 1003.4} {"step": 28208, "train_loss": 2.861621379852295, "lr": 4.5408275541069e-05, "tps": 1833636, "wall": 1008.2} {"step": 28209, "train_loss": 2.9692325592041016, "lr": 4.540361561306659e-05, "tps": 1824933, "wall": 1013.1} {"step": 28210, "train_loss": 2.901357412338257, "lr": 4.5398957662901475e-05, "tps": 1816326, "wall": 1017.9} {"step": 28211, "train_loss": 2.9186229705810547, "lr": 4.539430169062637e-05, "tps": 1807796, "wall": 1022.7} {"step": 28212, "train_loss": 2.895019054412842, "lr": 4.5389647696294095e-05, "tps": 1799330, "wall": 1027.6} {"step": 28213, "train_loss": 2.99068021774292, "lr": 4.538499567995735e-05, "tps": 1790943, "wall": 1032.4} {"step": 28214, "train_loss": 2.96142578125, "lr": 4.5380345641668786e-05, "tps": 1782670, "wall": 1037.3} {"step": 28215, "train_loss": 3.026047706604004, "lr": 4.5375697581481124e-05, "tps": 1774324, "wall": 1042.2} {"step": 28216, "train_loss": 2.999701499938965, "lr": 4.5371051499447024e-05, "tps": 1766146, "wall": 1047.0} {"step": 28217, "train_loss": 2.960498809814453, "lr": 4.536640739561906e-05, "tps": 1757917, "wall": 1052.0} {"step": 28218, "train_loss": 2.947955846786499, "lr": 4.536176527004992e-05, "tps": 1749897, "wall": 1056.8} {"step": 28219, "train_loss": 2.925386905670166, "lr": 4.535712512279213e-05, "tps": 1741957, "wall": 1061.7} {"step": 28220, "train_loss": 3.015596866607666, "lr": 4.5352486953898275e-05, "tps": 1734079, "wall": 1066.6} {"step": 28221, "train_loss": 2.99869704246521, "lr": 4.534785076342091e-05, "tps": 1726252, "wall": 1071.4} {"step": 28222, "train_loss": 3.0407555103302, "lr": 4.534321655141254e-05, "tps": 1718400, "wall": 1076.4} {"step": 28223, "train_loss": 2.951537847518921, "lr": 4.533858431792565e-05, "tps": 1710616, "wall": 1081.3} {"step": 28224, "train_loss": 2.9915857315063477, "lr": 4.5333954063012743e-05, "tps": 1702885, "wall": 1086.2} {"step": 28225, "train_loss": 3.0667195320129395, "lr": 4.5329325786726216e-05, "tps": 1695292, "wall": 1091.2} {"step": 28226, "train_loss": 2.9658799171447754, "lr": 4.532469948911858e-05, "tps": 1687811, "wall": 1096.0} {"step": 28227, "train_loss": 2.8509607315063477, "lr": 4.5320075170242196e-05, "tps": 1680403, "wall": 1100.9} {"step": 28228, "train_loss": 2.990227699279785, "lr": 4.5315452830149404e-05, "tps": 1672957, "wall": 1105.8} {"step": 28229, "train_loss": 3.0392308235168457, "lr": 4.531083246889266e-05, "tps": 1665532, "wall": 1110.8} {"step": 28230, "train_loss": 2.893756866455078, "lr": 4.530621408652424e-05, "tps": 1658295, "wall": 1115.7} {"step": 28231, "train_loss": 2.954956293106079, "lr": 4.5301597683096475e-05, "tps": 1651132, "wall": 1120.6} {"step": 28232, "train_loss": 2.9146275520324707, "lr": 4.529698325866166e-05, "tps": 1644060, "wall": 1125.4} {"step": 28233, "train_loss": 2.9641079902648926, "lr": 4.529237081327209e-05, "tps": 1637022, "wall": 1130.3} {"step": 28234, "train_loss": 3.0530059337615967, "lr": 4.5287760346979967e-05, "tps": 1630017, "wall": 1135.2} {"step": 28235, "train_loss": 2.9419748783111572, "lr": 4.5283151859837544e-05, "tps": 1623118, "wall": 1140.1} {"step": 28236, "train_loss": 2.939213275909424, "lr": 4.527854535189705e-05, "tps": 1616285, "wall": 1144.9} {"step": 28237, "train_loss": 3.019314765930176, "lr": 4.527394082321064e-05, "tps": 1609502, "wall": 1149.8} {"step": 28238, "train_loss": 3.032491445541382, "lr": 4.526933827383047e-05, "tps": 1602775, "wall": 1154.7} {"step": 28239, "train_loss": 2.929872989654541, "lr": 4.52647377038087e-05, "tps": 1596133, "wall": 1159.5} {"step": 28240, "train_loss": 3.010662078857422, "lr": 4.526013911319745e-05, "tps": 1589486, "wall": 1164.4} {"step": 28241, "train_loss": 2.9388256072998047, "lr": 4.5255542502048804e-05, "tps": 1582899, "wall": 1169.3} {"step": 28242, "train_loss": 2.9437055587768555, "lr": 4.525094787041478e-05, "tps": 1576334, "wall": 1174.2} {"step": 28243, "train_loss": 2.975526809692383, "lr": 4.5246355218347514e-05, "tps": 1569853, "wall": 1179.1} {"step": 28244, "train_loss": 2.9627115726470947, "lr": 4.524176454589896e-05, "tps": 1563476, "wall": 1183.9} {"step": 28245, "train_loss": 3.0021002292633057, "lr": 4.523717585312117e-05, "tps": 1557074, "wall": 1188.9} {"step": 28246, "train_loss": 2.983780860900879, "lr": 4.52325891400661e-05, "tps": 1550715, "wall": 1193.8} {"step": 28247, "train_loss": 3.013648271560669, "lr": 4.5228004406785695e-05, "tps": 1544448, "wall": 1198.7} {"step": 28248, "train_loss": 2.923466444015503, "lr": 4.522342165333194e-05, "tps": 1538239, "wall": 1203.5} {"step": 28249, "train_loss": 3.034012794494629, "lr": 4.521884087975672e-05, "tps": 1532030, "wall": 1208.5} {"step": 28250, "train_loss": 3.002789258956909, "lr": 4.5214262086111905e-05, "tps": 1525908, "wall": 1213.3} {"step": 28251, "train_loss": 2.9149818420410156, "lr": 4.52096852724494e-05, "tps": 1519799, "wall": 1218.3} {"step": 28252, "train_loss": 2.9021716117858887, "lr": 4.5205110438821044e-05, "tps": 1513789, "wall": 1223.1} {"step": 28253, "train_loss": 2.9774556159973145, "lr": 4.520053758527863e-05, "tps": 1507818, "wall": 1228.0} {"step": 28254, "train_loss": 3.0184853076934814, "lr": 4.519596671187399e-05, "tps": 1501778, "wall": 1233.0} {"step": 28255, "train_loss": 3.0144104957580566, "lr": 4.5191397818658916e-05, "tps": 1495820, "wall": 1238.0} {"step": 28256, "train_loss": 3.0431039333343506, "lr": 4.51868309056851e-05, "tps": 1489732, "wall": 1243.1} {"step": 28257, "train_loss": 2.9278430938720703, "lr": 4.5182265973004365e-05, "tps": 1483738, "wall": 1248.1} {"step": 28258, "train_loss": 2.9695162773132324, "lr": 4.5177703020668364e-05, "tps": 1477990, "wall": 1253.0} {"step": 28259, "train_loss": 3.0123510360717773, "lr": 4.51731420487288e-05, "tps": 1472289, "wall": 1257.9} {"step": 28260, "train_loss": 2.8389110565185547, "lr": 4.5168583057237343e-05, "tps": 1466607, "wall": 1262.9} {"step": 28261, "train_loss": 2.9403953552246094, "lr": 4.516402604624562e-05, "tps": 1460920, "wall": 1267.8} {"step": 28262, "train_loss": 2.991696357727051, "lr": 4.515947101580529e-05, "tps": 1455263, "wall": 1272.8} {"step": 28263, "train_loss": 3.078782558441162, "lr": 4.515491796596794e-05, "tps": 1449649, "wall": 1277.8} {"step": 28264, "train_loss": 3.009716272354126, "lr": 4.51503668967851e-05, "tps": 1444113, "wall": 1282.7} {"step": 28265, "train_loss": 2.8419675827026367, "lr": 4.514581780830839e-05, "tps": 1438657, "wall": 1287.6} {"step": 28266, "train_loss": 2.8744752407073975, "lr": 4.514127070058932e-05, "tps": 1433132, "wall": 1292.6} {"step": 28267, "train_loss": 2.954357624053955, "lr": 4.5136725573679355e-05, "tps": 1427752, "wall": 1297.5} {"step": 28268, "train_loss": 3.0077202320098877, "lr": 4.513218242763008e-05, "tps": 1422373, "wall": 1302.5} {"step": 28269, "train_loss": 2.9289231300354004, "lr": 4.5127641262492864e-05, "tps": 1417115, "wall": 1307.4} {"step": 28270, "train_loss": 2.985823154449463, "lr": 4.512310207831919e-05, "tps": 1411849, "wall": 1312.3} {"step": 28271, "train_loss": 2.9745805263519287, "lr": 4.5118564875160486e-05, "tps": 1406620, "wall": 1317.2} {"step": 28272, "train_loss": 3.0038437843322754, "lr": 4.511402965306816e-05, "tps": 1401412, "wall": 1322.2} {"step": 28273, "train_loss": 2.9356954097747803, "lr": 4.510949641209351e-05, "tps": 1396296, "wall": 1327.1} {"step": 28274, "train_loss": 3.090249538421631, "lr": 4.5104965152288e-05, "tps": 1391219, "wall": 1331.9} {"step": 28275, "train_loss": 2.9504897594451904, "lr": 4.510043587370289e-05, "tps": 1386197, "wall": 1336.8} {"step": 28276, "train_loss": 2.9713425636291504, "lr": 4.509590857638949e-05, "tps": 1381158, "wall": 1341.7} {"step": 28277, "train_loss": 2.977505683898926, "lr": 4.5091383260399124e-05, "tps": 1376171, "wall": 1346.7} {"step": 28278, "train_loss": 2.997173309326172, "lr": 4.508685992578301e-05, "tps": 1371170, "wall": 1351.6} {"step": 28279, "train_loss": 3.016202449798584, "lr": 4.508233857259243e-05, "tps": 1366195, "wall": 1356.6} {"step": 28280, "train_loss": 3.053757667541504, "lr": 4.507781920087856e-05, "tps": 1361308, "wall": 1361.5} {"step": 28281, "train_loss": 2.9335713386535645, "lr": 4.507330181069262e-05, "tps": 1356469, "wall": 1366.4} {"step": 28282, "train_loss": 2.976332664489746, "lr": 4.506878640208581e-05, "tps": 1351658, "wall": 1371.3} {"step": 28283, "train_loss": 2.9182357788085938, "lr": 4.5064272975109226e-05, "tps": 1346904, "wall": 1376.2} {"step": 28284, "train_loss": 3.0159125328063965, "lr": 4.505976152981402e-05, "tps": 1342215, "wall": 1381.1} {"step": 28285, "train_loss": 2.974348783493042, "lr": 4.5055252066251296e-05, "tps": 1337525, "wall": 1386.0} {"step": 28286, "train_loss": 3.040196180343628, "lr": 4.5050744584472174e-05, "tps": 1332854, "wall": 1390.9} {"step": 28287, "train_loss": 2.9736950397491455, "lr": 4.504623908452764e-05, "tps": 1328214, "wall": 1395.8} {"step": 28288, "train_loss": 2.982377529144287, "lr": 4.504173556646879e-05, "tps": 1323626, "wall": 1400.7} {"step": 28289, "train_loss": 2.89981746673584, "lr": 4.503723403034663e-05, "tps": 1318991, "wall": 1405.6} {"step": 28290, "train_loss": 3.010770320892334, "lr": 4.503273447621215e-05, "tps": 1314300, "wall": 1410.7} {"step": 28291, "train_loss": 3.0752956867218018, "lr": 4.5028236904116316e-05, "tps": 1309710, "wall": 1415.7} {"step": 28292, "train_loss": 2.93583083152771, "lr": 4.502374131411007e-05, "tps": 1305190, "wall": 1420.6} {"step": 28293, "train_loss": 2.997637987136841, "lr": 4.501924770624435e-05, "tps": 1300724, "wall": 1425.6} {"step": 28294, "train_loss": 2.9607744216918945, "lr": 4.5014756080570066e-05, "tps": 1296288, "wall": 1430.5} {"step": 28295, "train_loss": 2.973130702972412, "lr": 4.5010266437138104e-05, "tps": 1291908, "wall": 1435.4} {"step": 28296, "train_loss": 2.972113609313965, "lr": 4.500577877599928e-05, "tps": 1287551, "wall": 1440.3} {"step": 28297, "train_loss": 3.0101327896118164, "lr": 4.500129309720448e-05, "tps": 1283241, "wall": 1445.2} {"step": 28298, "train_loss": 3.0587356090545654, "lr": 4.49968094008045e-05, "tps": 1278947, "wall": 1450.1} {"step": 28299, "train_loss": 3.0379109382629395, "lr": 4.4992327686850127e-05, "tps": 1274688, "wall": 1455.0} {"step": 28300, "train_loss": 2.888979434967041, "lr": 4.498784795539214e-05, "tps": 1270416, "wall": 1459.9} {"step": 28301, "train_loss": 3.0525295734405518, "lr": 4.498337020648127e-05, "tps": 1266187, "wall": 1464.9} {"step": 28302, "train_loss": 2.9639227390289307, "lr": 4.497889444016825e-05, "tps": 1261948, "wall": 1469.8} {"step": 28303, "train_loss": 2.975773572921753, "lr": 4.4974420656503805e-05, "tps": 1257838, "wall": 1474.7} {"step": 28304, "train_loss": 2.9140255451202393, "lr": 4.496994885553856e-05, "tps": 1253727, "wall": 1479.6} {"step": 28305, "train_loss": 2.924192428588867, "lr": 4.496547903732323e-05, "tps": 1249643, "wall": 1484.5} {"step": 28306, "train_loss": 2.9482548236846924, "lr": 4.496101120190841e-05, "tps": 1245593, "wall": 1489.4} {"step": 28307, "train_loss": 2.940474033355713, "lr": 4.4956545349344704e-05, "tps": 1241563, "wall": 1494.2} {"step": 28308, "train_loss": 2.9610471725463867, "lr": 4.495208147968275e-05, "tps": 1237524, "wall": 1499.2} {"step": 28309, "train_loss": 2.9155406951904297, "lr": 4.494761959297309e-05, "tps": 1233544, "wall": 1504.1} {"step": 28310, "train_loss": 2.8852856159210205, "lr": 4.4943159689266245e-05, "tps": 1229603, "wall": 1508.9} {"step": 28311, "train_loss": 2.971766471862793, "lr": 4.493870176861276e-05, "tps": 1225669, "wall": 1513.8} {"step": 28312, "train_loss": 3.01324462890625, "lr": 4.4934245831063134e-05, "tps": 1221726, "wall": 1518.8} {"step": 28313, "train_loss": 3.047027587890625, "lr": 4.492979187666784e-05, "tps": 1217804, "wall": 1523.7} {"step": 28314, "train_loss": 3.06050181388855, "lr": 4.492533990547736e-05, "tps": 1213940, "wall": 1528.6} {"step": 28315, "train_loss": 2.99812650680542, "lr": 4.492088991754206e-05, "tps": 1210062, "wall": 1533.6} {"step": 28316, "train_loss": 2.9092400074005127, "lr": 4.491644191291242e-05, "tps": 1206243, "wall": 1538.5} {"step": 28317, "train_loss": 2.943445920944214, "lr": 4.49119958916388e-05, "tps": 1202465, "wall": 1543.4} {"step": 28318, "train_loss": 2.9246928691864014, "lr": 4.490755185377154e-05, "tps": 1198699, "wall": 1548.3} {"step": 28319, "train_loss": 2.9639101028442383, "lr": 4.490310979936103e-05, "tps": 1194872, "wall": 1553.3} {"step": 28320, "train_loss": 2.8996686935424805, "lr": 4.489866972845757e-05, "tps": 1191112, "wall": 1558.2} {"step": 28321, "train_loss": 3.0253725051879883, "lr": 4.4894231641111404e-05, "tps": 1187340, "wall": 1563.2} {"step": 28322, "train_loss": 2.9776573181152344, "lr": 4.48897955373729e-05, "tps": 1183583, "wall": 1568.3} {"step": 28323, "train_loss": 2.928922176361084, "lr": 4.488536141729227e-05, "tps": 1179854, "wall": 1573.3} {"step": 28324, "train_loss": 2.8834404945373535, "lr": 4.4880929280919695e-05, "tps": 1176156, "wall": 1578.3} {"step": 28325, "train_loss": 2.944077253341675, "lr": 4.487649912830546e-05, "tps": 1172310, "wall": 1583.5} {"step": 28326, "train_loss": 3.0117359161376953, "lr": 4.4872070959499724e-05, "tps": 1168677, "wall": 1588.5} {"step": 28327, "train_loss": 3.0915491580963135, "lr": 4.48676447745526e-05, "tps": 1165015, "wall": 1593.5} {"step": 28328, "train_loss": 2.9523444175720215, "lr": 4.486322057351432e-05, "tps": 1161420, "wall": 1598.5} {"step": 28329, "train_loss": 2.907904863357544, "lr": 4.485879835643494e-05, "tps": 1157872, "wall": 1603.5} {"step": 28330, "train_loss": 2.915348529815674, "lr": 4.485437812336455e-05, "tps": 1154351, "wall": 1608.4} {"step": 28331, "train_loss": 3.05271577835083, "lr": 4.4849959874353236e-05, "tps": 1150881, "wall": 1613.3} {"step": 28332, "train_loss": 2.9134609699249268, "lr": 4.484554360945106e-05, "tps": 1147406, "wall": 1618.3} {"step": 28333, "train_loss": 2.9501874446868896, "lr": 4.484112932870805e-05, "tps": 1143981, "wall": 1623.2} {"step": 28334, "train_loss": 2.9018890857696533, "lr": 4.483671703217421e-05, "tps": 1140520, "wall": 1628.2} {"step": 28335, "train_loss": 3.052402973175049, "lr": 4.4832306719899486e-05, "tps": 1137037, "wall": 1633.2} {"step": 28336, "train_loss": 2.9733688831329346, "lr": 4.48278983919339e-05, "tps": 1133576, "wall": 1638.3} {"step": 28337, "train_loss": 2.9971814155578613, "lr": 4.482349204832735e-05, "tps": 1130164, "wall": 1643.3} {"step": 28338, "train_loss": 3.000227212905884, "lr": 4.481908768912973e-05, "tps": 1126795, "wall": 1648.2} {"step": 28339, "train_loss": 2.9148948192596436, "lr": 4.4814685314391005e-05, "tps": 1123403, "wall": 1653.3} {"step": 28340, "train_loss": 2.9266490936279297, "lr": 4.4810284924160986e-05, "tps": 1120109, "wall": 1658.2} {"step": 28341, "train_loss": 2.943782329559326, "lr": 4.4805886518489507e-05, "tps": 1116843, "wall": 1663.1} {"step": 28342, "train_loss": 3.2061684131622314, "lr": 4.480149009742646e-05, "tps": 1113574, "wall": 1668.0} {"step": 28343, "train_loss": 2.9613196849823, "lr": 4.4797095661021623e-05, "tps": 1110352, "wall": 1672.9} {"step": 28344, "train_loss": 2.9734349250793457, "lr": 4.4792703209324715e-05, "tps": 1107164, "wall": 1677.8} {"step": 28345, "train_loss": 2.9435372352600098, "lr": 4.478831274238558e-05, "tps": 1103991, "wall": 1682.7} {"step": 28346, "train_loss": 2.9632833003997803, "lr": 4.478392426025392e-05, "tps": 1100829, "wall": 1687.6} {"step": 28347, "train_loss": 3.018110752105713, "lr": 4.477953776297941e-05, "tps": 1097693, "wall": 1692.5} {"step": 28348, "train_loss": 2.9143319129943848, "lr": 4.477515325061181e-05, "tps": 1094576, "wall": 1697.4} {"step": 28349, "train_loss": 2.977053165435791, "lr": 4.477077072320074e-05, "tps": 1091472, "wall": 1702.2} {"step": 28350, "train_loss": 2.9082024097442627, "lr": 4.476639018079585e-05, "tps": 1088392, "wall": 1707.1} {"step": 28351, "train_loss": 3.065804958343506, "lr": 4.476201162344679e-05, "tps": 1085278, "wall": 1712.1} {"step": 28352, "train_loss": 2.9429421424865723, "lr": 4.475763505120312e-05, "tps": 1082231, "wall": 1717.0} {"step": 28353, "train_loss": 3.0340657234191895, "lr": 4.4753260464114466e-05, "tps": 1079192, "wall": 1721.8} {"step": 28354, "train_loss": 2.9772047996520996, "lr": 4.474888786223035e-05, "tps": 1076174, "wall": 1726.7} {"step": 28355, "train_loss": 3.0318784713745117, "lr": 4.47445172456003e-05, "tps": 1073160, "wall": 1731.6} {"step": 28356, "train_loss": 2.9063069820404053, "lr": 4.474014861427387e-05, "tps": 1070156, "wall": 1736.6} {"step": 28357, "train_loss": 2.955871343612671, "lr": 4.47357819683005e-05, "tps": 1067152, "wall": 1741.5} {"step": 28358, "train_loss": 2.9886279106140137, "lr": 4.4731417307729655e-05, "tps": 1064201, "wall": 1746.4} {"step": 28359, "train_loss": 2.9516243934631348, "lr": 4.472705463261081e-05, "tps": 1061266, "wall": 1751.3} {"step": 28360, "train_loss": 2.949749231338501, "lr": 4.47226939429934e-05, "tps": 1058353, "wall": 1756.2} {"step": 28361, "train_loss": 2.935171127319336, "lr": 4.4718335238926755e-05, "tps": 1055423, "wall": 1761.1} {"step": 28362, "train_loss": 3.0317094326019287, "lr": 4.47139785204603e-05, "tps": 1052482, "wall": 1766.1} {"step": 28363, "train_loss": 2.892622709274292, "lr": 4.4709623787643394e-05, "tps": 1049533, "wall": 1771.1} {"step": 28364, "train_loss": 2.9203569889068604, "lr": 4.470527104052534e-05, "tps": 1046624, "wall": 1776.1} {"step": 28365, "train_loss": 3.002228260040283, "lr": 4.4700920279155475e-05, "tps": 1043744, "wall": 1781.1} {"step": 28366, "train_loss": 2.9263956546783447, "lr": 4.469657150358307e-05, "tps": 1040841, "wall": 1786.1} {"step": 28367, "train_loss": 3.0845584869384766, "lr": 4.469222471385735e-05, "tps": 1037991, "wall": 1791.1} {"step": 28368, "train_loss": 2.7985243797302246, "lr": 4.468787991002763e-05, "tps": 1035190, "wall": 1796.0} {"step": 28369, "train_loss": 2.8886685371398926, "lr": 4.468353709214307e-05, "tps": 1032395, "wall": 1800.9} {"step": 28370, "train_loss": 2.832643985748291, "lr": 4.467919626025289e-05, "tps": 1029587, "wall": 1805.9} {"step": 28371, "train_loss": 2.9426307678222656, "lr": 4.4674857414406265e-05, "tps": 1026791, "wall": 1810.9} {"step": 28372, "train_loss": 2.84873628616333, "lr": 4.4670520554652326e-05, "tps": 1024008, "wall": 1815.9} {"step": 28373, "train_loss": 2.9941272735595703, "lr": 4.466618568104024e-05, "tps": 1021221, "wall": 1820.9} {"step": 28374, "train_loss": 2.865593433380127, "lr": 4.4661852793619086e-05, "tps": 1018400, "wall": 1826.0} {"step": 28375, "train_loss": 2.88150954246521, "lr": 4.4657521892437926e-05, "tps": 1015621, "wall": 1831.0} {"step": 28376, "train_loss": 3.027641534805298, "lr": 4.465319297754586e-05, "tps": 1012895, "wall": 1836.0} {"step": 28377, "train_loss": 2.9965100288391113, "lr": 4.4648866048991924e-05, "tps": 1010177, "wall": 1841.0} {"step": 28378, "train_loss": 3.0523297786712646, "lr": 4.464454110682508e-05, "tps": 1007452, "wall": 1846.1} {"step": 28379, "train_loss": 2.982651472091675, "lr": 4.464021815109439e-05, "tps": 1004739, "wall": 1851.1} {"step": 28380, "train_loss": 3.0697903633117676, "lr": 4.463589718184879e-05, "tps": 1002059, "wall": 1856.2} {"step": 28381, "train_loss": 2.874424934387207, "lr": 4.463157819913724e-05, "tps": 999388, "wall": 1861.2} {"step": 28382, "train_loss": 2.9638419151306152, "lr": 4.462726120300864e-05, "tps": 996758, "wall": 1866.2} {"step": 28383, "train_loss": 3.004816770553589, "lr": 4.462294619351193e-05, "tps": 994156, "wall": 1871.1} {"step": 28384, "train_loss": 3.000387668609619, "lr": 4.4618633170695953e-05, "tps": 991532, "wall": 1876.1} {"step": 28385, "train_loss": 2.9036924839019775, "lr": 4.461432213460962e-05, "tps": 988827, "wall": 1881.3} {"step": 28386, "train_loss": 2.9708597660064697, "lr": 4.461001308530171e-05, "tps": 986176, "wall": 1886.4} {"step": 28387, "train_loss": 2.9526286125183105, "lr": 4.460570602282106e-05, "tps": 983342, "wall": 1892.0} {"step": 28388, "train_loss": 2.9628543853759766, "lr": 4.460140094721648e-05, "tps": 980756, "wall": 1897.0} {"step": 28389, "train_loss": 2.899460554122925, "lr": 4.45970978585367e-05, "tps": 978181, "wall": 1902.1} {"step": 28390, "train_loss": 3.03256893157959, "lr": 4.4592796756830484e-05, "tps": 975669, "wall": 1907.0} {"step": 28391, "train_loss": 3.054354190826416, "lr": 4.4588497642146574e-05, "tps": 973029, "wall": 1912.3} {"step": 28392, "train_loss": 2.984915018081665, "lr": 4.458420051453364e-05, "tps": 970526, "wall": 1917.3} {"step": 28393, "train_loss": 2.9083845615386963, "lr": 4.457990537404037e-05, "tps": 968044, "wall": 1922.3} {"step": 28394, "train_loss": 2.978041410446167, "lr": 4.457561222071542e-05, "tps": 965549, "wall": 1927.3} {"step": 28395, "train_loss": 3.0120811462402344, "lr": 4.457132105460744e-05, "tps": 963095, "wall": 1932.3} {"step": 28396, "train_loss": 2.9391045570373535, "lr": 4.4567031875765017e-05, "tps": 960637, "wall": 1937.3} {"step": 28397, "train_loss": 3.002171516418457, "lr": 4.456274468423675e-05, "tps": 958207, "wall": 1942.3} {"step": 28398, "train_loss": 3.0058746337890625, "lr": 4.455845948007118e-05, "tps": 955802, "wall": 1947.2} {"step": 28399, "train_loss": 3.011500120162964, "lr": 4.4554176263316904e-05, "tps": 953348, "wall": 1952.3} {"step": 28400, "train_loss": 2.900923252105713, "lr": 4.4549895034022405e-05, "tps": 950937, "wall": 1957.3} {"step": 28401, "train_loss": 2.951165199279785, "lr": 4.454561579223617e-05, "tps": 948518, "wall": 1962.4} {"step": 28402, "train_loss": 2.9758107662200928, "lr": 4.45413385380067e-05, "tps": 946121, "wall": 1967.4} {"step": 28403, "train_loss": 3.0276551246643066, "lr": 4.453706327138245e-05, "tps": 943759, "wall": 1972.4} {"step": 28404, "train_loss": 3.032684803009033, "lr": 4.4532789992411826e-05, "tps": 941431, "wall": 1977.4} {"step": 28405, "train_loss": 2.94400691986084, "lr": 4.452851870114325e-05, "tps": 939108, "wall": 1982.3} {"step": 28406, "train_loss": 3.0509207248687744, "lr": 4.452424939762509e-05, "tps": 936763, "wall": 1987.4} {"step": 28407, "train_loss": 2.9308342933654785, "lr": 4.451998208190577e-05, "tps": 934439, "wall": 1992.4} {"step": 28408, "train_loss": 2.9884111881256104, "lr": 4.451571675403357e-05, "tps": 932137, "wall": 1997.4} {"step": 28409, "train_loss": 3.0068295001983643, "lr": 4.451145341405682e-05, "tps": 929845, "wall": 2002.4} {"step": 28410, "train_loss": 2.9590461254119873, "lr": 4.4507192062023816e-05, "tps": 927562, "wall": 2007.4} {"step": 28411, "train_loss": 2.937415838241577, "lr": 4.450293269798283e-05, "tps": 925293, "wall": 2012.3} {"step": 28412, "train_loss": 2.8906121253967285, "lr": 4.449867532198213e-05, "tps": 923045, "wall": 2017.3} {"step": 28413, "train_loss": 2.954728126525879, "lr": 4.4494419934069924e-05, "tps": 920784, "wall": 2022.3} {"step": 28414, "train_loss": 2.963411331176758, "lr": 4.44901665342944e-05, "tps": 918497, "wall": 2027.4} {"step": 28415, "train_loss": 3.070744514465332, "lr": 4.44859151227038e-05, "tps": 916232, "wall": 2032.5} {"step": 28416, "train_loss": 3.0230557918548584, "lr": 4.448166569934623e-05, "tps": 913996, "wall": 2037.6} {"step": 28417, "train_loss": 2.886889696121216, "lr": 4.447741826426984e-05, "tps": 911774, "wall": 2042.6} {"step": 28418, "train_loss": 2.8739256858825684, "lr": 4.447317281752278e-05, "tps": 909562, "wall": 2047.7} {"step": 28419, "train_loss": 3.000988721847534, "lr": 4.446892935915309e-05, "tps": 907355, "wall": 2052.7} {"step": 28420, "train_loss": 2.9420228004455566, "lr": 4.4464687889208865e-05, "tps": 905158, "wall": 2057.8} {"step": 28421, "train_loss": 2.9464144706726074, "lr": 4.4460448407738164e-05, "tps": 902943, "wall": 2062.9} {"step": 28422, "train_loss": 2.9830307960510254, "lr": 4.4456210914788993e-05, "tps": 900770, "wall": 2067.9} {"step": 28423, "train_loss": 2.951724052429199, "lr": 4.445197541040935e-05, "tps": 898570, "wall": 2073.1} {"step": 28424, "train_loss": 3.016854763031006, "lr": 4.4447741894647255e-05, "tps": 896408, "wall": 2078.1} {"step": 28425, "train_loss": 2.8602402210235596, "lr": 4.444351036755062e-05, "tps": 894224, "wall": 2083.3} {"step": 28426, "train_loss": 2.9611563682556152, "lr": 4.443928082916739e-05, "tps": 892117, "wall": 2088.3} {"step": 28427, "train_loss": 3.045725107192993, "lr": 4.44350532795455e-05, "tps": 890049, "wall": 2093.2} {"step": 28428, "train_loss": 3.008793592453003, "lr": 4.443082771873283e-05, "tps": 887981, "wall": 2098.2} {"step": 28429, "train_loss": 3.0012013912200928, "lr": 4.4426604146777207e-05, "tps": 885928, "wall": 2103.1} {"step": 28430, "train_loss": 2.9882428646087646, "lr": 4.4422382563726536e-05, "tps": 883880, "wall": 2108.0} {"step": 28431, "train_loss": 2.9521372318267822, "lr": 4.4418162969628604e-05, "tps": 881802, "wall": 2113.1} {"step": 28432, "train_loss": 2.949093818664551, "lr": 4.4413945364531215e-05, "tps": 879761, "wall": 2118.1} {"step": 28433, "train_loss": 3.0042030811309814, "lr": 4.440972974848218e-05, "tps": 877717, "wall": 2123.1} {"step": 28434, "train_loss": 3.0544049739837646, "lr": 4.44055161215292e-05, "tps": 875683, "wall": 2128.1} {"step": 28435, "train_loss": 3.061579704284668, "lr": 4.4401304483720034e-05, "tps": 873632, "wall": 2133.1} {"step": 28436, "train_loss": 2.990359306335449, "lr": 4.4397094835102426e-05, "tps": 871615, "wall": 2138.2} {"step": 28437, "train_loss": 3.0224759578704834, "lr": 4.439288717572398e-05, "tps": 869638, "wall": 2143.1} {"step": 28438, "train_loss": 3.0123841762542725, "lr": 4.438868150563242e-05, "tps": 867673, "wall": 2148.0} {"step": 28439, "train_loss": 2.9632623195648193, "lr": 4.438447782487539e-05, "tps": 865703, "wall": 2153.0} {"step": 28440, "train_loss": 2.9132232666015625, "lr": 4.4380276133500484e-05, "tps": 863760, "wall": 2157.9} {"step": 28441, "train_loss": 2.9955356121063232, "lr": 4.437607643155532e-05, "tps": 861829, "wall": 2162.8} {"step": 28442, "train_loss": 2.877596855163574, "lr": 4.4371878719087476e-05, "tps": 859902, "wall": 2167.7} {"step": 28443, "train_loss": 2.9791462421417236, "lr": 4.4367682996144454e-05, "tps": 857992, "wall": 2172.6} {"step": 28444, "train_loss": 2.980783462524414, "lr": 4.4363489262773865e-05, "tps": 856093, "wall": 2177.5} {"step": 28445, "train_loss": 2.922098159790039, "lr": 4.4359297519023144e-05, "tps": 854172, "wall": 2182.5} {"step": 28446, "train_loss": 2.955329418182373, "lr": 4.435510776493979e-05, "tps": 852207, "wall": 2187.6} {"step": 28447, "train_loss": 3.001694917678833, "lr": 4.435092000057131e-05, "tps": 850237, "wall": 2192.8} {"step": 28448, "train_loss": 3.0339179039001465, "lr": 4.4346734225965087e-05, "tps": 848314, "wall": 2197.8} {"step": 28449, "train_loss": 3.013763189315796, "lr": 4.434255044116858e-05, "tps": 846410, "wall": 2202.8} {"step": 28450, "train_loss": 2.9532175064086914, "lr": 4.433836864622915e-05, "tps": 844505, "wall": 2207.9} {"step": 28451, "train_loss": 3.079744815826416, "lr": 4.433418884119418e-05, "tps": 842625, "wall": 2212.9} {"step": 28452, "train_loss": 3.021303653717041, "lr": 4.433001102611104e-05, "tps": 840766, "wall": 2217.9} {"step": 28453, "train_loss": 3.002314805984497, "lr": 4.4325835201027025e-05, "tps": 838891, "wall": 2222.9} {"step": 28454, "train_loss": 2.994393825531006, "lr": 4.4321661365989444e-05, "tps": 836999, "wall": 2228.0} {"step": 28455, "train_loss": 3.104360580444336, "lr": 4.431748952104561e-05, "tps": 835125, "wall": 2233.1} {"step": 28456, "train_loss": 3.007009744644165, "lr": 4.431331966624276e-05, "tps": 833270, "wall": 2238.1} {"step": 28457, "train_loss": 2.9927818775177, "lr": 4.4309151801628104e-05, "tps": 831410, "wall": 2243.2} {"step": 28458, "train_loss": 2.9130563735961914, "lr": 4.430498592724889e-05, "tps": 829589, "wall": 2248.2} {"step": 28459, "train_loss": 2.9026527404785156, "lr": 4.4300822043152305e-05, "tps": 827742, "wall": 2253.3} {"step": 28460, "train_loss": 2.9158172607421875, "lr": 4.4296660149385505e-05, "tps": 825936, "wall": 2258.3} {"step": 28461, "train_loss": 2.905880928039551, "lr": 4.429250024599567e-05, "tps": 824116, "wall": 2263.4} {"step": 28462, "train_loss": 2.9129796028137207, "lr": 4.428834233302988e-05, "tps": 822337, "wall": 2268.4} {"step": 28463, "train_loss": 2.9207444190979004, "lr": 4.428418641053524e-05, "tps": 820564, "wall": 2273.3} {"step": 28464, "train_loss": 2.8555667400360107, "lr": 4.428003247855887e-05, "tps": 818808, "wall": 2278.3} {"step": 28465, "train_loss": 2.9654643535614014, "lr": 4.4275880537147766e-05, "tps": 817054, "wall": 2283.3} {"step": 28466, "train_loss": 2.9843292236328125, "lr": 4.4271730586349024e-05, "tps": 815320, "wall": 2288.2} {"step": 28467, "train_loss": 2.932863235473633, "lr": 4.426758262620962e-05, "tps": 813600, "wall": 2293.1} {"step": 28468, "train_loss": 2.9981069564819336, "lr": 4.426343665677651e-05, "tps": 811895, "wall": 2298.0} {"step": 28469, "train_loss": 2.9533495903015137, "lr": 4.425929267809675e-05, "tps": 810119, "wall": 2303.1} {"step": 28470, "train_loss": 2.9516406059265137, "lr": 4.4255150690217204e-05, "tps": 808377, "wall": 2308.2} {"step": 28471, "train_loss": 2.9373202323913574, "lr": 4.4251010693184816e-05, "tps": 806667, "wall": 2313.1} {"step": 28472, "train_loss": 3.0171494483947754, "lr": 4.424687268704649e-05, "tps": 804970, "wall": 2318.1} {"step": 28473, "train_loss": 2.9670603275299072, "lr": 4.42427366718491e-05, "tps": 803258, "wall": 2323.1} {"step": 28474, "train_loss": 2.9742698669433594, "lr": 4.423860264763951e-05, "tps": 801553, "wall": 2328.2} {"step": 28475, "train_loss": 2.9588851928710938, "lr": 4.423447061446452e-05, "tps": 799865, "wall": 2333.1} {"step": 28476, "train_loss": 3.0292789936065674, "lr": 4.4230340572370966e-05, "tps": 798208, "wall": 2338.1} {"step": 28477, "train_loss": 3.016773223876953, "lr": 4.4226212521405604e-05, "tps": 796561, "wall": 2343.0} {"step": 28478, "train_loss": 2.9151229858398438, "lr": 4.422208646161523e-05, "tps": 794924, "wall": 2347.9} {"step": 28479, "train_loss": 3.028007984161377, "lr": 4.421796239304657e-05, "tps": 793297, "wall": 2352.8} {"step": 28480, "train_loss": 2.9759676456451416, "lr": 4.421384031574633e-05, "tps": 791671, "wall": 2357.7} {"step": 28481, "train_loss": 2.94881534576416, "lr": 4.420972022976123e-05, "tps": 790054, "wall": 2362.6} {"step": 28482, "train_loss": 2.906662940979004, "lr": 4.420560213513795e-05, "tps": 788443, "wall": 2367.5} {"step": 28483, "train_loss": 3.0722389221191406, "lr": 4.420148603192308e-05, "tps": 786819, "wall": 2372.5} {"step": 28484, "train_loss": 2.9590096473693848, "lr": 4.419737192016331e-05, "tps": 785224, "wall": 2377.4} {"step": 28485, "train_loss": 2.8522205352783203, "lr": 4.41932597999052e-05, "tps": 783636, "wall": 2382.3} {"step": 28486, "train_loss": 2.947125196456909, "lr": 4.4189149671195366e-05, "tps": 782051, "wall": 2387.2} {"step": 28487, "train_loss": 2.9964053630828857, "lr": 4.418504153408038e-05, "tps": 780470, "wall": 2392.1} {"step": 28488, "train_loss": 3.0137476921081543, "lr": 4.418093538860672e-05, "tps": 778895, "wall": 2397.1} {"step": 28489, "train_loss": 3.048414468765259, "lr": 4.417683123482096e-05, "tps": 777323, "wall": 2402.0} {"step": 28490, "train_loss": 2.978095531463623, "lr": 4.417272907276955e-05, "tps": 775761, "wall": 2406.9} {"step": 28491, "train_loss": 3.0304298400878906, "lr": 4.416862890249897e-05, "tps": 774198, "wall": 2411.9} {"step": 28492, "train_loss": 2.962367057800293, "lr": 4.4164530724055706e-05, "tps": 772647, "wall": 2416.8} {"step": 28493, "train_loss": 2.963428258895874, "lr": 4.416043453748614e-05, "tps": 771099, "wall": 2421.7} {"step": 28494, "train_loss": 3.0136027336120605, "lr": 4.4156340342836666e-05, "tps": 769555, "wall": 2426.7} {"step": 28495, "train_loss": 2.9623138904571533, "lr": 4.415224814015369e-05, "tps": 767998, "wall": 2431.7} {"step": 28496, "train_loss": 3.00726318359375, "lr": 4.414815792948357e-05, "tps": 766467, "wall": 2436.6} {"step": 28497, "train_loss": 2.9611945152282715, "lr": 4.414406971087261e-05, "tps": 764941, "wall": 2441.6} {"step": 28498, "train_loss": 2.9067111015319824, "lr": 4.4139983484367166e-05, "tps": 763425, "wall": 2446.5} {"step": 28499, "train_loss": 2.955474853515625, "lr": 4.413589925001349e-05, "tps": 761913, "wall": 2451.4} {"step": 28500, "train_loss": 2.972443103790283, "lr": 4.413181700785785e-05, "tps": 760410, "wall": 2456.4} {"step": 28501, "train_loss": 3.0453526973724365, "lr": 4.4127736757946534e-05, "tps": 758841, "wall": 2461.5} {"step": 28502, "train_loss": 2.938995122909546, "lr": 4.412365850032568e-05, "tps": 757319, "wall": 2466.6} {"step": 28503, "train_loss": 2.8632452487945557, "lr": 4.411958223504159e-05, "tps": 755787, "wall": 2471.6} {"step": 28504, "train_loss": 2.9715585708618164, "lr": 4.4115507962140375e-05, "tps": 754264, "wall": 2476.7} {"step": 28505, "train_loss": 3.0069191455841064, "lr": 4.411143568166818e-05, "tps": 752772, "wall": 2481.7} {"step": 28506, "train_loss": 2.9025590419769287, "lr": 4.4107365393671174e-05, "tps": 751278, "wall": 2486.7} {"step": 28507, "train_loss": 2.881840229034424, "lr": 4.410329709819545e-05, "tps": 749783, "wall": 2491.8} {"step": 28508, "train_loss": 2.780829429626465, "lr": 4.409923079528706e-05, "tps": 748309, "wall": 2496.8} {"step": 28509, "train_loss": 3.006776809692383, "lr": 4.4095166484992144e-05, "tps": 746846, "wall": 2501.8} {"step": 28510, "train_loss": 2.993973731994629, "lr": 4.409110416735669e-05, "tps": 745392, "wall": 2506.7} {"step": 28511, "train_loss": 2.8795340061187744, "lr": 4.408704384242669e-05, "tps": 743889, "wall": 2511.9} {"step": 28512, "train_loss": 2.9297289848327637, "lr": 4.40829855102482e-05, "tps": 742422, "wall": 2516.9} {"step": 28513, "train_loss": 3.0920562744140625, "lr": 4.407892917086717e-05, "tps": 740946, "wall": 2522.0} {"step": 28514, "train_loss": 2.9479610919952393, "lr": 4.407487482432953e-05, "tps": 739510, "wall": 2527.0} {"step": 28515, "train_loss": 2.9821083545684814, "lr": 4.407082247068125e-05, "tps": 738075, "wall": 2532.0} {"step": 28516, "train_loss": 3.0919885635375977, "lr": 4.40667721099682e-05, "tps": 736649, "wall": 2537.0} {"step": 28517, "train_loss": 2.9830663204193115, "lr": 4.406272374223625e-05, "tps": 735191, "wall": 2542.1} {"step": 28518, "train_loss": 3.0001659393310547, "lr": 4.405867736753134e-05, "tps": 733736, "wall": 2547.3} {"step": 28519, "train_loss": 2.9733352661132812, "lr": 4.4054632985899206e-05, "tps": 732293, "wall": 2552.4} {"step": 28520, "train_loss": 2.929870843887329, "lr": 4.4050590597385714e-05, "tps": 730881, "wall": 2557.4} {"step": 28521, "train_loss": 2.9806177616119385, "lr": 4.404655020203666e-05, "tps": 729472, "wall": 2562.4} {"step": 28522, "train_loss": 2.9539642333984375, "lr": 4.404251179989779e-05, "tps": 728065, "wall": 2567.5} {"step": 28523, "train_loss": 3.0174825191497803, "lr": 4.403847539101487e-05, "tps": 726667, "wall": 2572.5} {"step": 28524, "train_loss": 2.9782602787017822, "lr": 4.4034440975433644e-05, "tps": 725270, "wall": 2577.5} {"step": 28525, "train_loss": 2.88784122467041, "lr": 4.403040855319976e-05, "tps": 723885, "wall": 2582.6} {"step": 28526, "train_loss": 2.8817851543426514, "lr": 4.402637812435895e-05, "tps": 722493, "wall": 2587.6} {"step": 28527, "train_loss": 2.9832284450531006, "lr": 4.402234968895683e-05, "tps": 721100, "wall": 2592.7} {"step": 28528, "train_loss": 2.87064266204834, "lr": 4.4018323247039044e-05, "tps": 719714, "wall": 2597.8} {"step": 28529, "train_loss": 2.8814845085144043, "lr": 4.401429879865124e-05, "tps": 718347, "wall": 2602.8} {"step": 28530, "train_loss": 3.0141727924346924, "lr": 4.4010276343838966e-05, "tps": 716977, "wall": 2607.9} {"step": 28531, "train_loss": 2.9331672191619873, "lr": 4.40062558826478e-05, "tps": 715606, "wall": 2613.0} {"step": 28532, "train_loss": 2.9757566452026367, "lr": 4.4002237415123304e-05, "tps": 714261, "wall": 2618.0} {"step": 28533, "train_loss": 3.042081356048584, "lr": 4.3998220941310984e-05, "tps": 712922, "wall": 2623.0} {"step": 28534, "train_loss": 2.948915481567383, "lr": 4.399420646125631e-05, "tps": 711589, "wall": 2628.0} {"step": 28535, "train_loss": 3.0051047801971436, "lr": 4.39901939750048e-05, "tps": 710271, "wall": 2633.0} {"step": 28536, "train_loss": 2.9883549213409424, "lr": 4.398618348260191e-05, "tps": 708951, "wall": 2638.0} {"step": 28537, "train_loss": 3.0075247287750244, "lr": 4.398217498409305e-05, "tps": 707644, "wall": 2642.9} {"step": 28538, "train_loss": 2.8947513103485107, "lr": 4.397816847952362e-05, "tps": 706332, "wall": 2647.9} {"step": 28539, "train_loss": 3.0197372436523438, "lr": 4.397416396893902e-05, "tps": 705027, "wall": 2652.9} {"step": 28540, "train_loss": 3.0330848693847656, "lr": 4.397016145238463e-05, "tps": 703725, "wall": 2657.9} {"step": 28541, "train_loss": 2.878079891204834, "lr": 4.3966160929905766e-05, "tps": 702432, "wall": 2662.9} {"step": 28542, "train_loss": 2.945852279663086, "lr": 4.396216240154775e-05, "tps": 701145, "wall": 2667.9} {"step": 28543, "train_loss": 2.9980130195617676, "lr": 4.39581658673559e-05, "tps": 699850, "wall": 2672.9} {"step": 28544, "train_loss": 2.936540126800537, "lr": 4.3954171327375457e-05, "tps": 698575, "wall": 2677.9} {"step": 28545, "train_loss": 3.011795997619629, "lr": 4.3950178781651685e-05, "tps": 697288, "wall": 2683.0} {"step": 28546, "train_loss": 3.057828903198242, "lr": 4.394618823022982e-05, "tps": 696018, "wall": 2687.9} {"step": 28547, "train_loss": 2.9761133193969727, "lr": 4.394219967315506e-05, "tps": 694751, "wall": 2692.9} {"step": 28548, "train_loss": 2.94724440574646, "lr": 4.393821311047255e-05, "tps": 693484, "wall": 2697.9} {"step": 28549, "train_loss": 2.8526108264923096, "lr": 4.393422854222754e-05, "tps": 692220, "wall": 2703.0} {"step": 28550, "train_loss": 2.9078121185302734, "lr": 4.3930245968465086e-05, "tps": 690961, "wall": 2708.0} {"step": 28551, "train_loss": 2.9487006664276123, "lr": 4.392626538923031e-05, "tps": 689715, "wall": 2713.0} {"step": 28552, "train_loss": 3.0084173679351807, "lr": 4.392228680456837e-05, "tps": 688471, "wall": 2718.0} {"step": 28553, "train_loss": 2.9529948234558105, "lr": 4.3918310214524284e-05, "tps": 687232, "wall": 2723.0} {"step": 28554, "train_loss": 2.903167486190796, "lr": 4.3914335619143066e-05, "tps": 685996, "wall": 2728.0} {"step": 28555, "train_loss": 2.954625368118286, "lr": 4.391036301846982e-05, "tps": 684743, "wall": 2733.1} {"step": 28556, "train_loss": 3.020927667617798, "lr": 4.390639241254949e-05, "tps": 683516, "wall": 2738.1} {"step": 28557, "train_loss": 2.8789772987365723, "lr": 4.390242380142708e-05, "tps": 682282, "wall": 2743.1} {"step": 28558, "train_loss": 2.8230435848236084, "lr": 4.389845718514754e-05, "tps": 681045, "wall": 2748.2} {"step": 28559, "train_loss": 2.981743574142456, "lr": 4.389449256375578e-05, "tps": 679809, "wall": 2753.3} {"step": 28560, "train_loss": 2.873002052307129, "lr": 4.389052993729678e-05, "tps": 678568, "wall": 2758.4} {"step": 28561, "train_loss": 2.9852614402770996, "lr": 4.388656930581535e-05, "tps": 677358, "wall": 2763.4} {"step": 28562, "train_loss": 2.950364112854004, "lr": 4.38826106693564e-05, "tps": 676164, "wall": 2768.4} {"step": 28563, "train_loss": 2.9154672622680664, "lr": 4.387865402796478e-05, "tps": 674971, "wall": 2773.4} {"step": 28564, "train_loss": 2.9867515563964844, "lr": 4.387469938168527e-05, "tps": 673771, "wall": 2778.4} {"step": 28565, "train_loss": 2.9757421016693115, "lr": 4.38707467305627e-05, "tps": 672536, "wall": 2783.6} {"step": 28566, "train_loss": 2.8548078536987305, "lr": 4.386679607464184e-05, "tps": 671333, "wall": 2788.7} {"step": 28567, "train_loss": 2.8454055786132812, "lr": 4.386284741396746e-05, "tps": 670137, "wall": 2793.8} {"step": 28568, "train_loss": 3.074291944503784, "lr": 4.385890074858424e-05, "tps": 668967, "wall": 2798.8} {"step": 28569, "train_loss": 2.907575845718384, "lr": 4.3854956078536955e-05, "tps": 667798, "wall": 2803.8} {"step": 28570, "train_loss": 3.040975570678711, "lr": 4.385101340387024e-05, "tps": 666630, "wall": 2808.8} {"step": 28571, "train_loss": 2.85870623588562, "lr": 4.384707272462877e-05, "tps": 665464, "wall": 2813.8} {"step": 28572, "train_loss": 2.873579263687134, "lr": 4.384313404085722e-05, "tps": 664300, "wall": 2818.8} {"step": 28573, "train_loss": 2.837165355682373, "lr": 4.3839197352600135e-05, "tps": 663141, "wall": 2823.9} {"step": 28574, "train_loss": 3.063094139099121, "lr": 4.383526265990218e-05, "tps": 661983, "wall": 2828.9} {"step": 28575, "train_loss": 2.9596071243286133, "lr": 4.38313299628079e-05, "tps": 660834, "wall": 2833.9} {"step": 28576, "train_loss": 2.9462368488311768, "lr": 4.382739926136183e-05, "tps": 659693, "wall": 2838.9} {"step": 28577, "train_loss": 3.0245747566223145, "lr": 4.3823470555608507e-05, "tps": 658544, "wall": 2844.0} {"step": 28578, "train_loss": 2.881758213043213, "lr": 4.3819543845592483e-05, "tps": 657407, "wall": 2849.0} {"step": 28579, "train_loss": 2.9619758129119873, "lr": 4.381561913135816e-05, "tps": 656257, "wall": 2854.1} {"step": 28580, "train_loss": 3.018179416656494, "lr": 4.381169641295004e-05, "tps": 655128, "wall": 2859.1} {"step": 28581, "train_loss": 2.980987548828125, "lr": 4.3807775690412546e-05, "tps": 654005, "wall": 2864.1} {"step": 28582, "train_loss": 3.0967960357666016, "lr": 4.380385696379013e-05, "tps": 652888, "wall": 2869.1} {"step": 28583, "train_loss": 2.9558117389678955, "lr": 4.3799940233127126e-05, "tps": 651776, "wall": 2874.1} {"step": 28584, "train_loss": 3.051985502243042, "lr": 4.379602549846793e-05, "tps": 650672, "wall": 2879.1} {"step": 28585, "train_loss": 2.933544397354126, "lr": 4.3792112759856916e-05, "tps": 649572, "wall": 2884.1} {"step": 28586, "train_loss": 2.933652877807617, "lr": 4.378820201733836e-05, "tps": 648476, "wall": 2889.0} {"step": 28587, "train_loss": 3.0206422805786133, "lr": 4.378429327095659e-05, "tps": 647350, "wall": 2894.2} {"step": 28588, "train_loss": 2.851240396499634, "lr": 4.378038652075589e-05, "tps": 646236, "wall": 2899.3} {"step": 28589, "train_loss": 2.9403955936431885, "lr": 4.377648176678049e-05, "tps": 645111, "wall": 2904.4} {"step": 28590, "train_loss": 2.944002389907837, "lr": 4.377257900907464e-05, "tps": 644002, "wall": 2909.5} {"step": 28591, "train_loss": 2.8559370040893555, "lr": 4.376867824768255e-05, "tps": 642914, "wall": 2914.5} {"step": 28592, "train_loss": 2.951169013977051, "lr": 4.3764779482648414e-05, "tps": 641834, "wall": 2919.6} {"step": 28593, "train_loss": 2.83638072013855, "lr": 4.376088271401638e-05, "tps": 640758, "wall": 2924.6} {"step": 28594, "train_loss": 3.0652759075164795, "lr": 4.375698794183061e-05, "tps": 639687, "wall": 2929.6} {"step": 28595, "train_loss": 2.978797435760498, "lr": 4.3753095166135205e-05, "tps": 638612, "wall": 2934.6} {"step": 28596, "train_loss": 2.94539737701416, "lr": 4.374920438697427e-05, "tps": 637549, "wall": 2939.6} {"step": 28597, "train_loss": 2.881032705307007, "lr": 4.37453156043919e-05, "tps": 636480, "wall": 2944.6} {"step": 28598, "train_loss": 3.002964496612549, "lr": 4.374142881843212e-05, "tps": 635418, "wall": 2949.7} {"step": 28599, "train_loss": 3.0261118412017822, "lr": 4.373754402913896e-05, "tps": 634359, "wall": 2954.7} {"step": 28600, "train_loss": 2.8433492183685303, "lr": 4.373366123655645e-05, "tps": 633294, "wall": 2959.8} {"step": 28601, "train_loss": 3.06272554397583, "lr": 4.372978044072856e-05, "tps": 632229, "wall": 2964.8} {"step": 28602, "train_loss": 2.99971342086792, "lr": 4.372590164169925e-05, "tps": 631157, "wall": 2970.0} {"step": 28603, "train_loss": 3.0276052951812744, "lr": 4.372202483951248e-05, "tps": 630095, "wall": 2975.1} {"step": 28604, "train_loss": 2.853721857070923, "lr": 4.3718150034212116e-05, "tps": 629042, "wall": 2980.2} {"step": 28605, "train_loss": 2.948432445526123, "lr": 4.371427722584212e-05, "tps": 628011, "wall": 2985.2} {"step": 28606, "train_loss": 2.9727611541748047, "lr": 4.3710406414446306e-05, "tps": 626946, "wall": 2990.3} {"step": 28607, "train_loss": 2.9530341625213623, "lr": 4.3706537600068545e-05, "tps": 625869, "wall": 2995.6} {"step": 28608, "train_loss": 2.9247612953186035, "lr": 4.3702670782752656e-05, "tps": 624803, "wall": 3000.8} {"step": 28609, "train_loss": 3.058818817138672, "lr": 4.3698805962542474e-05, "tps": 623758, "wall": 3005.9} {"step": 28610, "train_loss": 2.825211524963379, "lr": 4.3694943139481734e-05, "tps": 622733, "wall": 3011.0} {"step": 28611, "train_loss": 2.895803213119507, "lr": 4.369108231361423e-05, "tps": 621664, "wall": 3016.3} {"step": 28612, "train_loss": 2.943631649017334, "lr": 4.36872234849837e-05, "tps": 620613, "wall": 3021.5} {"step": 28613, "train_loss": 2.9848315715789795, "lr": 4.368336665363381e-05, "tps": 619582, "wall": 3026.6} {"step": 28614, "train_loss": 3.015630006790161, "lr": 4.367951181960828e-05, "tps": 618546, "wall": 3031.8} {"step": 28615, "train_loss": 2.9349539279937744, "lr": 4.3675658982950806e-05, "tps": 617523, "wall": 3036.9} {"step": 28616, "train_loss": 3.0442442893981934, "lr": 4.367180814370499e-05, "tps": 616467, "wall": 3042.2} {"step": 28617, "train_loss": 2.9979984760284424, "lr": 4.3667959301914476e-05, "tps": 615453, "wall": 3047.4} {"step": 28618, "train_loss": 2.95837140083313, "lr": 4.366411245762284e-05, "tps": 614422, "wall": 3052.6} {"step": 28619, "train_loss": 2.989677667617798, "lr": 4.3660267610873686e-05, "tps": 613380, "wall": 3057.9} {"step": 28620, "train_loss": 2.975085973739624, "lr": 4.3656424761710576e-05, "tps": 612380, "wall": 3063.0} {"step": 28621, "train_loss": 3.0077619552612305, "lr": 4.3652583910177e-05, "tps": 611389, "wall": 3068.0} {"step": 28622, "train_loss": 2.9925944805145264, "lr": 4.364874505631653e-05, "tps": 610411, "wall": 3073.1} {"step": 28623, "train_loss": 2.9372165203094482, "lr": 4.36449082001726e-05, "tps": 609418, "wall": 3078.2} {"step": 28624, "train_loss": 2.920656681060791, "lr": 4.364107334178868e-05, "tps": 608452, "wall": 3083.2} {"step": 28625, "train_loss": 2.937340259552002, "lr": 4.363724048120822e-05, "tps": 607481, "wall": 3088.2} {"step": 28626, "train_loss": 3.009058952331543, "lr": 4.3633409618474665e-05, "tps": 606430, "wall": 3093.7} {"step": 28627, "train_loss": 2.862124443054199, "lr": 4.362958075363136e-05, "tps": 605446, "wall": 3098.8} {"step": 28628, "train_loss": 3.0412583351135254, "lr": 4.362575388672172e-05, "tps": 604492, "wall": 3103.8} {"step": 28629, "train_loss": 2.9355039596557617, "lr": 4.3621929017789084e-05, "tps": 603529, "wall": 3108.9} {"step": 28630, "train_loss": 2.997293472290039, "lr": 4.361810614687675e-05, "tps": 602573, "wall": 3113.9} {"step": 28631, "train_loss": 3.0086655616760254, "lr": 4.36142852740281e-05, "tps": 601621, "wall": 3118.9} {"step": 28632, "train_loss": 2.972015380859375, "lr": 4.361046639928634e-05, "tps": 600665, "wall": 3124.0} {"step": 28633, "train_loss": 2.901460647583008, "lr": 4.360664952269475e-05, "tps": 599713, "wall": 3129.1} {"step": 28634, "train_loss": 2.9337799549102783, "lr": 4.3602834644296596e-05, "tps": 598749, "wall": 3134.2} {"step": 28635, "train_loss": 2.964704751968384, "lr": 4.359902176413506e-05, "tps": 597804, "wall": 3139.3} {"step": 28636, "train_loss": 3.0401058197021484, "lr": 4.3595210882253356e-05, "tps": 596850, "wall": 3144.4} {"step": 28637, "train_loss": 2.9848062992095947, "lr": 4.359140199869466e-05, "tps": 595900, "wall": 3149.6} {"step": 28638, "train_loss": 3.0009119510650635, "lr": 4.358759511350208e-05, "tps": 594961, "wall": 3154.6} {"step": 28639, "train_loss": 2.9153199195861816, "lr": 4.358379022671878e-05, "tps": 594024, "wall": 3159.7} {"step": 28640, "train_loss": 3.1045479774475098, "lr": 4.357998733838786e-05, "tps": 593068, "wall": 3164.9} {"step": 28641, "train_loss": 2.8843302726745605, "lr": 4.357618644855237e-05, "tps": 592132, "wall": 3170.0} {"step": 28642, "train_loss": 2.846872091293335, "lr": 4.357238755725539e-05, "tps": 591210, "wall": 3175.1} {"step": 28643, "train_loss": 2.9851536750793457, "lr": 4.356859066453994e-05, "tps": 590296, "wall": 3180.1} {"step": 28644, "train_loss": 3.001674175262451, "lr": 4.3564795770449046e-05, "tps": 589383, "wall": 3185.2} {"step": 28645, "train_loss": 2.934558629989624, "lr": 4.356100287502569e-05, "tps": 588461, "wall": 3190.3} {"step": 28646, "train_loss": 2.945208787918091, "lr": 4.355721197831285e-05, "tps": 587546, "wall": 3195.3} {"step": 28647, "train_loss": 2.923950672149658, "lr": 4.3553423080353427e-05, "tps": 586641, "wall": 3200.4} {"step": 28648, "train_loss": 3.0428948402404785, "lr": 4.35496361811904e-05, "tps": 585736, "wall": 3205.4} {"step": 28649, "train_loss": 2.966151475906372, "lr": 4.3545851280866644e-05, "tps": 584826, "wall": 3210.5} {"step": 28650, "train_loss": 2.880394697189331, "lr": 4.354206837942501e-05, "tps": 583928, "wall": 3215.6} {"step": 28651, "train_loss": 2.999213218688965, "lr": 4.35382874769084e-05, "tps": 583036, "wall": 3220.6} {"step": 28652, "train_loss": 2.951725959777832, "lr": 4.353450857335958e-05, "tps": 582147, "wall": 3225.6} {"step": 28653, "train_loss": 3.0128862857818604, "lr": 4.3530731668821414e-05, "tps": 581259, "wall": 3230.7} {"step": 28654, "train_loss": 3.0270490646362305, "lr": 4.352695676333668e-05, "tps": 580375, "wall": 3235.7} {"step": 28655, "train_loss": 3.007596015930176, "lr": 4.352318385694809e-05, "tps": 579471, "wall": 3240.9} {"step": 28656, "train_loss": 3.016998291015625, "lr": 4.351941294969845e-05, "tps": 578572, "wall": 3246.0} {"step": 28657, "train_loss": 3.003263473510742, "lr": 4.351564404163044e-05, "tps": 577672, "wall": 3251.2} {"step": 28658, "train_loss": 2.9047956466674805, "lr": 4.351187713278675e-05, "tps": 576792, "wall": 3256.3} {"step": 28659, "train_loss": 2.988186836242676, "lr": 4.350811222321009e-05, "tps": 575924, "wall": 3261.3} {"step": 28660, "train_loss": 2.8935790061950684, "lr": 4.350434931294307e-05, "tps": 575059, "wall": 3266.3} {"step": 28661, "train_loss": 2.9431724548339844, "lr": 4.3500588402028314e-05, "tps": 574190, "wall": 3271.4} {"step": 28662, "train_loss": 2.953892707824707, "lr": 4.3496829490508465e-05, "tps": 573333, "wall": 3276.4} {"step": 28663, "train_loss": 2.916018486022949, "lr": 4.3493072578426076e-05, "tps": 572479, "wall": 3281.4} {"step": 28664, "train_loss": 2.9440560340881348, "lr": 4.348931766582369e-05, "tps": 571630, "wall": 3286.4} {"step": 28665, "train_loss": 2.9448773860931396, "lr": 4.3485564752743886e-05, "tps": 570777, "wall": 3291.4} {"step": 28666, "train_loss": 2.936967372894287, "lr": 4.3481813839229134e-05, "tps": 569930, "wall": 3296.4} {"step": 28667, "train_loss": 3.0005404949188232, "lr": 4.347806492532195e-05, "tps": 569090, "wall": 3301.4} {"step": 28668, "train_loss": 3.0590531826019287, "lr": 4.34743180110648e-05, "tps": 568248, "wall": 3306.4} {"step": 28669, "train_loss": 2.9244463443756104, "lr": 4.3470573096500136e-05, "tps": 567409, "wall": 3311.4} {"step": 28670, "train_loss": 2.9001235961914062, "lr": 4.3466830181670336e-05, "tps": 566567, "wall": 3316.4} {"step": 28671, "train_loss": 2.99301815032959, "lr": 4.346308926661787e-05, "tps": 565720, "wall": 3321.5} {"step": 28672, "train_loss": 2.9504928588867188, "lr": 4.345935035138506e-05, "tps": 564884, "wall": 3326.5} {"step": 28673, "train_loss": 2.9329400062561035, "lr": 4.345561343601428e-05, "tps": 564039, "wall": 3331.6} {"step": 28674, "train_loss": 2.9972383975982666, "lr": 4.3451878520547875e-05, "tps": 563211, "wall": 3336.7} {"step": 28675, "train_loss": 2.9650983810424805, "lr": 4.3448145605028124e-05, "tps": 562390, "wall": 3341.6} {"step": 28676, "train_loss": 2.9489119052886963, "lr": 4.344441468949735e-05, "tps": 561565, "wall": 3346.7} {"step": 28677, "train_loss": 2.8791518211364746, "lr": 4.344068577399781e-05, "tps": 560746, "wall": 3351.7} {"step": 28678, "train_loss": 2.9466745853424072, "lr": 4.3436958858571694e-05, "tps": 559932, "wall": 3356.7} {"step": 28679, "train_loss": 3.020820140838623, "lr": 4.343323394326128e-05, "tps": 559117, "wall": 3361.7} {"step": 28680, "train_loss": 2.935405969619751, "lr": 4.342951102810875e-05, "tps": 558314, "wall": 3366.6} {"step": 28681, "train_loss": 3.085494041442871, "lr": 4.342579011315624e-05, "tps": 557510, "wall": 3371.6} {"step": 28682, "train_loss": 3.0189919471740723, "lr": 4.342207119844598e-05, "tps": 556709, "wall": 3376.6} {"step": 28683, "train_loss": 2.88702392578125, "lr": 4.341835428402001e-05, "tps": 555904, "wall": 3381.6} {"step": 28684, "train_loss": 2.8575644493103027, "lr": 4.3414639369920494e-05, "tps": 555106, "wall": 3386.6} {"step": 28685, "train_loss": 2.9638047218322754, "lr": 4.341092645618949e-05, "tps": 554297, "wall": 3391.6} {"step": 28686, "train_loss": 3.00506591796875, "lr": 4.3407215542869075e-05, "tps": 553483, "wall": 3396.7} {"step": 28687, "train_loss": 3.0294878482818604, "lr": 4.340350663000127e-05, "tps": 552686, "wall": 3401.7} {"step": 28688, "train_loss": 3.007986307144165, "lr": 4.3399799717628086e-05, "tps": 551885, "wall": 3406.8} {"step": 28689, "train_loss": 2.8733229637145996, "lr": 4.339609480579153e-05, "tps": 551101, "wall": 3411.8} {"step": 28690, "train_loss": 2.992055892944336, "lr": 4.339239189453357e-05, "tps": 550318, "wall": 3416.7} {"step": 28691, "train_loss": 2.8751163482666016, "lr": 4.338869098389616e-05, "tps": 549523, "wall": 3421.8} {"step": 28692, "train_loss": 3.017662763595581, "lr": 4.3384992073921186e-05, "tps": 548740, "wall": 3426.8} {"step": 28693, "train_loss": 2.9499568939208984, "lr": 4.338129516465059e-05, "tps": 547957, "wall": 3431.8} {"step": 28694, "train_loss": 2.977552890777588, "lr": 4.337760025612625e-05, "tps": 547182, "wall": 3436.8} {"step": 28695, "train_loss": 2.9472603797912598, "lr": 4.3373907348390005e-05, "tps": 546410, "wall": 3441.8} {"step": 28696, "train_loss": 2.9896531105041504, "lr": 4.337021644148367e-05, "tps": 545640, "wall": 3446.8} {"step": 28697, "train_loss": 2.934445381164551, "lr": 4.336652753544912e-05, "tps": 544860, "wall": 3451.8} {"step": 28698, "train_loss": 2.878648281097412, "lr": 4.336284063032806e-05, "tps": 544087, "wall": 3456.8} {"step": 28699, "train_loss": 3.003481388092041, "lr": 4.3359155726162315e-05, "tps": 543325, "wall": 3461.8} {"step": 28700, "train_loss": 3.000459671020508, "lr": 4.335547282299362e-05, "tps": 542556, "wall": 3466.8} {"step": 28701, "train_loss": 2.9920451641082764, "lr": 4.335179192086366e-05, "tps": 541794, "wall": 3471.8} {"step": 28702, "train_loss": 2.9983956813812256, "lr": 4.334811301981418e-05, "tps": 541037, "wall": 3476.8} {"step": 28703, "train_loss": 3.0242862701416016, "lr": 4.334443611988683e-05, "tps": 540281, "wall": 3481.8} {"step": 28704, "train_loss": 2.9405295848846436, "lr": 4.334076122112324e-05, "tps": 539531, "wall": 3486.7} {"step": 28705, "train_loss": 2.950312376022339, "lr": 4.3337088323565084e-05, "tps": 538765, "wall": 3491.8} {"step": 28706, "train_loss": 3.0469889640808105, "lr": 4.333341742725394e-05, "tps": 537996, "wall": 3496.9} {"step": 28707, "train_loss": 2.9311933517456055, "lr": 4.332974853223143e-05, "tps": 537226, "wall": 3502.1} {"step": 28708, "train_loss": 3.009934902191162, "lr": 4.332608163853906e-05, "tps": 536467, "wall": 3507.2} {"step": 28709, "train_loss": 2.8673596382141113, "lr": 4.332241674621838e-05, "tps": 535708, "wall": 3512.2} {"step": 28710, "train_loss": 2.965432643890381, "lr": 4.3318753855310954e-05, "tps": 534970, "wall": 3517.2} {"step": 28711, "train_loss": 2.9880568981170654, "lr": 4.3315092965858225e-05, "tps": 534231, "wall": 3522.2} {"step": 28712, "train_loss": 2.9802207946777344, "lr": 4.3311434077901694e-05, "tps": 533488, "wall": 3527.2} {"step": 28713, "train_loss": 2.908931016921997, "lr": 4.330777719148278e-05, "tps": 532748, "wall": 3532.2} {"step": 28714, "train_loss": 2.9879894256591797, "lr": 4.330412230664294e-05, "tps": 532007, "wall": 3537.3} {"step": 28715, "train_loss": 3.062743902206421, "lr": 4.330046942342355e-05, "tps": 531269, "wall": 3542.3} {"step": 28716, "train_loss": 3.043560028076172, "lr": 4.3296818541866e-05, "tps": 530518, "wall": 3547.5} {"step": 28717, "train_loss": 2.9019293785095215, "lr": 4.3293169662011674e-05, "tps": 529790, "wall": 3552.5} {"step": 28718, "train_loss": 2.988299608230591, "lr": 4.328952278390186e-05, "tps": 529068, "wall": 3557.4} {"step": 28719, "train_loss": 2.9084415435791016, "lr": 4.3285877907577895e-05, "tps": 528346, "wall": 3562.4} {"step": 28720, "train_loss": 2.9601516723632812, "lr": 4.328223503308106e-05, "tps": 527622, "wall": 3567.4} {"step": 28721, "train_loss": 2.9829134941101074, "lr": 4.327859416045264e-05, "tps": 526899, "wall": 3572.5} {"step": 28722, "train_loss": 2.9803528785705566, "lr": 4.3274955289733845e-05, "tps": 526180, "wall": 3577.5} {"step": 28723, "train_loss": 2.9543519020080566, "lr": 4.3271318420965945e-05, "tps": 525450, "wall": 3582.6} {"step": 28724, "train_loss": 3.0078325271606445, "lr": 4.3267683554190075e-05, "tps": 524723, "wall": 3587.6} {"step": 28725, "train_loss": 2.938516139984131, "lr": 4.326405068944748e-05, "tps": 523998, "wall": 3592.7} {"step": 28726, "train_loss": 3.0090410709381104, "lr": 4.326041982677926e-05, "tps": 523277, "wall": 3597.8} {"step": 28727, "train_loss": 2.993424415588379, "lr": 4.325679096622657e-05, "tps": 522563, "wall": 3602.8} {"step": 28728, "train_loss": 2.9611902236938477, "lr": 4.3253164107830536e-05, "tps": 521859, "wall": 3607.8} {"step": 28729, "train_loss": 3.0160255432128906, "lr": 4.324953925163218e-05, "tps": 521159, "wall": 3612.8} {"step": 28730, "train_loss": 2.9719643592834473, "lr": 4.324591639767265e-05, "tps": 520459, "wall": 3617.8} {"step": 28731, "train_loss": 2.884934902191162, "lr": 4.32422955459929e-05, "tps": 519761, "wall": 3622.8} {"step": 28732, "train_loss": 2.9661154747009277, "lr": 4.3238676696634e-05, "tps": 519062, "wall": 3627.8} {"step": 28733, "train_loss": 2.918367862701416, "lr": 4.323505984963694e-05, "tps": 518349, "wall": 3632.9} {"step": 28734, "train_loss": 2.982740879058838, "lr": 4.32314450050427e-05, "tps": 517659, "wall": 3637.9} {"step": 28735, "train_loss": 2.982564687728882, "lr": 4.3227832162892195e-05, "tps": 516969, "wall": 3642.8} {"step": 28736, "train_loss": 3.018333673477173, "lr": 4.3224221323226366e-05, "tps": 516269, "wall": 3647.9} {"step": 28737, "train_loss": 2.967885971069336, "lr": 4.3220612486086144e-05, "tps": 515582, "wall": 3652.9} {"step": 28738, "train_loss": 2.9347174167633057, "lr": 4.3217005651512356e-05, "tps": 514895, "wall": 3657.9} {"step": 28739, "train_loss": 2.949071168899536, "lr": 4.3213400819545924e-05, "tps": 514215, "wall": 3662.9} {"step": 28740, "train_loss": 2.9862782955169678, "lr": 4.320979799022764e-05, "tps": 513539, "wall": 3667.8} {"step": 28741, "train_loss": 2.8225600719451904, "lr": 4.320619716359831e-05, "tps": 512863, "wall": 3672.8} {"step": 28742, "train_loss": 2.940674304962158, "lr": 4.320259833969876e-05, "tps": 512184, "wall": 3677.8} {"step": 28743, "train_loss": 2.9866766929626465, "lr": 4.3199001518569725e-05, "tps": 511500, "wall": 3682.8} {"step": 28744, "train_loss": 2.9571590423583984, "lr": 4.319540670025199e-05, "tps": 510823, "wall": 3687.8} {"step": 28745, "train_loss": 3.0267257690429688, "lr": 4.3191813884786254e-05, "tps": 510144, "wall": 3692.9} {"step": 28746, "train_loss": 2.866832733154297, "lr": 4.318822307221321e-05, "tps": 509476, "wall": 3697.8} {"step": 28747, "train_loss": 2.944938898086548, "lr": 4.318463426257352e-05, "tps": 508803, "wall": 3702.9} {"step": 28748, "train_loss": 3.095184564590454, "lr": 4.318104745590789e-05, "tps": 508132, "wall": 3707.9} {"step": 28749, "train_loss": 2.956364870071411, "lr": 4.317746265225688e-05, "tps": 507465, "wall": 3712.9} {"step": 28750, "train_loss": 2.931941509246826, "lr": 4.3173879851661175e-05, "tps": 506798, "wall": 3717.9} {"step": 28751, "train_loss": 2.9995479583740234, "lr": 4.31702990541613e-05, "tps": 506129, "wall": 3722.9} {"step": 28752, "train_loss": 2.8836517333984375, "lr": 4.316672025979787e-05, "tps": 505467, "wall": 3728.0} {"step": 28753, "train_loss": 2.9125075340270996, "lr": 4.3163143468611374e-05, "tps": 504802, "wall": 3733.0} {"step": 28754, "train_loss": 2.913203716278076, "lr": 4.3159568680642356e-05, "tps": 504141, "wall": 3738.0} {"step": 28755, "train_loss": 2.838926315307617, "lr": 4.315599589593133e-05, "tps": 503486, "wall": 3743.0} {"step": 28756, "train_loss": 3.065814256668091, "lr": 4.315242511451874e-05, "tps": 502816, "wall": 3748.1} {"step": 28757, "train_loss": 2.9372427463531494, "lr": 4.314885633644504e-05, "tps": 502140, "wall": 3753.3} {"step": 28758, "train_loss": 2.925825357437134, "lr": 4.314528956175068e-05, "tps": 501479, "wall": 3758.4} {"step": 28759, "train_loss": 3.013449192047119, "lr": 4.3141724790476035e-05, "tps": 500829, "wall": 3763.4} {"step": 28760, "train_loss": 2.924172878265381, "lr": 4.313816202266149e-05, "tps": 500174, "wall": 3768.4} {"step": 28761, "train_loss": 2.951746940612793, "lr": 4.313460125834742e-05, "tps": 499527, "wall": 3773.5} {"step": 28762, "train_loss": 3.0316288471221924, "lr": 4.313104249757417e-05, "tps": 498881, "wall": 3778.5} {"step": 28763, "train_loss": 3.0097227096557617, "lr": 4.312748574038202e-05, "tps": 498233, "wall": 3783.5} {"step": 28764, "train_loss": 2.8450543880462646, "lr": 4.31239309868113e-05, "tps": 497586, "wall": 3788.6} {"step": 28765, "train_loss": 2.888239860534668, "lr": 4.312037823690226e-05, "tps": 496945, "wall": 3793.6} {"step": 28766, "train_loss": 2.9559357166290283, "lr": 4.3116827490695125e-05, "tps": 496303, "wall": 3798.6} {"step": 28767, "train_loss": 2.9482884407043457, "lr": 4.311327874823014e-05, "tps": 495662, "wall": 3803.7} {"step": 28768, "train_loss": 2.9339656829833984, "lr": 4.310973200954749e-05, "tps": 495020, "wall": 3808.7} {"step": 28769, "train_loss": 2.995877265930176, "lr": 4.3106187274687386e-05, "tps": 494375, "wall": 3813.8} {"step": 28770, "train_loss": 2.9132697582244873, "lr": 4.310264454368996e-05, "tps": 493739, "wall": 3818.9} {"step": 28771, "train_loss": 2.955889940261841, "lr": 4.3099103816595344e-05, "tps": 493096, "wall": 3824.0} {"step": 28772, "train_loss": 3.0211992263793945, "lr": 4.309556509344366e-05, "tps": 492453, "wall": 3829.1} {"step": 28773, "train_loss": 2.9610018730163574, "lr": 4.309202837427498e-05, "tps": 491810, "wall": 3834.3} {"step": 28774, "train_loss": 2.8790299892425537, "lr": 4.308849365912937e-05, "tps": 491182, "wall": 3839.3} {"step": 28775, "train_loss": 3.000994920730591, "lr": 4.308496094804686e-05, "tps": 490556, "wall": 3844.3} {"step": 28776, "train_loss": 3.0485520362854004, "lr": 4.3081430241067514e-05, "tps": 489931, "wall": 3849.4} {"step": 28777, "train_loss": 2.997614860534668, "lr": 4.307790153823127e-05, "tps": 489307, "wall": 3854.4} {"step": 28778, "train_loss": 3.0257668495178223, "lr": 4.307437483957813e-05, "tps": 488689, "wall": 3859.4} {"step": 28779, "train_loss": 2.8890328407287598, "lr": 4.307085014514807e-05, "tps": 488073, "wall": 3864.4} {"step": 28780, "train_loss": 2.870513439178467, "lr": 4.306732745498096e-05, "tps": 487450, "wall": 3869.5} {"step": 28781, "train_loss": 2.9303369522094727, "lr": 4.306380676911676e-05, "tps": 486822, "wall": 3874.6} {"step": 28782, "train_loss": 2.9985127449035645, "lr": 4.306028808759532e-05, "tps": 486210, "wall": 3879.6} {"step": 28783, "train_loss": 2.891111373901367, "lr": 4.305677141045649e-05, "tps": 485595, "wall": 3884.7} {"step": 28784, "train_loss": 2.985866069793701, "lr": 4.305325673774015e-05, "tps": 484978, "wall": 3889.8} {"step": 28785, "train_loss": 2.9116740226745605, "lr": 4.304974406948608e-05, "tps": 484366, "wall": 3894.8} {"step": 28786, "train_loss": 3.109431266784668, "lr": 4.304623340573409e-05, "tps": 483763, "wall": 3899.8} {"step": 28787, "train_loss": 2.925571918487549, "lr": 4.304272474652394e-05, "tps": 483162, "wall": 3904.8} {"step": 28788, "train_loss": 3.0412638187408447, "lr": 4.303921809189537e-05, "tps": 482559, "wall": 3909.8} {"step": 28789, "train_loss": 3.011486768722534, "lr": 4.303571344188813e-05, "tps": 481955, "wall": 3914.8} {"step": 28790, "train_loss": 2.9775795936584473, "lr": 4.303221079654188e-05, "tps": 481356, "wall": 3919.9} {"step": 28791, "train_loss": 3.0227138996124268, "lr": 4.302871015589632e-05, "tps": 480756, "wall": 3924.9} {"step": 28792, "train_loss": 3.0210578441619873, "lr": 4.302521151999112e-05, "tps": 480146, "wall": 3930.0} {"step": 28793, "train_loss": 2.9769859313964844, "lr": 4.302171488886589e-05, "tps": 479555, "wall": 3935.0} {"step": 28794, "train_loss": 3.0096094608306885, "lr": 4.3018220262560246e-05, "tps": 478956, "wall": 3940.0} {"step": 28795, "train_loss": 3.008051872253418, "lr": 4.301472764111379e-05, "tps": 478326, "wall": 3945.4} {"step": 28796, "train_loss": 2.9182655811309814, "lr": 4.3011237024566056e-05, "tps": 477711, "wall": 3950.6} {"step": 28797, "train_loss": 3.0634987354278564, "lr": 4.3007748412956605e-05, "tps": 477108, "wall": 3955.7} {"step": 28798, "train_loss": 2.9425554275512695, "lr": 4.300426180632498e-05, "tps": 476512, "wall": 3960.8} {"step": 28799, "train_loss": 3.02164888381958, "lr": 4.3000777204710625e-05, "tps": 475914, "wall": 3965.9} {"step": 28800, "train_loss": 2.8826985359191895, "lr": 4.299729460815305e-05, "tps": 475318, "wall": 3971.0} {"step": 28801, "train_loss": 3.024728298187256, "lr": 4.2993814016691706e-05, "tps": 474737, "wall": 3976.0} {"step": 28802, "train_loss": 2.9683070182800293, "lr": 4.299033543036601e-05, "tps": 474141, "wall": 3981.2} {"step": 28803, "train_loss": 3.0173215866088867, "lr": 4.298685884921535e-05, "tps": 473556, "wall": 3986.2} {"step": 28804, "train_loss": 3.0294103622436523, "lr": 4.298338427327916e-05, "tps": 472970, "wall": 3991.3} {"step": 28805, "train_loss": 2.93441104888916, "lr": 4.297991170259673e-05, "tps": 472390, "wall": 3996.3} {"step": 28806, "train_loss": 2.993237018585205, "lr": 4.297644113720748e-05, "tps": 471812, "wall": 4001.4} {"step": 28807, "train_loss": 2.9258580207824707, "lr": 4.2972972577150666e-05, "tps": 471237, "wall": 4006.4} {"step": 28808, "train_loss": 2.9430110454559326, "lr": 4.2969506022465576e-05, "tps": 470664, "wall": 4011.4} {"step": 28809, "train_loss": 2.956641674041748, "lr": 4.296604147319151e-05, "tps": 470092, "wall": 4016.4} {"step": 28810, "train_loss": 3.0086352825164795, "lr": 4.296257892936773e-05, "tps": 469521, "wall": 4021.4} {"step": 28811, "train_loss": 2.944063186645508, "lr": 4.2959118391033407e-05, "tps": 468953, "wall": 4026.5} {"step": 28812, "train_loss": 2.899634838104248, "lr": 4.295565985822776e-05, "tps": 468385, "wall": 4031.5} {"step": 28813, "train_loss": 2.843740940093994, "lr": 4.295220333099e-05, "tps": 467818, "wall": 4036.5} {"step": 28814, "train_loss": 2.9435060024261475, "lr": 4.294874880935923e-05, "tps": 467254, "wall": 4041.5} {"step": 28815, "train_loss": 2.9663662910461426, "lr": 4.294529629337465e-05, "tps": 466689, "wall": 4046.6} {"step": 28816, "train_loss": 2.961118221282959, "lr": 4.2941845783075305e-05, "tps": 466119, "wall": 4051.6} {"step": 28817, "train_loss": 2.991640329360962, "lr": 4.293839727850033e-05, "tps": 465557, "wall": 4056.7} {"step": 28818, "train_loss": 2.9444732666015625, "lr": 4.2934950779688744e-05, "tps": 464996, "wall": 4061.7} {"step": 28819, "train_loss": 3.019136428833008, "lr": 4.293150628667964e-05, "tps": 464436, "wall": 4066.7} {"step": 28820, "train_loss": 2.968250274658203, "lr": 4.292806379951197e-05, "tps": 463876, "wall": 4071.8} {"step": 28821, "train_loss": 3.0155797004699707, "lr": 4.292462331822483e-05, "tps": 463319, "wall": 4076.8} {"step": 28822, "train_loss": 3.029787302017212, "lr": 4.2921184842857096e-05, "tps": 462761, "wall": 4081.9} {"step": 28823, "train_loss": 3.0092883110046387, "lr": 4.291774837344776e-05, "tps": 462196, "wall": 4087.0} {"step": 28824, "train_loss": 3.1107139587402344, "lr": 4.291431391003577e-05, "tps": 461627, "wall": 4092.2} {"step": 28825, "train_loss": 3.0141661167144775, "lr": 4.291088145266001e-05, "tps": 461064, "wall": 4097.3} {"step": 28826, "train_loss": 2.874873399734497, "lr": 4.290745100135936e-05, "tps": 460506, "wall": 4102.4} {"step": 28827, "train_loss": 2.864030361175537, "lr": 4.29040225561727e-05, "tps": 459950, "wall": 4107.6} {"step": 28828, "train_loss": 3.0017778873443604, "lr": 4.290059611713883e-05, "tps": 459397, "wall": 4112.6} {"step": 28829, "train_loss": 3.075463056564331, "lr": 4.28971716842966e-05, "tps": 458849, "wall": 4117.7} {"step": 28830, "train_loss": 2.9961540699005127, "lr": 4.289374925768479e-05, "tps": 458302, "wall": 4122.8} {"step": 28831, "train_loss": 3.0183491706848145, "lr": 4.2890328837342147e-05, "tps": 457756, "wall": 4127.8} {"step": 28832, "train_loss": 2.9064483642578125, "lr": 4.288691042330747e-05, "tps": 457211, "wall": 4132.9} {"step": 28833, "train_loss": 2.9620165824890137, "lr": 4.288349401561946e-05, "tps": 456670, "wall": 4137.9} {"step": 28834, "train_loss": 3.0448150634765625, "lr": 4.288007961431676e-05, "tps": 456129, "wall": 4143.0} {"step": 28835, "train_loss": 2.9555411338806152, "lr": 4.287666721943816e-05, "tps": 455591, "wall": 4148.0} {"step": 28836, "train_loss": 2.966256618499756, "lr": 4.287325683102223e-05, "tps": 455052, "wall": 4153.1} {"step": 28837, "train_loss": 2.9209606647491455, "lr": 4.286984844910762e-05, "tps": 454515, "wall": 4158.1} {"step": 28838, "train_loss": 2.958876848220825, "lr": 4.286644207373298e-05, "tps": 453979, "wall": 4163.2} {"step": 28839, "train_loss": 3.112459659576416, "lr": 4.286303770493683e-05, "tps": 453445, "wall": 4168.2} {"step": 28840, "train_loss": 3.0016117095947266, "lr": 4.285963534275779e-05, "tps": 452907, "wall": 4173.3} {"step": 28841, "train_loss": 3.0352115631103516, "lr": 4.285623498723438e-05, "tps": 452378, "wall": 4178.3} {"step": 28842, "train_loss": 2.8772270679473877, "lr": 4.2852836638405116e-05, "tps": 451849, "wall": 4183.4} {"step": 28843, "train_loss": 2.863846778869629, "lr": 4.2849440296308516e-05, "tps": 451322, "wall": 4188.4} {"step": 28844, "train_loss": 2.953913450241089, "lr": 4.284604596098304e-05, "tps": 450789, "wall": 4193.5} {"step": 28845, "train_loss": 2.899181842803955, "lr": 4.284265363246713e-05, "tps": 450262, "wall": 4198.6} {"step": 28846, "train_loss": 2.8993897438049316, "lr": 4.2839263310799245e-05, "tps": 449737, "wall": 4203.6} {"step": 28847, "train_loss": 2.9996042251586914, "lr": 4.283587499601776e-05, "tps": 449212, "wall": 4208.7} {"step": 28848, "train_loss": 2.9850826263427734, "lr": 4.283248868816105e-05, "tps": 448693, "wall": 4213.7} {"step": 28849, "train_loss": 2.966823101043701, "lr": 4.2829104387267506e-05, "tps": 448174, "wall": 4218.7} {"step": 28850, "train_loss": 3.00549578666687, "lr": 4.282572209337546e-05, "tps": 447646, "wall": 4223.8} {"step": 28851, "train_loss": 2.88450026512146, "lr": 4.2822341806523194e-05, "tps": 447127, "wall": 4228.9} {"step": 28852, "train_loss": 2.958099126815796, "lr": 4.2818963526749044e-05, "tps": 446602, "wall": 4234.0} {"step": 28853, "train_loss": 3.0499637126922607, "lr": 4.281558725409126e-05, "tps": 446088, "wall": 4239.0} {"step": 28854, "train_loss": 3.0665555000305176, "lr": 4.2812212988588066e-05, "tps": 445575, "wall": 4244.0} {"step": 28855, "train_loss": 2.9841485023498535, "lr": 4.280884073027775e-05, "tps": 445063, "wall": 4249.1} {"step": 28856, "train_loss": 2.9614946842193604, "lr": 4.2805470479198454e-05, "tps": 444553, "wall": 4254.1} {"step": 28857, "train_loss": 3.0642173290252686, "lr": 4.2802102235388356e-05, "tps": 444043, "wall": 4259.1} {"step": 28858, "train_loss": 3.0307016372680664, "lr": 4.279873599888565e-05, "tps": 443532, "wall": 4264.2} {"step": 28859, "train_loss": 3.0466418266296387, "lr": 4.279537176972843e-05, "tps": 442996, "wall": 4269.5} {"step": 28860, "train_loss": 3.008288621902466, "lr": 4.279200954795486e-05, "tps": 442463, "wall": 4274.8} {"step": 28861, "train_loss": 2.9661262035369873, "lr": 4.278864933360297e-05, "tps": 441949, "wall": 4279.9} {"step": 28862, "train_loss": 2.899991512298584, "lr": 4.2785291126710844e-05, "tps": 441436, "wall": 4285.0} {"step": 28863, "train_loss": 2.993508815765381, "lr": 4.2781934927316543e-05, "tps": 440915, "wall": 4290.2} {"step": 28864, "train_loss": 3.0411994457244873, "lr": 4.2778580735458064e-05, "tps": 440414, "wall": 4295.3} {"step": 28865, "train_loss": 2.9290404319763184, "lr": 4.2775228551173385e-05, "tps": 439914, "wall": 4300.3} {"step": 28866, "train_loss": 3.065167188644409, "lr": 4.277187837450053e-05, "tps": 439416, "wall": 4305.3} {"step": 28867, "train_loss": 2.926318645477295, "lr": 4.276853020547744e-05, "tps": 438919, "wall": 4310.3} {"step": 28868, "train_loss": 2.9711227416992188, "lr": 4.276518404414198e-05, "tps": 438423, "wall": 4315.4} {"step": 28869, "train_loss": 2.9994442462921143, "lr": 4.276183989053215e-05, "tps": 437928, "wall": 4320.4} {"step": 28870, "train_loss": 2.966826915740967, "lr": 4.275849774468578e-05, "tps": 437433, "wall": 4325.4} {"step": 28871, "train_loss": 2.9717366695404053, "lr": 4.27551576066407e-05, "tps": 436932, "wall": 4330.5} {"step": 28872, "train_loss": 2.9758050441741943, "lr": 4.2751819476434814e-05, "tps": 436439, "wall": 4335.6} {"step": 28873, "train_loss": 2.9328773021698, "lr": 4.27484833541059e-05, "tps": 435945, "wall": 4340.7} {"step": 28874, "train_loss": 3.0380473136901855, "lr": 4.274514923969174e-05, "tps": 435451, "wall": 4345.7} {"step": 28875, "train_loss": 2.9744863510131836, "lr": 4.2741817133230156e-05, "tps": 434950, "wall": 4350.9} {"step": 28876, "train_loss": 3.003345012664795, "lr": 4.273848703475882e-05, "tps": 434461, "wall": 4355.9} {"step": 28877, "train_loss": 2.9297337532043457, "lr": 4.27351589443155e-05, "tps": 433973, "wall": 4361.0} {"step": 28878, "train_loss": 2.9749999046325684, "lr": 4.2731832861937905e-05, "tps": 433486, "wall": 4366.0} {"step": 28879, "train_loss": 2.8295159339904785, "lr": 4.272850878766369e-05, "tps": 433000, "wall": 4371.1} {"step": 28880, "train_loss": 2.9126086235046387, "lr": 4.272518672153053e-05, "tps": 432506, "wall": 4376.2} {"step": 28881, "train_loss": 3.000365734100342, "lr": 4.272186666357603e-05, "tps": 432011, "wall": 4381.4} {"step": 28882, "train_loss": 2.874558448791504, "lr": 4.27185486138378e-05, "tps": 431521, "wall": 4386.5} {"step": 28883, "train_loss": 3.012308120727539, "lr": 4.271523257235346e-05, "tps": 431040, "wall": 4391.6} {"step": 28884, "train_loss": 2.9824461936950684, "lr": 4.271191853916057e-05, "tps": 430557, "wall": 4396.6} {"step": 28885, "train_loss": 2.986029863357544, "lr": 4.270860651429662e-05, "tps": 430077, "wall": 4401.7} {"step": 28886, "train_loss": 2.94683837890625, "lr": 4.270529649779921e-05, "tps": 429593, "wall": 4406.8} {"step": 28887, "train_loss": 3.0314571857452393, "lr": 4.270198848970578e-05, "tps": 429107, "wall": 4412.0} {"step": 28888, "train_loss": 2.897996664047241, "lr": 4.26986824900538e-05, "tps": 428625, "wall": 4417.1} {"step": 28889, "train_loss": 2.899672031402588, "lr": 4.2695378498880753e-05, "tps": 428149, "wall": 4422.1} {"step": 28890, "train_loss": 2.9764492511749268, "lr": 4.269207651622403e-05, "tps": 427677, "wall": 4427.2} {"step": 28891, "train_loss": 3.15214204788208, "lr": 4.2688776542121074e-05, "tps": 427204, "wall": 4432.2} {"step": 28892, "train_loss": 2.9101319313049316, "lr": 4.268547857660925e-05, "tps": 426734, "wall": 4437.3} {"step": 28893, "train_loss": 2.935748815536499, "lr": 4.268218261972589e-05, "tps": 426264, "wall": 4442.3} {"step": 28894, "train_loss": 2.9948127269744873, "lr": 4.2678888671508404e-05, "tps": 425795, "wall": 4447.4} {"step": 28895, "train_loss": 2.929565191268921, "lr": 4.267559673199404e-05, "tps": 425327, "wall": 4452.4} {"step": 28896, "train_loss": 3.0489771366119385, "lr": 4.267230680122009e-05, "tps": 424859, "wall": 4457.5} {"step": 28897, "train_loss": 3.0882468223571777, "lr": 4.266901887922387e-05, "tps": 424388, "wall": 4462.6} {"step": 28898, "train_loss": 2.9609532356262207, "lr": 4.2665732966042575e-05, "tps": 423906, "wall": 4467.8} {"step": 28899, "train_loss": 2.9743103981018066, "lr": 4.266244906171345e-05, "tps": 423434, "wall": 4472.9} {"step": 28900, "train_loss": 2.9980154037475586, "lr": 4.265916716627372e-05, "tps": 422966, "wall": 4478.0} {"step": 28901, "train_loss": 3.0028109550476074, "lr": 4.265588727976054e-05, "tps": 422501, "wall": 4483.1} {"step": 28902, "train_loss": 3.025799036026001, "lr": 4.2652609402211024e-05, "tps": 422039, "wall": 4488.2} {"step": 28903, "train_loss": 3.023547887802124, "lr": 4.2649333533662384e-05, "tps": 421578, "wall": 4493.2} {"step": 28904, "train_loss": 3.0296831130981445, "lr": 4.264605967415167e-05, "tps": 421112, "wall": 4498.4} {"step": 28905, "train_loss": 2.971614360809326, "lr": 4.264278782371597e-05, "tps": 420652, "wall": 4503.4} {"step": 28906, "train_loss": 2.952943801879883, "lr": 4.263951798239239e-05, "tps": 420194, "wall": 4508.5} {"step": 28907, "train_loss": 2.8962759971618652, "lr": 4.2636250150217946e-05, "tps": 419738, "wall": 4513.6} {"step": 28908, "train_loss": 2.931210994720459, "lr": 4.263298432722962e-05, "tps": 419280, "wall": 4518.6} {"step": 28909, "train_loss": 2.978409767150879, "lr": 4.262972051346449e-05, "tps": 418822, "wall": 4523.7} {"step": 28910, "train_loss": 2.9430294036865234, "lr": 4.262645870895946e-05, "tps": 418365, "wall": 4528.8} {"step": 28911, "train_loss": 2.910944700241089, "lr": 4.262319891375149e-05, "tps": 417891, "wall": 4534.1} {"step": 28912, "train_loss": 2.9339025020599365, "lr": 4.261994112787755e-05, "tps": 417424, "wall": 4539.4} {"step": 28913, "train_loss": 2.984205484390259, "lr": 4.261668535137449e-05, "tps": 416962, "wall": 4544.6} {"step": 28914, "train_loss": 2.9911274909973145, "lr": 4.261343158427921e-05, "tps": 416499, "wall": 4549.8} {"step": 28915, "train_loss": 2.9273605346679688, "lr": 4.2610179826628605e-05, "tps": 416043, "wall": 4554.9} {"step": 28916, "train_loss": 2.950681209564209, "lr": 4.260693007845944e-05, "tps": 415589, "wall": 4560.0} {"step": 28917, "train_loss": 2.927361011505127, "lr": 4.26036823398086e-05, "tps": 415139, "wall": 4565.1} {"step": 28918, "train_loss": 3.023651361465454, "lr": 4.260043661071281e-05, "tps": 414685, "wall": 4570.3} {"step": 28919, "train_loss": 2.8714675903320312, "lr": 4.25971928912089e-05, "tps": 414237, "wall": 4575.4} {"step": 28920, "train_loss": 2.947577714920044, "lr": 4.259395118133358e-05, "tps": 413788, "wall": 4580.5} {"step": 28921, "train_loss": 2.9593629837036133, "lr": 4.2590711481123566e-05, "tps": 413341, "wall": 4585.6} {"step": 28922, "train_loss": 2.9031405448913574, "lr": 4.2587473790615584e-05, "tps": 412879, "wall": 4590.9} {"step": 28923, "train_loss": 2.9431049823760986, "lr": 4.258423810984631e-05, "tps": 412428, "wall": 4596.1} {"step": 28924, "train_loss": 2.9900169372558594, "lr": 4.258100443885235e-05, "tps": 411978, "wall": 4601.3} {"step": 28925, "train_loss": 3.0412745475769043, "lr": 4.2577772777670376e-05, "tps": 411534, "wall": 4606.4} {"step": 28926, "train_loss": 2.957416534423828, "lr": 4.2574543126337005e-05, "tps": 411085, "wall": 4611.6} {"step": 28927, "train_loss": 3.043548107147217, "lr": 4.25713154848888e-05, "tps": 410637, "wall": 4616.8} {"step": 28928, "train_loss": 2.849849224090576, "lr": 4.256808985336233e-05, "tps": 410188, "wall": 4622.0} {"step": 28929, "train_loss": 2.9798107147216797, "lr": 4.256486623179415e-05, "tps": 409739, "wall": 4627.2} {"step": 28930, "train_loss": 2.9838709831237793, "lr": 4.2561644620220756e-05, "tps": 409292, "wall": 4632.4} {"step": 28931, "train_loss": 2.910249710083008, "lr": 4.2558425018678646e-05, "tps": 408847, "wall": 4637.6} {"step": 28932, "train_loss": 2.927995204925537, "lr": 4.255520742720431e-05, "tps": 408403, "wall": 4642.8} {"step": 28933, "train_loss": 2.9939346313476562, "lr": 4.255199184583417e-05, "tps": 407959, "wall": 4648.1} {"step": 28934, "train_loss": 2.934965133666992, "lr": 4.2548778274604674e-05, "tps": 407515, "wall": 4653.3} {"step": 28935, "train_loss": 2.9015328884124756, "lr": 4.254556671355222e-05, "tps": 407080, "wall": 4658.4} {"step": 28936, "train_loss": 3.031451463699341, "lr": 4.2542357162713176e-05, "tps": 406644, "wall": 4663.6} {"step": 28937, "train_loss": 3.0332956314086914, "lr": 4.253914962212392e-05, "tps": 406212, "wall": 4668.7} {"step": 28938, "train_loss": 2.901381731033325, "lr": 4.2535944091820764e-05, "tps": 405780, "wall": 4673.8} {"step": 28939, "train_loss": 3.108835220336914, "lr": 4.253274057184006e-05, "tps": 405352, "wall": 4678.9} {"step": 28940, "train_loss": 3.002715587615967, "lr": 4.2529539062218046e-05, "tps": 404927, "wall": 4684.0} {"step": 28941, "train_loss": 2.9305973052978516, "lr": 4.252633956299103e-05, "tps": 404509, "wall": 4689.0} {"step": 28942, "train_loss": 2.9583187103271484, "lr": 4.2523142074195235e-05, "tps": 404087, "wall": 4694.0} {"step": 28943, "train_loss": 2.9362876415252686, "lr": 4.251994659586689e-05, "tps": 403666, "wall": 4699.1} {"step": 28944, "train_loss": 3.000005006790161, "lr": 4.2516753128042194e-05, "tps": 403252, "wall": 4704.1} {"step": 28945, "train_loss": 3.0099587440490723, "lr": 4.2513561670757306e-05, "tps": 402837, "wall": 4709.1} {"step": 28946, "train_loss": 3.0072362422943115, "lr": 4.251037222404841e-05, "tps": 402415, "wall": 4714.2} {"step": 28947, "train_loss": 2.9262499809265137, "lr": 4.25071847879516e-05, "tps": 402001, "wall": 4719.2} {"step": 28948, "train_loss": 3.064188241958618, "lr": 4.2503999362503026e-05, "tps": 401587, "wall": 4724.3} {"step": 28949, "train_loss": 2.9805736541748047, "lr": 4.250081594773875e-05, "tps": 401173, "wall": 4729.3} {"step": 28950, "train_loss": 2.9850738048553467, "lr": 4.24976345436948e-05, "tps": 400762, "wall": 4734.3} {"step": 28951, "train_loss": 3.003671646118164, "lr": 4.249445515040728e-05, "tps": 400349, "wall": 4739.4} {"step": 28952, "train_loss": 2.9174118041992188, "lr": 4.249127776791217e-05, "tps": 399941, "wall": 4744.4} {"step": 28953, "train_loss": 2.977099657058716, "lr": 4.248810239624546e-05, "tps": 399532, "wall": 4749.4} {"step": 28954, "train_loss": 2.9611282348632812, "lr": 4.248492903544313e-05, "tps": 399121, "wall": 4754.4} {"step": 28955, "train_loss": 2.877871513366699, "lr": 4.248175768554112e-05, "tps": 398713, "wall": 4759.5} {"step": 28956, "train_loss": 2.90871524810791, "lr": 4.2478588346575386e-05, "tps": 398309, "wall": 4764.5} {"step": 28957, "train_loss": 2.9030213356018066, "lr": 4.247542101858179e-05, "tps": 397899, "wall": 4769.5} {"step": 28958, "train_loss": 3.0260767936706543, "lr": 4.247225570159623e-05, "tps": 397494, "wall": 4774.6} {"step": 28959, "train_loss": 2.869823932647705, "lr": 4.246909239565458e-05, "tps": 397093, "wall": 4779.5} {"step": 28960, "train_loss": 2.9324984550476074, "lr": 4.246593110079263e-05, "tps": 396694, "wall": 4784.5} {"step": 28961, "train_loss": 2.8541762828826904, "lr": 4.246277181704622e-05, "tps": 396296, "wall": 4789.5} {"step": 28962, "train_loss": 2.901761054992676, "lr": 4.2459614544451156e-05, "tps": 395899, "wall": 4794.4} {"step": 28963, "train_loss": 2.9342782497406006, "lr": 4.2456459283043165e-05, "tps": 395503, "wall": 4799.4} {"step": 28964, "train_loss": 2.9015519618988037, "lr": 4.2453306032858006e-05, "tps": 395105, "wall": 4804.4} {"step": 28965, "train_loss": 2.9763197898864746, "lr": 4.245015479393142e-05, "tps": 394710, "wall": 4809.4} {"step": 28966, "train_loss": 2.9674739837646484, "lr": 4.244700556629907e-05, "tps": 394314, "wall": 4814.4} {"step": 28967, "train_loss": 2.9827253818511963, "lr": 4.2443858349996643e-05, "tps": 393921, "wall": 4819.4} {"step": 28968, "train_loss": 2.959872245788574, "lr": 4.244071314505981e-05, "tps": 393527, "wall": 4824.4} {"step": 28969, "train_loss": 2.9852099418640137, "lr": 4.243756995152418e-05, "tps": 393127, "wall": 4829.4} {"step": 28970, "train_loss": 2.9192721843719482, "lr": 4.243442876942535e-05, "tps": 392723, "wall": 4834.6} {"step": 28971, "train_loss": 3.0205461978912354, "lr": 4.243128959879892e-05, "tps": 392321, "wall": 4839.7} {"step": 28972, "train_loss": 2.894887924194336, "lr": 4.242815243968046e-05, "tps": 391921, "wall": 4844.8} {"step": 28973, "train_loss": 2.9989278316497803, "lr": 4.242501729210549e-05, "tps": 391529, "wall": 4849.8} {"step": 28974, "train_loss": 2.9584085941314697, "lr": 4.2421884156109545e-05, "tps": 391139, "wall": 4854.8} {"step": 28975, "train_loss": 2.936645984649658, "lr": 4.241875303172807e-05, "tps": 390746, "wall": 4859.9} {"step": 28976, "train_loss": 2.92026948928833, "lr": 4.2415623918996586e-05, "tps": 390354, "wall": 4864.9} {"step": 28977, "train_loss": 2.996544361114502, "lr": 4.2412496817950535e-05, "tps": 389965, "wall": 4869.9} {"step": 28978, "train_loss": 2.911721706390381, "lr": 4.2409371728625305e-05, "tps": 389574, "wall": 4875.0} {"step": 28979, "train_loss": 2.988039970397949, "lr": 4.240624865105632e-05, "tps": 389185, "wall": 4880.0} {"step": 28980, "train_loss": 2.914321184158325, "lr": 4.240312758527898e-05, "tps": 388800, "wall": 4885.0} {"step": 28981, "train_loss": 2.985696792602539, "lr": 4.2400008531328605e-05, "tps": 388402, "wall": 4890.2} {"step": 28982, "train_loss": 2.875358819961548, "lr": 4.239689148924054e-05, "tps": 388016, "wall": 4895.2} {"step": 28983, "train_loss": 2.9633312225341797, "lr": 4.239377645905009e-05, "tps": 387631, "wall": 4900.3} {"step": 28984, "train_loss": 2.991427183151245, "lr": 4.239066344079256e-05, "tps": 387247, "wall": 4905.3} {"step": 28985, "train_loss": 2.978095054626465, "lr": 4.23875524345032e-05, "tps": 386856, "wall": 4910.4} {"step": 28986, "train_loss": 2.859299421310425, "lr": 4.238444344021726e-05, "tps": 386460, "wall": 4915.6} {"step": 28987, "train_loss": 2.8151848316192627, "lr": 4.238133645796994e-05, "tps": 386078, "wall": 4920.7} {"step": 28988, "train_loss": 2.9614107608795166, "lr": 4.237823148779647e-05, "tps": 385699, "wall": 4925.7} {"step": 28989, "train_loss": 3.0420949459075928, "lr": 4.237512852973197e-05, "tps": 385320, "wall": 4930.7} {"step": 28990, "train_loss": 2.9404666423797607, "lr": 4.237202758381165e-05, "tps": 384940, "wall": 4935.7} {"step": 28991, "train_loss": 2.9591684341430664, "lr": 4.236892865007061e-05, "tps": 384562, "wall": 4940.7} {"step": 28992, "train_loss": 2.9803895950317383, "lr": 4.2365831728543946e-05, "tps": 384178, "wall": 4945.8} {"step": 28993, "train_loss": 2.9734230041503906, "lr": 4.236273681926675e-05, "tps": 383790, "wall": 4951.0} {"step": 28994, "train_loss": 2.9774105548858643, "lr": 4.2359643922274096e-05, "tps": 383403, "wall": 4956.2} {"step": 28995, "train_loss": 2.9562344551086426, "lr": 4.235655303760099e-05, "tps": 383016, "wall": 4961.4} {"step": 28996, "train_loss": 2.9041271209716797, "lr": 4.235346416528246e-05, "tps": 382638, "wall": 4966.4} {"step": 28997, "train_loss": 2.9540066719055176, "lr": 4.235037730535351e-05, "tps": 382262, "wall": 4971.5} {"step": 28998, "train_loss": 2.8835597038269043, "lr": 4.234729245784909e-05, "tps": 381887, "wall": 4976.5} {"step": 28999, "train_loss": 2.9043827056884766, "lr": 4.234420962280415e-05, "tps": 381512, "wall": 4981.6} {"step": 29000, "train_loss": 2.955965518951416, "lr": 4.234112880025364e-05, "tps": 381140, "wall": 4986.6, "val_loss_monitor": 3.3620908152971687} {"step": 29001, "train_loss": 2.9810922145843506, "lr": 4.2338049990232386e-05, "tps": 377055, "wall": 5040.8} {"step": 29002, "train_loss": 3.088531494140625, "lr": 4.2334973192775354e-05, "tps": 376688, "wall": 5045.9} {"step": 29003, "train_loss": 3.0276241302490234, "lr": 4.233189840791735e-05, "tps": 376296, "wall": 5051.4} {"step": 29004, "train_loss": 3.026144504547119, "lr": 4.232882563569318e-05, "tps": 375914, "wall": 5056.7} {"step": 29005, "train_loss": 2.880448341369629, "lr": 4.2325754876137726e-05, "tps": 375547, "wall": 5061.8} {"step": 29006, "train_loss": 3.0091207027435303, "lr": 4.232268612928572e-05, "tps": 375184, "wall": 5066.8} {"step": 29007, "train_loss": 3.0871400833129883, "lr": 4.2319619395171925e-05, "tps": 374816, "wall": 5072.0} {"step": 29008, "train_loss": 3.186776876449585, "lr": 4.2316554673831116e-05, "tps": 374439, "wall": 5077.3} {"step": 29009, "train_loss": 2.987001657485962, "lr": 4.231349196529797e-05, "tps": 374078, "wall": 5082.4} {"step": 29010, "train_loss": 3.0247745513916016, "lr": 4.23104312696072e-05, "tps": 373677, "wall": 5088.0} {"step": 29011, "train_loss": 3.1206154823303223, "lr": 4.230737258679349e-05, "tps": 373297, "wall": 5093.3} {"step": 29012, "train_loss": 3.0458219051361084, "lr": 4.2304315916891456e-05, "tps": 372930, "wall": 5098.5} {"step": 29013, "train_loss": 2.988593101501465, "lr": 4.230126125993575e-05, "tps": 372568, "wall": 5103.7} {"step": 29014, "train_loss": 3.076077699661255, "lr": 4.2298208615961e-05, "tps": 372202, "wall": 5108.9} {"step": 29015, "train_loss": 3.0959510803222656, "lr": 4.229515798500173e-05, "tps": 371847, "wall": 5113.9} {"step": 29016, "train_loss": 3.0601301193237305, "lr": 4.229210936709254e-05, "tps": 371490, "wall": 5119.0} {"step": 29017, "train_loss": 3.0834429264068604, "lr": 4.228906276226793e-05, "tps": 371123, "wall": 5124.2} {"step": 29018, "train_loss": 3.0055274963378906, "lr": 4.228601817056243e-05, "tps": 370753, "wall": 5129.5} {"step": 29019, "train_loss": 3.0364184379577637, "lr": 4.2282975592010544e-05, "tps": 370387, "wall": 5134.8} {"step": 29020, "train_loss": 3.0864062309265137, "lr": 4.227993502664672e-05, "tps": 370027, "wall": 5139.9} {"step": 29021, "train_loss": 3.0797531604766846, "lr": 4.2276896474505395e-05, "tps": 369674, "wall": 5145.0} {"step": 29022, "train_loss": 3.124459743499756, "lr": 4.2273859935621016e-05, "tps": 369322, "wall": 5150.1} {"step": 29023, "train_loss": 2.9525012969970703, "lr": 4.227082541002797e-05, "tps": 368972, "wall": 5155.2} {"step": 29024, "train_loss": 3.1171112060546875, "lr": 4.226779289776062e-05, "tps": 368625, "wall": 5160.2} {"step": 29025, "train_loss": 2.903323173522949, "lr": 4.226476239885332e-05, "tps": 368264, "wall": 5165.4} {"step": 29026, "train_loss": 3.0592825412750244, "lr": 4.226173391334041e-05, "tps": 367870, "wall": 5171.2} {"step": 29027, "train_loss": 3.0227980613708496, "lr": 4.2258707441256205e-05, "tps": 367520, "wall": 5176.3} {"step": 29028, "train_loss": 3.048017978668213, "lr": 4.2255682982634974e-05, "tps": 367165, "wall": 5181.4} {"step": 29029, "train_loss": 3.0739893913269043, "lr": 4.225266053751098e-05, "tps": 366806, "wall": 5186.7} {"step": 29030, "train_loss": 3.14589262008667, "lr": 4.224964010591846e-05, "tps": 366441, "wall": 5192.0} {"step": 29031, "train_loss": 2.9951558113098145, "lr": 4.224662168789164e-05, "tps": 366089, "wall": 5197.2} {"step": 29032, "train_loss": 3.057602643966675, "lr": 4.224360528346468e-05, "tps": 365742, "wall": 5202.3} {"step": 29033, "train_loss": 3.1526904106140137, "lr": 4.2240590892671804e-05, "tps": 365395, "wall": 5207.4} {"step": 29034, "train_loss": 2.9903602600097656, "lr": 4.2237578515547135e-05, "tps": 365052, "wall": 5212.5} {"step": 29035, "train_loss": 3.0828213691711426, "lr": 4.2234568152124776e-05, "tps": 364687, "wall": 5217.9} {"step": 29036, "train_loss": 3.094882011413574, "lr": 4.2231559802438857e-05, "tps": 364331, "wall": 5223.2} {"step": 29037, "train_loss": 3.0665969848632812, "lr": 4.222855346652345e-05, "tps": 363969, "wall": 5228.6} {"step": 29038, "train_loss": 3.0982069969177246, "lr": 4.2225549144412577e-05, "tps": 363589, "wall": 5234.2} {"step": 29039, "train_loss": 3.0083534717559814, "lr": 4.2222546836140344e-05, "tps": 363241, "wall": 5239.4} {"step": 29040, "train_loss": 2.974958896636963, "lr": 4.2219546541740694e-05, "tps": 362897, "wall": 5244.5} {"step": 29041, "train_loss": 3.009195327758789, "lr": 4.221654826124764e-05, "tps": 362559, "wall": 5249.6} {"step": 29042, "train_loss": 2.9583895206451416, "lr": 4.221355199469513e-05, "tps": 362226, "wall": 5254.6} {"step": 29043, "train_loss": 3.067239284515381, "lr": 4.2210557742117144e-05, "tps": 361894, "wall": 5259.6} {"step": 29044, "train_loss": 2.962372303009033, "lr": 4.2207565503547565e-05, "tps": 361561, "wall": 5264.6} {"step": 29045, "train_loss": 3.023876190185547, "lr": 4.2204575279020314e-05, "tps": 361225, "wall": 5269.7} {"step": 29046, "train_loss": 2.908994674682617, "lr": 4.220158706856923e-05, "tps": 360888, "wall": 5274.8} {"step": 29047, "train_loss": 3.076796293258667, "lr": 4.219860087222821e-05, "tps": 360556, "wall": 5279.9} {"step": 29048, "train_loss": 3.0060086250305176, "lr": 4.219561669003106e-05, "tps": 360223, "wall": 5284.9} {"step": 29049, "train_loss": 3.0285019874572754, "lr": 4.219263452201157e-05, "tps": 359890, "wall": 5290.0} {"step": 29050, "train_loss": 3.0533523559570312, "lr": 4.218965436820354e-05, "tps": 359558, "wall": 5295.1} {"step": 29051, "train_loss": 3.0661232471466064, "lr": 4.218667622864072e-05, "tps": 359222, "wall": 5300.2} {"step": 29052, "train_loss": 3.034723997116089, "lr": 4.2183700103356865e-05, "tps": 358892, "wall": 5305.3} {"step": 29053, "train_loss": 3.0881571769714355, "lr": 4.218072599238567e-05, "tps": 358548, "wall": 5310.5} {"step": 29054, "train_loss": 3.1264123916625977, "lr": 4.217775389576082e-05, "tps": 358207, "wall": 5315.8} {"step": 29055, "train_loss": 3.0218262672424316, "lr": 4.217478381351599e-05, "tps": 357881, "wall": 5320.8} {"step": 29056, "train_loss": 3.0655858516693115, "lr": 4.217181574568486e-05, "tps": 357560, "wall": 5325.8} {"step": 29057, "train_loss": 3.0459611415863037, "lr": 4.2168849692300996e-05, "tps": 357234, "wall": 5330.8} {"step": 29058, "train_loss": 3.11240291595459, "lr": 4.216588565339802e-05, "tps": 356912, "wall": 5335.8} {"step": 29059, "train_loss": 3.0710854530334473, "lr": 4.216292362900953e-05, "tps": 356589, "wall": 5340.8} {"step": 29060, "train_loss": 3.021721363067627, "lr": 4.215996361916906e-05, "tps": 356264, "wall": 5345.9} {"step": 29061, "train_loss": 2.9585580825805664, "lr": 4.215700562391012e-05, "tps": 355943, "wall": 5350.9} {"step": 29062, "train_loss": 3.0273056030273438, "lr": 4.215404964326626e-05, "tps": 355621, "wall": 5355.9} {"step": 29063, "train_loss": 2.9120028018951416, "lr": 4.215109567727093e-05, "tps": 355292, "wall": 5361.0} {"step": 29064, "train_loss": 2.9794797897338867, "lr": 4.2148143725957626e-05, "tps": 354969, "wall": 5366.1} {"step": 29065, "train_loss": 3.0482847690582275, "lr": 4.214519378935979e-05, "tps": 354637, "wall": 5371.3} {"step": 29066, "train_loss": 3.023226737976074, "lr": 4.2142245867510776e-05, "tps": 354319, "wall": 5376.3} {"step": 29067, "train_loss": 2.989797353744507, "lr": 4.213929996044405e-05, "tps": 353997, "wall": 5381.4} {"step": 29068, "train_loss": 3.1055898666381836, "lr": 4.213635606819296e-05, "tps": 353677, "wall": 5386.5} {"step": 29069, "train_loss": 3.0241594314575195, "lr": 4.2133414190790835e-05, "tps": 353360, "wall": 5391.5} {"step": 29070, "train_loss": 2.9837183952331543, "lr": 4.213047432827103e-05, "tps": 353044, "wall": 5396.5} {"step": 29071, "train_loss": 3.036717176437378, "lr": 4.212753648066684e-05, "tps": 352729, "wall": 5401.5} {"step": 29072, "train_loss": 3.0274438858032227, "lr": 4.212460064801152e-05, "tps": 352415, "wall": 5406.5} {"step": 29073, "train_loss": 3.002650260925293, "lr": 4.2121666830338355e-05, "tps": 352100, "wall": 5411.5} {"step": 29074, "train_loss": 3.024153232574463, "lr": 4.211873502768057e-05, "tps": 351788, "wall": 5416.5} {"step": 29075, "train_loss": 3.0458106994628906, "lr": 4.211580524007137e-05, "tps": 351473, "wall": 5421.5} {"step": 29076, "train_loss": 3.008924961090088, "lr": 4.211287746754398e-05, "tps": 351162, "wall": 5426.5} {"step": 29077, "train_loss": 3.086707592010498, "lr": 4.210995171013151e-05, "tps": 350848, "wall": 5431.6} {"step": 29078, "train_loss": 3.056382894515991, "lr": 4.210702796786714e-05, "tps": 350536, "wall": 5436.6} {"step": 29079, "train_loss": 3.0343141555786133, "lr": 4.210410624078397e-05, "tps": 350223, "wall": 5441.6} {"step": 29080, "train_loss": 2.972137451171875, "lr": 4.210118652891511e-05, "tps": 349912, "wall": 5446.7} {"step": 29081, "train_loss": 2.9769463539123535, "lr": 4.209826883229365e-05, "tps": 349602, "wall": 5451.7} {"step": 29082, "train_loss": 2.889554977416992, "lr": 4.209535315095262e-05, "tps": 349293, "wall": 5456.7} {"step": 29083, "train_loss": 3.062512159347534, "lr": 4.209243948492505e-05, "tps": 348985, "wall": 5461.7} {"step": 29084, "train_loss": 3.068155527114868, "lr": 4.2089527834243974e-05, "tps": 348678, "wall": 5466.7} {"step": 29085, "train_loss": 2.9657955169677734, "lr": 4.208661819894232e-05, "tps": 348367, "wall": 5471.7} {"step": 29086, "train_loss": 3.073791027069092, "lr": 4.208371057905308e-05, "tps": 348052, "wall": 5476.9} {"step": 29087, "train_loss": 3.1031508445739746, "lr": 4.208080497460921e-05, "tps": 347741, "wall": 5482.0} {"step": 29088, "train_loss": 2.9944286346435547, "lr": 4.2077901385643586e-05, "tps": 347429, "wall": 5487.1} {"step": 29089, "train_loss": 3.0429892539978027, "lr": 4.207499981218914e-05, "tps": 347117, "wall": 5492.2} {"step": 29090, "train_loss": 3.1373672485351562, "lr": 4.207210025427871e-05, "tps": 346811, "wall": 5497.2} {"step": 29091, "train_loss": 3.034928798675537, "lr": 4.206920271194516e-05, "tps": 346506, "wall": 5502.3} {"step": 29092, "train_loss": 3.1147892475128174, "lr": 4.206630718522129e-05, "tps": 346201, "wall": 5507.3} {"step": 29093, "train_loss": 3.052727699279785, "lr": 4.206341367413995e-05, "tps": 345899, "wall": 5512.3} {"step": 29094, "train_loss": 3.0876035690307617, "lr": 4.206052217873386e-05, "tps": 345599, "wall": 5517.3} {"step": 29095, "train_loss": 3.0823512077331543, "lr": 4.2057632699035816e-05, "tps": 345297, "wall": 5522.3} {"step": 29096, "train_loss": 3.0197551250457764, "lr": 4.2054745235078516e-05, "tps": 344996, "wall": 5527.3} {"step": 29097, "train_loss": 3.0333542823791504, "lr": 4.205185978689471e-05, "tps": 344695, "wall": 5532.3} {"step": 29098, "train_loss": 3.121659755706787, "lr": 4.2048976354517046e-05, "tps": 344395, "wall": 5537.3} {"step": 29099, "train_loss": 3.0230367183685303, "lr": 4.204609493797822e-05, "tps": 344096, "wall": 5542.3} {"step": 29100, "train_loss": 3.070310354232788, "lr": 4.2043215537310856e-05, "tps": 343797, "wall": 5547.3} {"step": 29101, "train_loss": 3.0423924922943115, "lr": 4.2040338152547566e-05, "tps": 343490, "wall": 5552.5} {"step": 29102, "train_loss": 2.8616931438446045, "lr": 4.203746278372096e-05, "tps": 343190, "wall": 5557.5} {"step": 29103, "train_loss": 3.004089832305908, "lr": 4.20345894308636e-05, "tps": 342890, "wall": 5562.6} {"step": 29104, "train_loss": 3.007432460784912, "lr": 4.2031718094008035e-05, "tps": 342587, "wall": 5567.7} {"step": 29105, "train_loss": 3.0497426986694336, "lr": 4.20288487731868e-05, "tps": 342294, "wall": 5572.7} {"step": 29106, "train_loss": 2.9864563941955566, "lr": 4.202598146843238e-05, "tps": 342001, "wall": 5577.6} {"step": 29107, "train_loss": 3.0124564170837402, "lr": 4.2023116179777286e-05, "tps": 341707, "wall": 5582.6} {"step": 29108, "train_loss": 2.922273635864258, "lr": 4.202025290725395e-05, "tps": 341411, "wall": 5587.6} {"step": 29109, "train_loss": 2.9471566677093506, "lr": 4.201739165089482e-05, "tps": 341113, "wall": 5592.7} {"step": 29110, "train_loss": 3.0276033878326416, "lr": 4.201453241073233e-05, "tps": 340812, "wall": 5597.9} {"step": 29111, "train_loss": 3.0460665225982666, "lr": 4.201167518679882e-05, "tps": 340516, "wall": 5602.9} {"step": 29112, "train_loss": 2.989515781402588, "lr": 4.200881997912669e-05, "tps": 340222, "wall": 5607.9} {"step": 29113, "train_loss": 2.965423107147217, "lr": 4.200596678774827e-05, "tps": 339927, "wall": 5613.0} {"step": 29114, "train_loss": 2.9895710945129395, "lr": 4.2003115612695894e-05, "tps": 339633, "wall": 5618.1} {"step": 29115, "train_loss": 3.115302085876465, "lr": 4.200026645400186e-05, "tps": 339340, "wall": 5623.1} {"step": 29116, "train_loss": 3.1494760513305664, "lr": 4.199741931169842e-05, "tps": 339047, "wall": 5628.1} {"step": 29117, "train_loss": 3.086167573928833, "lr": 4.199457418581785e-05, "tps": 338755, "wall": 5633.2} {"step": 29118, "train_loss": 3.000232458114624, "lr": 4.199173107639238e-05, "tps": 338463, "wall": 5638.3} {"step": 29119, "train_loss": 2.971544027328491, "lr": 4.198888998345421e-05, "tps": 338174, "wall": 5643.3} {"step": 29120, "train_loss": 2.9787814617156982, "lr": 4.198605090703551e-05, "tps": 337883, "wall": 5648.3} {"step": 29121, "train_loss": 3.0969643592834473, "lr": 4.1983213847168476e-05, "tps": 337593, "wall": 5653.4} {"step": 29122, "train_loss": 3.064967155456543, "lr": 4.1980378803885226e-05, "tps": 337304, "wall": 5658.4} {"step": 29123, "train_loss": 3.1277575492858887, "lr": 4.197754577721786e-05, "tps": 337016, "wall": 5663.4} {"step": 29124, "train_loss": 3.0607895851135254, "lr": 4.1974714767198494e-05, "tps": 336727, "wall": 5668.5} {"step": 29125, "train_loss": 3.123631238937378, "lr": 4.197188577385919e-05, "tps": 336437, "wall": 5673.6} {"step": 29126, "train_loss": 3.113171100616455, "lr": 4.1969058797232e-05, "tps": 336152, "wall": 5678.6} {"step": 29127, "train_loss": 3.091308355331421, "lr": 4.1966233837348937e-05, "tps": 335865, "wall": 5683.6} {"step": 29128, "train_loss": 3.0509932041168213, "lr": 4.1963410894242e-05, "tps": 335578, "wall": 5688.7} {"step": 29129, "train_loss": 2.9742236137390137, "lr": 4.196058996794319e-05, "tps": 335291, "wall": 5693.8} {"step": 29130, "train_loss": 3.0109305381774902, "lr": 4.1957771058484454e-05, "tps": 335004, "wall": 5698.8} {"step": 29131, "train_loss": 2.9831156730651855, "lr": 4.1954954165897706e-05, "tps": 334721, "wall": 5703.8} {"step": 29132, "train_loss": 3.1805224418640137, "lr": 4.195213929021487e-05, "tps": 334432, "wall": 5709.0} {"step": 29133, "train_loss": 3.057356357574463, "lr": 4.194932643146784e-05, "tps": 334142, "wall": 5714.1} {"step": 29134, "train_loss": 3.0517215728759766, "lr": 4.1946515589688464e-05, "tps": 333856, "wall": 5719.2} {"step": 29135, "train_loss": 3.162588357925415, "lr": 4.19437067649086e-05, "tps": 333572, "wall": 5724.3} {"step": 29136, "train_loss": 3.023751974105835, "lr": 4.194089995716006e-05, "tps": 333288, "wall": 5729.3} {"step": 29137, "train_loss": 3.0633254051208496, "lr": 4.193809516647461e-05, "tps": 333002, "wall": 5734.5} {"step": 29138, "train_loss": 3.042097330093384, "lr": 4.193529239288407e-05, "tps": 332720, "wall": 5739.5} {"step": 29139, "train_loss": 2.9523088932037354, "lr": 4.1932491636420184e-05, "tps": 332442, "wall": 5744.5} {"step": 29140, "train_loss": 3.015899419784546, "lr": 4.1929692897114655e-05, "tps": 332165, "wall": 5749.5} {"step": 29141, "train_loss": 3.025587558746338, "lr": 4.1926896174999205e-05, "tps": 331887, "wall": 5754.5} {"step": 29142, "train_loss": 3.0614302158355713, "lr": 4.19241014701055e-05, "tps": 331608, "wall": 5759.5} {"step": 29143, "train_loss": 2.950089454650879, "lr": 4.192130878246522e-05, "tps": 331333, "wall": 5764.5} {"step": 29144, "train_loss": 3.0350427627563477, "lr": 4.191851811210997e-05, "tps": 331057, "wall": 5769.5} {"step": 29145, "train_loss": 3.126096725463867, "lr": 4.191572945907138e-05, "tps": 330781, "wall": 5774.5} {"step": 29146, "train_loss": 3.0257914066314697, "lr": 4.191294282338107e-05, "tps": 330508, "wall": 5779.5} {"step": 29147, "train_loss": 3.023660659790039, "lr": 4.191015820507055e-05, "tps": 330233, "wall": 5784.5} {"step": 29148, "train_loss": 3.041449785232544, "lr": 4.190737560417139e-05, "tps": 329955, "wall": 5789.6} {"step": 29149, "train_loss": 3.1366772651672363, "lr": 4.1904595020715124e-05, "tps": 329677, "wall": 5794.7} {"step": 29150, "train_loss": 2.997854471206665, "lr": 4.190181645473325e-05, "tps": 329402, "wall": 5799.7} {"step": 29151, "train_loss": 3.035682201385498, "lr": 4.189903990625721e-05, "tps": 329126, "wall": 5804.8} {"step": 29152, "train_loss": 3.0483717918395996, "lr": 4.1896265375318515e-05, "tps": 328854, "wall": 5809.8} {"step": 29153, "train_loss": 3.0633885860443115, "lr": 4.1893492861948546e-05, "tps": 328583, "wall": 5814.8} {"step": 29154, "train_loss": 3.0802531242370605, "lr": 4.189072236617871e-05, "tps": 328311, "wall": 5819.8} {"step": 29155, "train_loss": 3.0554089546203613, "lr": 4.188795388804041e-05, "tps": 328040, "wall": 5824.8} {"step": 29156, "train_loss": 3.044009208679199, "lr": 4.188518742756503e-05, "tps": 327770, "wall": 5829.8} {"step": 29157, "train_loss": 3.0988926887512207, "lr": 4.1882422984783867e-05, "tps": 327500, "wall": 5834.8} {"step": 29158, "train_loss": 3.0370001792907715, "lr": 4.187966055972824e-05, "tps": 327229, "wall": 5839.8} {"step": 29159, "train_loss": 2.952711582183838, "lr": 4.187690015242946e-05, "tps": 326961, "wall": 5844.8} {"step": 29160, "train_loss": 3.0811872482299805, "lr": 4.187414176291879e-05, "tps": 326686, "wall": 5849.9} {"step": 29161, "train_loss": 2.9884352684020996, "lr": 4.18713853912275e-05, "tps": 326417, "wall": 5855.0} {"step": 29162, "train_loss": 3.1219394207000732, "lr": 4.186863103738676e-05, "tps": 326149, "wall": 5860.0} {"step": 29163, "train_loss": 3.0323033332824707, "lr": 4.186587870142783e-05, "tps": 325880, "wall": 5865.0} {"step": 29164, "train_loss": 3.0556092262268066, "lr": 4.186312838338187e-05, "tps": 325611, "wall": 5870.1} {"step": 29165, "train_loss": 3.0438597202301025, "lr": 4.186038008327999e-05, "tps": 325342, "wall": 5875.1} {"step": 29166, "train_loss": 2.9428465366363525, "lr": 4.18576338011534e-05, "tps": 325073, "wall": 5880.2} {"step": 29167, "train_loss": 3.002559185028076, "lr": 4.1854889537033154e-05, "tps": 324802, "wall": 5885.3} {"step": 29168, "train_loss": 2.9644436836242676, "lr": 4.185214729095034e-05, "tps": 324531, "wall": 5890.4} {"step": 29169, "train_loss": 3.0225954055786133, "lr": 4.1849407062936064e-05, "tps": 324259, "wall": 5895.5} {"step": 29170, "train_loss": 2.916916608810425, "lr": 4.1846668853021354e-05, "tps": 323991, "wall": 5900.6} {"step": 29171, "train_loss": 3.066603660583496, "lr": 4.184393266123719e-05, "tps": 323721, "wall": 5905.7} {"step": 29172, "train_loss": 2.98264741897583, "lr": 4.18411984876146e-05, "tps": 323448, "wall": 5910.9} {"step": 29173, "train_loss": 3.072859287261963, "lr": 4.183846633218456e-05, "tps": 323183, "wall": 5916.0} {"step": 29174, "train_loss": 3.09443998336792, "lr": 4.1835736194978014e-05, "tps": 322920, "wall": 5921.0} {"step": 29175, "train_loss": 2.9850075244903564, "lr": 4.183300807602587e-05, "tps": 322658, "wall": 5926.0} {"step": 29176, "train_loss": 3.019162654876709, "lr": 4.183028197535906e-05, "tps": 322396, "wall": 5931.0} {"step": 29177, "train_loss": 3.0161304473876953, "lr": 4.1827557893008454e-05, "tps": 322135, "wall": 5936.0} {"step": 29178, "train_loss": 3.0403480529785156, "lr": 4.182483582900493e-05, "tps": 321876, "wall": 5941.0} {"step": 29179, "train_loss": 2.98905348777771, "lr": 4.182211578337927e-05, "tps": 321616, "wall": 5946.0} {"step": 29180, "train_loss": 2.943852424621582, "lr": 4.181939775616234e-05, "tps": 321357, "wall": 5951.0} {"step": 29181, "train_loss": 3.0432138442993164, "lr": 4.181668174738492e-05, "tps": 321098, "wall": 5956.0} {"step": 29182, "train_loss": 2.9716851711273193, "lr": 4.181396775707774e-05, "tps": 320838, "wall": 5961.1} {"step": 29183, "train_loss": 3.052337169647217, "lr": 4.18112557852716e-05, "tps": 320580, "wall": 5966.1} {"step": 29184, "train_loss": 2.9397990703582764, "lr": 4.18085458319972e-05, "tps": 320314, "wall": 5971.2} {"step": 29185, "train_loss": 2.9582693576812744, "lr": 4.1805837897285216e-05, "tps": 320055, "wall": 5976.3} {"step": 29186, "train_loss": 3.106910228729248, "lr": 4.1803131981166345e-05, "tps": 319798, "wall": 5981.3} {"step": 29187, "train_loss": 3.0078492164611816, "lr": 4.180042808367124e-05, "tps": 319541, "wall": 5986.3} {"step": 29188, "train_loss": 2.9276413917541504, "lr": 4.1797726204830496e-05, "tps": 319282, "wall": 5991.3} {"step": 29189, "train_loss": 3.150722026824951, "lr": 4.179502634467479e-05, "tps": 319021, "wall": 5996.4} {"step": 29190, "train_loss": 3.093202590942383, "lr": 4.179232850323465e-05, "tps": 318763, "wall": 6001.5} {"step": 29191, "train_loss": 3.021637439727783, "lr": 4.178963268054065e-05, "tps": 318507, "wall": 6006.5} {"step": 29192, "train_loss": 2.9706614017486572, "lr": 4.178693887662334e-05, "tps": 318252, "wall": 6011.6} {"step": 29193, "train_loss": 3.033501148223877, "lr": 4.178424709151323e-05, "tps": 317999, "wall": 6016.5} {"step": 29194, "train_loss": 3.050011396408081, "lr": 4.17815573252408e-05, "tps": 317747, "wall": 6021.5} {"step": 29195, "train_loss": 3.0514090061187744, "lr": 4.177886957783652e-05, "tps": 317494, "wall": 6026.5} {"step": 29196, "train_loss": 3.0759551525115967, "lr": 4.177618384933087e-05, "tps": 317237, "wall": 6031.6} {"step": 29197, "train_loss": 3.100998878479004, "lr": 4.177350013975424e-05, "tps": 316987, "wall": 6036.6} {"step": 29198, "train_loss": 2.9992282390594482, "lr": 4.177081844913705e-05, "tps": 316735, "wall": 6041.6} {"step": 29199, "train_loss": 3.1621956825256348, "lr": 4.176813877750966e-05, "tps": 316484, "wall": 6046.6} {"step": 29200, "train_loss": 3.1034231185913086, "lr": 4.176546112490244e-05, "tps": 316234, "wall": 6051.6} {"step": 29201, "train_loss": 3.12626314163208, "lr": 4.1762785491345725e-05, "tps": 315984, "wall": 6056.6} {"step": 29202, "train_loss": 3.0230557918548584, "lr": 4.176011187686979e-05, "tps": 315733, "wall": 6061.6} {"step": 29203, "train_loss": 3.0895285606384277, "lr": 4.1757440281505e-05, "tps": 315485, "wall": 6066.6} {"step": 29204, "train_loss": 3.0958642959594727, "lr": 4.1754770705281536e-05, "tps": 315236, "wall": 6071.6} {"step": 29205, "train_loss": 3.094226837158203, "lr": 4.175210314822967e-05, "tps": 314985, "wall": 6076.6} {"step": 29206, "train_loss": 3.058908462524414, "lr": 4.1749437610379645e-05, "tps": 314733, "wall": 6081.7} {"step": 29207, "train_loss": 3.0114095211029053, "lr": 4.174677409176162e-05, "tps": 314481, "wall": 6086.8} {"step": 29208, "train_loss": 3.072462797164917, "lr": 4.1744112592405775e-05, "tps": 314225, "wall": 6091.9} {"step": 29209, "train_loss": 3.0088729858398438, "lr": 4.174145311234226e-05, "tps": 313974, "wall": 6097.0} {"step": 29210, "train_loss": 2.9618945121765137, "lr": 4.1738795651601244e-05, "tps": 313725, "wall": 6102.1} {"step": 29211, "train_loss": 3.0291836261749268, "lr": 4.173614021021275e-05, "tps": 313478, "wall": 6107.1} {"step": 29212, "train_loss": 3.0259382724761963, "lr": 4.1733486788206934e-05, "tps": 313230, "wall": 6112.1} {"step": 29213, "train_loss": 3.067143440246582, "lr": 4.173083538561381e-05, "tps": 312985, "wall": 6117.1} {"step": 29214, "train_loss": 3.0780863761901855, "lr": 4.172818600246343e-05, "tps": 312732, "wall": 6122.3} {"step": 29215, "train_loss": 3.0383641719818115, "lr": 4.172553863878581e-05, "tps": 312484, "wall": 6127.3} {"step": 29216, "train_loss": 3.0415093898773193, "lr": 4.1722893294610914e-05, "tps": 312238, "wall": 6132.4} {"step": 29217, "train_loss": 3.0759024620056152, "lr": 4.172024996996874e-05, "tps": 311991, "wall": 6137.4} {"step": 29218, "train_loss": 3.072641372680664, "lr": 4.171760866488923e-05, "tps": 311744, "wall": 6142.5} {"step": 29219, "train_loss": 2.985712766647339, "lr": 4.171496937940229e-05, "tps": 311496, "wall": 6147.6} {"step": 29220, "train_loss": 3.0102739334106445, "lr": 4.171233211353782e-05, "tps": 311251, "wall": 6152.7} {"step": 29221, "train_loss": 3.0480258464813232, "lr": 4.1709696867325696e-05, "tps": 311010, "wall": 6157.6} {"step": 29222, "train_loss": 3.0308773517608643, "lr": 4.170706364079575e-05, "tps": 310768, "wall": 6162.7} {"step": 29223, "train_loss": 3.0692403316497803, "lr": 4.170443243397787e-05, "tps": 310526, "wall": 6167.7} {"step": 29224, "train_loss": 3.0725624561309814, "lr": 4.1701803246901786e-05, "tps": 310283, "wall": 6172.7} {"step": 29225, "train_loss": 3.0787458419799805, "lr": 4.169917607959735e-05, "tps": 310040, "wall": 6177.8} {"step": 29226, "train_loss": 3.0322365760803223, "lr": 4.169655093209429e-05, "tps": 309799, "wall": 6182.8} {"step": 29227, "train_loss": 3.0456044673919678, "lr": 4.1693927804422336e-05, "tps": 309556, "wall": 6187.8} {"step": 29228, "train_loss": 3.24062180519104, "lr": 4.169130669661122e-05, "tps": 309317, "wall": 6192.8} {"step": 29229, "train_loss": 2.9769489765167236, "lr": 4.168868760869062e-05, "tps": 309077, "wall": 6197.9} {"step": 29230, "train_loss": 3.048964738845825, "lr": 4.1686070540690206e-05, "tps": 308836, "wall": 6202.9} {"step": 29231, "train_loss": 2.977170467376709, "lr": 4.1683455492639666e-05, "tps": 308598, "wall": 6207.9} {"step": 29232, "train_loss": 3.0307064056396484, "lr": 4.1680842464568566e-05, "tps": 308353, "wall": 6213.0} {"step": 29233, "train_loss": 2.926119327545166, "lr": 4.1678231456506525e-05, "tps": 308111, "wall": 6218.1} {"step": 29234, "train_loss": 2.992858648300171, "lr": 4.167562246848315e-05, "tps": 307866, "wall": 6223.3} {"step": 29235, "train_loss": 3.065622329711914, "lr": 4.167301550052794e-05, "tps": 307627, "wall": 6228.3} {"step": 29236, "train_loss": 3.050601005554199, "lr": 4.167041055267047e-05, "tps": 307390, "wall": 6233.4} {"step": 29237, "train_loss": 3.0845065116882324, "lr": 4.166780762494024e-05, "tps": 307151, "wall": 6238.4} {"step": 29238, "train_loss": 3.082130193710327, "lr": 4.166520671736672e-05, "tps": 306912, "wall": 6243.5} {"step": 29239, "train_loss": 2.9653029441833496, "lr": 4.166260782997939e-05, "tps": 306675, "wall": 6248.5} {"step": 29240, "train_loss": 3.0413951873779297, "lr": 4.166001096280771e-05, "tps": 306440, "wall": 6253.5} {"step": 29241, "train_loss": 3.037120819091797, "lr": 4.165741611588106e-05, "tps": 306205, "wall": 6258.6} {"step": 29242, "train_loss": 3.068291425704956, "lr": 4.165482328922884e-05, "tps": 305966, "wall": 6263.6} {"step": 29243, "train_loss": 3.0528998374938965, "lr": 4.165223248288042e-05, "tps": 305733, "wall": 6268.6} {"step": 29244, "train_loss": 3.0819344520568848, "lr": 4.1649643696865186e-05, "tps": 305496, "wall": 6273.7} {"step": 29245, "train_loss": 3.0139174461364746, "lr": 4.1647056931212426e-05, "tps": 305262, "wall": 6278.7} {"step": 29246, "train_loss": 3.139923095703125, "lr": 4.164447218595144e-05, "tps": 305026, "wall": 6283.8} {"step": 29247, "train_loss": 3.1696810722351074, "lr": 4.164188946111155e-05, "tps": 304793, "wall": 6288.8} {"step": 29248, "train_loss": 3.145326852798462, "lr": 4.1639308756721964e-05, "tps": 304561, "wall": 6293.8} {"step": 29249, "train_loss": 3.0968384742736816, "lr": 4.163673007281194e-05, "tps": 304325, "wall": 6298.9} {"step": 29250, "train_loss": 3.0028843879699707, "lr": 4.163415340941069e-05, "tps": 304088, "wall": 6304.1} {"step": 29251, "train_loss": 3.1151695251464844, "lr": 4.1631578766547405e-05, "tps": 303852, "wall": 6309.2} {"step": 29252, "train_loss": 3.1104671955108643, "lr": 4.1629006144251256e-05, "tps": 303620, "wall": 6314.2} {"step": 29253, "train_loss": 3.0639920234680176, "lr": 4.162643554255135e-05, "tps": 303391, "wall": 6319.2} {"step": 29254, "train_loss": 3.010634660720825, "lr": 4.162386696147683e-05, "tps": 303161, "wall": 6324.2} {"step": 29255, "train_loss": 3.0355141162872314, "lr": 4.16213004010568e-05, "tps": 302933, "wall": 6329.2} {"step": 29256, "train_loss": 2.981858968734741, "lr": 4.161873586132035e-05, "tps": 302701, "wall": 6334.2} {"step": 29257, "train_loss": 3.037888765335083, "lr": 4.161617334229649e-05, "tps": 302473, "wall": 6339.2} {"step": 29258, "train_loss": 2.9652392864227295, "lr": 4.1613612844014275e-05, "tps": 302245, "wall": 6344.2} {"step": 29259, "train_loss": 3.1352455615997314, "lr": 4.1611054366502706e-05, "tps": 302019, "wall": 6349.2} {"step": 29260, "train_loss": 3.0416178703308105, "lr": 4.160849790979077e-05, "tps": 301791, "wall": 6354.2} {"step": 29261, "train_loss": 3.048285484313965, "lr": 4.1605943473907404e-05, "tps": 301564, "wall": 6359.2} {"step": 29262, "train_loss": 3.0753390789031982, "lr": 4.160339105888157e-05, "tps": 301336, "wall": 6364.3} {"step": 29263, "train_loss": 2.9621737003326416, "lr": 4.160084066474217e-05, "tps": 301106, "wall": 6369.3} {"step": 29264, "train_loss": 3.019015312194824, "lr": 4.159829229151811e-05, "tps": 300878, "wall": 6374.4} {"step": 29265, "train_loss": 2.891934394836426, "lr": 4.159574593923824e-05, "tps": 300653, "wall": 6379.4} {"step": 29266, "train_loss": 3.047076463699341, "lr": 4.15932016079314e-05, "tps": 300426, "wall": 6384.4} {"step": 29267, "train_loss": 3.0303874015808105, "lr": 4.159065929762642e-05, "tps": 300200, "wall": 6389.4} {"step": 29268, "train_loss": 2.91451096534729, "lr": 4.1588119008352125e-05, "tps": 299968, "wall": 6394.6} {"step": 29269, "train_loss": 2.9433295726776123, "lr": 4.1585580740137277e-05, "tps": 299735, "wall": 6399.8} {"step": 29270, "train_loss": 3.105403423309326, "lr": 4.15830444930106e-05, "tps": 299504, "wall": 6404.9} {"step": 29271, "train_loss": 2.9801759719848633, "lr": 4.158051026700086e-05, "tps": 299274, "wall": 6410.1} {"step": 29272, "train_loss": 3.037627696990967, "lr": 4.1577978062136745e-05, "tps": 299046, "wall": 6415.2} {"step": 29273, "train_loss": 3.0788257122039795, "lr": 4.157544787844692e-05, "tps": 298820, "wall": 6420.2} {"step": 29274, "train_loss": 3.0696606636047363, "lr": 4.157291971596012e-05, "tps": 298595, "wall": 6425.3} {"step": 29275, "train_loss": 3.085404872894287, "lr": 4.15703935747049e-05, "tps": 298369, "wall": 6430.4} {"step": 29276, "train_loss": 3.113255739212036, "lr": 4.156786945470995e-05, "tps": 298145, "wall": 6435.4} {"step": 29277, "train_loss": 3.047520875930786, "lr": 4.15653473560038e-05, "tps": 297920, "wall": 6440.5} {"step": 29278, "train_loss": 3.1046760082244873, "lr": 4.156282727861506e-05, "tps": 297697, "wall": 6445.6} {"step": 29279, "train_loss": 2.9855737686157227, "lr": 4.156030922257228e-05, "tps": 297469, "wall": 6450.7} {"step": 29280, "train_loss": 3.1446852684020996, "lr": 4.155779318790395e-05, "tps": 297247, "wall": 6455.8} {"step": 29281, "train_loss": 2.9904050827026367, "lr": 4.1555279174638584e-05, "tps": 297024, "wall": 6460.8} {"step": 29282, "train_loss": 3.004031181335449, "lr": 4.15527671828047e-05, "tps": 296802, "wall": 6465.9} {"step": 29283, "train_loss": 3.006439447402954, "lr": 4.1550257212430696e-05, "tps": 296559, "wall": 6471.4} {"step": 29284, "train_loss": 3.067958354949951, "lr": 4.1547749263545055e-05, "tps": 296329, "wall": 6476.6} {"step": 29285, "train_loss": 2.968228578567505, "lr": 4.154524333617614e-05, "tps": 296103, "wall": 6481.8} {"step": 29286, "train_loss": 3.0686726570129395, "lr": 4.1542739430352387e-05, "tps": 295876, "wall": 6487.0} {"step": 29287, "train_loss": 3.016099214553833, "lr": 4.154023754610211e-05, "tps": 295657, "wall": 6492.0} {"step": 29288, "train_loss": 3.0239434242248535, "lr": 4.15377376834537e-05, "tps": 295425, "wall": 6497.4} {"step": 29289, "train_loss": 3.0723929405212402, "lr": 4.1535239842435444e-05, "tps": 295201, "wall": 6502.5} {"step": 29290, "train_loss": 3.0557727813720703, "lr": 4.1532744023075634e-05, "tps": 294974, "wall": 6507.7} {"step": 29291, "train_loss": 2.9996705055236816, "lr": 4.153025022540257e-05, "tps": 294751, "wall": 6512.9} {"step": 29292, "train_loss": 2.9753940105438232, "lr": 4.152775844944449e-05, "tps": 294532, "wall": 6517.9} {"step": 29293, "train_loss": 3.0582146644592285, "lr": 4.1525268695229606e-05, "tps": 294315, "wall": 6523.0} {"step": 29294, "train_loss": 3.053196907043457, "lr": 4.1522780962786146e-05, "tps": 294094, "wall": 6528.1} {"step": 29295, "train_loss": 2.9988455772399902, "lr": 4.152029525214226e-05, "tps": 293874, "wall": 6533.2} {"step": 29296, "train_loss": 3.030010461807251, "lr": 4.1517811563326134e-05, "tps": 293654, "wall": 6538.3} {"step": 29297, "train_loss": 3.041494607925415, "lr": 4.15153298963659e-05, "tps": 293435, "wall": 6543.4} {"step": 29298, "train_loss": 3.0261266231536865, "lr": 4.1512850251289654e-05, "tps": 293215, "wall": 6548.6} {"step": 29299, "train_loss": 2.9683852195739746, "lr": 4.15103726281255e-05, "tps": 292993, "wall": 6553.8} {"step": 29300, "train_loss": 3.0452637672424316, "lr": 4.1507897026901503e-05, "tps": 292774, "wall": 6558.9} {"step": 29301, "train_loss": 3.114182472229004, "lr": 4.15054234476457e-05, "tps": 292561, "wall": 6563.9} {"step": 29302, "train_loss": 2.8925838470458984, "lr": 4.1502951890386125e-05, "tps": 292339, "wall": 6569.1} {"step": 29303, "train_loss": 3.029506206512451, "lr": 4.150048235515078e-05, "tps": 292117, "wall": 6574.3} {"step": 29304, "train_loss": 3.1425585746765137, "lr": 4.14980148419676e-05, "tps": 291905, "wall": 6579.3} {"step": 29305, "train_loss": 3.0308103561401367, "lr": 4.1495549350864584e-05, "tps": 291688, "wall": 6584.4} {"step": 29306, "train_loss": 2.9818990230560303, "lr": 4.1493085881869633e-05, "tps": 291474, "wall": 6589.5} {"step": 29307, "train_loss": 3.111640453338623, "lr": 4.149062443501065e-05, "tps": 291259, "wall": 6594.6} {"step": 29308, "train_loss": 3.056462049484253, "lr": 4.148816501031555e-05, "tps": 291045, "wall": 6599.6} {"step": 29309, "train_loss": 3.0113673210144043, "lr": 4.148570760781216e-05, "tps": 290832, "wall": 6604.7} {"step": 29310, "train_loss": 3.032611846923828, "lr": 4.148325222752835e-05, "tps": 290621, "wall": 6609.7} {"step": 29311, "train_loss": 2.964524269104004, "lr": 4.14807988694919e-05, "tps": 290413, "wall": 6614.7} {"step": 29312, "train_loss": 3.0774669647216797, "lr": 4.1478347533730626e-05, "tps": 290203, "wall": 6619.7} {"step": 29313, "train_loss": 2.9905991554260254, "lr": 4.1475898220272295e-05, "tps": 289996, "wall": 6624.6} {"step": 29314, "train_loss": 3.060483694076538, "lr": 4.1473450929144645e-05, "tps": 289787, "wall": 6629.6} {"step": 29315, "train_loss": 3.146002769470215, "lr": 4.147100566037538e-05, "tps": 289579, "wall": 6634.6} {"step": 29316, "train_loss": 2.991546630859375, "lr": 4.1468562413992246e-05, "tps": 289372, "wall": 6639.6} {"step": 29317, "train_loss": 3.115490198135376, "lr": 4.1466121190022894e-05, "tps": 289165, "wall": 6644.6} {"step": 29318, "train_loss": 3.0908498764038086, "lr": 4.146368198849495e-05, "tps": 288959, "wall": 6649.6} {"step": 29319, "train_loss": 2.9668331146240234, "lr": 4.1461244809436105e-05, "tps": 288753, "wall": 6654.5} {"step": 29320, "train_loss": 3.167037010192871, "lr": 4.145880965287393e-05, "tps": 288548, "wall": 6659.5} {"step": 29321, "train_loss": 3.076453924179077, "lr": 4.145637651883602e-05, "tps": 288343, "wall": 6664.4} {"step": 29322, "train_loss": 3.0948379039764404, "lr": 4.145394540734994e-05, "tps": 288138, "wall": 6669.4} {"step": 29323, "train_loss": 3.095552444458008, "lr": 4.145151631844322e-05, "tps": 287933, "wall": 6674.4} {"step": 29324, "train_loss": 3.014326810836792, "lr": 4.144908925214336e-05, "tps": 287729, "wall": 6679.3} {"step": 29325, "train_loss": 3.0612754821777344, "lr": 4.14466642084779e-05, "tps": 287524, "wall": 6684.3} {"step": 29326, "train_loss": 3.1351990699768066, "lr": 4.144424118747429e-05, "tps": 287320, "wall": 6689.3} {"step": 29327, "train_loss": 3.0316123962402344, "lr": 4.144182018915996e-05, "tps": 287113, "wall": 6694.4} {"step": 29328, "train_loss": 3.0187597274780273, "lr": 4.1439401213562374e-05, "tps": 286911, "wall": 6699.3} {"step": 29329, "train_loss": 3.173966884613037, "lr": 4.1436984260708894e-05, "tps": 286708, "wall": 6704.3} {"step": 29330, "train_loss": 3.013091564178467, "lr": 4.143456933062691e-05, "tps": 286502, "wall": 6709.3} {"step": 29331, "train_loss": 3.129978656768799, "lr": 4.143215642334381e-05, "tps": 286299, "wall": 6714.3} {"step": 29332, "train_loss": 3.112630844116211, "lr": 4.142974553888688e-05, "tps": 286096, "wall": 6719.3} {"step": 29333, "train_loss": 3.027456045150757, "lr": 4.142733667728345e-05, "tps": 285894, "wall": 6724.3} {"step": 29334, "train_loss": 2.9793648719787598, "lr": 4.1424929838560825e-05, "tps": 285691, "wall": 6729.3} {"step": 29335, "train_loss": 2.9676454067230225, "lr": 4.1422525022746264e-05, "tps": 285490, "wall": 6734.2} {"step": 29336, "train_loss": 3.0003395080566406, "lr": 4.142012222986698e-05, "tps": 285289, "wall": 6739.2} {"step": 29337, "train_loss": 3.0598201751708984, "lr": 4.141772145995024e-05, "tps": 285088, "wall": 6744.2} {"step": 29338, "train_loss": 3.0254921913146973, "lr": 4.141532271302316e-05, "tps": 284887, "wall": 6749.2} {"step": 29339, "train_loss": 3.075505256652832, "lr": 4.141292598911301e-05, "tps": 284683, "wall": 6754.3} {"step": 29340, "train_loss": 2.9144275188446045, "lr": 4.141053128824688e-05, "tps": 284483, "wall": 6759.2} {"step": 29341, "train_loss": 3.009587287902832, "lr": 4.140813861045193e-05, "tps": 284283, "wall": 6764.2} {"step": 29342, "train_loss": 3.1515111923217773, "lr": 4.140574795575523e-05, "tps": 284074, "wall": 6769.4} {"step": 29343, "train_loss": 3.15725040435791, "lr": 4.140335932418389e-05, "tps": 283866, "wall": 6774.6} {"step": 29344, "train_loss": 2.9860246181488037, "lr": 4.140097271576494e-05, "tps": 283664, "wall": 6779.7} {"step": 29345, "train_loss": 3.019704818725586, "lr": 4.1398588130525454e-05, "tps": 283460, "wall": 6784.8} {"step": 29346, "train_loss": 3.037278890609741, "lr": 4.1396205568492406e-05, "tps": 283258, "wall": 6789.9} {"step": 29347, "train_loss": 3.1263339519500732, "lr": 4.1393825029692826e-05, "tps": 283057, "wall": 6794.9} {"step": 29348, "train_loss": 2.9930779933929443, "lr": 4.139144651415364e-05, "tps": 282857, "wall": 6800.0} {"step": 29349, "train_loss": 3.086803436279297, "lr": 4.138907002190181e-05, "tps": 282657, "wall": 6805.0} {"step": 29350, "train_loss": 2.9783921241760254, "lr": 4.138669555296426e-05, "tps": 282453, "wall": 6810.1} {"step": 29351, "train_loss": 3.1195666790008545, "lr": 4.13843231073679e-05, "tps": 282256, "wall": 6815.1} {"step": 29352, "train_loss": 3.0851621627807617, "lr": 4.1381952685139574e-05, "tps": 282058, "wall": 6820.1} {"step": 29353, "train_loss": 2.9323983192443848, "lr": 4.1379584286306144e-05, "tps": 281860, "wall": 6825.2} {"step": 29354, "train_loss": 3.1552176475524902, "lr": 4.137721791089446e-05, "tps": 281663, "wall": 6830.2} {"step": 29355, "train_loss": 3.072418689727783, "lr": 4.1374853558931306e-05, "tps": 281465, "wall": 6835.2} {"step": 29356, "train_loss": 2.9782347679138184, "lr": 4.13724912304435e-05, "tps": 281269, "wall": 6840.2} {"step": 29357, "train_loss": 2.9816854000091553, "lr": 4.1370130925457764e-05, "tps": 281074, "wall": 6845.2} {"step": 29358, "train_loss": 2.9936563968658447, "lr": 4.136777264400082e-05, "tps": 280880, "wall": 6850.1} {"step": 29359, "train_loss": 3.019068717956543, "lr": 4.1365416386099456e-05, "tps": 280685, "wall": 6855.1} {"step": 29360, "train_loss": 3.1072816848754883, "lr": 4.136306215178029e-05, "tps": 280488, "wall": 6860.2} {"step": 29361, "train_loss": 3.064704418182373, "lr": 4.136070994107003e-05, "tps": 280292, "wall": 6865.2} {"step": 29362, "train_loss": 3.0157690048217773, "lr": 4.1358359753995304e-05, "tps": 280094, "wall": 6870.3} {"step": 29363, "train_loss": 3.0579259395599365, "lr": 4.135601159058275e-05, "tps": 279900, "wall": 6875.3} {"step": 29364, "train_loss": 2.988162040710449, "lr": 4.1353665450858956e-05, "tps": 279707, "wall": 6880.3} {"step": 29365, "train_loss": 3.025073766708374, "lr": 4.135132133485051e-05, "tps": 279513, "wall": 6885.3} {"step": 29366, "train_loss": 3.071279525756836, "lr": 4.1348979242583964e-05, "tps": 279320, "wall": 6890.3} {"step": 29367, "train_loss": 3.0181236267089844, "lr": 4.1346639174085825e-05, "tps": 279125, "wall": 6895.3} {"step": 29368, "train_loss": 3.081505537033081, "lr": 4.134430112938264e-05, "tps": 278932, "wall": 6900.3} {"step": 29369, "train_loss": 3.0884056091308594, "lr": 4.134196510850087e-05, "tps": 278739, "wall": 6905.3} {"step": 29370, "train_loss": 2.9657230377197266, "lr": 4.1339631111467006e-05, "tps": 278547, "wall": 6910.3} {"step": 29371, "train_loss": 2.980710029602051, "lr": 4.1337299138307455e-05, "tps": 278356, "wall": 6915.3} {"step": 29372, "train_loss": 2.994635820388794, "lr": 4.133496918904863e-05, "tps": 278165, "wall": 6920.3} {"step": 29373, "train_loss": 3.0605340003967285, "lr": 4.133264126371694e-05, "tps": 277975, "wall": 6925.3} {"step": 29374, "train_loss": 3.073430299758911, "lr": 4.133031536233877e-05, "tps": 277782, "wall": 6930.3} {"step": 29375, "train_loss": 3.073564052581787, "lr": 4.1327991484940454e-05, "tps": 277592, "wall": 6935.3} {"step": 29376, "train_loss": 3.001495599746704, "lr": 4.1325669631548306e-05, "tps": 277401, "wall": 6940.3} {"step": 29377, "train_loss": 3.018047571182251, "lr": 4.132334980218866e-05, "tps": 277212, "wall": 6945.3} {"step": 29378, "train_loss": 3.0683982372283936, "lr": 4.1321031996887744e-05, "tps": 277023, "wall": 6950.2} {"step": 29379, "train_loss": 3.0125246047973633, "lr": 4.131871621567185e-05, "tps": 276834, "wall": 6955.2} {"step": 29380, "train_loss": 3.0685460567474365, "lr": 4.131640245856723e-05, "tps": 276643, "wall": 6960.3} {"step": 29381, "train_loss": 3.095975399017334, "lr": 4.131409072560003e-05, "tps": 276453, "wall": 6965.3} {"step": 29382, "train_loss": 3.0046205520629883, "lr": 4.1311781016796515e-05, "tps": 276264, "wall": 6970.3} {"step": 29383, "train_loss": 3.070585250854492, "lr": 4.1309473332182775e-05, "tps": 276075, "wall": 6975.3} {"step": 29384, "train_loss": 2.9826738834381104, "lr": 4.130716767178501e-05, "tps": 275887, "wall": 6980.3} {"step": 29385, "train_loss": 3.0561914443969727, "lr": 4.130486403562932e-05, "tps": 275696, "wall": 6985.4} {"step": 29386, "train_loss": 3.1020307540893555, "lr": 4.13025624237418e-05, "tps": 275502, "wall": 6990.5} {"step": 29387, "train_loss": 3.165618419647217, "lr": 4.130026283614851e-05, "tps": 275313, "wall": 6995.6} {"step": 29388, "train_loss": 3.0163350105285645, "lr": 4.1297965272875514e-05, "tps": 275126, "wall": 7000.6} {"step": 29389, "train_loss": 3.163522243499756, "lr": 4.129566973394882e-05, "tps": 274940, "wall": 7005.5} {"step": 29390, "train_loss": 3.0304503440856934, "lr": 4.129337621939446e-05, "tps": 274752, "wall": 7010.6} {"step": 29391, "train_loss": 3.04934024810791, "lr": 4.129108472923842e-05, "tps": 274564, "wall": 7015.6} {"step": 29392, "train_loss": 3.0471386909484863, "lr": 4.128879526350662e-05, "tps": 274378, "wall": 7020.6} {"step": 29393, "train_loss": 2.9998538494110107, "lr": 4.128650782222501e-05, "tps": 274191, "wall": 7025.6} {"step": 29394, "train_loss": 3.0406453609466553, "lr": 4.128422240541953e-05, "tps": 274005, "wall": 7030.6} {"step": 29395, "train_loss": 3.0646872520446777, "lr": 4.1281939013116e-05, "tps": 273819, "wall": 7035.6} {"step": 29396, "train_loss": 3.117544651031494, "lr": 4.1279657645340375e-05, "tps": 273631, "wall": 7040.7} {"step": 29397, "train_loss": 3.052213668823242, "lr": 4.127737830211847e-05, "tps": 273442, "wall": 7045.8} {"step": 29398, "train_loss": 3.024702787399292, "lr": 4.1275100983476044e-05, "tps": 273254, "wall": 7050.9} {"step": 29399, "train_loss": 3.017958879470825, "lr": 4.127282568943899e-05, "tps": 273067, "wall": 7056.0} {"step": 29400, "train_loss": 3.065072774887085, "lr": 4.127055242003301e-05, "tps": 272882, "wall": 7061.0} {"step": 29401, "train_loss": 3.0792365074157715, "lr": 4.1268281175283874e-05, "tps": 272698, "wall": 7066.0} {"step": 29402, "train_loss": 3.022798538208008, "lr": 4.126601195521734e-05, "tps": 272515, "wall": 7071.0} {"step": 29403, "train_loss": 3.093925714492798, "lr": 4.126374475985907e-05, "tps": 272329, "wall": 7076.1} {"step": 29404, "train_loss": 3.0103416442871094, "lr": 4.12614795892348e-05, "tps": 272145, "wall": 7081.1} {"step": 29405, "train_loss": 2.999375820159912, "lr": 4.125921644337012e-05, "tps": 271962, "wall": 7086.1} {"step": 29406, "train_loss": 2.980860471725464, "lr": 4.1256955322290736e-05, "tps": 271780, "wall": 7091.1} {"step": 29407, "train_loss": 2.961825370788574, "lr": 4.125469622602222e-05, "tps": 271597, "wall": 7096.1} {"step": 29408, "train_loss": 3.156345844268799, "lr": 4.1252439154590186e-05, "tps": 271415, "wall": 7101.1} {"step": 29409, "train_loss": 3.082486629486084, "lr": 4.125018410802017e-05, "tps": 271228, "wall": 7106.2} {"step": 29410, "train_loss": 3.029024600982666, "lr": 4.124793108633775e-05, "tps": 271042, "wall": 7111.3} {"step": 29411, "train_loss": 3.1331255435943604, "lr": 4.124568008956845e-05, "tps": 270859, "wall": 7116.4} {"step": 29412, "train_loss": 3.0718986988067627, "lr": 4.1243431117737726e-05, "tps": 270679, "wall": 7121.4} {"step": 29413, "train_loss": 2.9792990684509277, "lr": 4.124118417087112e-05, "tps": 270499, "wall": 7126.4} {"step": 29414, "train_loss": 3.0966649055480957, "lr": 4.1238939248994025e-05, "tps": 270320, "wall": 7131.3} {"step": 29415, "train_loss": 3.0072176456451416, "lr": 4.1236696352131905e-05, "tps": 270139, "wall": 7136.3} {"step": 29416, "train_loss": 3.04109525680542, "lr": 4.1234455480310165e-05, "tps": 269957, "wall": 7141.4} {"step": 29417, "train_loss": 3.0104963779449463, "lr": 4.1232216633554155e-05, "tps": 269772, "wall": 7146.5} {"step": 29418, "train_loss": 3.124323606491089, "lr": 4.1229979811889306e-05, "tps": 269591, "wall": 7151.6} {"step": 29419, "train_loss": 2.968057632446289, "lr": 4.122774501534089e-05, "tps": 269412, "wall": 7156.6} {"step": 29420, "train_loss": 2.9957141876220703, "lr": 4.122551224393427e-05, "tps": 269232, "wall": 7161.6} {"step": 29421, "train_loss": 3.0121817588806152, "lr": 4.122328149769472e-05, "tps": 269053, "wall": 7166.6} {"step": 29422, "train_loss": 3.042755126953125, "lr": 4.1221052776647504e-05, "tps": 268873, "wall": 7171.7} {"step": 29423, "train_loss": 2.9810922145843506, "lr": 4.121882608081786e-05, "tps": 268693, "wall": 7176.7} {"step": 29424, "train_loss": 2.9692819118499756, "lr": 4.121660141023103e-05, "tps": 268511, "wall": 7181.8} {"step": 29425, "train_loss": 3.025559425354004, "lr": 4.121437876491222e-05, "tps": 268334, "wall": 7186.8} {"step": 29426, "train_loss": 3.0127182006835938, "lr": 4.1212158144886595e-05, "tps": 268154, "wall": 7191.8} {"step": 29427, "train_loss": 2.9427270889282227, "lr": 4.1209939550179314e-05, "tps": 267973, "wall": 7197.0} {"step": 29428, "train_loss": 3.09731125831604, "lr": 4.120772298081551e-05, "tps": 267793, "wall": 7202.0} {"step": 29429, "train_loss": 3.014441728591919, "lr": 4.120550843682029e-05, "tps": 267614, "wall": 7207.1} {"step": 29430, "train_loss": 3.1062397956848145, "lr": 4.120329591821874e-05, "tps": 267436, "wall": 7212.1} {"step": 29431, "train_loss": 3.047832489013672, "lr": 4.120108542503595e-05, "tps": 267258, "wall": 7217.2} {"step": 29432, "train_loss": 3.1036312580108643, "lr": 4.1198876957296915e-05, "tps": 267071, "wall": 7222.5} {"step": 29433, "train_loss": 3.007889747619629, "lr": 4.1196670515026684e-05, "tps": 266885, "wall": 7227.8} {"step": 29434, "train_loss": 3.0970211029052734, "lr": 4.1194466098250225e-05, "tps": 266696, "wall": 7233.1} {"step": 29435, "train_loss": 3.040539264678955, "lr": 4.119226370699254e-05, "tps": 266512, "wall": 7238.4} {"step": 29436, "train_loss": 3.026258945465088, "lr": 4.119006334127857e-05, "tps": 266329, "wall": 7243.6} {"step": 29437, "train_loss": 3.0298664569854736, "lr": 4.118786500113323e-05, "tps": 266151, "wall": 7248.7} {"step": 29438, "train_loss": 3.04445743560791, "lr": 4.118566868658144e-05, "tps": 265972, "wall": 7253.8} {"step": 29439, "train_loss": 2.9618759155273438, "lr": 4.1183474397648066e-05, "tps": 265792, "wall": 7259.0} {"step": 29440, "train_loss": 3.0100364685058594, "lr": 4.118128213435795e-05, "tps": 265612, "wall": 7264.1} {"step": 29441, "train_loss": 2.8434665203094482, "lr": 4.1179091896735955e-05, "tps": 265433, "wall": 7269.3} {"step": 29442, "train_loss": 3.0482282638549805, "lr": 4.117690368480688e-05, "tps": 265255, "wall": 7274.4} {"step": 29443, "train_loss": 3.043470859527588, "lr": 4.117471749859552e-05, "tps": 265078, "wall": 7279.5} {"step": 29444, "train_loss": 2.9270589351654053, "lr": 4.117253333812663e-05, "tps": 264898, "wall": 7284.7} {"step": 29445, "train_loss": 3.055912971496582, "lr": 4.117035120342496e-05, "tps": 264718, "wall": 7289.9} {"step": 29446, "train_loss": 3.0582966804504395, "lr": 4.116817109451522e-05, "tps": 264541, "wall": 7295.0} {"step": 29447, "train_loss": 3.0739083290100098, "lr": 4.116599301142211e-05, "tps": 264363, "wall": 7300.2} {"step": 29448, "train_loss": 3.0652811527252197, "lr": 4.11638169541703e-05, "tps": 264183, "wall": 7305.4} {"step": 29449, "train_loss": 2.855668067932129, "lr": 4.116164292278446e-05, "tps": 264002, "wall": 7310.7} {"step": 29450, "train_loss": 2.961793899536133, "lr": 4.11594709172892e-05, "tps": 263820, "wall": 7316.0} {"step": 29451, "train_loss": 3.0474953651428223, "lr": 4.1157300937709145e-05, "tps": 263637, "wall": 7321.3} {"step": 29452, "train_loss": 2.9819841384887695, "lr": 4.1155132984068834e-05, "tps": 263456, "wall": 7326.6} {"step": 29453, "train_loss": 3.018883466720581, "lr": 4.1152967056392886e-05, "tps": 263277, "wall": 7331.8} {"step": 29454, "train_loss": 2.8314456939697266, "lr": 4.1150803154705764e-05, "tps": 263099, "wall": 7337.0} {"step": 29455, "train_loss": 3.0903782844543457, "lr": 4.114864127903203e-05, "tps": 262920, "wall": 7342.3} {"step": 29456, "train_loss": 2.9415712356567383, "lr": 4.114648142939619e-05, "tps": 262740, "wall": 7347.5} {"step": 29457, "train_loss": 2.9862899780273438, "lr": 4.1144323605822644e-05, "tps": 262558, "wall": 7352.9} {"step": 29458, "train_loss": 3.115694046020508, "lr": 4.11421678083359e-05, "tps": 262385, "wall": 7358.0} {"step": 29459, "train_loss": 3.1035685539245605, "lr": 4.114001403696035e-05, "tps": 262206, "wall": 7363.2} {"step": 29460, "train_loss": 3.1069533824920654, "lr": 4.1137862291720384e-05, "tps": 262030, "wall": 7368.4} {"step": 29461, "train_loss": 3.0150415897369385, "lr": 4.113571257264042e-05, "tps": 261855, "wall": 7373.6} {"step": 29462, "train_loss": 3.1223998069763184, "lr": 4.1133564879744753e-05, "tps": 261678, "wall": 7378.8} {"step": 29463, "train_loss": 2.974487066268921, "lr": 4.113141921305775e-05, "tps": 261502, "wall": 7384.1} {"step": 29464, "train_loss": 2.9837093353271484, "lr": 4.112927557260372e-05, "tps": 261326, "wall": 7389.3} {"step": 29465, "train_loss": 3.0608160495758057, "lr": 4.11271339584069e-05, "tps": 261148, "wall": 7394.6} {"step": 29466, "train_loss": 3.1013693809509277, "lr": 4.112499437049162e-05, "tps": 260969, "wall": 7399.9} {"step": 29467, "train_loss": 3.040130615234375, "lr": 4.112285680888207e-05, "tps": 260791, "wall": 7405.2} {"step": 29468, "train_loss": 3.1117777824401855, "lr": 4.1120721273602455e-05, "tps": 260613, "wall": 7410.5} {"step": 29469, "train_loss": 3.083214044570923, "lr": 4.1118587764677005e-05, "tps": 260437, "wall": 7415.8} {"step": 29470, "train_loss": 2.987039566040039, "lr": 4.111645628212986e-05, "tps": 260258, "wall": 7421.1} {"step": 29471, "train_loss": 2.9554080963134766, "lr": 4.1114326825985186e-05, "tps": 260082, "wall": 7426.4} {"step": 29472, "train_loss": 3.0254015922546387, "lr": 4.111219939626709e-05, "tps": 259907, "wall": 7431.7} {"step": 29473, "train_loss": 2.9179534912109375, "lr": 4.1110073992999686e-05, "tps": 259733, "wall": 7436.9} {"step": 29474, "train_loss": 3.0928239822387695, "lr": 4.110795061620703e-05, "tps": 259557, "wall": 7442.2} {"step": 29475, "train_loss": 3.135192394256592, "lr": 4.110582926591319e-05, "tps": 259382, "wall": 7447.4} {"step": 29476, "train_loss": 2.987196445465088, "lr": 4.1103709942142186e-05, "tps": 259211, "wall": 7452.6} {"step": 29477, "train_loss": 2.9828293323516846, "lr": 4.110159264491804e-05, "tps": 259041, "wall": 7457.8} {"step": 29478, "train_loss": 3.124655246734619, "lr": 4.109947737426475e-05, "tps": 258871, "wall": 7462.9} {"step": 29479, "train_loss": 3.11106538772583, "lr": 4.109736413020622e-05, "tps": 258700, "wall": 7468.1} {"step": 29480, "train_loss": 2.976391315460205, "lr": 4.109525291276645e-05, "tps": 258526, "wall": 7473.4} {"step": 29481, "train_loss": 3.018143653869629, "lr": 4.109314372196936e-05, "tps": 258357, "wall": 7478.5} {"step": 29482, "train_loss": 2.9878792762756348, "lr": 4.109103655783878e-05, "tps": 258188, "wall": 7483.7} {"step": 29483, "train_loss": 2.9400577545166016, "lr": 4.1088931420398624e-05, "tps": 258021, "wall": 7488.8} {"step": 29484, "train_loss": 2.950248956680298, "lr": 4.1086828309672736e-05, "tps": 257850, "wall": 7494.0} {"step": 29485, "train_loss": 3.005201816558838, "lr": 4.108472722568492e-05, "tps": 257678, "wall": 7499.2} {"step": 29486, "train_loss": 2.9918336868286133, "lr": 4.1082628168459026e-05, "tps": 257510, "wall": 7504.4} {"step": 29487, "train_loss": 2.9560129642486572, "lr": 4.108053113801877e-05, "tps": 257341, "wall": 7509.6} {"step": 29488, "train_loss": 2.9630608558654785, "lr": 4.107843613438795e-05, "tps": 257172, "wall": 7514.8} {"step": 29489, "train_loss": 3.064202070236206, "lr": 4.107634315759028e-05, "tps": 257004, "wall": 7519.9} {"step": 29490, "train_loss": 3.0763344764709473, "lr": 4.1074252207649486e-05, "tps": 256835, "wall": 7525.1} {"step": 29491, "train_loss": 3.0766797065734863, "lr": 4.107216328458922e-05, "tps": 256658, "wall": 7530.6} {"step": 29492, "train_loss": 2.9269189834594727, "lr": 4.10700763884332e-05, "tps": 256476, "wall": 7536.2} {"step": 29493, "train_loss": 3.089414119720459, "lr": 4.1067991519205016e-05, "tps": 256309, "wall": 7541.4} {"step": 29494, "train_loss": 2.951956033706665, "lr": 4.1065908676928285e-05, "tps": 256126, "wall": 7547.0} {"step": 29495, "train_loss": 3.08241868019104, "lr": 4.1063827861626646e-05, "tps": 255962, "wall": 7552.1} {"step": 29496, "train_loss": 2.9423909187316895, "lr": 4.106174907332363e-05, "tps": 255799, "wall": 7557.2} {"step": 29497, "train_loss": 3.0057454109191895, "lr": 4.1059672312042824e-05, "tps": 255633, "wall": 7562.3} {"step": 29498, "train_loss": 3.055436134338379, "lr": 4.105759757780771e-05, "tps": 255466, "wall": 7567.5} {"step": 29499, "train_loss": 3.072570562362671, "lr": 4.105552487064181e-05, "tps": 255299, "wall": 7572.7} {"step": 29500, "train_loss": 2.8806207180023193, "lr": 4.105345419056863e-05, "tps": 255138, "wall": 7577.8} {"step": 29501, "train_loss": 3.0309455394744873, "lr": 4.105138553761159e-05, "tps": 254964, "wall": 7583.2} {"step": 29502, "train_loss": 2.9692959785461426, "lr": 4.1049318911794114e-05, "tps": 254796, "wall": 7588.4} {"step": 29503, "train_loss": 3.114201068878174, "lr": 4.1047254313139654e-05, "tps": 254617, "wall": 7594.0} {"step": 29504, "train_loss": 3.021314859390259, "lr": 4.1045191741671576e-05, "tps": 254444, "wall": 7599.5} {"step": 29505, "train_loss": 2.950995922088623, "lr": 4.104313119741325e-05, "tps": 254270, "wall": 7604.9} {"step": 29506, "train_loss": 2.9134504795074463, "lr": 4.1041072680388016e-05, "tps": 254094, "wall": 7610.4} {"step": 29507, "train_loss": 3.0309247970581055, "lr": 4.103901619061918e-05, "tps": 253925, "wall": 7615.8} {"step": 29508, "train_loss": 3.031499147415161, "lr": 4.1036961728130054e-05, "tps": 253756, "wall": 7621.1} {"step": 29509, "train_loss": 3.0808773040771484, "lr": 4.1034909292943926e-05, "tps": 253587, "wall": 7626.4} {"step": 29510, "train_loss": 2.9793732166290283, "lr": 4.1032858885084e-05, "tps": 253421, "wall": 7631.7} {"step": 29511, "train_loss": 3.047863006591797, "lr": 4.103081050457355e-05, "tps": 253256, "wall": 7636.9} {"step": 29512, "train_loss": 3.0956945419311523, "lr": 4.102876415143575e-05, "tps": 253094, "wall": 7642.1} {"step": 29513, "train_loss": 3.158762216567993, "lr": 4.1026719825693805e-05, "tps": 252931, "wall": 7647.2} {"step": 29514, "train_loss": 3.055171489715576, "lr": 4.102467752737085e-05, "tps": 252763, "wall": 7652.6} {"step": 29515, "train_loss": 3.0610926151275635, "lr": 4.1022637256490023e-05, "tps": 252599, "wall": 7657.8} {"step": 29516, "train_loss": 3.0295748710632324, "lr": 4.102059901307446e-05, "tps": 252435, "wall": 7663.1} {"step": 29517, "train_loss": 3.067826509475708, "lr": 4.101856279714722e-05, "tps": 252272, "wall": 7668.3} {"step": 29518, "train_loss": 3.1139304637908936, "lr": 4.1016528608731394e-05, "tps": 252109, "wall": 7673.5} {"step": 29519, "train_loss": 2.920100212097168, "lr": 4.101449644785e-05, "tps": 251944, "wall": 7678.8} {"step": 29520, "train_loss": 3.0691206455230713, "lr": 4.1012466314526096e-05, "tps": 251782, "wall": 7684.0} {"step": 29521, "train_loss": 3.0938913822174072, "lr": 4.1010438208782624e-05, "tps": 251619, "wall": 7689.2} {"step": 29522, "train_loss": 2.9716196060180664, "lr": 4.1008412130642626e-05, "tps": 251455, "wall": 7694.5} {"step": 29523, "train_loss": 3.025082588195801, "lr": 4.100638808012899e-05, "tps": 251287, "wall": 7699.9} {"step": 29524, "train_loss": 3.1056604385375977, "lr": 4.100436605726469e-05, "tps": 251124, "wall": 7705.2} {"step": 29525, "train_loss": 2.9215519428253174, "lr": 4.100234606207261e-05, "tps": 250957, "wall": 7710.5} {"step": 29526, "train_loss": 2.891542911529541, "lr": 4.1000328094575644e-05, "tps": 250792, "wall": 7715.9} {"step": 29527, "train_loss": 2.9424099922180176, "lr": 4.0998312154796636e-05, "tps": 250627, "wall": 7721.2} {"step": 29528, "train_loss": 3.037820339202881, "lr": 4.0996298242758444e-05, "tps": 250462, "wall": 7726.6} {"step": 29529, "train_loss": 3.151980400085449, "lr": 4.099428635848387e-05, "tps": 250304, "wall": 7731.7} {"step": 29530, "train_loss": 3.078848361968994, "lr": 4.099227650199569e-05, "tps": 250145, "wall": 7736.9} {"step": 29531, "train_loss": 3.0489606857299805, "lr": 4.099026867331669e-05, "tps": 249985, "wall": 7742.1} {"step": 29532, "train_loss": 2.9807915687561035, "lr": 4.0988262872469616e-05, "tps": 249827, "wall": 7747.3} {"step": 29533, "train_loss": 3.0304808616638184, "lr": 4.098625909947717e-05, "tps": 249668, "wall": 7752.4} {"step": 29534, "train_loss": 2.9783310890197754, "lr": 4.098425735436208e-05, "tps": 249512, "wall": 7757.6} {"step": 29535, "train_loss": 3.10506534576416, "lr": 4.0982257637147e-05, "tps": 249351, "wall": 7762.8} {"step": 29536, "train_loss": 2.9695420265197754, "lr": 4.0980259947854594e-05, "tps": 249192, "wall": 7768.0} {"step": 29537, "train_loss": 3.020763874053955, "lr": 4.097826428650747e-05, "tps": 249025, "wall": 7773.5} {"step": 29538, "train_loss": 3.028866767883301, "lr": 4.097627065312829e-05, "tps": 248865, "wall": 7778.8} {"step": 29539, "train_loss": 3.0007362365722656, "lr": 4.0974279047739564e-05, "tps": 248707, "wall": 7784.0} {"step": 29540, "train_loss": 2.9536972045898438, "lr": 4.097228947036392e-05, "tps": 248548, "wall": 7789.2} {"step": 29541, "train_loss": 3.0132484436035156, "lr": 4.097030192102387e-05, "tps": 248392, "wall": 7794.4} {"step": 29542, "train_loss": 3.092088222503662, "lr": 4.0968316399741894e-05, "tps": 248236, "wall": 7799.5} {"step": 29543, "train_loss": 3.04587984085083, "lr": 4.096633290654053e-05, "tps": 248079, "wall": 7804.7} {"step": 29544, "train_loss": 3.01497745513916, "lr": 4.0964351441442235e-05, "tps": 247920, "wall": 7810.0} {"step": 29545, "train_loss": 3.0539820194244385, "lr": 4.096237200446944e-05, "tps": 247766, "wall": 7815.1} {"step": 29546, "train_loss": 2.9857985973358154, "lr": 4.09603945956446e-05, "tps": 247615, "wall": 7820.2} {"step": 29547, "train_loss": 3.079211950302124, "lr": 4.0958419214990084e-05, "tps": 247462, "wall": 7825.3} {"step": 29548, "train_loss": 3.0048677921295166, "lr": 4.095644586252829e-05, "tps": 247306, "wall": 7830.5} {"step": 29549, "train_loss": 3.0974793434143066, "lr": 4.095447453828155e-05, "tps": 247150, "wall": 7835.7} {"step": 29550, "train_loss": 3.0883822441101074, "lr": 4.0952505242272204e-05, "tps": 246995, "wall": 7840.8} {"step": 29551, "train_loss": 3.087855339050293, "lr": 4.095053797452258e-05, "tps": 246837, "wall": 7846.1} {"step": 29552, "train_loss": 3.0503458976745605, "lr": 4.094857273505496e-05, "tps": 246678, "wall": 7851.5} {"step": 29553, "train_loss": 3.0627636909484863, "lr": 4.094660952389157e-05, "tps": 246524, "wall": 7856.6} {"step": 29554, "train_loss": 3.03727388381958, "lr": 4.094464834105468e-05, "tps": 246368, "wall": 7861.9} {"step": 29555, "train_loss": 3.078474998474121, "lr": 4.094268918656652e-05, "tps": 246216, "wall": 7867.0} {"step": 29556, "train_loss": 3.140559673309326, "lr": 4.0940732060449225e-05, "tps": 246061, "wall": 7872.2} {"step": 29557, "train_loss": 3.010939359664917, "lr": 4.093877696272503e-05, "tps": 245909, "wall": 7877.4} {"step": 29558, "train_loss": 3.0405020713806152, "lr": 4.093682389341607e-05, "tps": 245756, "wall": 7882.5} {"step": 29559, "train_loss": 3.0814530849456787, "lr": 4.093487285254443e-05, "tps": 245598, "wall": 7887.9} {"step": 29560, "train_loss": 3.0060501098632812, "lr": 4.093292384013225e-05, "tps": 245443, "wall": 7893.1} {"step": 29561, "train_loss": 2.938549518585205, "lr": 4.093097685620159e-05, "tps": 245288, "wall": 7898.3} {"step": 29562, "train_loss": 3.0458996295928955, "lr": 4.092903190077452e-05, "tps": 245137, "wall": 7903.5} {"step": 29563, "train_loss": 2.975835084915161, "lr": 4.092708897387305e-05, "tps": 244984, "wall": 7908.7} {"step": 29564, "train_loss": 3.061495304107666, "lr": 4.092514807551922e-05, "tps": 244826, "wall": 7914.1} {"step": 29565, "train_loss": 3.0612740516662598, "lr": 4.092320920573499e-05, "tps": 244668, "wall": 7919.4} {"step": 29566, "train_loss": 2.954157829284668, "lr": 4.092127236454234e-05, "tps": 244512, "wall": 7924.8} {"step": 29567, "train_loss": 3.060359477996826, "lr": 4.0919337551963214e-05, "tps": 244356, "wall": 7930.1} {"step": 29568, "train_loss": 3.076561450958252, "lr": 4.09174047680195e-05, "tps": 244201, "wall": 7935.4} {"step": 29569, "train_loss": 3.0642337799072266, "lr": 4.091547401273311e-05, "tps": 244046, "wall": 7940.7} {"step": 29570, "train_loss": 2.9824299812316895, "lr": 4.091354528612592e-05, "tps": 243891, "wall": 7946.0} {"step": 29571, "train_loss": 3.048534393310547, "lr": 4.09116185882198e-05, "tps": 243736, "wall": 7951.3} {"step": 29572, "train_loss": 3.0875444412231445, "lr": 4.0909693919036535e-05, "tps": 243583, "wall": 7956.6} {"step": 29573, "train_loss": 3.0830636024475098, "lr": 4.090777127859796e-05, "tps": 243431, "wall": 7961.8} {"step": 29574, "train_loss": 3.026273727416992, "lr": 4.090585066692584e-05, "tps": 243279, "wall": 7967.1} {"step": 29575, "train_loss": 3.107926845550537, "lr": 4.090393208404191e-05, "tps": 243127, "wall": 7972.3} {"step": 29576, "train_loss": 3.1083292961120605, "lr": 4.090201552996795e-05, "tps": 242974, "wall": 7977.6} {"step": 29577, "train_loss": 3.106156349182129, "lr": 4.0900101004725625e-05, "tps": 242819, "wall": 7983.0} {"step": 29578, "train_loss": 3.072312831878662, "lr": 4.0898188508336674e-05, "tps": 242667, "wall": 7988.3} {"step": 29579, "train_loss": 3.0043249130249023, "lr": 4.08962780408227e-05, "tps": 242515, "wall": 7993.5} {"step": 29580, "train_loss": 3.0760958194732666, "lr": 4.089436960220541e-05, "tps": 242364, "wall": 7998.8} {"step": 29581, "train_loss": 3.022688388824463, "lr": 4.0892463192506364e-05, "tps": 242212, "wall": 8004.1} {"step": 29582, "train_loss": 3.0179672241210938, "lr": 4.089055881174719e-05, "tps": 242062, "wall": 8009.3} {"step": 29583, "train_loss": 3.015932559967041, "lr": 4.088865645994947e-05, "tps": 241908, "wall": 8014.7} {"step": 29584, "train_loss": 3.1099092960357666, "lr": 4.088675613713474e-05, "tps": 241760, "wall": 8019.8} {"step": 29585, "train_loss": 3.062246322631836, "lr": 4.0884857843324496e-05, "tps": 241611, "wall": 8025.1} {"step": 29586, "train_loss": 3.044206142425537, "lr": 4.08829615785403e-05, "tps": 241460, "wall": 8030.4} {"step": 29587, "train_loss": 3.1556715965270996, "lr": 4.088106734280359e-05, "tps": 241309, "wall": 8035.7} {"step": 29588, "train_loss": 3.0274271965026855, "lr": 4.087917513613586e-05, "tps": 241159, "wall": 8040.9} {"step": 29589, "train_loss": 2.989269971847534, "lr": 4.08772849585585e-05, "tps": 241009, "wall": 8046.2} {"step": 29590, "train_loss": 3.071791648864746, "lr": 4.087539681009297e-05, "tps": 240855, "wall": 8051.6} {"step": 29591, "train_loss": 3.154101848602295, "lr": 4.087351069076063e-05, "tps": 240706, "wall": 8056.9} {"step": 29592, "train_loss": 3.033421754837036, "lr": 4.087162660058284e-05, "tps": 240556, "wall": 8062.2} {"step": 29593, "train_loss": 3.0732436180114746, "lr": 4.086974453958095e-05, "tps": 240405, "wall": 8067.5} {"step": 29594, "train_loss": 3.0136427879333496, "lr": 4.086786450777629e-05, "tps": 240248, "wall": 8073.0} {"step": 29595, "train_loss": 3.0466859340667725, "lr": 4.0865986505190175e-05, "tps": 240101, "wall": 8078.3} {"step": 29596, "train_loss": 2.964402675628662, "lr": 4.0864110531843824e-05, "tps": 239941, "wall": 8083.9} {"step": 29597, "train_loss": 3.0284435749053955, "lr": 4.086223658775854e-05, "tps": 239789, "wall": 8089.3} {"step": 29598, "train_loss": 3.080448627471924, "lr": 4.0860364672955514e-05, "tps": 239640, "wall": 8094.6} {"step": 29599, "train_loss": 3.091564178466797, "lr": 4.0858494787455976e-05, "tps": 239492, "wall": 8099.9} {"step": 29600, "train_loss": 3.123934507369995, "lr": 4.08566269312811e-05, "tps": 239349, "wall": 8105.0} {"step": 29601, "train_loss": 3.025029420852661, "lr": 4.0854761104452065e-05, "tps": 239206, "wall": 8110.1} {"step": 29602, "train_loss": 3.0231165885925293, "lr": 4.085289730698996e-05, "tps": 239065, "wall": 8115.2} {"step": 29603, "train_loss": 2.988741874694824, "lr": 4.085103553891595e-05, "tps": 238924, "wall": 8120.2} {"step": 29604, "train_loss": 3.1569724082946777, "lr": 4.084917580025109e-05, "tps": 238785, "wall": 8125.3} {"step": 29605, "train_loss": 2.9763565063476562, "lr": 4.084731809101645e-05, "tps": 238643, "wall": 8130.4} {"step": 29606, "train_loss": 3.0131139755249023, "lr": 4.084546241123309e-05, "tps": 238504, "wall": 8135.4} {"step": 29607, "train_loss": 3.010061264038086, "lr": 4.0843608760922024e-05, "tps": 238366, "wall": 8140.4} {"step": 29608, "train_loss": 3.0912647247314453, "lr": 4.084175714010425e-05, "tps": 238225, "wall": 8145.4} {"step": 29609, "train_loss": 2.9869885444641113, "lr": 4.083990754880074e-05, "tps": 238083, "wall": 8150.6} {"step": 29610, "train_loss": 3.0883402824401855, "lr": 4.083805998703244e-05, "tps": 237944, "wall": 8155.6} {"step": 29611, "train_loss": 2.989126443862915, "lr": 4.083621445482031e-05, "tps": 237806, "wall": 8160.6} {"step": 29612, "train_loss": 3.032435655593872, "lr": 4.083437095218522e-05, "tps": 237667, "wall": 8165.7} {"step": 29613, "train_loss": 3.0548958778381348, "lr": 4.0832529479148085e-05, "tps": 237528, "wall": 8170.7} {"step": 29614, "train_loss": 3.018296003341675, "lr": 4.083069003572974e-05, "tps": 237390, "wall": 8175.8} {"step": 29615, "train_loss": 2.996396064758301, "lr": 4.082885262195101e-05, "tps": 237251, "wall": 8180.8} {"step": 29616, "train_loss": 2.925795316696167, "lr": 4.0827017237832764e-05, "tps": 237111, "wall": 8185.9} {"step": 29617, "train_loss": 2.986868381500244, "lr": 4.082518388339574e-05, "tps": 236970, "wall": 8191.1} {"step": 29618, "train_loss": 3.0692577362060547, "lr": 4.0823352558660745e-05, "tps": 236832, "wall": 8196.1} {"step": 29619, "train_loss": 3.0373504161834717, "lr": 4.0821523263648476e-05, "tps": 236695, "wall": 8201.2} {"step": 29620, "train_loss": 3.11446475982666, "lr": 4.081969599837973e-05, "tps": 236558, "wall": 8206.2} {"step": 29621, "train_loss": 3.0380971431732178, "lr": 4.081787076287511e-05, "tps": 236420, "wall": 8211.2} {"step": 29622, "train_loss": 2.9926376342773438, "lr": 4.081604755715537e-05, "tps": 236283, "wall": 8216.3} {"step": 29623, "train_loss": 2.994352102279663, "lr": 4.081422638124113e-05, "tps": 236146, "wall": 8221.3} {"step": 29624, "train_loss": 2.968881607055664, "lr": 4.0812407235153024e-05, "tps": 236010, "wall": 8226.4} {"step": 29625, "train_loss": 2.9157943725585938, "lr": 4.081059011891169e-05, "tps": 235874, "wall": 8231.4} {"step": 29626, "train_loss": 3.0487396717071533, "lr": 4.080877503253767e-05, "tps": 235738, "wall": 8236.4} {"step": 29627, "train_loss": 3.174222946166992, "lr": 4.0806961976051526e-05, "tps": 235601, "wall": 8241.5} {"step": 29628, "train_loss": 3.0281035900115967, "lr": 4.080515094947383e-05, "tps": 235466, "wall": 8246.4} {"step": 29629, "train_loss": 3.049549102783203, "lr": 4.0803341952825047e-05, "tps": 235328, "wall": 8251.6} {"step": 29630, "train_loss": 3.017605781555176, "lr": 4.080153498612573e-05, "tps": 235192, "wall": 8256.6} {"step": 29631, "train_loss": 3.1117124557495117, "lr": 4.0799730049396316e-05, "tps": 235057, "wall": 8261.6} {"step": 29632, "train_loss": 3.1064035892486572, "lr": 4.079792714265724e-05, "tps": 234923, "wall": 8266.6} {"step": 29633, "train_loss": 3.0518646240234375, "lr": 4.079612626592896e-05, "tps": 234789, "wall": 8271.6} {"step": 29634, "train_loss": 3.0201961994171143, "lr": 4.079432741923184e-05, "tps": 234657, "wall": 8276.6} {"step": 29635, "train_loss": 3.05867600440979, "lr": 4.079253060258629e-05, "tps": 234525, "wall": 8281.5} {"step": 29636, "train_loss": 2.8684089183807373, "lr": 4.079073581601263e-05, "tps": 234393, "wall": 8286.5} {"step": 29637, "train_loss": 3.085991859436035, "lr": 4.078894305953121e-05, "tps": 234262, "wall": 8291.4} {"step": 29638, "train_loss": 3.0068678855895996, "lr": 4.078715233316235e-05, "tps": 234129, "wall": 8296.3} {"step": 29639, "train_loss": 3.081598997116089, "lr": 4.078536363692632e-05, "tps": 233997, "wall": 8301.3} {"step": 29640, "train_loss": 3.068824291229248, "lr": 4.07835769708434e-05, "tps": 233862, "wall": 8306.4} {"step": 29641, "train_loss": 3.035982131958008, "lr": 4.078179233493379e-05, "tps": 233727, "wall": 8311.5} {"step": 29642, "train_loss": 3.078430652618408, "lr": 4.078000972921775e-05, "tps": 233595, "wall": 8316.4} {"step": 29643, "train_loss": 3.0539140701293945, "lr": 4.077822915371545e-05, "tps": 233463, "wall": 8321.4} {"step": 29644, "train_loss": 3.0650017261505127, "lr": 4.077645060844705e-05, "tps": 233332, "wall": 8326.4} {"step": 29645, "train_loss": 3.1146769523620605, "lr": 4.077467409343273e-05, "tps": 233202, "wall": 8331.3} {"step": 29646, "train_loss": 3.058471918106079, "lr": 4.07728996086926e-05, "tps": 233072, "wall": 8336.2} {"step": 29647, "train_loss": 2.9612045288085938, "lr": 4.0771127154246753e-05, "tps": 232942, "wall": 8341.2} {"step": 29648, "train_loss": 3.0856547355651855, "lr": 4.076935673011527e-05, "tps": 232812, "wall": 8346.1} {"step": 29649, "train_loss": 3.061967134475708, "lr": 4.076758833631822e-05, "tps": 232683, "wall": 8351.0} {"step": 29650, "train_loss": 3.1321678161621094, "lr": 4.076582197287562e-05, "tps": 232553, "wall": 8356.0} {"step": 29651, "train_loss": 3.1549088954925537, "lr": 4.07640576398075e-05, "tps": 232423, "wall": 8360.9} {"step": 29652, "train_loss": 3.0443081855773926, "lr": 4.076229533713381e-05, "tps": 232290, "wall": 8366.0} {"step": 29653, "train_loss": 3.0859124660491943, "lr": 4.076053506487456e-05, "tps": 232158, "wall": 8371.0} {"step": 29654, "train_loss": 3.0616328716278076, "lr": 4.075877682304964e-05, "tps": 232030, "wall": 8375.9} {"step": 29655, "train_loss": 3.047895908355713, "lr": 4.075702061167899e-05, "tps": 231902, "wall": 8380.8} {"step": 29656, "train_loss": 2.9816322326660156, "lr": 4.075526643078253e-05, "tps": 231774, "wall": 8385.7} {"step": 29657, "train_loss": 2.9589955806732178, "lr": 4.07535142803801e-05, "tps": 231647, "wall": 8390.6} {"step": 29658, "train_loss": 2.98260760307312, "lr": 4.0751764160491554e-05, "tps": 231520, "wall": 8395.5} {"step": 29659, "train_loss": 3.0060176849365234, "lr": 4.075001607113672e-05, "tps": 231393, "wall": 8400.4} {"step": 29660, "train_loss": 2.9841549396514893, "lr": 4.07482700123354e-05, "tps": 231266, "wall": 8405.3} {"step": 29661, "train_loss": 3.091954231262207, "lr": 4.074652598410739e-05, "tps": 231139, "wall": 8410.2} {"step": 29662, "train_loss": 3.103971004486084, "lr": 4.07447839864724e-05, "tps": 231012, "wall": 8415.1} {"step": 29663, "train_loss": 3.081900119781494, "lr": 4.074304401945022e-05, "tps": 230886, "wall": 8420.0} {"step": 29664, "train_loss": 3.0116419792175293, "lr": 4.0741306083060524e-05, "tps": 230760, "wall": 8424.9} {"step": 29665, "train_loss": 3.156456708908081, "lr": 4.073957017732303e-05, "tps": 230633, "wall": 8429.8} {"step": 29666, "train_loss": 3.050994634628296, "lr": 4.073783630225736e-05, "tps": 230504, "wall": 8434.8} {"step": 29667, "train_loss": 2.9748106002807617, "lr": 4.073610445788317e-05, "tps": 230378, "wall": 8439.7} {"step": 29668, "train_loss": 3.0849902629852295, "lr": 4.073437464422013e-05, "tps": 230250, "wall": 8444.7} {"step": 29669, "train_loss": 3.007678985595703, "lr": 4.0732646861287735e-05, "tps": 230121, "wall": 8449.7} {"step": 29670, "train_loss": 3.0986223220825195, "lr": 4.073092110910566e-05, "tps": 229994, "wall": 8454.6} {"step": 29671, "train_loss": 2.9970643520355225, "lr": 4.07291973876934e-05, "tps": 229870, "wall": 8459.5} {"step": 29672, "train_loss": 3.02333927154541, "lr": 4.0727475697070464e-05, "tps": 229745, "wall": 8464.4} {"step": 29673, "train_loss": 2.995577335357666, "lr": 4.072575603725642e-05, "tps": 229621, "wall": 8469.2} {"step": 29674, "train_loss": 3.0178024768829346, "lr": 4.072403840827069e-05, "tps": 229497, "wall": 8474.1} {"step": 29675, "train_loss": 3.020750045776367, "lr": 4.072232281013274e-05, "tps": 229373, "wall": 8478.9} {"step": 29676, "train_loss": 3.0959041118621826, "lr": 4.072060924286205e-05, "tps": 229248, "wall": 8483.9} {"step": 29677, "train_loss": 2.944301128387451, "lr": 4.0718897706477966e-05, "tps": 229116, "wall": 8489.0} {"step": 29678, "train_loss": 3.075453758239746, "lr": 4.071718820099991e-05, "tps": 228987, "wall": 8494.1} {"step": 29679, "train_loss": 3.009164810180664, "lr": 4.071548072644726e-05, "tps": 228860, "wall": 8499.1} {"step": 29680, "train_loss": 2.9003381729125977, "lr": 4.0713775282839346e-05, "tps": 228734, "wall": 8504.1} {"step": 29681, "train_loss": 3.0371789932250977, "lr": 4.071207187019547e-05, "tps": 228609, "wall": 8509.0} {"step": 29682, "train_loss": 3.0466156005859375, "lr": 4.0710370488534947e-05, "tps": 228482, "wall": 8514.0} {"step": 29683, "train_loss": 3.020843505859375, "lr": 4.070867113787704e-05, "tps": 228357, "wall": 8519.0} {"step": 29684, "train_loss": 2.962803840637207, "lr": 4.070697381824102e-05, "tps": 228233, "wall": 8523.9} {"step": 29685, "train_loss": 3.1182594299316406, "lr": 4.0705278529646095e-05, "tps": 228108, "wall": 8528.8} {"step": 29686, "train_loss": 3.0537991523742676, "lr": 4.070358527211147e-05, "tps": 227984, "wall": 8533.8} {"step": 29687, "train_loss": 3.079908609390259, "lr": 4.070189404565633e-05, "tps": 227860, "wall": 8538.7} {"step": 29688, "train_loss": 3.0552737712860107, "lr": 4.0700204850299856e-05, "tps": 227736, "wall": 8543.7} {"step": 29689, "train_loss": 3.048872709274292, "lr": 4.0698517686061136e-05, "tps": 227612, "wall": 8548.6} {"step": 29690, "train_loss": 3.0568461418151855, "lr": 4.069683255295932e-05, "tps": 227485, "wall": 8553.6} {"step": 29691, "train_loss": 3.0262181758880615, "lr": 4.0695149451013484e-05, "tps": 227360, "wall": 8558.6} {"step": 29692, "train_loss": 3.0719857215881348, "lr": 4.069346838024268e-05, "tps": 227237, "wall": 8563.5} {"step": 29693, "train_loss": 3.03061580657959, "lr": 4.0691789340665984e-05, "tps": 227115, "wall": 8568.4} {"step": 29694, "train_loss": 3.06205415725708, "lr": 4.069011233230239e-05, "tps": 226992, "wall": 8573.4} {"step": 29695, "train_loss": 3.072646379470825, "lr": 4.068843735517092e-05, "tps": 226869, "wall": 8578.3} {"step": 29696, "train_loss": 3.029588460922241, "lr": 4.068676440929051e-05, "tps": 226746, "wall": 8583.2} {"step": 29697, "train_loss": 3.0834498405456543, "lr": 4.068509349468015e-05, "tps": 226625, "wall": 8588.1} {"step": 29698, "train_loss": 3.121478796005249, "lr": 4.068342461135873e-05, "tps": 226503, "wall": 8593.1} {"step": 29699, "train_loss": 3.0678303241729736, "lr": 4.06817577593452e-05, "tps": 226381, "wall": 8597.9} {"step": 29700, "train_loss": 3.0346693992614746, "lr": 4.068009293865841e-05, "tps": 226260, "wall": 8602.8} {"step": 29701, "train_loss": 3.012078285217285, "lr": 4.067843014931724e-05, "tps": 226140, "wall": 8607.7} {"step": 29702, "train_loss": 3.0870437622070312, "lr": 4.0676769391340496e-05, "tps": 226017, "wall": 8612.7} {"step": 29703, "train_loss": 3.06695818901062, "lr": 4.067511066474702e-05, "tps": 225896, "wall": 8617.6} {"step": 29704, "train_loss": 3.1343448162078857, "lr": 4.0673453969555586e-05, "tps": 225775, "wall": 8622.5} {"step": 29705, "train_loss": 3.087249755859375, "lr": 4.067179930578496e-05, "tps": 225653, "wall": 8627.5} {"step": 29706, "train_loss": 3.0438387393951416, "lr": 4.06701466734539e-05, "tps": 225532, "wall": 8632.4} {"step": 29707, "train_loss": 3.001307249069214, "lr": 4.0668496072581116e-05, "tps": 225412, "wall": 8637.3} {"step": 29708, "train_loss": 3.138266086578369, "lr": 4.066684750318533e-05, "tps": 225291, "wall": 8642.2} {"step": 29709, "train_loss": 2.981490135192871, "lr": 4.0665200965285176e-05, "tps": 225172, "wall": 8647.0} {"step": 29710, "train_loss": 3.129603862762451, "lr": 4.066355645889933e-05, "tps": 225053, "wall": 8651.9} {"step": 29711, "train_loss": 3.0640358924865723, "lr": 4.066191398404642e-05, "tps": 224924, "wall": 8657.2} {"step": 29712, "train_loss": 3.0908780097961426, "lr": 4.066027354074506e-05, "tps": 224804, "wall": 8662.1} {"step": 29713, "train_loss": 3.053112745285034, "lr": 4.0658635129013824e-05, "tps": 224683, "wall": 8667.0} {"step": 29714, "train_loss": 3.084623098373413, "lr": 4.065699874887127e-05, "tps": 224562, "wall": 8672.0} {"step": 29715, "train_loss": 2.9882431030273438, "lr": 4.0655364400335925e-05, "tps": 224442, "wall": 8676.9} {"step": 29716, "train_loss": 2.99102783203125, "lr": 4.065373208342633e-05, "tps": 224322, "wall": 8681.9} {"step": 29717, "train_loss": 2.9316537380218506, "lr": 4.065210179816094e-05, "tps": 224200, "wall": 8686.9} {"step": 29718, "train_loss": 3.0657472610473633, "lr": 4.0650473544558254e-05, "tps": 224078, "wall": 8691.9} {"step": 29719, "train_loss": 3.0031094551086426, "lr": 4.0648847322636704e-05, "tps": 223957, "wall": 8696.9} {"step": 29720, "train_loss": 2.892024040222168, "lr": 4.064722313241471e-05, "tps": 223835, "wall": 8701.9} {"step": 29721, "train_loss": 3.0027875900268555, "lr": 4.064560097391069e-05, "tps": 223714, "wall": 8706.9} {"step": 29722, "train_loss": 3.0735976696014404, "lr": 4.0643980847143005e-05, "tps": 223596, "wall": 8711.8} {"step": 29723, "train_loss": 2.9467897415161133, "lr": 4.0642362752129985e-05, "tps": 223478, "wall": 8716.7} {"step": 29724, "train_loss": 3.1771535873413086, "lr": 4.0640746688889996e-05, "tps": 223360, "wall": 8721.6} {"step": 29725, "train_loss": 2.871396541595459, "lr": 4.063913265744135e-05, "tps": 223243, "wall": 8726.4} {"step": 29726, "train_loss": 3.163969039916992, "lr": 4.063752065780229e-05, "tps": 223124, "wall": 8731.4} {"step": 29727, "train_loss": 3.0303242206573486, "lr": 4.063591068999111e-05, "tps": 223005, "wall": 8736.3} {"step": 29728, "train_loss": 3.0625839233398438, "lr": 4.063430275402603e-05, "tps": 222886, "wall": 8741.3} {"step": 29729, "train_loss": 3.019361972808838, "lr": 4.063269684992527e-05, "tps": 222768, "wall": 8746.2} {"step": 29730, "train_loss": 2.9709768295288086, "lr": 4.0631092977707034e-05, "tps": 222652, "wall": 8751.1} {"step": 29731, "train_loss": 3.091925621032715, "lr": 4.0629491137389466e-05, "tps": 222534, "wall": 8756.0} {"step": 29732, "train_loss": 3.066206693649292, "lr": 4.062789132899073e-05, "tps": 222417, "wall": 8760.9} {"step": 29733, "train_loss": 3.1304450035095215, "lr": 4.062629355252895e-05, "tps": 222300, "wall": 8765.8} {"step": 29734, "train_loss": 3.082009792327881, "lr": 4.062469780802224e-05, "tps": 222184, "wall": 8770.7} {"step": 29735, "train_loss": 3.0929529666900635, "lr": 4.062310409548864e-05, "tps": 222067, "wall": 8775.6} {"step": 29736, "train_loss": 3.015489101409912, "lr": 4.062151241494621e-05, "tps": 221952, "wall": 8780.5} {"step": 29737, "train_loss": 3.026193857192993, "lr": 4.0619922766413e-05, "tps": 221836, "wall": 8785.4} {"step": 29738, "train_loss": 3.044928550720215, "lr": 4.0618335149907e-05, "tps": 221717, "wall": 8790.3} {"step": 29739, "train_loss": 3.045809268951416, "lr": 4.0616749565446216e-05, "tps": 221602, "wall": 8795.2} {"step": 29740, "train_loss": 3.0715951919555664, "lr": 4.061516601304861e-05, "tps": 221487, "wall": 8800.1} {"step": 29741, "train_loss": 3.026327133178711, "lr": 4.061358449273208e-05, "tps": 221371, "wall": 8805.0} {"step": 29742, "train_loss": 3.040224552154541, "lr": 4.061200500451458e-05, "tps": 221255, "wall": 8809.9} {"step": 29743, "train_loss": 3.0334911346435547, "lr": 4.0610427548413996e-05, "tps": 221140, "wall": 8814.8} {"step": 29744, "train_loss": 3.0357675552368164, "lr": 4.0608852124448194e-05, "tps": 221025, "wall": 8819.7} {"step": 29745, "train_loss": 3.008129119873047, "lr": 4.0607278732635015e-05, "tps": 220910, "wall": 8824.5} {"step": 29746, "train_loss": 2.9247279167175293, "lr": 4.060570737299229e-05, "tps": 220796, "wall": 8829.4} {"step": 29747, "train_loss": 3.0730438232421875, "lr": 4.060413804553782e-05, "tps": 220682, "wall": 8834.3} {"step": 29748, "train_loss": 2.922208070755005, "lr": 4.060257075028938e-05, "tps": 220567, "wall": 8839.1} {"step": 29749, "train_loss": 3.020080804824829, "lr": 4.060100548726471e-05, "tps": 220453, "wall": 8844.0} {"step": 29750, "train_loss": 3.032214403152466, "lr": 4.059944225648157e-05, "tps": 220338, "wall": 8848.9} {"step": 29751, "train_loss": 2.992940902709961, "lr": 4.059788105795765e-05, "tps": 220222, "wall": 8853.9} {"step": 29752, "train_loss": 3.0579333305358887, "lr": 4.0596321891710636e-05, "tps": 220108, "wall": 8858.8} {"step": 29753, "train_loss": 3.094343662261963, "lr": 4.0594764757758197e-05, "tps": 219993, "wall": 8863.7} {"step": 29754, "train_loss": 3.1960511207580566, "lr": 4.0593209656117956e-05, "tps": 219879, "wall": 8868.6} {"step": 29755, "train_loss": 3.093003749847412, "lr": 4.0591656586807566e-05, "tps": 219765, "wall": 8873.5} {"step": 29756, "train_loss": 2.9893248081207275, "lr": 4.059010554984458e-05, "tps": 219651, "wall": 8878.4} {"step": 29757, "train_loss": 3.042320489883423, "lr": 4.0588556545246586e-05, "tps": 219538, "wall": 8883.3} {"step": 29758, "train_loss": 3.0283684730529785, "lr": 4.058700957303112e-05, "tps": 219424, "wall": 8888.2} {"step": 29759, "train_loss": 3.0755414962768555, "lr": 4.0585464633215744e-05, "tps": 219311, "wall": 8893.1} {"step": 29760, "train_loss": 3.0333218574523926, "lr": 4.05839217258179e-05, "tps": 219198, "wall": 8897.9} {"step": 29761, "train_loss": 3.1098930835723877, "lr": 4.058238085085511e-05, "tps": 219079, "wall": 8903.1} {"step": 29762, "train_loss": 2.982219934463501, "lr": 4.058084200834482e-05, "tps": 218963, "wall": 8908.1} {"step": 29763, "train_loss": 3.0568957328796387, "lr": 4.057930519830445e-05, "tps": 218846, "wall": 8913.2} {"step": 29764, "train_loss": 3.0185818672180176, "lr": 4.057777042075142e-05, "tps": 218731, "wall": 8918.2} {"step": 29765, "train_loss": 3.017266035079956, "lr": 4.057623767570312e-05, "tps": 218612, "wall": 8923.3} {"step": 29766, "train_loss": 3.113147497177124, "lr": 4.057470696317689e-05, "tps": 218491, "wall": 8928.5} {"step": 29767, "train_loss": 3.0844974517822266, "lr": 4.05731782831901e-05, "tps": 218378, "wall": 8933.5} {"step": 29768, "train_loss": 3.0411508083343506, "lr": 4.0571651635760036e-05, "tps": 218260, "wall": 8938.6} {"step": 29769, "train_loss": 3.135603666305542, "lr": 4.0570127020904035e-05, "tps": 218145, "wall": 8943.6} {"step": 29770, "train_loss": 3.0804696083068848, "lr": 4.0568604438639326e-05, "tps": 218032, "wall": 8948.5} {"step": 29771, "train_loss": 2.9048571586608887, "lr": 4.056708388898318e-05, "tps": 217921, "wall": 8953.4} {"step": 29772, "train_loss": 2.9697346687316895, "lr": 4.056556537195282e-05, "tps": 217808, "wall": 8958.4} {"step": 29773, "train_loss": 3.1107122898101807, "lr": 4.056404888756544e-05, "tps": 217692, "wall": 8963.4} {"step": 29774, "train_loss": 2.972618341445923, "lr": 4.05625344358382e-05, "tps": 217580, "wall": 8968.3} {"step": 29775, "train_loss": 3.0748088359832764, "lr": 4.0561022016788295e-05, "tps": 217469, "wall": 8973.2} {"step": 29776, "train_loss": 2.946721076965332, "lr": 4.0559511630432854e-05, "tps": 217358, "wall": 8978.1} {"step": 29777, "train_loss": 3.034592390060425, "lr": 4.055800327678894e-05, "tps": 217246, "wall": 8983.0} {"step": 29778, "train_loss": 3.043456554412842, "lr": 4.05564969558737e-05, "tps": 217136, "wall": 8987.9} {"step": 29779, "train_loss": 2.940638542175293, "lr": 4.055499266770415e-05, "tps": 217026, "wall": 8992.7} {"step": 29780, "train_loss": 2.9784293174743652, "lr": 4.055349041229736e-05, "tps": 216916, "wall": 8997.6} {"step": 29781, "train_loss": 3.1205081939697266, "lr": 4.0551990189670335e-05, "tps": 216807, "wall": 9002.4} {"step": 29782, "train_loss": 3.0429329872131348, "lr": 4.0550491999840076e-05, "tps": 216697, "wall": 9007.3} {"step": 29783, "train_loss": 3.171099901199341, "lr": 4.054899584282356e-05, "tps": 216588, "wall": 9012.1} {"step": 29784, "train_loss": 3.069276809692383, "lr": 4.054750171863773e-05, "tps": 216478, "wall": 9017.0} {"step": 29785, "train_loss": 3.0679454803466797, "lr": 4.054600962729948e-05, "tps": 216368, "wall": 9021.9} {"step": 29786, "train_loss": 2.905393600463867, "lr": 4.054451956882577e-05, "tps": 216257, "wall": 9026.8} {"step": 29787, "train_loss": 3.1058712005615234, "lr": 4.0543031543233453e-05, "tps": 216147, "wall": 9031.7} {"step": 29788, "train_loss": 3.058076858520508, "lr": 4.054154555053936e-05, "tps": 216037, "wall": 9036.6} {"step": 29789, "train_loss": 3.103909730911255, "lr": 4.054006159076036e-05, "tps": 215927, "wall": 9041.5} {"step": 29790, "train_loss": 2.997805595397949, "lr": 4.053857966391324e-05, "tps": 215812, "wall": 9046.7} {"step": 29791, "train_loss": 3.072517156600952, "lr": 4.0537099770014815e-05, "tps": 215697, "wall": 9051.8} {"step": 29792, "train_loss": 3.0526044368743896, "lr": 4.053562190908182e-05, "tps": 215587, "wall": 9056.7} {"step": 29793, "train_loss": 3.0046746730804443, "lr": 4.053414608113102e-05, "tps": 215477, "wall": 9061.7} {"step": 29794, "train_loss": 3.082674980163574, "lr": 4.0532672286179116e-05, "tps": 215364, "wall": 9066.7} {"step": 29795, "train_loss": 3.1261937618255615, "lr": 4.0531200524242795e-05, "tps": 215254, "wall": 9071.6} {"step": 29796, "train_loss": 3.002673625946045, "lr": 4.052973079533878e-05, "tps": 215142, "wall": 9076.7} {"step": 29797, "train_loss": 3.0299463272094727, "lr": 4.052826309948364e-05, "tps": 215030, "wall": 9081.7} {"step": 29798, "train_loss": 2.938382863998413, "lr": 4.052679743669407e-05, "tps": 214921, "wall": 9086.6} {"step": 29799, "train_loss": 3.0063722133636475, "lr": 4.052533380698664e-05, "tps": 214812, "wall": 9091.5} {"step": 29800, "train_loss": 2.962390422821045, "lr": 4.0523872210377956e-05, "tps": 214704, "wall": 9096.4} {"step": 29801, "train_loss": 3.004241466522217, "lr": 4.052241264688455e-05, "tps": 214594, "wall": 9101.3} {"step": 29802, "train_loss": 3.10103440284729, "lr": 4.0520955116522945e-05, "tps": 214486, "wall": 9106.3} {"step": 29803, "train_loss": 2.979477643966675, "lr": 4.051949961930969e-05, "tps": 214375, "wall": 9111.3} {"step": 29804, "train_loss": 3.0658390522003174, "lr": 4.0518046155261234e-05, "tps": 214266, "wall": 9116.2} {"step": 29805, "train_loss": 3.0319149494171143, "lr": 4.051659472439408e-05, "tps": 214156, "wall": 9121.2} {"step": 29806, "train_loss": 3.065746784210205, "lr": 4.0515145326724634e-05, "tps": 214047, "wall": 9126.2} {"step": 29807, "train_loss": 3.0597848892211914, "lr": 4.051369796226935e-05, "tps": 213938, "wall": 9131.1} {"step": 29808, "train_loss": 2.9678597450256348, "lr": 4.0512252631044584e-05, "tps": 213831, "wall": 9136.0} {"step": 29809, "train_loss": 3.065002918243408, "lr": 4.0510809333066755e-05, "tps": 213723, "wall": 9140.9} {"step": 29810, "train_loss": 3.0071918964385986, "lr": 4.050936806835218e-05, "tps": 213615, "wall": 9145.8} {"step": 29811, "train_loss": 3.182762384414673, "lr": 4.050792883691719e-05, "tps": 213506, "wall": 9150.8} {"step": 29812, "train_loss": 3.071655511856079, "lr": 4.050649163877809e-05, "tps": 213399, "wall": 9155.7} {"step": 29813, "train_loss": 2.9771175384521484, "lr": 4.050505647395115e-05, "tps": 213293, "wall": 9160.6} {"step": 29814, "train_loss": 2.9509031772613525, "lr": 4.0503623342452655e-05, "tps": 213188, "wall": 9165.4} {"step": 29815, "train_loss": 3.076857566833496, "lr": 4.0502192244298835e-05, "tps": 213083, "wall": 9170.2} {"step": 29816, "train_loss": 3.0944862365722656, "lr": 4.0500763179505874e-05, "tps": 212977, "wall": 9175.1} {"step": 29817, "train_loss": 3.130908966064453, "lr": 4.049933614809e-05, "tps": 212872, "wall": 9179.9} {"step": 29818, "train_loss": 3.1473631858825684, "lr": 4.049791115006734e-05, "tps": 212767, "wall": 9184.8} {"step": 29819, "train_loss": 2.993865489959717, "lr": 4.049648818545406e-05, "tps": 212662, "wall": 9189.6} {"step": 29820, "train_loss": 3.1270625591278076, "lr": 4.049506725426627e-05, "tps": 212557, "wall": 9194.5} {"step": 29821, "train_loss": 3.0988690853118896, "lr": 4.049364835652007e-05, "tps": 212452, "wall": 9199.3} {"step": 29822, "train_loss": 3.0121660232543945, "lr": 4.049223149223154e-05, "tps": 212348, "wall": 9204.1} {"step": 29823, "train_loss": 3.0246214866638184, "lr": 4.049081666141671e-05, "tps": 212244, "wall": 9208.9} {"step": 29824, "train_loss": 3.005855083465576, "lr": 4.0489403864091615e-05, "tps": 212138, "wall": 9213.8} {"step": 29825, "train_loss": 2.988110065460205, "lr": 4.048799310027228e-05, "tps": 212032, "wall": 9218.7} {"step": 29826, "train_loss": 3.0827996730804443, "lr": 4.048658436997466e-05, "tps": 211927, "wall": 9223.6} {"step": 29827, "train_loss": 2.984111785888672, "lr": 4.0485177673214726e-05, "tps": 211823, "wall": 9228.5} {"step": 29828, "train_loss": 2.893598794937134, "lr": 4.048377301000841e-05, "tps": 211720, "wall": 9233.3} {"step": 29829, "train_loss": 3.032684326171875, "lr": 4.048237038037164e-05, "tps": 211616, "wall": 9238.1} {"step": 29830, "train_loss": 3.0497710704803467, "lr": 4.048096978432028e-05, "tps": 211513, "wall": 9242.9} {"step": 29831, "train_loss": 2.912203550338745, "lr": 4.047957122187021e-05, "tps": 211410, "wall": 9247.7} {"step": 29832, "train_loss": 3.047001838684082, "lr": 4.047817469303725e-05, "tps": 211306, "wall": 9252.6} {"step": 29833, "train_loss": 3.1343600749969482, "lr": 4.047678019783726e-05, "tps": 211201, "wall": 9257.5} {"step": 29834, "train_loss": 3.0819668769836426, "lr": 4.0475387736286e-05, "tps": 211096, "wall": 9262.4} {"step": 29835, "train_loss": 3.0773777961730957, "lr": 4.047399730839927e-05, "tps": 210991, "wall": 9267.3} {"step": 29836, "train_loss": 3.1263866424560547, "lr": 4.0472608914192805e-05, "tps": 210886, "wall": 9272.3} {"step": 29837, "train_loss": 2.987849712371826, "lr": 4.047122255368235e-05, "tps": 210783, "wall": 9277.1} {"step": 29838, "train_loss": 3.1236844062805176, "lr": 4.04698382268836e-05, "tps": 210679, "wall": 9282.0} {"step": 29839, "train_loss": 2.985091209411621, "lr": 4.0468455933812216e-05, "tps": 210577, "wall": 9286.8} {"step": 29840, "train_loss": 2.9796767234802246, "lr": 4.046707567448388e-05, "tps": 210474, "wall": 9291.7} {"step": 29841, "train_loss": 3.0916872024536133, "lr": 4.0465697448914234e-05, "tps": 210371, "wall": 9296.5} {"step": 29842, "train_loss": 3.121199131011963, "lr": 4.046432125711887e-05, "tps": 210269, "wall": 9301.4} {"step": 29843, "train_loss": 3.022204637527466, "lr": 4.046294709911341e-05, "tps": 210167, "wall": 9306.2} {"step": 29844, "train_loss": 2.990804672241211, "lr": 4.046157497491337e-05, "tps": 210065, "wall": 9311.0} {"step": 29845, "train_loss": 3.1118574142456055, "lr": 4.0460204884534335e-05, "tps": 209962, "wall": 9315.9} {"step": 29846, "train_loss": 3.1286892890930176, "lr": 4.045883682799181e-05, "tps": 209860, "wall": 9320.7} {"step": 29847, "train_loss": 3.0500736236572266, "lr": 4.045747080530131e-05, "tps": 209758, "wall": 9325.6} {"step": 29848, "train_loss": 3.0494213104248047, "lr": 4.045610681647826e-05, "tps": 209655, "wall": 9330.5} {"step": 29849, "train_loss": 2.977027177810669, "lr": 4.045474486153817e-05, "tps": 209554, "wall": 9335.3} {"step": 29850, "train_loss": 3.010817766189575, "lr": 4.045338494049643e-05, "tps": 209452, "wall": 9340.1} {"step": 29851, "train_loss": 3.0809054374694824, "lr": 4.0452027053368475e-05, "tps": 209349, "wall": 9345.1} {"step": 29852, "train_loss": 3.022411346435547, "lr": 4.045067120016966e-05, "tps": 209245, "wall": 9350.0} {"step": 29853, "train_loss": 3.062467098236084, "lr": 4.044931738091534e-05, "tps": 209141, "wall": 9355.0} {"step": 29854, "train_loss": 2.987186908721924, "lr": 4.04479655956209e-05, "tps": 209039, "wall": 9359.8} {"step": 29855, "train_loss": 3.1057491302490234, "lr": 4.0446615844301586e-05, "tps": 208937, "wall": 9364.7} {"step": 29856, "train_loss": 3.154754161834717, "lr": 4.044526812697275e-05, "tps": 208836, "wall": 9369.6} {"step": 29857, "train_loss": 2.921607494354248, "lr": 4.0443922443649614e-05, "tps": 208735, "wall": 9374.4} {"step": 29858, "train_loss": 2.970337152481079, "lr": 4.044257879434743e-05, "tps": 208633, "wall": 9379.3} {"step": 29859, "train_loss": 3.113898515701294, "lr": 4.044123717908145e-05, "tps": 208529, "wall": 9384.3} {"step": 29860, "train_loss": 2.9547500610351562, "lr": 4.043989759786684e-05, "tps": 208425, "wall": 9389.3} {"step": 29861, "train_loss": 3.1031970977783203, "lr": 4.0438560050718774e-05, "tps": 208320, "wall": 9394.4} {"step": 29862, "train_loss": 3.0358142852783203, "lr": 4.043722453765242e-05, "tps": 208216, "wall": 9399.3} {"step": 29863, "train_loss": 3.0586354732513428, "lr": 4.0435891058682896e-05, "tps": 208113, "wall": 9404.3} {"step": 29864, "train_loss": 3.0490169525146484, "lr": 4.043455961382533e-05, "tps": 208009, "wall": 9409.3} {"step": 29865, "train_loss": 3.010234832763672, "lr": 4.043323020309477e-05, "tps": 207906, "wall": 9414.3} {"step": 29866, "train_loss": 2.9687814712524414, "lr": 4.043190282650631e-05, "tps": 207803, "wall": 9419.3} {"step": 29867, "train_loss": 2.9970040321350098, "lr": 4.043057748407494e-05, "tps": 207702, "wall": 9424.2} {"step": 29868, "train_loss": 3.091759204864502, "lr": 4.042925417581573e-05, "tps": 207601, "wall": 9429.1} {"step": 29869, "train_loss": 2.972425699234009, "lr": 4.042793290174364e-05, "tps": 207500, "wall": 9434.0} {"step": 29870, "train_loss": 3.0333480834960938, "lr": 4.042661366187364e-05, "tps": 207400, "wall": 9438.9} {"step": 29871, "train_loss": 3.035416603088379, "lr": 4.042529645622066e-05, "tps": 207298, "wall": 9443.8} {"step": 29872, "train_loss": 2.9573686122894287, "lr": 4.0423981284799635e-05, "tps": 207192, "wall": 9449.0} {"step": 29873, "train_loss": 2.9862477779388428, "lr": 4.042266814762548e-05, "tps": 207089, "wall": 9454.0} {"step": 29874, "train_loss": 2.9819254875183105, "lr": 4.042135704471306e-05, "tps": 206985, "wall": 9459.1} {"step": 29875, "train_loss": 3.1045608520507812, "lr": 4.042004797607721e-05, "tps": 206884, "wall": 9464.0} {"step": 29876, "train_loss": 2.9927680492401123, "lr": 4.041874094173277e-05, "tps": 206783, "wall": 9468.9} {"step": 29877, "train_loss": 3.115039110183716, "lr": 4.041743594169456e-05, "tps": 206682, "wall": 9473.9} {"step": 29878, "train_loss": 3.085998058319092, "lr": 4.041613297597734e-05, "tps": 206581, "wall": 9478.8} {"step": 29879, "train_loss": 3.0392370223999023, "lr": 4.041483204459588e-05, "tps": 206477, "wall": 9483.9} {"step": 29880, "train_loss": 3.064809560775757, "lr": 4.041353314756493e-05, "tps": 206376, "wall": 9488.9} {"step": 29881, "train_loss": 3.1780827045440674, "lr": 4.041223628489919e-05, "tps": 206274, "wall": 9493.9} {"step": 29882, "train_loss": 3.0088658332824707, "lr": 4.041094145661334e-05, "tps": 206173, "wall": 9498.8} {"step": 29883, "train_loss": 3.061495304107666, "lr": 4.040964866272208e-05, "tps": 206072, "wall": 9503.8} {"step": 29884, "train_loss": 3.059921979904175, "lr": 4.040835790324002e-05, "tps": 205974, "wall": 9508.7} {"step": 29885, "train_loss": 3.2056522369384766, "lr": 4.040706917818179e-05, "tps": 205862, "wall": 9514.2} {"step": 29886, "train_loss": 3.010529041290283, "lr": 4.040578248756203e-05, "tps": 205755, "wall": 9519.4} {"step": 29887, "train_loss": 3.066211700439453, "lr": 4.0404497831395236e-05, "tps": 205635, "wall": 9525.3} {"step": 29888, "train_loss": 3.12479305267334, "lr": 4.040321520969603e-05, "tps": 205531, "wall": 9530.5} {"step": 29889, "train_loss": 3.0520007610321045, "lr": 4.040193462247892e-05, "tps": 205432, "wall": 9535.4} {"step": 29890, "train_loss": 3.0331239700317383, "lr": 4.040065606975841e-05, "tps": 205334, "wall": 9540.2} {"step": 29891, "train_loss": 2.93497896194458, "lr": 4.039937955154899e-05, "tps": 205237, "wall": 9545.1} {"step": 29892, "train_loss": 3.0761871337890625, "lr": 4.03981050678651e-05, "tps": 205140, "wall": 9549.9} {"step": 29893, "train_loss": 3.055478572845459, "lr": 4.039683261872121e-05, "tps": 205041, "wall": 9554.8} {"step": 29894, "train_loss": 3.1011435985565186, "lr": 4.03955622041317e-05, "tps": 204943, "wall": 9559.7} {"step": 29895, "train_loss": 3.065415143966675, "lr": 4.039429382411099e-05, "tps": 204844, "wall": 9564.6} {"step": 29896, "train_loss": 3.184605360031128, "lr": 4.039302747867344e-05, "tps": 204744, "wall": 9569.6} {"step": 29897, "train_loss": 3.0818607807159424, "lr": 4.039176316783337e-05, "tps": 204639, "wall": 9574.9} {"step": 29898, "train_loss": 2.9869601726531982, "lr": 4.0390500891605134e-05, "tps": 204539, "wall": 9579.8} {"step": 29899, "train_loss": 3.1337625980377197, "lr": 4.038924065000302e-05, "tps": 204442, "wall": 9584.7} {"step": 29900, "train_loss": 3.0772857666015625, "lr": 4.038798244304132e-05, "tps": 204346, "wall": 9589.6} {"step": 29901, "train_loss": 2.9594383239746094, "lr": 4.038672627073425e-05, "tps": 204250, "wall": 9594.4} {"step": 29902, "train_loss": 3.039888858795166, "lr": 4.038547213309607e-05, "tps": 204155, "wall": 9599.2} {"step": 29903, "train_loss": 3.130734443664551, "lr": 4.038422003014097e-05, "tps": 204052, "wall": 9604.4} {"step": 29904, "train_loss": 3.032290458679199, "lr": 4.038296996188316e-05, "tps": 203951, "wall": 9609.4} {"step": 29905, "train_loss": 3.0295939445495605, "lr": 4.038172192833677e-05, "tps": 203850, "wall": 9614.5} {"step": 29906, "train_loss": 2.978489398956299, "lr": 4.0380475929515954e-05, "tps": 203748, "wall": 9619.6} {"step": 29907, "train_loss": 3.0397589206695557, "lr": 4.037923196543483e-05, "tps": 203654, "wall": 9624.4} {"step": 29908, "train_loss": 3.0427751541137695, "lr": 4.0377990036107474e-05, "tps": 203559, "wall": 9629.2} {"step": 29909, "train_loss": 3.125675916671753, "lr": 4.0376750141547966e-05, "tps": 203463, "wall": 9634.1} {"step": 29910, "train_loss": 3.0290489196777344, "lr": 4.037551228177037e-05, "tps": 203368, "wall": 9638.9} {"step": 29911, "train_loss": 2.9777908325195312, "lr": 4.037427645678866e-05, "tps": 203273, "wall": 9643.7} {"step": 29912, "train_loss": 3.038466215133667, "lr": 4.037304266661689e-05, "tps": 203178, "wall": 9648.5} {"step": 29913, "train_loss": 3.159173011779785, "lr": 4.037181091126899e-05, "tps": 203084, "wall": 9653.3} {"step": 29914, "train_loss": 3.0066089630126953, "lr": 4.0370581190758925e-05, "tps": 202990, "wall": 9658.1} {"step": 29915, "train_loss": 3.0650715827941895, "lr": 4.036935350510065e-05, "tps": 202895, "wall": 9663.0} {"step": 29916, "train_loss": 2.9903290271759033, "lr": 4.036812785430806e-05, "tps": 202801, "wall": 9667.8} {"step": 29917, "train_loss": 2.996596574783325, "lr": 4.036690423839502e-05, "tps": 202704, "wall": 9672.7} {"step": 29918, "train_loss": 3.0117363929748535, "lr": 4.036568265737542e-05, "tps": 202604, "wall": 9677.8} {"step": 29919, "train_loss": 2.9413061141967773, "lr": 4.036446311126309e-05, "tps": 202504, "wall": 9683.0} {"step": 29920, "train_loss": 3.034289836883545, "lr": 4.036324560007184e-05, "tps": 202406, "wall": 9687.9} {"step": 29921, "train_loss": 3.0425989627838135, "lr": 4.036203012381546e-05, "tps": 202308, "wall": 9693.0} {"step": 29922, "train_loss": 3.0615074634552, "lr": 4.0360816682507706e-05, "tps": 202214, "wall": 9697.8} {"step": 29923, "train_loss": 3.008556365966797, "lr": 4.0359605276162346e-05, "tps": 202116, "wall": 9702.8} {"step": 29924, "train_loss": 2.9862866401672363, "lr": 4.03583959047931e-05, "tps": 202018, "wall": 9707.8} {"step": 29925, "train_loss": 2.935631275177002, "lr": 4.0357188568413664e-05, "tps": 201916, "wall": 9713.1} {"step": 29926, "train_loss": 2.9737823009490967, "lr": 4.03559832670377e-05, "tps": 201820, "wall": 9718.0} {"step": 29927, "train_loss": 2.9938554763793945, "lr": 4.0354780000678894e-05, "tps": 201724, "wall": 9723.0} {"step": 29928, "train_loss": 3.020953416824341, "lr": 4.0353578769350864e-05, "tps": 201629, "wall": 9727.9} {"step": 29929, "train_loss": 3.089581251144409, "lr": 4.035237957306719e-05, "tps": 201536, "wall": 9732.7} {"step": 29930, "train_loss": 3.1019604206085205, "lr": 4.03511824118415e-05, "tps": 201443, "wall": 9737.5} {"step": 29931, "train_loss": 3.0060434341430664, "lr": 4.0349987285687316e-05, "tps": 201350, "wall": 9742.3} {"step": 29932, "train_loss": 3.003157377243042, "lr": 4.034879419461822e-05, "tps": 201257, "wall": 9747.2} {"step": 29933, "train_loss": 3.0280637741088867, "lr": 4.034760313864767e-05, "tps": 201162, "wall": 9752.1} {"step": 29934, "train_loss": 3.1455979347229004, "lr": 4.034641411778921e-05, "tps": 201069, "wall": 9756.9} {"step": 29935, "train_loss": 3.064080238342285, "lr": 4.034522713205629e-05, "tps": 200977, "wall": 9761.7} {"step": 29936, "train_loss": 3.003793954849243, "lr": 4.034404218146234e-05, "tps": 200885, "wall": 9766.5} {"step": 29937, "train_loss": 3.097569465637207, "lr": 4.034285926602082e-05, "tps": 200793, "wall": 9771.3} {"step": 29938, "train_loss": 3.0654361248016357, "lr": 4.03416783857451e-05, "tps": 200700, "wall": 9776.1} {"step": 29939, "train_loss": 3.0851874351501465, "lr": 4.034049954064858e-05, "tps": 200608, "wall": 9781.0} {"step": 29940, "train_loss": 3.055737018585205, "lr": 4.0339322730744575e-05, "tps": 200516, "wall": 9785.8} {"step": 29941, "train_loss": 2.9518208503723145, "lr": 4.0338147956046455e-05, "tps": 200424, "wall": 9790.6} {"step": 29942, "train_loss": 3.0155484676361084, "lr": 4.033697521656753e-05, "tps": 200332, "wall": 9795.5} {"step": 29943, "train_loss": 3.0242509841918945, "lr": 4.033580451232104e-05, "tps": 200238, "wall": 9800.4} {"step": 29944, "train_loss": 2.991314172744751, "lr": 4.033463584332029e-05, "tps": 200146, "wall": 9805.2} {"step": 29945, "train_loss": 2.981041431427002, "lr": 4.0333469209578514e-05, "tps": 200053, "wall": 9810.1} {"step": 29946, "train_loss": 3.0089759826660156, "lr": 4.033230461110892e-05, "tps": 199962, "wall": 9814.9} {"step": 29947, "train_loss": 2.964911699295044, "lr": 4.0331142047924676e-05, "tps": 199869, "wall": 9819.8} {"step": 29948, "train_loss": 3.0782017707824707, "lr": 4.0329981520038985e-05, "tps": 199775, "wall": 9824.7} {"step": 29949, "train_loss": 3.022239923477173, "lr": 4.0328823027465e-05, "tps": 199683, "wall": 9829.6} {"step": 29950, "train_loss": 3.0885605812072754, "lr": 4.032766657021581e-05, "tps": 199591, "wall": 9834.4} {"step": 29951, "train_loss": 3.0028152465820312, "lr": 4.032651214830453e-05, "tps": 199497, "wall": 9839.4} {"step": 29952, "train_loss": 3.0654051303863525, "lr": 4.032535976174425e-05, "tps": 199404, "wall": 9844.3} {"step": 29953, "train_loss": 2.937927722930908, "lr": 4.032420941054801e-05, "tps": 199312, "wall": 9849.2} {"step": 29954, "train_loss": 3.039966106414795, "lr": 4.032306109472886e-05, "tps": 199221, "wall": 9854.0} {"step": 29955, "train_loss": 2.976818084716797, "lr": 4.032191481429978e-05, "tps": 199130, "wall": 9858.8} {"step": 29956, "train_loss": 3.0358147621154785, "lr": 4.032077056927377e-05, "tps": 199035, "wall": 9863.9} {"step": 29957, "train_loss": 3.0045032501220703, "lr": 4.03196283596638e-05, "tps": 198942, "wall": 9868.8} {"step": 29958, "train_loss": 3.051987886428833, "lr": 4.031848818548279e-05, "tps": 198847, "wall": 9873.8} {"step": 29959, "train_loss": 3.0085532665252686, "lr": 4.0317350046743674e-05, "tps": 198753, "wall": 9878.8} {"step": 29960, "train_loss": 3.078394889831543, "lr": 4.031621394345932e-05, "tps": 198655, "wall": 9884.1} {"step": 29961, "train_loss": 3.0572919845581055, "lr": 4.031507987564263e-05, "tps": 198560, "wall": 9889.1} {"step": 29962, "train_loss": 3.1512575149536133, "lr": 4.031394784330644e-05, "tps": 198463, "wall": 9894.3} {"step": 29963, "train_loss": 2.9815149307250977, "lr": 4.031281784646356e-05, "tps": 198368, "wall": 9899.3} {"step": 29964, "train_loss": 3.0450291633605957, "lr": 4.031168988512681e-05, "tps": 198274, "wall": 9904.4} {"step": 29965, "train_loss": 3.015460729598999, "lr": 4.031056395930895e-05, "tps": 198182, "wall": 9909.3} {"step": 29966, "train_loss": 3.0670101642608643, "lr": 4.030944006902275e-05, "tps": 198090, "wall": 9914.2} {"step": 29967, "train_loss": 3.0707194805145264, "lr": 4.030831821428093e-05, "tps": 197997, "wall": 9919.3} {"step": 29968, "train_loss": 2.934967041015625, "lr": 4.030719839509621e-05, "tps": 197900, "wall": 9924.4} {"step": 29969, "train_loss": 3.0258140563964844, "lr": 4.030608061148124e-05, "tps": 197806, "wall": 9929.5} {"step": 29970, "train_loss": 2.960571765899658, "lr": 4.030496486344873e-05, "tps": 197713, "wall": 9934.5} {"step": 29971, "train_loss": 3.1140878200531006, "lr": 4.03038511510113e-05, "tps": 197618, "wall": 9939.6} {"step": 29972, "train_loss": 2.972693920135498, "lr": 4.030273947418157e-05, "tps": 197525, "wall": 9944.6} {"step": 29973, "train_loss": 3.161741018295288, "lr": 4.030162983297213e-05, "tps": 197430, "wall": 9949.7} {"step": 29974, "train_loss": 3.068915843963623, "lr": 4.030052222739554e-05, "tps": 197336, "wall": 9954.8} {"step": 29975, "train_loss": 3.0453217029571533, "lr": 4.029941665746436e-05, "tps": 197247, "wall": 9959.6} {"step": 29976, "train_loss": 3.051130533218384, "lr": 4.029831312319111e-05, "tps": 197157, "wall": 9964.5} {"step": 29977, "train_loss": 2.9800307750701904, "lr": 4.029721162458828e-05, "tps": 197067, "wall": 9969.4} {"step": 29978, "train_loss": 3.119074821472168, "lr": 4.0296112161668376e-05, "tps": 196975, "wall": 9974.4} {"step": 29979, "train_loss": 2.9856276512145996, "lr": 4.029501473444383e-05, "tps": 196882, "wall": 9979.4} {"step": 29980, "train_loss": 3.0722270011901855, "lr": 4.029391934292707e-05, "tps": 196790, "wall": 9984.4} {"step": 29981, "train_loss": 3.0085816383361816, "lr": 4.029282598713051e-05, "tps": 196699, "wall": 9989.3} {"step": 29982, "train_loss": 3.082167148590088, "lr": 4.029173466706655e-05, "tps": 196609, "wall": 9994.3} {"step": 29983, "train_loss": 3.0229127407073975, "lr": 4.029064538274755e-05, "tps": 196518, "wall": 9999.2} {"step": 29984, "train_loss": 3.001378297805786, "lr": 4.028955813418583e-05, "tps": 196427, "wall": 10004.2} {"step": 29985, "train_loss": 2.966434955596924, "lr": 4.0288472921393715e-05, "tps": 196337, "wall": 10009.1} {"step": 29986, "train_loss": 3.0976357460021973, "lr": 4.028738974438349e-05, "tps": 196246, "wall": 10014.1} {"step": 29987, "train_loss": 3.0912210941314697, "lr": 4.028630860316746e-05, "tps": 196157, "wall": 10019.0} {"step": 29988, "train_loss": 3.12016224861145, "lr": 4.0285229497757845e-05, "tps": 196067, "wall": 10023.9} {"step": 29989, "train_loss": 3.09987735748291, "lr": 4.028415242816685e-05, "tps": 195978, "wall": 10028.8} {"step": 29990, "train_loss": 2.971353530883789, "lr": 4.028307739440672e-05, "tps": 195888, "wall": 10033.7} {"step": 29991, "train_loss": 3.067042827606201, "lr": 4.028200439648963e-05, "tps": 195799, "wall": 10038.6} {"step": 29992, "train_loss": 2.9869985580444336, "lr": 4.028093343442767e-05, "tps": 195709, "wall": 10043.6} {"step": 29993, "train_loss": 3.0746254920959473, "lr": 4.027986450823306e-05, "tps": 195620, "wall": 10048.4} {"step": 29994, "train_loss": 3.0061087608337402, "lr": 4.027879761791784e-05, "tps": 195531, "wall": 10053.4} {"step": 29995, "train_loss": 2.995401620864868, "lr": 4.027773276349414e-05, "tps": 195438, "wall": 10058.5} {"step": 29996, "train_loss": 3.1112914085388184, "lr": 4.0276669944974014e-05, "tps": 195349, "wall": 10063.4} {"step": 29997, "train_loss": 2.9776346683502197, "lr": 4.0275609162369476e-05, "tps": 195263, "wall": 10068.2} {"step": 29998, "train_loss": 3.142609119415283, "lr": 4.0274550415692544e-05, "tps": 195171, "wall": 10073.3} {"step": 29999, "train_loss": 3.0610766410827637, "lr": 4.027349370495525e-05, "tps": 195081, "wall": 10078.2} {"step": 30000, "train_loss": 3.0661492347717285, "lr": 4.027243903016954e-05, "tps": 194993, "wall": 10083.1, "val_loss_monitor": 3.342864080973755, "val_loss_full": 3.361604109595712} {"step": 30001, "train_loss": 2.965359687805176, "lr": 4.027138639134738e-05, "tps": 191726, "wall": 10255.3} {"step": 30002, "train_loss": 2.987990140914917, "lr": 4.0270335788500655e-05, "tps": 191640, "wall": 10260.3} {"step": 30003, "train_loss": 2.9448697566986084, "lr": 4.02692872216413e-05, "tps": 191554, "wall": 10265.2} {"step": 30004, "train_loss": 3.052778720855713, "lr": 4.026824069078117e-05, "tps": 191470, "wall": 10270.0} {"step": 30005, "train_loss": 2.986929178237915, "lr": 4.026719619593215e-05, "tps": 191387, "wall": 10274.8} {"step": 30006, "train_loss": 3.1454455852508545, "lr": 4.026615373710603e-05, "tps": 191303, "wall": 10279.7} {"step": 30007, "train_loss": 3.1401660442352295, "lr": 4.026511331431467e-05, "tps": 191220, "wall": 10284.5} {"step": 30008, "train_loss": 3.0773978233337402, "lr": 4.0264074927569824e-05, "tps": 191137, "wall": 10289.3} {"step": 30009, "train_loss": 3.069671869277954, "lr": 4.0263038576883255e-05, "tps": 191053, "wall": 10294.1} {"step": 30010, "train_loss": 2.9451048374176025, "lr": 4.026200426226672e-05, "tps": 190970, "wall": 10299.0} {"step": 30011, "train_loss": 3.0854086875915527, "lr": 4.026097198373191e-05, "tps": 190887, "wall": 10303.8} {"step": 30012, "train_loss": 2.854264259338379, "lr": 4.025994174129053e-05, "tps": 190804, "wall": 10308.6} {"step": 30013, "train_loss": 3.0273756980895996, "lr": 4.025891353495426e-05, "tps": 190722, "wall": 10313.4} {"step": 30014, "train_loss": 3.021714687347412, "lr": 4.0257887364734756e-05, "tps": 190639, "wall": 10318.2} {"step": 30015, "train_loss": 2.9857981204986572, "lr": 4.025686323064361e-05, "tps": 190557, "wall": 10323.0} {"step": 30016, "train_loss": 2.9668726921081543, "lr": 4.025584113269245e-05, "tps": 190474, "wall": 10327.8} {"step": 30017, "train_loss": 2.9899802207946777, "lr": 4.0254821070892846e-05, "tps": 190392, "wall": 10332.6} {"step": 30018, "train_loss": 2.9771084785461426, "lr": 4.025380304525633e-05, "tps": 190310, "wall": 10337.4} {"step": 30019, "train_loss": 3.0637197494506836, "lr": 4.0252787055794494e-05, "tps": 190228, "wall": 10342.3} {"step": 30020, "train_loss": 3.0580837726593018, "lr": 4.025177310251879e-05, "tps": 190146, "wall": 10347.1} {"step": 30021, "train_loss": 3.198465347290039, "lr": 4.0250761185440724e-05, "tps": 190063, "wall": 10351.9} {"step": 30022, "train_loss": 3.065298080444336, "lr": 4.024975130457177e-05, "tps": 189981, "wall": 10356.7} {"step": 30023, "train_loss": 3.18422269821167, "lr": 4.024874345992333e-05, "tps": 189899, "wall": 10361.5} {"step": 30024, "train_loss": 3.052855968475342, "lr": 4.0247737651506876e-05, "tps": 189818, "wall": 10366.3} {"step": 30025, "train_loss": 3.0628857612609863, "lr": 4.024673387933378e-05, "tps": 189736, "wall": 10371.1} {"step": 30026, "train_loss": 3.107403516769409, "lr": 4.0245732143415384e-05, "tps": 189655, "wall": 10375.9} {"step": 30027, "train_loss": 2.9907758235931396, "lr": 4.024473244376307e-05, "tps": 189574, "wall": 10380.7} {"step": 30028, "train_loss": 3.027163028717041, "lr": 4.024373478038815e-05, "tps": 189493, "wall": 10385.5} {"step": 30029, "train_loss": 3.0443034172058105, "lr": 4.024273915330193e-05, "tps": 189412, "wall": 10390.3} {"step": 30030, "train_loss": 3.0090677738189697, "lr": 4.0241745562515686e-05, "tps": 189330, "wall": 10395.1} {"step": 30031, "train_loss": 3.023563861846924, "lr": 4.024075400804066e-05, "tps": 189249, "wall": 10399.9} {"step": 30032, "train_loss": 3.1605591773986816, "lr": 4.023976448988811e-05, "tps": 189168, "wall": 10404.7} {"step": 30033, "train_loss": 3.0479977130889893, "lr": 4.023877700806923e-05, "tps": 189086, "wall": 10409.5} {"step": 30034, "train_loss": 2.9717135429382324, "lr": 4.023779156259521e-05, "tps": 189004, "wall": 10414.4} {"step": 30035, "train_loss": 3.051496744155884, "lr": 4.023680815347721e-05, "tps": 188923, "wall": 10419.3} {"step": 30036, "train_loss": 3.0771090984344482, "lr": 4.0235826780726364e-05, "tps": 188842, "wall": 10424.1} {"step": 30037, "train_loss": 2.9473583698272705, "lr": 4.023484744435383e-05, "tps": 188761, "wall": 10428.9} {"step": 30038, "train_loss": 3.0475778579711914, "lr": 4.0233870144370626e-05, "tps": 188679, "wall": 10433.8} {"step": 30039, "train_loss": 3.0136115550994873, "lr": 4.02328948807879e-05, "tps": 188597, "wall": 10438.6} {"step": 30040, "train_loss": 2.999390125274658, "lr": 4.023192165361665e-05, "tps": 188515, "wall": 10443.5} {"step": 30041, "train_loss": 3.041649580001831, "lr": 4.023095046286792e-05, "tps": 188434, "wall": 10448.4} {"step": 30042, "train_loss": 2.9717931747436523, "lr": 4.02299813085527e-05, "tps": 188353, "wall": 10453.2} {"step": 30043, "train_loss": 3.0547661781311035, "lr": 4.0229014190682e-05, "tps": 188272, "wall": 10458.0} {"step": 30044, "train_loss": 2.961475372314453, "lr": 4.022804910926673e-05, "tps": 188192, "wall": 10462.9} {"step": 30045, "train_loss": 3.0544071197509766, "lr": 4.022708606431784e-05, "tps": 188111, "wall": 10467.7} {"step": 30046, "train_loss": 3.066498041152954, "lr": 4.0226125055846264e-05, "tps": 188030, "wall": 10472.5} {"step": 30047, "train_loss": 2.991997718811035, "lr": 4.0225166083862865e-05, "tps": 187950, "wall": 10477.4} {"step": 30048, "train_loss": 3.036458730697632, "lr": 4.0224209148378514e-05, "tps": 187870, "wall": 10482.2} {"step": 30049, "train_loss": 3.06124210357666, "lr": 4.022325424940403e-05, "tps": 187790, "wall": 10487.0} {"step": 30050, "train_loss": 2.9715490341186523, "lr": 4.022230138695026e-05, "tps": 187711, "wall": 10491.8} {"step": 30051, "train_loss": 3.1471991539001465, "lr": 4.022135056102798e-05, "tps": 187631, "wall": 10496.6} {"step": 30052, "train_loss": 3.0367307662963867, "lr": 4.022040177164798e-05, "tps": 187550, "wall": 10501.5} {"step": 30053, "train_loss": 2.9959254264831543, "lr": 4.0219455018820984e-05, "tps": 187469, "wall": 10506.4} {"step": 30054, "train_loss": 3.08317232131958, "lr": 4.0218510302557724e-05, "tps": 187389, "wall": 10511.2} {"step": 30055, "train_loss": 3.049808979034424, "lr": 4.021756762286891e-05, "tps": 187308, "wall": 10516.1} {"step": 30056, "train_loss": 3.0892982482910156, "lr": 4.021662697976523e-05, "tps": 187227, "wall": 10521.0} {"step": 30057, "train_loss": 2.910073757171631, "lr": 4.021568837325729e-05, "tps": 187145, "wall": 10525.9} {"step": 30058, "train_loss": 3.0403666496276855, "lr": 4.02147518033558e-05, "tps": 187063, "wall": 10530.9} {"step": 30059, "train_loss": 3.127413749694824, "lr": 4.0213817270071296e-05, "tps": 186983, "wall": 10535.7} {"step": 30060, "train_loss": 3.0134119987487793, "lr": 4.0212884773414405e-05, "tps": 186904, "wall": 10540.6} {"step": 30061, "train_loss": 3.1347246170043945, "lr": 4.0211954313395693e-05, "tps": 186825, "wall": 10545.4} {"step": 30062, "train_loss": 2.9536542892456055, "lr": 4.021102589002567e-05, "tps": 186746, "wall": 10550.2} {"step": 30063, "train_loss": 3.0584957599639893, "lr": 4.021009950331489e-05, "tps": 186668, "wall": 10555.0} {"step": 30064, "train_loss": 3.059514045715332, "lr": 4.020917515327382e-05, "tps": 186589, "wall": 10559.8} {"step": 30065, "train_loss": 2.955991744995117, "lr": 4.020825283991295e-05, "tps": 186510, "wall": 10564.6} {"step": 30066, "train_loss": 3.1201603412628174, "lr": 4.020733256324271e-05, "tps": 186432, "wall": 10569.4} {"step": 30067, "train_loss": 3.06002140045166, "lr": 4.020641432327352e-05, "tps": 186353, "wall": 10574.2} {"step": 30068, "train_loss": 3.098942756652832, "lr": 4.020549812001582e-05, "tps": 186275, "wall": 10578.9} {"step": 30069, "train_loss": 2.983865261077881, "lr": 4.020458395347995e-05, "tps": 186197, "wall": 10583.7} {"step": 30070, "train_loss": 3.107557773590088, "lr": 4.020367182367629e-05, "tps": 186119, "wall": 10588.5} {"step": 30071, "train_loss": 3.0938525199890137, "lr": 4.0202761730615154e-05, "tps": 186040, "wall": 10593.4} {"step": 30072, "train_loss": 3.025184154510498, "lr": 4.0201853674306866e-05, "tps": 185961, "wall": 10598.3} {"step": 30073, "train_loss": 3.0404391288757324, "lr": 4.02009476547617e-05, "tps": 185883, "wall": 10603.1} {"step": 30074, "train_loss": 3.0882012844085693, "lr": 4.0200043671989915e-05, "tps": 185804, "wall": 10607.9} {"step": 30075, "train_loss": 2.9959332942962646, "lr": 4.019914172600178e-05, "tps": 185726, "wall": 10612.7} {"step": 30076, "train_loss": 3.0286343097686768, "lr": 4.01982418168075e-05, "tps": 185647, "wall": 10617.6} {"step": 30077, "train_loss": 2.9970717430114746, "lr": 4.019734394441724e-05, "tps": 185568, "wall": 10622.5} {"step": 30078, "train_loss": 3.196105480194092, "lr": 4.0196448108841225e-05, "tps": 185490, "wall": 10627.3} {"step": 30079, "train_loss": 3.0118470191955566, "lr": 4.019555431008955e-05, "tps": 185412, "wall": 10632.1} {"step": 30080, "train_loss": 2.993898868560791, "lr": 4.019466254817236e-05, "tps": 185334, "wall": 10636.9} {"step": 30081, "train_loss": 3.0461809635162354, "lr": 4.0193772823099785e-05, "tps": 185256, "wall": 10641.8} {"step": 30082, "train_loss": 2.9797773361206055, "lr": 4.019288513488185e-05, "tps": 185178, "wall": 10646.6} {"step": 30083, "train_loss": 2.9537758827209473, "lr": 4.019199948352866e-05, "tps": 185100, "wall": 10651.4} {"step": 30084, "train_loss": 3.0876359939575195, "lr": 4.019111586905021e-05, "tps": 185023, "wall": 10656.2} {"step": 30085, "train_loss": 3.0285117626190186, "lr": 4.019023429145655e-05, "tps": 184946, "wall": 10661.0} {"step": 30086, "train_loss": 3.033207654953003, "lr": 4.018935475075764e-05, "tps": 184869, "wall": 10665.8} {"step": 30087, "train_loss": 2.917966842651367, "lr": 4.018847724696343e-05, "tps": 184792, "wall": 10670.6} {"step": 30088, "train_loss": 3.0982611179351807, "lr": 4.0187601780083874e-05, "tps": 184715, "wall": 10675.4} {"step": 30089, "train_loss": 3.145188570022583, "lr": 4.018672835012891e-05, "tps": 184638, "wall": 10680.2} {"step": 30090, "train_loss": 3.0101513862609863, "lr": 4.018585695710841e-05, "tps": 184562, "wall": 10685.0} {"step": 30091, "train_loss": 3.0237488746643066, "lr": 4.0184987601032245e-05, "tps": 184485, "wall": 10689.8} {"step": 30092, "train_loss": 3.1617860794067383, "lr": 4.0184120281910266e-05, "tps": 184407, "wall": 10694.7} {"step": 30093, "train_loss": 3.0218048095703125, "lr": 4.0183254999752316e-05, "tps": 184328, "wall": 10699.6} {"step": 30094, "train_loss": 3.062666416168213, "lr": 4.018239175456816e-05, "tps": 184250, "wall": 10704.5} {"step": 30095, "train_loss": 3.0774998664855957, "lr": 4.018153054636761e-05, "tps": 184172, "wall": 10709.4} {"step": 30096, "train_loss": 3.0974578857421875, "lr": 4.018067137516043e-05, "tps": 184094, "wall": 10714.2} {"step": 30097, "train_loss": 3.0299887657165527, "lr": 4.01798142409563e-05, "tps": 184017, "wall": 10719.1} {"step": 30098, "train_loss": 3.0615944862365723, "lr": 4.017895914376498e-05, "tps": 183941, "wall": 10723.9} {"step": 30099, "train_loss": 2.9694066047668457, "lr": 4.017810608359614e-05, "tps": 183865, "wall": 10728.7} {"step": 30100, "train_loss": 3.046046257019043, "lr": 4.017725506045944e-05, "tps": 183789, "wall": 10733.5} {"step": 30101, "train_loss": 3.0333499908447266, "lr": 4.017640607436451e-05, "tps": 183713, "wall": 10738.3} {"step": 30102, "train_loss": 3.098310947418213, "lr": 4.0175559125320994e-05, "tps": 183636, "wall": 10743.1} {"step": 30103, "train_loss": 3.068375587463379, "lr": 4.017471421333845e-05, "tps": 183560, "wall": 10747.9} {"step": 30104, "train_loss": 3.0168676376342773, "lr": 4.017387133842651e-05, "tps": 183484, "wall": 10752.7} {"step": 30105, "train_loss": 3.0687270164489746, "lr": 4.017303050059465e-05, "tps": 183407, "wall": 10757.6} {"step": 30106, "train_loss": 3.021777391433716, "lr": 4.0172191699852445e-05, "tps": 183331, "wall": 10762.4} {"step": 30107, "train_loss": 2.925750255584717, "lr": 4.017135493620939e-05, "tps": 183255, "wall": 10767.2} {"step": 30108, "train_loss": 2.9405815601348877, "lr": 4.0170520209674935e-05, "tps": 183179, "wall": 10772.1} {"step": 30109, "train_loss": 3.0532925128936768, "lr": 4.016968752025856e-05, "tps": 183103, "wall": 10776.9} {"step": 30110, "train_loss": 3.0865392684936523, "lr": 4.0168856867969705e-05, "tps": 183025, "wall": 10781.9} {"step": 30111, "train_loss": 2.98762583732605, "lr": 4.0168028252817755e-05, "tps": 182947, "wall": 10786.8} {"step": 30112, "train_loss": 3.0303478240966797, "lr": 4.016720167481213e-05, "tps": 182870, "wall": 10791.7} {"step": 30113, "train_loss": 3.0775938034057617, "lr": 4.016637713396215e-05, "tps": 182794, "wall": 10796.6} {"step": 30114, "train_loss": 3.0072858333587646, "lr": 4.016555463027719e-05, "tps": 182718, "wall": 10801.4} {"step": 30115, "train_loss": 3.115044593811035, "lr": 4.016473416376654e-05, "tps": 182641, "wall": 10806.3} {"step": 30116, "train_loss": 2.9585490226745605, "lr": 4.0163915734439525e-05, "tps": 182565, "wall": 10811.2} {"step": 30117, "train_loss": 3.0331475734710693, "lr": 4.0163099342305413e-05, "tps": 182488, "wall": 10816.1} {"step": 30118, "train_loss": 3.1752467155456543, "lr": 4.016228498737343e-05, "tps": 182412, "wall": 10821.0} {"step": 30119, "train_loss": 2.9651129245758057, "lr": 4.01614726696528e-05, "tps": 182335, "wall": 10825.9} {"step": 30120, "train_loss": 3.113152027130127, "lr": 4.016066238915274e-05, "tps": 182257, "wall": 10830.9} {"step": 30121, "train_loss": 3.050172805786133, "lr": 4.015985414588245e-05, "tps": 182181, "wall": 10835.8} {"step": 30122, "train_loss": 2.930166721343994, "lr": 4.0159047939851036e-05, "tps": 182104, "wall": 10840.7} {"step": 30123, "train_loss": 3.0332517623901367, "lr": 4.0158243771067647e-05, "tps": 182029, "wall": 10845.5} {"step": 30124, "train_loss": 3.022357940673828, "lr": 4.0157441639541434e-05, "tps": 181953, "wall": 10850.4} {"step": 30125, "train_loss": 3.0331668853759766, "lr": 4.0156641545281424e-05, "tps": 181878, "wall": 10855.3} {"step": 30126, "train_loss": 3.0269792079925537, "lr": 4.015584348829673e-05, "tps": 181801, "wall": 10860.2} {"step": 30127, "train_loss": 3.0370545387268066, "lr": 4.015504746859635e-05, "tps": 181725, "wall": 10865.1} {"step": 30128, "train_loss": 3.0487852096557617, "lr": 4.015425348618933e-05, "tps": 181649, "wall": 10870.0} {"step": 30129, "train_loss": 2.9918274879455566, "lr": 4.015346154108468e-05, "tps": 181574, "wall": 10874.8} {"step": 30130, "train_loss": 3.0727791786193848, "lr": 4.0152671633291325e-05, "tps": 181499, "wall": 10879.7} {"step": 30131, "train_loss": 3.110647439956665, "lr": 4.015188376281822e-05, "tps": 181424, "wall": 10884.6} {"step": 30132, "train_loss": 3.04587721824646, "lr": 4.015109792967433e-05, "tps": 181350, "wall": 10889.4} {"step": 30133, "train_loss": 2.946550130844116, "lr": 4.015031413386853e-05, "tps": 181275, "wall": 10894.3} {"step": 30134, "train_loss": 2.9899797439575195, "lr": 4.014953237540968e-05, "tps": 181199, "wall": 10899.2} {"step": 30135, "train_loss": 3.084533929824829, "lr": 4.014875265430667e-05, "tps": 181125, "wall": 10904.0} {"step": 30136, "train_loss": 3.056093215942383, "lr": 4.014797497056832e-05, "tps": 181052, "wall": 10908.8} {"step": 30137, "train_loss": 3.148139715194702, "lr": 4.014719932420345e-05, "tps": 180979, "wall": 10913.5} {"step": 30138, "train_loss": 3.1252059936523438, "lr": 4.014642571522081e-05, "tps": 180904, "wall": 10918.4} {"step": 30139, "train_loss": 3.0481951236724854, "lr": 4.014565414362922e-05, "tps": 180830, "wall": 10923.2} {"step": 30140, "train_loss": 2.9791250228881836, "lr": 4.014488460943737e-05, "tps": 180756, "wall": 10928.1} {"step": 30141, "train_loss": 2.997082233428955, "lr": 4.0144117112654e-05, "tps": 180683, "wall": 10932.9} {"step": 30142, "train_loss": 3.059051513671875, "lr": 4.0143351653287806e-05, "tps": 180609, "wall": 10937.7} {"step": 30143, "train_loss": 2.9822795391082764, "lr": 4.0142588231347444e-05, "tps": 180537, "wall": 10942.4} {"step": 30144, "train_loss": 3.0725977420806885, "lr": 4.0141826846841586e-05, "tps": 180463, "wall": 10947.2} {"step": 30145, "train_loss": 3.0188586711883545, "lr": 4.014106749977883e-05, "tps": 180390, "wall": 10952.1} {"step": 30146, "train_loss": 3.0767226219177246, "lr": 4.0140310190167814e-05, "tps": 180316, "wall": 10956.9} {"step": 30147, "train_loss": 3.1979598999023438, "lr": 4.013955491801708e-05, "tps": 180242, "wall": 10961.8} {"step": 30148, "train_loss": 3.089155912399292, "lr": 4.01388016833352e-05, "tps": 180169, "wall": 10966.6} {"step": 30149, "train_loss": 3.0089430809020996, "lr": 4.0138050486130705e-05, "tps": 180096, "wall": 10971.4} {"step": 30150, "train_loss": 3.019942283630371, "lr": 4.0137301326412104e-05, "tps": 180023, "wall": 10976.2} {"step": 30151, "train_loss": 2.9552834033966064, "lr": 4.0136554204187875e-05, "tps": 179951, "wall": 10981.0} {"step": 30152, "train_loss": 3.1148438453674316, "lr": 4.01358091194665e-05, "tps": 179879, "wall": 10985.7} {"step": 30153, "train_loss": 3.0639455318450928, "lr": 4.013506607225642e-05, "tps": 179807, "wall": 10990.5} {"step": 30154, "train_loss": 3.1054677963256836, "lr": 4.013432506256602e-05, "tps": 179734, "wall": 10995.3} {"step": 30155, "train_loss": 3.010267972946167, "lr": 4.0133586090403725e-05, "tps": 179662, "wall": 11000.1} {"step": 30156, "train_loss": 3.0739426612854004, "lr": 4.01328491557779e-05, "tps": 179585, "wall": 11005.2} {"step": 30157, "train_loss": 3.0537567138671875, "lr": 4.013211425869689e-05, "tps": 179509, "wall": 11010.2} {"step": 30158, "train_loss": 2.9535722732543945, "lr": 4.0131381399169035e-05, "tps": 179437, "wall": 11015.0} {"step": 30159, "train_loss": 3.088991165161133, "lr": 4.013065057720259e-05, "tps": 179365, "wall": 11019.8} {"step": 30160, "train_loss": 3.018155336380005, "lr": 4.012992179280587e-05, "tps": 179293, "wall": 11024.6} {"step": 30161, "train_loss": 3.1213059425354004, "lr": 4.012919504598715e-05, "tps": 179221, "wall": 11029.3} {"step": 30162, "train_loss": 3.0483946800231934, "lr": 4.012847033675462e-05, "tps": 179149, "wall": 11034.1} {"step": 30163, "train_loss": 3.0292296409606934, "lr": 4.0127747665116536e-05, "tps": 179077, "wall": 11039.0} {"step": 30164, "train_loss": 3.046330451965332, "lr": 4.012702703108103e-05, "tps": 179004, "wall": 11043.8} {"step": 30165, "train_loss": 3.030851125717163, "lr": 4.012630843465631e-05, "tps": 178932, "wall": 11048.6} {"step": 30166, "train_loss": 3.0601840019226074, "lr": 4.0125591875850495e-05, "tps": 178861, "wall": 11053.4} {"step": 30167, "train_loss": 2.983120918273926, "lr": 4.012487735467169e-05, "tps": 178790, "wall": 11058.1} {"step": 30168, "train_loss": 3.0175976753234863, "lr": 4.0124164871128025e-05, "tps": 178719, "wall": 11062.9} {"step": 30169, "train_loss": 2.9871439933776855, "lr": 4.012345442522754e-05, "tps": 178647, "wall": 11067.7} {"step": 30170, "train_loss": 2.9423394203186035, "lr": 4.0122746016978295e-05, "tps": 178574, "wall": 11072.6} {"step": 30171, "train_loss": 3.0907585620880127, "lr": 4.012203964638832e-05, "tps": 178502, "wall": 11077.4} {"step": 30172, "train_loss": 3.049140214920044, "lr": 4.012133531346561e-05, "tps": 178429, "wall": 11082.3} {"step": 30173, "train_loss": 2.9614977836608887, "lr": 4.0120633018218154e-05, "tps": 178357, "wall": 11087.2} {"step": 30174, "train_loss": 3.0969486236572266, "lr": 4.011993276065388e-05, "tps": 178285, "wall": 11092.0} {"step": 30175, "train_loss": 2.956181287765503, "lr": 4.0119234540780745e-05, "tps": 178214, "wall": 11096.8} {"step": 30176, "train_loss": 3.071131706237793, "lr": 4.011853835860665e-05, "tps": 178143, "wall": 11101.6} {"step": 30177, "train_loss": 3.0781586170196533, "lr": 4.011784421413951e-05, "tps": 178072, "wall": 11106.4} {"step": 30178, "train_loss": 3.0240609645843506, "lr": 4.011715210738713e-05, "tps": 178001, "wall": 11111.2} {"step": 30179, "train_loss": 3.0860517024993896, "lr": 4.0116462038357396e-05, "tps": 177931, "wall": 11115.9} {"step": 30180, "train_loss": 3.030211925506592, "lr": 4.0115774007058104e-05, "tps": 177861, "wall": 11120.7} {"step": 30181, "train_loss": 2.9597368240356445, "lr": 4.011508801349707e-05, "tps": 177791, "wall": 11125.5} {"step": 30182, "train_loss": 3.0142269134521484, "lr": 4.011440405768202e-05, "tps": 177719, "wall": 11130.3} {"step": 30183, "train_loss": 2.9663662910461426, "lr": 4.0113722139620766e-05, "tps": 177649, "wall": 11135.1} {"step": 30184, "train_loss": 3.0870816707611084, "lr": 4.011304225932099e-05, "tps": 177579, "wall": 11139.9} {"step": 30185, "train_loss": 3.106674909591675, "lr": 4.01123644167904e-05, "tps": 177508, "wall": 11144.7} {"step": 30186, "train_loss": 3.05745267868042, "lr": 4.0111688612036685e-05, "tps": 177438, "wall": 11149.4} {"step": 30187, "train_loss": 2.9442718029022217, "lr": 4.0111014845067466e-05, "tps": 177368, "wall": 11154.2} {"step": 30188, "train_loss": 3.056082010269165, "lr": 4.011034311589042e-05, "tps": 177297, "wall": 11159.0} {"step": 30189, "train_loss": 3.1017098426818848, "lr": 4.010967342451315e-05, "tps": 177226, "wall": 11163.9} {"step": 30190, "train_loss": 3.0531671047210693, "lr": 4.010900577094322e-05, "tps": 177155, "wall": 11168.7} {"step": 30191, "train_loss": 3.018717050552368, "lr": 4.0108340155188206e-05, "tps": 177083, "wall": 11173.6} {"step": 30192, "train_loss": 3.0712313652038574, "lr": 4.010767657725567e-05, "tps": 177013, "wall": 11178.4} {"step": 30193, "train_loss": 3.0810317993164062, "lr": 4.010701503715307e-05, "tps": 176943, "wall": 11183.2} {"step": 30194, "train_loss": 3.0739569664001465, "lr": 4.010635553488795e-05, "tps": 176872, "wall": 11188.0} {"step": 30195, "train_loss": 3.0088093280792236, "lr": 4.010569807046776e-05, "tps": 176802, "wall": 11192.9} {"step": 30196, "train_loss": 3.0269644260406494, "lr": 4.0105042643899964e-05, "tps": 176732, "wall": 11197.7} {"step": 30197, "train_loss": 3.088233470916748, "lr": 4.0104389255191964e-05, "tps": 176663, "wall": 11202.4} {"step": 30198, "train_loss": 2.98279070854187, "lr": 4.01037379043512e-05, "tps": 176593, "wall": 11207.2} {"step": 30199, "train_loss": 3.1166720390319824, "lr": 4.0103088591385007e-05, "tps": 176524, "wall": 11212.0} {"step": 30200, "train_loss": 2.9739952087402344, "lr": 4.0102441316300754e-05, "tps": 176455, "wall": 11216.7} {"step": 30201, "train_loss": 3.012748956680298, "lr": 4.010179607910578e-05, "tps": 176386, "wall": 11221.5} {"step": 30202, "train_loss": 3.1032793521881104, "lr": 4.01011528798074e-05, "tps": 176316, "wall": 11226.3} {"step": 30203, "train_loss": 3.0594027042388916, "lr": 4.01005117184129e-05, "tps": 176247, "wall": 11231.1} {"step": 30204, "train_loss": 3.0513923168182373, "lr": 4.009987259492953e-05, "tps": 176178, "wall": 11235.9} {"step": 30205, "train_loss": 3.0488133430480957, "lr": 4.009923550936452e-05, "tps": 176109, "wall": 11240.6} {"step": 30206, "train_loss": 3.034115791320801, "lr": 4.009860046172513e-05, "tps": 176040, "wall": 11245.4} {"step": 30207, "train_loss": 3.0153868198394775, "lr": 4.00979674520185e-05, "tps": 175970, "wall": 11250.3} {"step": 30208, "train_loss": 3.001079797744751, "lr": 4.009733648025184e-05, "tps": 175901, "wall": 11255.1} {"step": 30209, "train_loss": 3.0310616493225098, "lr": 4.0096707546432275e-05, "tps": 175832, "wall": 11259.8} {"step": 30210, "train_loss": 3.017704725265503, "lr": 4.009608065056696e-05, "tps": 175763, "wall": 11264.6} {"step": 30211, "train_loss": 3.0090794563293457, "lr": 4.009545579266296e-05, "tps": 175692, "wall": 11269.5} {"step": 30212, "train_loss": 3.054290533065796, "lr": 4.0094832972727373e-05, "tps": 175621, "wall": 11274.5} {"step": 30213, "train_loss": 3.1045663356781006, "lr": 4.009421219076724e-05, "tps": 175550, "wall": 11279.4} {"step": 30214, "train_loss": 2.9640254974365234, "lr": 4.0093593446789625e-05, "tps": 175481, "wall": 11284.2} {"step": 30215, "train_loss": 3.001887559890747, "lr": 4.009297674080151e-05, "tps": 175412, "wall": 11289.0} {"step": 30216, "train_loss": 3.0728116035461426, "lr": 4.009236207280988e-05, "tps": 175344, "wall": 11293.8} {"step": 30217, "train_loss": 2.9940850734710693, "lr": 4.0091749442821705e-05, "tps": 175275, "wall": 11298.6} {"step": 30218, "train_loss": 3.0410523414611816, "lr": 4.009113885084392e-05, "tps": 175207, "wall": 11303.3} {"step": 30219, "train_loss": 2.9835128784179688, "lr": 4.009053029688346e-05, "tps": 175138, "wall": 11308.2} {"step": 30220, "train_loss": 3.002289056777954, "lr": 4.00899237809472e-05, "tps": 175068, "wall": 11313.1} {"step": 30221, "train_loss": 3.130488872528076, "lr": 4.0089319303042016e-05, "tps": 174999, "wall": 11317.9} {"step": 30222, "train_loss": 2.970918893814087, "lr": 4.0088716863174764e-05, "tps": 174930, "wall": 11322.8} {"step": 30223, "train_loss": 2.873194932937622, "lr": 4.008811646135224e-05, "tps": 174861, "wall": 11327.6} {"step": 30224, "train_loss": 2.975250244140625, "lr": 4.008751809758129e-05, "tps": 174791, "wall": 11332.5} {"step": 30225, "train_loss": 3.036487102508545, "lr": 4.008692177186866e-05, "tps": 174722, "wall": 11337.4} {"step": 30226, "train_loss": 3.0985512733459473, "lr": 4.0086327484221106e-05, "tps": 174653, "wall": 11342.2} {"step": 30227, "train_loss": 2.9795544147491455, "lr": 4.008573523464537e-05, "tps": 174584, "wall": 11347.1} {"step": 30228, "train_loss": 3.1578145027160645, "lr": 4.0085145023148174e-05, "tps": 174514, "wall": 11352.0} {"step": 30229, "train_loss": 3.003877878189087, "lr": 4.008455684973615e-05, "tps": 174441, "wall": 11357.1} {"step": 30230, "train_loss": 2.967423439025879, "lr": 4.008397071441604e-05, "tps": 174371, "wall": 11362.1} {"step": 30231, "train_loss": 3.006709575653076, "lr": 4.008338661719443e-05, "tps": 174299, "wall": 11367.1} {"step": 30232, "train_loss": 2.899299144744873, "lr": 4.008280455807794e-05, "tps": 174229, "wall": 11372.1} {"step": 30233, "train_loss": 2.9160780906677246, "lr": 4.008222453707318e-05, "tps": 174161, "wall": 11376.9} {"step": 30234, "train_loss": 3.104470729827881, "lr": 4.008164655418673e-05, "tps": 174092, "wall": 11381.8} {"step": 30235, "train_loss": 3.0866799354553223, "lr": 4.0081070609425104e-05, "tps": 174023, "wall": 11386.7} {"step": 30236, "train_loss": 2.9954450130462646, "lr": 4.008049670279484e-05, "tps": 173955, "wall": 11391.5} {"step": 30237, "train_loss": 3.0928070545196533, "lr": 4.007992483430244e-05, "tps": 173887, "wall": 11396.3} {"step": 30238, "train_loss": 3.0788686275482178, "lr": 4.0079355003954395e-05, "tps": 173815, "wall": 11401.4} {"step": 30239, "train_loss": 3.1149420738220215, "lr": 4.007878721175716e-05, "tps": 173748, "wall": 11406.2} {"step": 30240, "train_loss": 3.1008827686309814, "lr": 4.007822145771714e-05, "tps": 173680, "wall": 11411.0} {"step": 30241, "train_loss": 3.039271354675293, "lr": 4.0077657741840766e-05, "tps": 173613, "wall": 11415.8} {"step": 30242, "train_loss": 3.06917142868042, "lr": 4.007709606413442e-05, "tps": 173543, "wall": 11420.8} {"step": 30243, "train_loss": 3.0826501846313477, "lr": 4.0076536424604464e-05, "tps": 173473, "wall": 11425.8} {"step": 30244, "train_loss": 3.0561742782592773, "lr": 4.007597882325722e-05, "tps": 173402, "wall": 11430.8} {"step": 30245, "train_loss": 2.9802918434143066, "lr": 4.0075423260099046e-05, "tps": 173333, "wall": 11435.8} {"step": 30246, "train_loss": 3.0267395973205566, "lr": 4.00748697351362e-05, "tps": 173259, "wall": 11441.1} {"step": 30247, "train_loss": 3.0951485633850098, "lr": 4.007431824837496e-05, "tps": 173190, "wall": 11445.9} {"step": 30248, "train_loss": 3.0276997089385986, "lr": 4.007376879982159e-05, "tps": 173122, "wall": 11450.8} {"step": 30249, "train_loss": 3.086681842803955, "lr": 4.007322138948229e-05, "tps": 173055, "wall": 11455.7} {"step": 30250, "train_loss": 3.009361743927002, "lr": 4.007267601736329e-05, "tps": 172988, "wall": 11460.5} {"step": 30251, "train_loss": 3.057875394821167, "lr": 4.007213268347073e-05, "tps": 172920, "wall": 11465.3} {"step": 30252, "train_loss": 2.8796653747558594, "lr": 4.007159138781079e-05, "tps": 172853, "wall": 11470.2} {"step": 30253, "train_loss": 3.001314640045166, "lr": 4.0071052130389594e-05, "tps": 172785, "wall": 11475.0} {"step": 30254, "train_loss": 3.113089084625244, "lr": 4.007051491121325e-05, "tps": 172716, "wall": 11480.0} {"step": 30255, "train_loss": 3.1104578971862793, "lr": 4.0069979730287857e-05, "tps": 172645, "wall": 11485.1} {"step": 30256, "train_loss": 3.0807180404663086, "lr": 4.006944658761946e-05, "tps": 172573, "wall": 11490.3} {"step": 30257, "train_loss": 2.939875602722168, "lr": 4.006891548321411e-05, "tps": 172504, "wall": 11495.3} {"step": 30258, "train_loss": 3.0971455574035645, "lr": 4.006838641707782e-05, "tps": 172436, "wall": 11500.2} {"step": 30259, "train_loss": 3.0687220096588135, "lr": 4.006785938921657e-05, "tps": 172364, "wall": 11505.4} {"step": 30260, "train_loss": 2.907663583755493, "lr": 4.0067334399636367e-05, "tps": 172295, "wall": 11510.4} {"step": 30261, "train_loss": 2.9980359077453613, "lr": 4.0066811448343115e-05, "tps": 172227, "wall": 11515.3} {"step": 30262, "train_loss": 3.0611891746520996, "lr": 4.006629053534276e-05, "tps": 172160, "wall": 11520.2} {"step": 30263, "train_loss": 3.039638042449951, "lr": 4.006577166064122e-05, "tps": 172092, "wall": 11525.1} {"step": 30264, "train_loss": 3.1648855209350586, "lr": 4.006525482424434e-05, "tps": 172023, "wall": 11530.1} {"step": 30265, "train_loss": 3.0464980602264404, "lr": 4.0064740026157975e-05, "tps": 171955, "wall": 11535.1} {"step": 30266, "train_loss": 2.984870433807373, "lr": 4.0064227266387995e-05, "tps": 171888, "wall": 11539.9} {"step": 30267, "train_loss": 3.0593905448913574, "lr": 4.006371654494016e-05, "tps": 171822, "wall": 11544.7} {"step": 30268, "train_loss": 3.087161064147949, "lr": 4.006320786182027e-05, "tps": 171757, "wall": 11549.5} {"step": 30269, "train_loss": 3.037288188934326, "lr": 4.006270121703413e-05, "tps": 171691, "wall": 11554.3} {"step": 30270, "train_loss": 3.125908136367798, "lr": 4.006219661058742e-05, "tps": 171626, "wall": 11559.1} {"step": 30271, "train_loss": 3.0882835388183594, "lr": 4.0061694042485885e-05, "tps": 171560, "wall": 11563.9} {"step": 30272, "train_loss": 2.9602251052856445, "lr": 4.0061193512735216e-05, "tps": 171495, "wall": 11568.6} {"step": 30273, "train_loss": 3.0678887367248535, "lr": 4.006069502134108e-05, "tps": 171430, "wall": 11573.4} {"step": 30274, "train_loss": 3.066643238067627, "lr": 4.0060198568309134e-05, "tps": 171366, "wall": 11578.1} {"step": 30275, "train_loss": 2.9720890522003174, "lr": 4.005970415364498e-05, "tps": 171300, "wall": 11583.0} {"step": 30276, "train_loss": 2.9715020656585693, "lr": 4.005921177735424e-05, "tps": 171233, "wall": 11587.9} {"step": 30277, "train_loss": 3.0621514320373535, "lr": 4.005872143944249e-05, "tps": 171167, "wall": 11592.7} {"step": 30278, "train_loss": 2.973895788192749, "lr": 4.005823313991526e-05, "tps": 171101, "wall": 11597.6} {"step": 30279, "train_loss": 3.112550973892212, "lr": 4.005774687877812e-05, "tps": 171036, "wall": 11602.4} {"step": 30280, "train_loss": 3.037348985671997, "lr": 4.0057262656036534e-05, "tps": 170971, "wall": 11607.2} {"step": 30281, "train_loss": 2.972740650177002, "lr": 4.0056780471696044e-05, "tps": 170906, "wall": 11612.0} {"step": 30282, "train_loss": 3.0394346714019775, "lr": 4.005630032576205e-05, "tps": 170840, "wall": 11616.8} {"step": 30283, "train_loss": 3.0337541103363037, "lr": 4.0055822218240035e-05, "tps": 170774, "wall": 11621.7} {"step": 30284, "train_loss": 2.9884912967681885, "lr": 4.00553461491354e-05, "tps": 170707, "wall": 11626.6} {"step": 30285, "train_loss": 3.108879327774048, "lr": 4.005487211845354e-05, "tps": 170642, "wall": 11631.5} {"step": 30286, "train_loss": 3.0649662017822266, "lr": 4.005440012619981e-05, "tps": 170576, "wall": 11636.3} {"step": 30287, "train_loss": 2.9955687522888184, "lr": 4.0053930172379595e-05, "tps": 170511, "wall": 11641.2} {"step": 30288, "train_loss": 3.0961642265319824, "lr": 4.005346225699817e-05, "tps": 170445, "wall": 11646.0} {"step": 30289, "train_loss": 2.9708566665649414, "lr": 4.0052996380060864e-05, "tps": 170379, "wall": 11651.0} {"step": 30290, "train_loss": 2.931976556777954, "lr": 4.005253254157296e-05, "tps": 170315, "wall": 11655.7} {"step": 30291, "train_loss": 2.9730119705200195, "lr": 4.00520707415397e-05, "tps": 170249, "wall": 11660.6} {"step": 30292, "train_loss": 3.0814435482025146, "lr": 4.005161097996632e-05, "tps": 170185, "wall": 11665.4} {"step": 30293, "train_loss": 3.008424758911133, "lr": 4.0051153256858e-05, "tps": 170119, "wall": 11670.3} {"step": 30294, "train_loss": 3.0459353923797607, "lr": 4.005069757221998e-05, "tps": 170054, "wall": 11675.2} {"step": 30295, "train_loss": 3.0722246170043945, "lr": 4.005024392605738e-05, "tps": 169989, "wall": 11680.0} {"step": 30296, "train_loss": 3.0339484214782715, "lr": 4.0049792318375353e-05, "tps": 169923, "wall": 11685.0} {"step": 30297, "train_loss": 3.0775160789489746, "lr": 4.004934274917902e-05, "tps": 169858, "wall": 11689.8} {"step": 30298, "train_loss": 3.066096067428589, "lr": 4.004889521847347e-05, "tps": 169793, "wall": 11694.6} {"step": 30299, "train_loss": 3.091895818710327, "lr": 4.004844972626377e-05, "tps": 169729, "wall": 11699.5} {"step": 30300, "train_loss": 3.058640718460083, "lr": 4.004800627255496e-05, "tps": 169664, "wall": 11704.3} {"step": 30301, "train_loss": 3.012017250061035, "lr": 4.0047564857352066e-05, "tps": 169599, "wall": 11709.2} {"step": 30302, "train_loss": 2.9481897354125977, "lr": 4.0047125480660094e-05, "tps": 169535, "wall": 11714.0} {"step": 30303, "train_loss": 3.0350589752197266, "lr": 4.004668814248404e-05, "tps": 169471, "wall": 11718.8} {"step": 30304, "train_loss": 2.9769396781921387, "lr": 4.0046252842828816e-05, "tps": 169406, "wall": 11723.7} {"step": 30305, "train_loss": 3.078644037246704, "lr": 4.004581958169938e-05, "tps": 169340, "wall": 11728.6} {"step": 30306, "train_loss": 3.0465006828308105, "lr": 4.0045388359100636e-05, "tps": 169273, "wall": 11733.7} {"step": 30307, "train_loss": 3.0428504943847656, "lr": 4.004495917503747e-05, "tps": 169209, "wall": 11738.5} {"step": 30308, "train_loss": 3.0193214416503906, "lr": 4.0044532029514734e-05, "tps": 169141, "wall": 11743.6} {"step": 30309, "train_loss": 3.134701728820801, "lr": 4.0044106922537276e-05, "tps": 169076, "wall": 11748.5} {"step": 30310, "train_loss": 2.9815850257873535, "lr": 4.0043683854109925e-05, "tps": 169012, "wall": 11753.3} {"step": 30311, "train_loss": 3.0195016860961914, "lr": 4.004326282423744e-05, "tps": 168949, "wall": 11758.1} {"step": 30312, "train_loss": 3.0183639526367188, "lr": 4.004284383292464e-05, "tps": 168885, "wall": 11763.0} {"step": 30313, "train_loss": 3.0486645698547363, "lr": 4.004242688017621e-05, "tps": 168821, "wall": 11767.8} {"step": 30314, "train_loss": 3.0393121242523193, "lr": 4.004201196599691e-05, "tps": 168757, "wall": 11772.6} {"step": 30315, "train_loss": 3.0607986450195312, "lr": 4.004159909039143e-05, "tps": 168694, "wall": 11777.5} {"step": 30316, "train_loss": 3.1123805046081543, "lr": 4.004118825336447e-05, "tps": 168630, "wall": 11782.3} {"step": 30317, "train_loss": 3.020989418029785, "lr": 4.0040779454920654e-05, "tps": 168566, "wall": 11787.2} {"step": 30318, "train_loss": 3.1127827167510986, "lr": 4.004037269506462e-05, "tps": 168501, "wall": 11792.1} {"step": 30319, "train_loss": 3.065492630004883, "lr": 4.0039967973800975e-05, "tps": 168436, "wall": 11797.0} {"step": 30320, "train_loss": 2.965916872024536, "lr": 4.0039565291134324e-05, "tps": 168371, "wall": 11802.0} {"step": 30321, "train_loss": 3.003669500350952, "lr": 4.00391646470692e-05, "tps": 168305, "wall": 11807.0} {"step": 30322, "train_loss": 3.093367576599121, "lr": 4.003876604161016e-05, "tps": 168240, "wall": 11812.0} {"step": 30323, "train_loss": 3.016838788986206, "lr": 4.00383694747617e-05, "tps": 168175, "wall": 11816.9} {"step": 30324, "train_loss": 3.04111909866333, "lr": 4.003797494652836e-05, "tps": 168111, "wall": 11821.8} {"step": 30325, "train_loss": 3.04433274269104, "lr": 4.0037582456914544e-05, "tps": 168047, "wall": 11826.7} {"step": 30326, "train_loss": 3.078033924102783, "lr": 4.0037192005924746e-05, "tps": 167983, "wall": 11831.6} {"step": 30327, "train_loss": 2.9875030517578125, "lr": 4.0036803593563356e-05, "tps": 167919, "wall": 11836.5} {"step": 30328, "train_loss": 3.041343927383423, "lr": 4.00364172198348e-05, "tps": 167855, "wall": 11841.4} {"step": 30329, "train_loss": 3.1217052936553955, "lr": 4.0036032884743445e-05, "tps": 167790, "wall": 11846.4} {"step": 30330, "train_loss": 3.02972149848938, "lr": 4.003565058829365e-05, "tps": 167724, "wall": 11851.4} {"step": 30331, "train_loss": 2.985111951828003, "lr": 4.003527033048975e-05, "tps": 167660, "wall": 11856.4} {"step": 30332, "train_loss": 3.055665969848633, "lr": 4.003489211133603e-05, "tps": 167595, "wall": 11861.3} {"step": 30333, "train_loss": 2.9949498176574707, "lr": 4.00345159308368e-05, "tps": 167531, "wall": 11866.3} {"step": 30334, "train_loss": 2.9942381381988525, "lr": 4.003414178899629e-05, "tps": 167467, "wall": 11871.1} {"step": 30335, "train_loss": 2.9709577560424805, "lr": 4.003376968581878e-05, "tps": 167404, "wall": 11876.0} {"step": 30336, "train_loss": 3.0154595375061035, "lr": 4.0033399621308444e-05, "tps": 167340, "wall": 11881.0} {"step": 30337, "train_loss": 3.05588436126709, "lr": 4.00330315954695e-05, "tps": 167277, "wall": 11885.9} {"step": 30338, "train_loss": 3.045830249786377, "lr": 4.003266560830611e-05, "tps": 167213, "wall": 11890.8} {"step": 30339, "train_loss": 3.0762743949890137, "lr": 4.003230165982241e-05, "tps": 167149, "wall": 11895.7} {"step": 30340, "train_loss": 3.1040754318237305, "lr": 4.003193975002255e-05, "tps": 167086, "wall": 11900.6} {"step": 30341, "train_loss": 2.9696590900421143, "lr": 4.003157987891062e-05, "tps": 167023, "wall": 11905.5} {"step": 30342, "train_loss": 3.0014514923095703, "lr": 4.003122204649066e-05, "tps": 166960, "wall": 11910.4} {"step": 30343, "train_loss": 3.0361008644104004, "lr": 4.003086625276678e-05, "tps": 166897, "wall": 11915.2} {"step": 30344, "train_loss": 3.0826807022094727, "lr": 4.003051249774297e-05, "tps": 166835, "wall": 11920.1} {"step": 30345, "train_loss": 3.1098217964172363, "lr": 4.003016078142325e-05, "tps": 166772, "wall": 11924.9} {"step": 30346, "train_loss": 3.063511848449707, "lr": 4.002981110381161e-05, "tps": 166711, "wall": 11929.7} {"step": 30347, "train_loss": 2.9830687046051025, "lr": 4.0029463464912e-05, "tps": 166649, "wall": 11934.6} {"step": 30348, "train_loss": 3.0866899490356445, "lr": 4.002911786472837e-05, "tps": 166587, "wall": 11939.4} {"step": 30349, "train_loss": 3.0563173294067383, "lr": 4.002877430326463e-05, "tps": 166524, "wall": 11944.3} {"step": 30350, "train_loss": 3.019455909729004, "lr": 4.0028432780524664e-05, "tps": 166462, "wall": 11949.2} {"step": 30351, "train_loss": 2.991917371749878, "lr": 4.0028093296512345e-05, "tps": 166400, "wall": 11954.0} {"step": 30352, "train_loss": 3.066948652267456, "lr": 4.002775585123153e-05, "tps": 166338, "wall": 11958.8} {"step": 30353, "train_loss": 2.9863598346710205, "lr": 4.0027420444686026e-05, "tps": 166275, "wall": 11963.8} {"step": 30354, "train_loss": 3.0606460571289062, "lr": 4.002708707687965e-05, "tps": 166212, "wall": 11968.7} {"step": 30355, "train_loss": 3.0402894020080566, "lr": 4.002675574781616e-05, "tps": 166150, "wall": 11973.6} {"step": 30356, "train_loss": 3.064549207687378, "lr": 4.0026426457499325e-05, "tps": 166089, "wall": 11978.4} {"step": 30357, "train_loss": 2.9730377197265625, "lr": 4.002609920593286e-05, "tps": 166026, "wall": 11983.3} {"step": 30358, "train_loss": 3.0473055839538574, "lr": 4.002577399312049e-05, "tps": 165965, "wall": 11988.1} {"step": 30359, "train_loss": 2.935936212539673, "lr": 4.0025450819065866e-05, "tps": 165904, "wall": 11992.9} {"step": 30360, "train_loss": 3.133406162261963, "lr": 4.002512968377269e-05, "tps": 165842, "wall": 11997.7} {"step": 30361, "train_loss": 2.9529337882995605, "lr": 4.0024810587244565e-05, "tps": 165781, "wall": 12002.6} {"step": 30362, "train_loss": 2.9954075813293457, "lr": 4.0024493529485144e-05, "tps": 165720, "wall": 12007.4} {"step": 30363, "train_loss": 2.993211269378662, "lr": 4.0024178510497984e-05, "tps": 165660, "wall": 12012.1} {"step": 30364, "train_loss": 3.0834014415740967, "lr": 4.0023865530286676e-05, "tps": 165600, "wall": 12016.9} {"step": 30365, "train_loss": 3.0073633193969727, "lr": 4.002355458885476e-05, "tps": 165539, "wall": 12021.7} {"step": 30366, "train_loss": 3.043168306350708, "lr": 4.0023245686205734e-05, "tps": 165478, "wall": 12026.6} {"step": 30367, "train_loss": 3.1421945095062256, "lr": 4.002293882234311e-05, "tps": 165415, "wall": 12031.5} {"step": 30368, "train_loss": 3.0319221019744873, "lr": 4.002263399727041e-05, "tps": 165354, "wall": 12036.3} {"step": 30369, "train_loss": 2.9790921211242676, "lr": 4.002233121099102e-05, "tps": 165292, "wall": 12041.2} {"step": 30370, "train_loss": 2.9656496047973633, "lr": 4.00220304635084e-05, "tps": 165231, "wall": 12046.1} {"step": 30371, "train_loss": 3.1235859394073486, "lr": 4.002173175482597e-05, "tps": 165171, "wall": 12050.9} {"step": 30372, "train_loss": 3.103994131088257, "lr": 4.002143508494709e-05, "tps": 165109, "wall": 12055.8} {"step": 30373, "train_loss": 3.1457130908966064, "lr": 4.0021140453875135e-05, "tps": 165049, "wall": 12060.6} {"step": 30374, "train_loss": 2.9598145484924316, "lr": 4.002084786161343e-05, "tps": 164988, "wall": 12065.4} {"step": 30375, "train_loss": 3.090592622756958, "lr": 4.002055730816529e-05, "tps": 164928, "wall": 12070.2} {"step": 30376, "train_loss": 2.9564549922943115, "lr": 4.002026879353403e-05, "tps": 164867, "wall": 12075.1} {"step": 30377, "train_loss": 3.0628116130828857, "lr": 4.0019982317722896e-05, "tps": 164806, "wall": 12079.9} {"step": 30378, "train_loss": 3.0684359073638916, "lr": 4.001969788073513e-05, "tps": 164746, "wall": 12084.7} {"step": 30379, "train_loss": 2.979851722717285, "lr": 4.0019415482573975e-05, "tps": 164686, "wall": 12089.6} {"step": 30380, "train_loss": 3.0612759590148926, "lr": 4.001913512324262e-05, "tps": 164624, "wall": 12094.5} {"step": 30381, "train_loss": 3.124624490737915, "lr": 4.0018856802744234e-05, "tps": 164563, "wall": 12099.4} {"step": 30382, "train_loss": 3.1169090270996094, "lr": 4.0018580521081986e-05, "tps": 164503, "wall": 12104.2} {"step": 30383, "train_loss": 3.078479290008545, "lr": 4.0018306278258976e-05, "tps": 164435, "wall": 12109.6} {"step": 30384, "train_loss": 3.1167564392089844, "lr": 4.001803407427834e-05, "tps": 164372, "wall": 12114.6} {"step": 30385, "train_loss": 3.0767006874084473, "lr": 4.0017763909143136e-05, "tps": 164308, "wall": 12119.8} {"step": 30386, "train_loss": 3.1174468994140625, "lr": 4.001749578285646e-05, "tps": 164245, "wall": 12124.8} {"step": 30387, "train_loss": 3.005268096923828, "lr": 4.001722969542132e-05, "tps": 164184, "wall": 12129.7} {"step": 30388, "train_loss": 3.035245895385742, "lr": 4.001696564684074e-05, "tps": 164123, "wall": 12134.6} {"step": 30389, "train_loss": 3.0487406253814697, "lr": 4.0016703637117706e-05, "tps": 164063, "wall": 12139.4} {"step": 30390, "train_loss": 3.0565176010131836, "lr": 4.001644366625521e-05, "tps": 164003, "wall": 12144.3} {"step": 30391, "train_loss": 3.1296868324279785, "lr": 4.0016185734256145e-05, "tps": 163943, "wall": 12149.1} {"step": 30392, "train_loss": 3.1650304794311523, "lr": 4.001592984112348e-05, "tps": 163882, "wall": 12154.0} {"step": 30393, "train_loss": 3.03177809715271, "lr": 4.001567598686009e-05, "tps": 163822, "wall": 12158.9} {"step": 30394, "train_loss": 2.943244218826294, "lr": 4.001542417146887e-05, "tps": 163763, "wall": 12163.7} {"step": 30395, "train_loss": 3.1299948692321777, "lr": 4.001517439495266e-05, "tps": 163703, "wall": 12168.5} {"step": 30396, "train_loss": 2.9775519371032715, "lr": 4.00149266573143e-05, "tps": 163644, "wall": 12173.3} {"step": 30397, "train_loss": 3.06284761428833, "lr": 4.001468095855658e-05, "tps": 163585, "wall": 12178.2} {"step": 30398, "train_loss": 3.0136547088623047, "lr": 4.0014437298682285e-05, "tps": 163525, "wall": 12183.0} {"step": 30399, "train_loss": 2.9278323650360107, "lr": 4.001419567769418e-05, "tps": 163466, "wall": 12187.8} {"step": 30400, "train_loss": 2.9762563705444336, "lr": 4.001395609559502e-05, "tps": 163408, "wall": 12192.5} {"step": 30401, "train_loss": 3.130873203277588, "lr": 4.0013718552387504e-05, "tps": 163349, "wall": 12197.3} {"step": 30402, "train_loss": 3.0684399604797363, "lr": 4.001348304807431e-05, "tps": 163291, "wall": 12202.1} {"step": 30403, "train_loss": 3.066837787628174, "lr": 4.001324958265811e-05, "tps": 163233, "wall": 12206.8} {"step": 30404, "train_loss": 2.9929559230804443, "lr": 4.001301815614156e-05, "tps": 163174, "wall": 12211.6} {"step": 30405, "train_loss": 3.167327404022217, "lr": 4.0012788768527275e-05, "tps": 163115, "wall": 12216.4} {"step": 30406, "train_loss": 3.008485794067383, "lr": 4.001256141981788e-05, "tps": 163057, "wall": 12221.2} {"step": 30407, "train_loss": 3.084296941757202, "lr": 4.00123361100159e-05, "tps": 162999, "wall": 12225.9} {"step": 30408, "train_loss": 3.0952718257904053, "lr": 4.0012112839123925e-05, "tps": 162940, "wall": 12230.7} {"step": 30409, "train_loss": 3.092616558074951, "lr": 4.0011891607144466e-05, "tps": 162883, "wall": 12235.5} {"step": 30410, "train_loss": 3.039768695831299, "lr": 4.001167241408003e-05, "tps": 162825, "wall": 12240.2} {"step": 30411, "train_loss": 3.0363245010375977, "lr": 4.0011455259933126e-05, "tps": 162767, "wall": 12245.0} {"step": 30412, "train_loss": 2.920300006866455, "lr": 4.001124014470618e-05, "tps": 162709, "wall": 12249.7} {"step": 30413, "train_loss": 2.9057610034942627, "lr": 4.001102706840166e-05, "tps": 162651, "wall": 12254.5} {"step": 30414, "train_loss": 3.009049892425537, "lr": 4.001081603102195e-05, "tps": 162588, "wall": 12259.6} {"step": 30415, "train_loss": 3.1598575115203857, "lr": 4.001060703256944e-05, "tps": 162526, "wall": 12264.7} {"step": 30416, "train_loss": 3.088501453399658, "lr": 4.001040007304652e-05, "tps": 162466, "wall": 12269.7} {"step": 30417, "train_loss": 3.0286524295806885, "lr": 4.001019515245553e-05, "tps": 162407, "wall": 12274.5} {"step": 30418, "train_loss": 3.0530543327331543, "lr": 4.000999227079879e-05, "tps": 162348, "wall": 12279.4} {"step": 30419, "train_loss": 2.9461045265197754, "lr": 4.00097914280786e-05, "tps": 162290, "wall": 12284.2} {"step": 30420, "train_loss": 2.9751181602478027, "lr": 4.000959262429722e-05, "tps": 162230, "wall": 12289.1} {"step": 30421, "train_loss": 3.0382580757141113, "lr": 4.00093958594569e-05, "tps": 162170, "wall": 12294.1} {"step": 30422, "train_loss": 3.1270194053649902, "lr": 4.000920113355989e-05, "tps": 162111, "wall": 12299.0} {"step": 30423, "train_loss": 3.2025532722473145, "lr": 4.00090084466084e-05, "tps": 162052, "wall": 12303.8} {"step": 30424, "train_loss": 3.093676805496216, "lr": 4.000881779860459e-05, "tps": 161993, "wall": 12308.7} {"step": 30425, "train_loss": 3.0365142822265625, "lr": 4.000862918955062e-05, "tps": 161935, "wall": 12313.5} {"step": 30426, "train_loss": 3.033524990081787, "lr": 4.000844261944865e-05, "tps": 161877, "wall": 12318.4} {"step": 30427, "train_loss": 3.1084890365600586, "lr": 4.0008258088300765e-05, "tps": 161818, "wall": 12323.2} {"step": 30428, "train_loss": 3.10453462600708, "lr": 4.000807559610909e-05, "tps": 161760, "wall": 12328.1} {"step": 30429, "train_loss": 3.047912359237671, "lr": 4.0007895142875654e-05, "tps": 161702, "wall": 12332.9} {"step": 30430, "train_loss": 2.9782676696777344, "lr": 4.000771672860254e-05, "tps": 161645, "wall": 12337.7} {"step": 30431, "train_loss": 3.0626559257507324, "lr": 4.0007540353291725e-05, "tps": 161588, "wall": 12342.4} {"step": 30432, "train_loss": 3.036329507827759, "lr": 4.000736601694524e-05, "tps": 161531, "wall": 12347.2} {"step": 30433, "train_loss": 3.0919880867004395, "lr": 4.000719371956506e-05, "tps": 161474, "wall": 12351.9} {"step": 30434, "train_loss": 3.016855239868164, "lr": 4.000702346115311e-05, "tps": 161417, "wall": 12356.7} {"step": 30435, "train_loss": 3.109455108642578, "lr": 4.0006855241711336e-05, "tps": 161360, "wall": 12361.4} {"step": 30436, "train_loss": 2.88580584526062, "lr": 4.000668906124165e-05, "tps": 161304, "wall": 12366.2} {"step": 30437, "train_loss": 3.0318167209625244, "lr": 4.000652491974594e-05, "tps": 161247, "wall": 12370.9} {"step": 30438, "train_loss": 3.102515697479248, "lr": 4.000636281722603e-05, "tps": 161191, "wall": 12375.7} {"step": 30439, "train_loss": 3.0691463947296143, "lr": 4.0006202753683786e-05, "tps": 161133, "wall": 12380.5} {"step": 30440, "train_loss": 2.9780197143554688, "lr": 4.000604472912103e-05, "tps": 161075, "wall": 12385.4} {"step": 30441, "train_loss": 3.1036345958709717, "lr": 4.0005888743539524e-05, "tps": 161017, "wall": 12390.2} {"step": 30442, "train_loss": 2.998466968536377, "lr": 4.0005734796941054e-05, "tps": 160960, "wall": 12395.0} {"step": 30443, "train_loss": 3.042135238647461, "lr": 4.000558288932734e-05, "tps": 160903, "wall": 12399.8} {"step": 30444, "train_loss": 3.1262741088867188, "lr": 4.0005433020700156e-05, "tps": 160847, "wall": 12404.6} {"step": 30445, "train_loss": 2.991091012954712, "lr": 4.000528519106112e-05, "tps": 160790, "wall": 12409.4} {"step": 30446, "train_loss": 3.0981616973876953, "lr": 4.000513940041199e-05, "tps": 160732, "wall": 12414.3} {"step": 30447, "train_loss": 3.0640511512756348, "lr": 4.000499564875435e-05, "tps": 160674, "wall": 12419.1} {"step": 30448, "train_loss": 3.0774242877960205, "lr": 4.000485393608987e-05, "tps": 160617, "wall": 12424.0} {"step": 30449, "train_loss": 3.131938934326172, "lr": 4.000471426242014e-05, "tps": 160560, "wall": 12428.8} {"step": 30450, "train_loss": 2.9548630714416504, "lr": 4.000457662774676e-05, "tps": 160503, "wall": 12433.6} {"step": 30451, "train_loss": 3.042539119720459, "lr": 4.0004441032071254e-05, "tps": 160445, "wall": 12438.5} {"step": 30452, "train_loss": 2.9998779296875, "lr": 4.000430747539517e-05, "tps": 160388, "wall": 12443.3} {"step": 30453, "train_loss": 3.0339269638061523, "lr": 4.0004175957720045e-05, "tps": 160331, "wall": 12448.2} {"step": 30454, "train_loss": 3.0985374450683594, "lr": 4.000404647904736e-05, "tps": 160274, "wall": 12453.0} {"step": 30455, "train_loss": 3.0029489994049072, "lr": 4.0003919039378565e-05, "tps": 160217, "wall": 12457.8} {"step": 30456, "train_loss": 3.042940855026245, "lr": 4.000379363871509e-05, "tps": 160161, "wall": 12462.6} {"step": 30457, "train_loss": 3.0219218730926514, "lr": 4.00036702770584e-05, "tps": 160105, "wall": 12467.4} {"step": 30458, "train_loss": 3.1270179748535156, "lr": 4.000354895440987e-05, "tps": 160048, "wall": 12472.2} {"step": 30459, "train_loss": 3.1580135822296143, "lr": 4.000342967077089e-05, "tps": 159990, "wall": 12477.2} {"step": 30460, "train_loss": 2.9730777740478516, "lr": 4.000331242614278e-05, "tps": 159933, "wall": 12482.0} {"step": 30461, "train_loss": 3.0271780490875244, "lr": 4.000319722052687e-05, "tps": 159876, "wall": 12486.9} {"step": 30462, "train_loss": 3.0072238445281982, "lr": 4.000308405392451e-05, "tps": 159820, "wall": 12491.7} {"step": 30463, "train_loss": 2.970524787902832, "lr": 4.0002972926336935e-05, "tps": 159764, "wall": 12496.4} {"step": 30464, "train_loss": 3.0879616737365723, "lr": 4.000286383776541e-05, "tps": 159708, "wall": 12501.3} {"step": 30465, "train_loss": 3.122713088989258, "lr": 4.0002756788211194e-05, "tps": 159652, "wall": 12506.0} {"step": 30466, "train_loss": 3.0515096187591553, "lr": 4.0002651777675486e-05, "tps": 159595, "wall": 12510.9} {"step": 30467, "train_loss": 3.0096869468688965, "lr": 4.0002548806159474e-05, "tps": 159540, "wall": 12515.7} {"step": 30468, "train_loss": 3.0625741481781006, "lr": 4.000244787366433e-05, "tps": 159484, "wall": 12520.4} {"step": 30469, "train_loss": 3.0940418243408203, "lr": 4.00023489801912e-05, "tps": 159429, "wall": 12525.2} {"step": 30470, "train_loss": 3.1147522926330566, "lr": 4.000225212574118e-05, "tps": 159372, "wall": 12530.1} {"step": 30471, "train_loss": 3.1306610107421875, "lr": 4.0002157310315416e-05, "tps": 159316, "wall": 12534.9} {"step": 30472, "train_loss": 3.141986846923828, "lr": 4.000206453391493e-05, "tps": 159260, "wall": 12539.7} {"step": 30473, "train_loss": 3.0338141918182373, "lr": 4.000197379654079e-05, "tps": 159205, "wall": 12544.4} {"step": 30474, "train_loss": 3.0993497371673584, "lr": 4.000188509819402e-05, "tps": 159149, "wall": 12549.3} {"step": 30475, "train_loss": 3.0422303676605225, "lr": 4.000179843887566e-05, "tps": 159094, "wall": 12554.0} {"step": 30476, "train_loss": 3.057429790496826, "lr": 4.000171381858665e-05, "tps": 159038, "wall": 12558.8} {"step": 30477, "train_loss": 3.1031007766723633, "lr": 4.000163123732798e-05, "tps": 158983, "wall": 12563.6} {"step": 30478, "train_loss": 3.145796775817871, "lr": 4.0001550695100556e-05, "tps": 158928, "wall": 12568.4} {"step": 30479, "train_loss": 3.070509910583496, "lr": 4.000147219190531e-05, "tps": 158872, "wall": 12573.2} {"step": 30480, "train_loss": 3.0271177291870117, "lr": 4.000139572774311e-05, "tps": 158817, "wall": 12578.0} {"step": 30481, "train_loss": 3.097539186477661, "lr": 4.000132130261485e-05, "tps": 158761, "wall": 12582.8} {"step": 30482, "train_loss": 3.0350546836853027, "lr": 4.0001248916521345e-05, "tps": 158706, "wall": 12587.6} {"step": 30483, "train_loss": 3.011876344680786, "lr": 4.000117856946345e-05, "tps": 158651, "wall": 12592.4} {"step": 30484, "train_loss": 2.9080686569213867, "lr": 4.000111026144193e-05, "tps": 158596, "wall": 12597.1} {"step": 30485, "train_loss": 3.064901351928711, "lr": 4.0001043992457564e-05, "tps": 158542, "wall": 12601.9} {"step": 30486, "train_loss": 3.085399627685547, "lr": 4.000097976251113e-05, "tps": 158487, "wall": 12606.6} {"step": 30487, "train_loss": 3.0274248123168945, "lr": 4.0000917571603323e-05, "tps": 158432, "wall": 12611.4} {"step": 30488, "train_loss": 3.0799453258514404, "lr": 4.000085741973485e-05, "tps": 158377, "wall": 12616.2} {"step": 30489, "train_loss": 2.9328010082244873, "lr": 4.0000799306906426e-05, "tps": 158323, "wall": 12621.0} {"step": 30490, "train_loss": 2.9063756465911865, "lr": 4.0000743233118675e-05, "tps": 158268, "wall": 12625.8} {"step": 30491, "train_loss": 3.041369915008545, "lr": 4.000068919837224e-05, "tps": 158212, "wall": 12630.6} {"step": 30492, "train_loss": 3.012627124786377, "lr": 4.0000637202667736e-05, "tps": 158158, "wall": 12635.4} {"step": 30493, "train_loss": 3.0451626777648926, "lr": 4.0000587246005746e-05, "tps": 158103, "wall": 12640.2} {"step": 30494, "train_loss": 3.0793864727020264, "lr": 4.000053932838683e-05, "tps": 158047, "wall": 12645.0} {"step": 30495, "train_loss": 3.0142662525177, "lr": 4.000049344981158e-05, "tps": 157993, "wall": 12649.8} {"step": 30496, "train_loss": 2.9919352531433105, "lr": 4.000044961028045e-05, "tps": 157938, "wall": 12654.6} {"step": 30497, "train_loss": 2.957829236984253, "lr": 4.000040780979396e-05, "tps": 157881, "wall": 12659.6} {"step": 30498, "train_loss": 3.053130626678467, "lr": 4.00003680483526e-05, "tps": 157826, "wall": 12664.4} {"step": 30499, "train_loss": 3.071575403213501, "lr": 4.000033032595682e-05, "tps": 157772, "wall": 12669.2} {"step": 30500, "train_loss": 3.081479072570801, "lr": 4.0000294642607015e-05, "tps": 157718, "wall": 12674.0} {"step": 30501, "train_loss": 2.9868319034576416, "lr": 4.0000260998303614e-05, "tps": 157659, "wall": 12679.1} {"step": 30502, "train_loss": 3.088554859161377, "lr": 4.0000229393047e-05, "tps": 157605, "wall": 12683.8} {"step": 30503, "train_loss": 3.0695605278015137, "lr": 4.000019982683752e-05, "tps": 157551, "wall": 12688.6} {"step": 30504, "train_loss": 3.054373264312744, "lr": 4.0000172299675534e-05, "tps": 157496, "wall": 12693.4} {"step": 30505, "train_loss": 3.030207872390747, "lr": 4.000014681156131e-05, "tps": 157442, "wall": 12698.2} {"step": 30506, "train_loss": 3.104281425476074, "lr": 4.000012336249516e-05, "tps": 157387, "wall": 12703.0} {"step": 30507, "train_loss": 3.012972116470337, "lr": 4.000010195247737e-05, "tps": 157333, "wall": 12707.8} {"step": 30508, "train_loss": 2.9450035095214844, "lr": 4.0000082581508157e-05, "tps": 157279, "wall": 12712.6} {"step": 30509, "train_loss": 3.126145601272583, "lr": 4.000006524958774e-05, "tps": 157224, "wall": 12717.5} {"step": 30510, "train_loss": 3.037003517150879, "lr": 4.0000049956716305e-05, "tps": 157170, "wall": 12722.3} {"step": 30511, "train_loss": 2.959573268890381, "lr": 4.0000036702894064e-05, "tps": 157116, "wall": 12727.1} {"step": 30512, "train_loss": 3.0732247829437256, "lr": 4.000002548812116e-05, "tps": 157062, "wall": 12731.9} {"step": 30513, "train_loss": 2.9723379611968994, "lr": 4.000001631239768e-05, "tps": 157007, "wall": 12736.8} {"step": 30514, "train_loss": 2.9487931728363037, "lr": 4.000000917572376e-05, "tps": 156953, "wall": 12741.5} {"step": 30515, "train_loss": 3.0730490684509277, "lr": 4.000000407809946e-05, "tps": 156898, "wall": 12746.5} {"step": 30516, "train_loss": 3.070194721221924, "lr": 4.000000101952487e-05, "tps": 156843, "wall": 12751.3}