{"num_parameters": 101202432, "trainable_parameters": 101202432, "step": 0} {"train_info/time_between_train_steps": 2.2874653339385986, "step": 0} {"info/global_step": 1, "train_info/time_within_train_step": 4.370887994766235, "step": 1} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4102.23583984375, "train_info/memory_reserved": 4326.0, "train_info/memory_max_reserved": 4326.0, "_timestamp": 1746322980, "_runtime": 28}, "step": 1} {"logs": {"train/loss": 10.0531, "train/learning_rate": 2e-06, "train/epoch": 0.0, "_timestamp": 1746322980, "_runtime": 28}, "step": 1} {"train_info/time_between_train_steps": 0.025208473205566406, "step": 1} {"info/global_step": 2, "train_info/time_within_train_step": 2.2994558811187744, "step": 2} {"train_info/time_between_train_steps": 0.003510713577270508, "step": 2} {"info/global_step": 3, "train_info/time_within_train_step": 2.302712917327881, "step": 3} {"train_info/time_between_train_steps": 0.003482341766357422, "step": 3} {"info/global_step": 4, "train_info/time_within_train_step": 2.293229818344116, "step": 4} {"train_info/time_between_train_steps": 0.0034265518188476562, "step": 4} {"info/global_step": 5, "train_info/time_within_train_step": 2.2989914417266846, "step": 5} {"train_info/time_between_train_steps": 0.004563093185424805, "step": 5} {"info/global_step": 6, "train_info/time_within_train_step": 2.299325942993164, "step": 6} {"train_info/time_between_train_steps": 0.0036742687225341797, "step": 6} {"info/global_step": 7, "train_info/time_within_train_step": 2.3062801361083984, "step": 7} {"train_info/time_between_train_steps": 0.0036928653717041016, "step": 7} {"info/global_step": 8, "train_info/time_within_train_step": 2.3086934089660645, "step": 8} {"train_info/time_between_train_steps": 0.0035958290100097656, "step": 8} {"info/global_step": 9, "train_info/time_within_train_step": 2.3105013370513916, "step": 9} {"train_info/time_between_train_steps": 0.0037245750427246094, "step": 9} {"info/global_step": 10, "train_info/time_within_train_step": 2.3270211219787598, "step": 10} {"train_info/time_between_train_steps": 0.0037012100219726562, "step": 10} {"info/global_step": 11, "train_info/time_within_train_step": 2.4864230155944824, "step": 11} {"train_info/time_between_train_steps": 0.003731250762939453, "step": 11} {"info/global_step": 12, "train_info/time_within_train_step": 2.547574758529663, "step": 12} {"train_info/time_between_train_steps": 0.0037653446197509766, "step": 12} {"info/global_step": 13, "train_info/time_within_train_step": 2.520684003829956, "step": 13} {"train_info/time_between_train_steps": 0.003732442855834961, "step": 13} {"info/global_step": 14, "train_info/time_within_train_step": 2.519615888595581, "step": 14} {"train_info/time_between_train_steps": 0.0037126541137695312, "step": 14} {"info/global_step": 15, "train_info/time_within_train_step": 2.5200939178466797, "step": 15} {"train_info/time_between_train_steps": 0.003756999969482422, "step": 15} {"info/global_step": 16, "train_info/time_within_train_step": 2.5301010608673096, "step": 16} {"train_info/time_between_train_steps": 0.0037369728088378906, "step": 16} {"info/global_step": 17, "train_info/time_within_train_step": 2.519375801086426, "step": 17} {"train_info/time_between_train_steps": 0.003694772720336914, "step": 17} {"info/global_step": 18, "train_info/time_within_train_step": 2.519749164581299, "step": 18} {"train_info/time_between_train_steps": 0.003719806671142578, "step": 18} {"info/global_step": 19, "train_info/time_within_train_step": 2.5195486545562744, "step": 19} {"train_info/time_between_train_steps": 0.0037734508514404297, "step": 19} {"info/global_step": 20, "train_info/time_within_train_step": 2.520442008972168, "step": 20} {"train_info/time_between_train_steps": 0.0037572383880615234, "step": 20} {"info/global_step": 21, "train_info/time_within_train_step": 2.521270990371704, "step": 21} {"train_info/time_between_train_steps": 0.003737211227416992, "step": 21} {"info/global_step": 22, "train_info/time_within_train_step": 2.522109270095825, "step": 22} {"train_info/time_between_train_steps": 0.003749370574951172, "step": 22} {"info/global_step": 23, "train_info/time_within_train_step": 2.522087335586548, "step": 23} {"train_info/time_between_train_steps": 0.0037016868591308594, "step": 23} {"info/global_step": 24, "train_info/time_within_train_step": 2.5217015743255615, "step": 24} {"train_info/time_between_train_steps": 0.0038077831268310547, "step": 24} {"info/global_step": 25, "train_info/time_within_train_step": 2.5222175121307373, "step": 25} {"train_info/time_between_train_steps": 0.003705739974975586, "step": 25} {"info/global_step": 26, "train_info/time_within_train_step": 2.5226261615753174, "step": 26} {"train_info/time_between_train_steps": 0.0037584304809570312, "step": 26} {"info/global_step": 27, "train_info/time_within_train_step": 2.5228137969970703, "step": 27} {"train_info/time_between_train_steps": 0.003702878952026367, "step": 27} {"info/global_step": 28, "train_info/time_within_train_step": 2.9534709453582764, "step": 28} {"train_info/time_between_train_steps": 0.003467082977294922, "step": 28} {"info/global_step": 29, "train_info/time_within_train_step": 2.5223050117492676, "step": 29} {"train_info/time_between_train_steps": 0.0034036636352539062, "step": 29} {"info/global_step": 30, "train_info/time_within_train_step": 2.5219831466674805, "step": 30} {"train_info/time_between_train_steps": 0.003394603729248047, "step": 30} {"info/global_step": 31, "train_info/time_within_train_step": 2.522393226623535, "step": 31} {"train_info/time_between_train_steps": 0.0034012794494628906, "step": 31} {"info/global_step": 32, "train_info/time_within_train_step": 2.521488904953003, "step": 32} {"train_info/time_between_train_steps": 0.0033659934997558594, "step": 32} {"info/global_step": 33, "train_info/time_within_train_step": 2.5216476917266846, "step": 33} {"train_info/time_between_train_steps": 0.003518819808959961, "step": 33} {"info/global_step": 34, "train_info/time_within_train_step": 2.5223817825317383, "step": 34} {"train_info/time_between_train_steps": 0.0036563873291015625, "step": 34} {"info/global_step": 35, "train_info/time_within_train_step": 2.5226545333862305, "step": 35} {"train_info/time_between_train_steps": 0.003658294677734375, "step": 35} {"info/global_step": 36, "train_info/time_within_train_step": 2.5224242210388184, "step": 36} {"train_info/time_between_train_steps": 0.003720521926879883, "step": 36} {"info/global_step": 37, "train_info/time_within_train_step": 2.52205491065979, "step": 37} {"train_info/time_between_train_steps": 0.003746509552001953, "step": 37} {"info/global_step": 38, "train_info/time_within_train_step": 2.522636651992798, "step": 38} {"train_info/time_between_train_steps": 0.0037412643432617188, "step": 38} {"info/global_step": 39, "train_info/time_within_train_step": 2.522510051727295, "step": 39} {"train_info/time_between_train_steps": 0.003762483596801758, "step": 39} {"info/global_step": 40, "train_info/time_within_train_step": 2.5215072631835938, "step": 40} {"train_info/time_between_train_steps": 0.0037288665771484375, "step": 40} {"info/global_step": 41, "train_info/time_within_train_step": 2.5220484733581543, "step": 41} {"train_info/time_between_train_steps": 0.0037097930908203125, "step": 41} {"info/global_step": 42, "train_info/time_within_train_step": 2.5220093727111816, "step": 42} {"train_info/time_between_train_steps": 0.003750324249267578, "step": 42} {"info/global_step": 43, "train_info/time_within_train_step": 2.5221545696258545, "step": 43} {"train_info/time_between_train_steps": 0.003803253173828125, "step": 43} {"info/global_step": 44, "train_info/time_within_train_step": 2.522836685180664, "step": 44} {"train_info/time_between_train_steps": 0.003786325454711914, "step": 44} {"info/global_step": 45, "train_info/time_within_train_step": 2.522571325302124, "step": 45} {"train_info/time_between_train_steps": 0.0037627220153808594, "step": 45} {"info/global_step": 46, "train_info/time_within_train_step": 2.5226144790649414, "step": 46} {"train_info/time_between_train_steps": 0.0037975311279296875, "step": 46} {"info/global_step": 47, "train_info/time_within_train_step": 2.523247480392456, "step": 47} {"train_info/time_between_train_steps": 0.0037555694580078125, "step": 47} {"info/global_step": 48, "train_info/time_within_train_step": 2.522368907928467, "step": 48} {"train_info/time_between_train_steps": 0.0037488937377929688, "step": 48} {"info/global_step": 49, "train_info/time_within_train_step": 2.522357702255249, "step": 49} {"train_info/time_between_train_steps": 0.0037474632263183594, "step": 49} {"info/global_step": 50, "train_info/time_within_train_step": 2.5226569175720215, "step": 50} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746323103, "_runtime": 151}, "step": 50} {"logs": {"train/loss": 8.1884, "train/learning_rate": 9.999999999999999e-05, "train/epoch": 0.02, "_timestamp": 1746323103, "_runtime": 151}, "step": 50} {"train_info/time_between_train_steps": 0.02520442008972168, "step": 50} {"info/global_step": 51, "train_info/time_within_train_step": 2.522599935531616, "step": 51} {"train_info/time_between_train_steps": 0.0037832260131835938, "step": 51} {"info/global_step": 52, "train_info/time_within_train_step": 2.5226352214813232, "step": 52} {"train_info/time_between_train_steps": 0.0037457942962646484, "step": 52} {"info/global_step": 53, "train_info/time_within_train_step": 2.5220775604248047, "step": 53} {"train_info/time_between_train_steps": 0.0037164688110351562, "step": 53} {"info/global_step": 54, "train_info/time_within_train_step": 2.522451400756836, "step": 54} {"train_info/time_between_train_steps": 0.003714323043823242, "step": 54} {"info/global_step": 55, "train_info/time_within_train_step": 2.5220537185668945, "step": 55} {"train_info/time_between_train_steps": 0.0037691593170166016, "step": 55} {"info/global_step": 56, "train_info/time_within_train_step": 2.522096872329712, "step": 56} {"train_info/time_between_train_steps": 0.0037283897399902344, "step": 56} {"info/global_step": 57, "train_info/time_within_train_step": 2.5216946601867676, "step": 57} {"train_info/time_between_train_steps": 0.003724813461303711, "step": 57} {"info/global_step": 58, "train_info/time_within_train_step": 2.5211470127105713, "step": 58} {"train_info/time_between_train_steps": 0.003915071487426758, "step": 58} {"info/global_step": 59, "train_info/time_within_train_step": 2.5221686363220215, "step": 59} {"train_info/time_between_train_steps": 0.0036835670471191406, "step": 59} {"info/global_step": 60, "train_info/time_within_train_step": 2.5217032432556152, "step": 60} {"train_info/time_between_train_steps": 0.0036194324493408203, "step": 60} {"info/global_step": 61, "train_info/time_within_train_step": 2.5220389366149902, "step": 61} {"train_info/time_between_train_steps": 0.003676176071166992, "step": 61} {"info/global_step": 62, "train_info/time_within_train_step": 2.52211856842041, "step": 62} {"train_info/time_between_train_steps": 0.0038759708404541016, "step": 62} {"info/global_step": 63, "train_info/time_within_train_step": 2.68934965133667, "step": 63} {"train_info/time_between_train_steps": 0.00354766845703125, "step": 63} {"info/global_step": 64, "train_info/time_within_train_step": 2.5216610431671143, "step": 64} {"train_info/time_between_train_steps": 0.0035142898559570312, "step": 64} {"info/global_step": 65, "train_info/time_within_train_step": 2.521653413772583, "step": 65} {"train_info/time_between_train_steps": 0.0035474300384521484, "step": 65} {"info/global_step": 66, "train_info/time_within_train_step": 2.5214507579803467, "step": 66} {"train_info/time_between_train_steps": 0.0037088394165039062, "step": 66} {"info/global_step": 67, "train_info/time_within_train_step": 2.522336483001709, "step": 67} {"train_info/time_between_train_steps": 0.003522157669067383, "step": 67} {"info/global_step": 68, "train_info/time_within_train_step": 2.5219643115997314, "step": 68} {"train_info/time_between_train_steps": 0.0037364959716796875, "step": 68} {"info/global_step": 69, "train_info/time_within_train_step": 2.52180552482605, "step": 69} {"train_info/time_between_train_steps": 0.003668546676635742, "step": 69} {"info/global_step": 70, "train_info/time_within_train_step": 2.522061824798584, "step": 70} {"train_info/time_between_train_steps": 0.0035462379455566406, "step": 70} {"info/global_step": 71, "train_info/time_within_train_step": 2.521113634109497, "step": 71} {"train_info/time_between_train_steps": 0.003451108932495117, "step": 71} {"info/global_step": 72, "train_info/time_within_train_step": 2.5216588973999023, "step": 72} {"train_info/time_between_train_steps": 0.0035943984985351562, "step": 72} {"info/global_step": 73, "train_info/time_within_train_step": 2.5211598873138428, "step": 73} {"train_info/time_between_train_steps": 0.0035483837127685547, "step": 73} {"info/global_step": 74, "train_info/time_within_train_step": 2.521911144256592, "step": 74} {"train_info/time_between_train_steps": 0.0036606788635253906, "step": 74} {"info/global_step": 75, "train_info/time_within_train_step": 2.5219759941101074, "step": 75} {"train_info/time_between_train_steps": 0.003560781478881836, "step": 75} {"info/global_step": 76, "train_info/time_within_train_step": 2.5220727920532227, "step": 76} {"train_info/time_between_train_steps": 0.003736257553100586, "step": 76} {"info/global_step": 77, "train_info/time_within_train_step": 2.540330171585083, "step": 77} {"train_info/time_between_train_steps": 0.0035545825958251953, "step": 77} {"info/global_step": 78, "train_info/time_within_train_step": 2.5209412574768066, "step": 78} {"train_info/time_between_train_steps": 0.003728628158569336, "step": 78} {"info/global_step": 79, "train_info/time_within_train_step": 2.5209927558898926, "step": 79} {"train_info/time_between_train_steps": 0.0037384033203125, "step": 79} {"info/global_step": 80, "train_info/time_within_train_step": 2.8283796310424805, "step": 80} {"train_info/time_between_train_steps": 0.003410816192626953, "step": 80} {"info/global_step": 81, "train_info/time_within_train_step": 2.5216708183288574, "step": 81} {"train_info/time_between_train_steps": 0.003474712371826172, "step": 81} {"info/global_step": 82, "train_info/time_within_train_step": 2.521535634994507, "step": 82} {"train_info/time_between_train_steps": 0.003470897674560547, "step": 82} {"info/global_step": 83, "train_info/time_within_train_step": 2.5220680236816406, "step": 83} {"train_info/time_between_train_steps": 0.0035583972930908203, "step": 83} {"info/global_step": 84, "train_info/time_within_train_step": 2.52215576171875, "step": 84} {"train_info/time_between_train_steps": 0.003561735153198242, "step": 84} {"info/global_step": 85, "train_info/time_within_train_step": 2.5221495628356934, "step": 85} {"train_info/time_between_train_steps": 0.003367185592651367, "step": 85} {"info/global_step": 86, "train_info/time_within_train_step": 2.5205066204071045, "step": 86} {"train_info/time_between_train_steps": 0.003476381301879883, "step": 86} {"info/global_step": 87, "train_info/time_within_train_step": 2.5212621688842773, "step": 87} {"train_info/time_between_train_steps": 0.003520965576171875, "step": 87} {"info/global_step": 88, "train_info/time_within_train_step": 2.520899772644043, "step": 88} {"train_info/time_between_train_steps": 0.0034444332122802734, "step": 88} {"info/global_step": 89, "train_info/time_within_train_step": 2.521538496017456, "step": 89} {"train_info/time_between_train_steps": 0.003596067428588867, "step": 89} {"info/global_step": 90, "train_info/time_within_train_step": 2.5214016437530518, "step": 90} {"train_info/time_between_train_steps": 0.003434419631958008, "step": 90} {"info/global_step": 91, "train_info/time_within_train_step": 2.5215938091278076, "step": 91} {"train_info/time_between_train_steps": 0.003593921661376953, "step": 91} {"info/global_step": 92, "train_info/time_within_train_step": 2.5218024253845215, "step": 92} {"train_info/time_between_train_steps": 0.0035088062286376953, "step": 92} {"info/global_step": 93, "train_info/time_within_train_step": 2.5211181640625, "step": 93} {"train_info/time_between_train_steps": 0.003475666046142578, "step": 93} {"info/global_step": 94, "train_info/time_within_train_step": 2.5216779708862305, "step": 94} {"train_info/time_between_train_steps": 0.00350189208984375, "step": 94} {"info/global_step": 95, "train_info/time_within_train_step": 2.521334648132324, "step": 95} {"train_info/time_between_train_steps": 0.0033867359161376953, "step": 95} {"info/global_step": 96, "train_info/time_within_train_step": 2.521273136138916, "step": 96} {"train_info/time_between_train_steps": 0.0033473968505859375, "step": 96} {"info/global_step": 97, "train_info/time_within_train_step": 2.523043632507324, "step": 97} {"train_info/time_between_train_steps": 0.0034525394439697266, "step": 97} {"info/global_step": 98, "train_info/time_within_train_step": 2.522120714187622, "step": 98} {"train_info/time_between_train_steps": 0.0034575462341308594, "step": 98} {"info/global_step": 99, "train_info/time_within_train_step": 2.5222649574279785, "step": 99} {"train_info/time_between_train_steps": 0.0033833980560302734, "step": 99} {"info/global_step": 100, "train_info/time_within_train_step": 2.5217466354370117, "step": 100} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746323231, "_runtime": 279}, "step": 100} {"logs": {"train/loss": 6.8871, "train/learning_rate": 0.00019999999999999998, "train/epoch": 0.03, "_timestamp": 1746323231, "_runtime": 279}, "step": 100} {"train_info/time_between_train_steps": 11.968169927597046, "step": 100} {"info/global_step": 101, "train_info/time_within_train_step": 2.3345983028411865, "step": 101} {"train_info/time_between_train_steps": 0.004128217697143555, "step": 101} {"info/global_step": 102, "train_info/time_within_train_step": 2.3800740242004395, "step": 102} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 102} {"info/global_step": 103, "train_info/time_within_train_step": 2.517500877380371, "step": 103} {"train_info/time_between_train_steps": 0.0034172534942626953, "step": 103} {"info/global_step": 104, "train_info/time_within_train_step": 2.5191383361816406, "step": 104} {"train_info/time_between_train_steps": 0.0033833980560302734, "step": 104} {"info/global_step": 105, "train_info/time_within_train_step": 2.5204591751098633, "step": 105} {"train_info/time_between_train_steps": 0.003496408462524414, "step": 105} {"info/global_step": 106, "train_info/time_within_train_step": 2.5202486515045166, "step": 106} {"train_info/time_between_train_steps": 0.0034372806549072266, "step": 106} {"info/global_step": 107, "train_info/time_within_train_step": 2.5201752185821533, "step": 107} {"train_info/time_between_train_steps": 0.003408670425415039, "step": 107} {"info/global_step": 108, "train_info/time_within_train_step": 2.5209267139434814, "step": 108} {"train_info/time_between_train_steps": 0.003398895263671875, "step": 108} {"info/global_step": 109, "train_info/time_within_train_step": 2.522080898284912, "step": 109} {"train_info/time_between_train_steps": 0.003381967544555664, "step": 109} {"info/global_step": 110, "train_info/time_within_train_step": 2.5206234455108643, "step": 110} {"train_info/time_between_train_steps": 0.0034286975860595703, "step": 110} {"info/global_step": 111, "train_info/time_within_train_step": 2.5213515758514404, "step": 111} {"train_info/time_between_train_steps": 0.0033745765686035156, "step": 111} {"info/global_step": 112, "train_info/time_within_train_step": 2.520214319229126, "step": 112} {"train_info/time_between_train_steps": 0.0033791065216064453, "step": 112} {"info/global_step": 113, "train_info/time_within_train_step": 2.5217132568359375, "step": 113} {"train_info/time_between_train_steps": 0.0034024715423583984, "step": 113} {"info/global_step": 114, "train_info/time_within_train_step": 2.523029088973999, "step": 114} {"train_info/time_between_train_steps": 0.0033826828002929688, "step": 114} {"info/global_step": 115, "train_info/time_within_train_step": 2.5259552001953125, "step": 115} {"train_info/time_between_train_steps": 0.0033791065216064453, "step": 115} {"info/global_step": 116, "train_info/time_within_train_step": 2.520925521850586, "step": 116} {"train_info/time_between_train_steps": 0.003423452377319336, "step": 116} {"info/global_step": 117, "train_info/time_within_train_step": 2.5212295055389404, "step": 117} {"train_info/time_between_train_steps": 0.0033597946166992188, "step": 117} {"info/global_step": 118, "train_info/time_within_train_step": 2.521973133087158, "step": 118} {"train_info/time_between_train_steps": 0.0034170150756835938, "step": 118} {"info/global_step": 119, "train_info/time_within_train_step": 2.5219709873199463, "step": 119} {"train_info/time_between_train_steps": 0.0033693313598632812, "step": 119} {"info/global_step": 120, "train_info/time_within_train_step": 2.5214476585388184, "step": 120} {"train_info/time_between_train_steps": 0.003381013870239258, "step": 120} {"info/global_step": 121, "train_info/time_within_train_step": 2.5215768814086914, "step": 121} {"train_info/time_between_train_steps": 0.0033745765686035156, "step": 121} {"info/global_step": 122, "train_info/time_within_train_step": 2.527139663696289, "step": 122} {"train_info/time_between_train_steps": 0.0033931732177734375, "step": 122} {"info/global_step": 123, "train_info/time_within_train_step": 2.522484540939331, "step": 123} {"train_info/time_between_train_steps": 0.0034246444702148438, "step": 123} {"info/global_step": 124, "train_info/time_within_train_step": 2.5220532417297363, "step": 124} {"train_info/time_between_train_steps": 0.0034477710723876953, "step": 124} {"info/global_step": 125, "train_info/time_within_train_step": 2.522108554840088, "step": 125} {"train_info/time_between_train_steps": 0.12131762504577637, "step": 125} {"info/global_step": 126, "train_info/time_within_train_step": 2.522745370864868, "step": 126} {"train_info/time_between_train_steps": 0.0034525394439697266, "step": 126} {"info/global_step": 127, "train_info/time_within_train_step": 2.5230047702789307, "step": 127} {"train_info/time_between_train_steps": 0.0034449100494384766, "step": 127} {"info/global_step": 128, "train_info/time_within_train_step": 2.5236310958862305, "step": 128} {"train_info/time_between_train_steps": 0.0034551620483398438, "step": 128} {"info/global_step": 129, "train_info/time_within_train_step": 2.523022174835205, "step": 129} {"train_info/time_between_train_steps": 0.0034186840057373047, "step": 129} {"info/global_step": 130, "train_info/time_within_train_step": 2.52293062210083, "step": 130} {"train_info/time_between_train_steps": 0.0034618377685546875, "step": 130} {"info/global_step": 131, "train_info/time_within_train_step": 2.5228729248046875, "step": 131} {"train_info/time_between_train_steps": 0.0034193992614746094, "step": 131} {"info/global_step": 132, "train_info/time_within_train_step": 2.5226590633392334, "step": 132} {"train_info/time_between_train_steps": 0.003441333770751953, "step": 132} {"info/global_step": 133, "train_info/time_within_train_step": 2.522136926651001, "step": 133} {"train_info/time_between_train_steps": 0.003454923629760742, "step": 133} {"info/global_step": 134, "train_info/time_within_train_step": 2.522639751434326, "step": 134} {"train_info/time_between_train_steps": 0.0034492015838623047, "step": 134} {"info/global_step": 135, "train_info/time_within_train_step": 2.522784948348999, "step": 135} {"train_info/time_between_train_steps": 0.003930807113647461, "step": 135} {"info/global_step": 136, "train_info/time_within_train_step": 2.5225441455841064, "step": 136} {"train_info/time_between_train_steps": 0.003425121307373047, "step": 136} {"info/global_step": 137, "train_info/time_within_train_step": 2.5217056274414062, "step": 137} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 137} {"info/global_step": 138, "train_info/time_within_train_step": 2.521742820739746, "step": 138} {"train_info/time_between_train_steps": 0.0034208297729492188, "step": 138} {"info/global_step": 139, "train_info/time_within_train_step": 2.5213463306427, "step": 139} {"train_info/time_between_train_steps": 0.0033888816833496094, "step": 139} {"info/global_step": 140, "train_info/time_within_train_step": 2.5214521884918213, "step": 140} {"train_info/time_between_train_steps": 0.0033915042877197266, "step": 140} {"info/global_step": 141, "train_info/time_within_train_step": 2.5213754177093506, "step": 141} {"train_info/time_between_train_steps": 0.0033829212188720703, "step": 141} {"info/global_step": 142, "train_info/time_within_train_step": 2.521947145462036, "step": 142} {"train_info/time_between_train_steps": 0.00341796875, "step": 142} {"info/global_step": 143, "train_info/time_within_train_step": 2.522090196609497, "step": 143} {"train_info/time_between_train_steps": 0.0033876895904541016, "step": 143} {"info/global_step": 144, "train_info/time_within_train_step": 2.521819591522217, "step": 144} {"train_info/time_between_train_steps": 0.0033884048461914062, "step": 144} {"info/global_step": 145, "train_info/time_within_train_step": 2.521908760070801, "step": 145} {"train_info/time_between_train_steps": 0.0034067630767822266, "step": 145} {"info/global_step": 146, "train_info/time_within_train_step": 2.5215139389038086, "step": 146} {"train_info/time_between_train_steps": 0.0034699440002441406, "step": 146} {"info/global_step": 147, "train_info/time_within_train_step": 2.5227138996124268, "step": 147} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 147} {"info/global_step": 148, "train_info/time_within_train_step": 2.5235435962677, "step": 148} {"train_info/time_between_train_steps": 0.0034759044647216797, "step": 148} {"info/global_step": 149, "train_info/time_within_train_step": 2.5235328674316406, "step": 149} {"train_info/time_between_train_steps": 0.003436565399169922, "step": 149} {"info/global_step": 150, "train_info/time_within_train_step": 2.7448995113372803, "step": 150} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746323371, "_runtime": 419}, "step": 150} {"logs": {"train/loss": 6.4996, "train/learning_rate": 0.0003, "train/epoch": 0.05, "_timestamp": 1746323371, "_runtime": 419}, "step": 150} {"train_info/time_between_train_steps": 0.024142980575561523, "step": 150} {"info/global_step": 151, "train_info/time_within_train_step": 2.5225160121917725, "step": 151} {"train_info/time_between_train_steps": 0.0034401416778564453, "step": 151} {"info/global_step": 152, "train_info/time_within_train_step": 2.523012638092041, "step": 152} {"train_info/time_between_train_steps": 0.0034475326538085938, "step": 152} {"info/global_step": 153, "train_info/time_within_train_step": 2.5235040187835693, "step": 153} {"train_info/time_between_train_steps": 0.003420591354370117, "step": 153} {"info/global_step": 154, "train_info/time_within_train_step": 2.5224740505218506, "step": 154} {"train_info/time_between_train_steps": 0.0034537315368652344, "step": 154} {"info/global_step": 155, "train_info/time_within_train_step": 2.522291421890259, "step": 155} {"train_info/time_between_train_steps": 0.0034067630767822266, "step": 155} {"info/global_step": 156, "train_info/time_within_train_step": 2.522435426712036, "step": 156} {"train_info/time_between_train_steps": 0.003423929214477539, "step": 156} {"info/global_step": 157, "train_info/time_within_train_step": 2.5223770141601562, "step": 157} {"train_info/time_between_train_steps": 0.0034148693084716797, "step": 157} {"info/global_step": 158, "train_info/time_within_train_step": 2.5223591327667236, "step": 158} {"train_info/time_between_train_steps": 0.0034270286560058594, "step": 158} {"info/global_step": 159, "train_info/time_within_train_step": 2.5220439434051514, "step": 159} {"train_info/time_between_train_steps": 0.0034313201904296875, "step": 159} {"info/global_step": 160, "train_info/time_within_train_step": 2.522718667984009, "step": 160} {"train_info/time_between_train_steps": 0.0034368038177490234, "step": 160} {"info/global_step": 161, "train_info/time_within_train_step": 2.5226263999938965, "step": 161} {"train_info/time_between_train_steps": 0.003415822982788086, "step": 161} {"info/global_step": 162, "train_info/time_within_train_step": 2.52761173248291, "step": 162} {"train_info/time_between_train_steps": 0.0034515857696533203, "step": 162} {"info/global_step": 163, "train_info/time_within_train_step": 2.5235352516174316, "step": 163} {"train_info/time_between_train_steps": 0.003413677215576172, "step": 163} {"info/global_step": 164, "train_info/time_within_train_step": 2.5239644050598145, "step": 164} {"train_info/time_between_train_steps": 0.0034224987030029297, "step": 164} {"info/global_step": 165, "train_info/time_within_train_step": 2.522728204727173, "step": 165} {"train_info/time_between_train_steps": 0.0034589767456054688, "step": 165} {"info/global_step": 166, "train_info/time_within_train_step": 2.5230607986450195, "step": 166} {"train_info/time_between_train_steps": 0.0034189224243164062, "step": 166} {"info/global_step": 167, "train_info/time_within_train_step": 2.522721767425537, "step": 167} {"train_info/time_between_train_steps": 0.0034084320068359375, "step": 167} {"info/global_step": 168, "train_info/time_within_train_step": 2.5506036281585693, "step": 168} {"train_info/time_between_train_steps": 0.0034322738647460938, "step": 168} {"info/global_step": 169, "train_info/time_within_train_step": 2.5274624824523926, "step": 169} {"train_info/time_between_train_steps": 0.0034019947052001953, "step": 169} {"info/global_step": 170, "train_info/time_within_train_step": 2.5224931240081787, "step": 170} {"train_info/time_between_train_steps": 0.0035066604614257812, "step": 170} {"info/global_step": 171, "train_info/time_within_train_step": 2.5230555534362793, "step": 171} {"train_info/time_between_train_steps": 0.0035233497619628906, "step": 171} {"info/global_step": 172, "train_info/time_within_train_step": 2.5233230590820312, "step": 172} {"train_info/time_between_train_steps": 0.0034682750701904297, "step": 172} {"info/global_step": 173, "train_info/time_within_train_step": 2.5217154026031494, "step": 173} {"train_info/time_between_train_steps": 0.004011869430541992, "step": 173} {"info/global_step": 174, "train_info/time_within_train_step": 2.522369623184204, "step": 174} {"train_info/time_between_train_steps": 0.0033957958221435547, "step": 174} {"info/global_step": 175, "train_info/time_within_train_step": 2.521757125854492, "step": 175} {"train_info/time_between_train_steps": 0.00342559814453125, "step": 175} {"info/global_step": 176, "train_info/time_within_train_step": 2.5221402645111084, "step": 176} {"train_info/time_between_train_steps": 0.0033826828002929688, "step": 176} {"info/global_step": 177, "train_info/time_within_train_step": 2.5220634937286377, "step": 177} {"train_info/time_between_train_steps": 0.0034041404724121094, "step": 177} {"info/global_step": 178, "train_info/time_within_train_step": 2.5216426849365234, "step": 178} {"train_info/time_between_train_steps": 0.0034062862396240234, "step": 178} {"info/global_step": 179, "train_info/time_within_train_step": 2.521963357925415, "step": 179} {"train_info/time_between_train_steps": 0.0033910274505615234, "step": 179} {"info/global_step": 180, "train_info/time_within_train_step": 2.522103786468506, "step": 180} {"train_info/time_between_train_steps": 0.0034263134002685547, "step": 180} {"info/global_step": 181, "train_info/time_within_train_step": 2.52236008644104, "step": 181} {"train_info/time_between_train_steps": 0.003417491912841797, "step": 181} {"info/global_step": 182, "train_info/time_within_train_step": 2.521904468536377, "step": 182} {"train_info/time_between_train_steps": 0.0033876895904541016, "step": 182} {"info/global_step": 183, "train_info/time_within_train_step": 2.52241587638855, "step": 183} {"train_info/time_between_train_steps": 0.003391742706298828, "step": 183} {"info/global_step": 184, "train_info/time_within_train_step": 2.521949291229248, "step": 184} {"train_info/time_between_train_steps": 0.003431558609008789, "step": 184} {"info/global_step": 185, "train_info/time_within_train_step": 2.52097487449646, "step": 185} {"train_info/time_between_train_steps": 0.0033855438232421875, "step": 185} {"info/global_step": 186, "train_info/time_within_train_step": 2.5212409496307373, "step": 186} {"train_info/time_between_train_steps": 0.003406524658203125, "step": 186} {"info/global_step": 187, "train_info/time_within_train_step": 2.521451950073242, "step": 187} {"train_info/time_between_train_steps": 0.0034270286560058594, "step": 187} {"info/global_step": 188, "train_info/time_within_train_step": 2.639439821243286, "step": 188} {"train_info/time_between_train_steps": 0.003461122512817383, "step": 188} {"info/global_step": 189, "train_info/time_within_train_step": 2.520801305770874, "step": 189} {"train_info/time_between_train_steps": 0.0033979415893554688, "step": 189} {"info/global_step": 190, "train_info/time_within_train_step": 2.5207507610321045, "step": 190} {"train_info/time_between_train_steps": 0.0034122467041015625, "step": 190} {"info/global_step": 191, "train_info/time_within_train_step": 2.5217502117156982, "step": 191} {"train_info/time_between_train_steps": 0.003477811813354492, "step": 191} {"info/global_step": 192, "train_info/time_within_train_step": 2.5209643840789795, "step": 192} {"train_info/time_between_train_steps": 0.0034050941467285156, "step": 192} {"info/global_step": 193, "train_info/time_within_train_step": 2.520848512649536, "step": 193} {"train_info/time_between_train_steps": 0.0034360885620117188, "step": 193} {"info/global_step": 194, "train_info/time_within_train_step": 2.524360418319702, "step": 194} {"train_info/time_between_train_steps": 0.0035686492919921875, "step": 194} {"info/global_step": 195, "train_info/time_within_train_step": 2.522603988647461, "step": 195} {"train_info/time_between_train_steps": 0.003624439239501953, "step": 195} {"info/global_step": 196, "train_info/time_within_train_step": 2.5235579013824463, "step": 196} {"train_info/time_between_train_steps": 0.003863096237182617, "step": 196} {"info/global_step": 197, "train_info/time_within_train_step": 2.5235848426818848, "step": 197} {"train_info/time_between_train_steps": 0.0038771629333496094, "step": 197} {"info/global_step": 198, "train_info/time_within_train_step": 2.523902177810669, "step": 198} {"train_info/time_between_train_steps": 0.0037810802459716797, "step": 198} {"info/global_step": 199, "train_info/time_within_train_step": 2.524005174636841, "step": 199} {"train_info/time_between_train_steps": 0.003936290740966797, "step": 199} {"info/global_step": 200, "train_info/time_within_train_step": 2.5244295597076416, "step": 200} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746323498, "_runtime": 546}, "step": 200} {"logs": {"train/loss": 6.2131, "train/learning_rate": 0.00039999999999999996, "train/epoch": 0.07, "_timestamp": 1746323498, "_runtime": 546}, "step": 200} {"train_info/time_between_train_steps": 19.618163347244263, "step": 200} {"info/global_step": 201, "train_info/time_within_train_step": 2.3299717903137207, "step": 201} {"train_info/time_between_train_steps": 0.003771543502807617, "step": 201} {"info/global_step": 202, "train_info/time_within_train_step": 2.3154046535491943, "step": 202} {"train_info/time_between_train_steps": 0.003784656524658203, "step": 202} {"info/global_step": 203, "train_info/time_within_train_step": 2.4724183082580566, "step": 203} {"train_info/time_between_train_steps": 0.0038061141967773438, "step": 203} {"info/global_step": 204, "train_info/time_within_train_step": 2.5216610431671143, "step": 204} {"train_info/time_between_train_steps": 0.003774881362915039, "step": 204} {"info/global_step": 205, "train_info/time_within_train_step": 2.521230459213257, "step": 205} {"train_info/time_between_train_steps": 0.003906965255737305, "step": 205} {"info/global_step": 206, "train_info/time_within_train_step": 2.5236499309539795, "step": 206} {"train_info/time_between_train_steps": 0.003916740417480469, "step": 206} {"info/global_step": 207, "train_info/time_within_train_step": 2.524911642074585, "step": 207} {"train_info/time_between_train_steps": 0.0038728713989257812, "step": 207} {"info/global_step": 208, "train_info/time_within_train_step": 2.524350166320801, "step": 208} {"train_info/time_between_train_steps": 0.003813505172729492, "step": 208} {"info/global_step": 209, "train_info/time_within_train_step": 2.525172472000122, "step": 209} {"train_info/time_between_train_steps": 0.0038704872131347656, "step": 209} {"info/global_step": 210, "train_info/time_within_train_step": 2.5253076553344727, "step": 210} {"train_info/time_between_train_steps": 0.0038361549377441406, "step": 210} {"info/global_step": 211, "train_info/time_within_train_step": 2.5249674320220947, "step": 211} {"train_info/time_between_train_steps": 0.0038039684295654297, "step": 211} {"info/global_step": 212, "train_info/time_within_train_step": 2.525318145751953, "step": 212} {"train_info/time_between_train_steps": 0.0038988590240478516, "step": 212} {"info/global_step": 213, "train_info/time_within_train_step": 2.525144577026367, "step": 213} {"train_info/time_between_train_steps": 0.00377655029296875, "step": 213} {"info/global_step": 214, "train_info/time_within_train_step": 2.5263869762420654, "step": 214} {"train_info/time_between_train_steps": 0.0038013458251953125, "step": 214} {"info/global_step": 215, "train_info/time_within_train_step": 2.899940013885498, "step": 215} {"train_info/time_between_train_steps": 0.003627300262451172, "step": 215} {"info/global_step": 216, "train_info/time_within_train_step": 2.523030996322632, "step": 216} {"train_info/time_between_train_steps": 0.003648996353149414, "step": 216} {"info/global_step": 217, "train_info/time_within_train_step": 2.523030996322632, "step": 217} {"train_info/time_between_train_steps": 0.0035283565521240234, "step": 217} {"info/global_step": 218, "train_info/time_within_train_step": 2.522610664367676, "step": 218} {"train_info/time_between_train_steps": 0.0035643577575683594, "step": 218} {"info/global_step": 219, "train_info/time_within_train_step": 2.5515999794006348, "step": 219} {"train_info/time_between_train_steps": 0.0037050247192382812, "step": 219} {"info/global_step": 220, "train_info/time_within_train_step": 2.5254135131835938, "step": 220} {"train_info/time_between_train_steps": 0.0038161277770996094, "step": 220} {"info/global_step": 221, "train_info/time_within_train_step": 2.5238444805145264, "step": 221} {"train_info/time_between_train_steps": 0.0038602352142333984, "step": 221} {"info/global_step": 222, "train_info/time_within_train_step": 2.5243215560913086, "step": 222} {"train_info/time_between_train_steps": 0.004054069519042969, "step": 222} {"info/global_step": 223, "train_info/time_within_train_step": 2.5237603187561035, "step": 223} {"train_info/time_between_train_steps": 0.0038001537322998047, "step": 223} {"info/global_step": 224, "train_info/time_within_train_step": 2.5244557857513428, "step": 224} {"train_info/time_between_train_steps": 0.003945827484130859, "step": 224} {"info/global_step": 225, "train_info/time_within_train_step": 2.5243802070617676, "step": 225} {"train_info/time_between_train_steps": 0.003985881805419922, "step": 225} {"info/global_step": 226, "train_info/time_within_train_step": 2.524604082107544, "step": 226} {"train_info/time_between_train_steps": 0.003870248794555664, "step": 226} {"info/global_step": 227, "train_info/time_within_train_step": 2.524416923522949, "step": 227} {"train_info/time_between_train_steps": 0.0038003921508789062, "step": 227} {"info/global_step": 228, "train_info/time_within_train_step": 2.5244998931884766, "step": 228} {"train_info/time_between_train_steps": 0.0038194656372070312, "step": 228} {"info/global_step": 229, "train_info/time_within_train_step": 2.524038076400757, "step": 229} {"train_info/time_between_train_steps": 0.003709554672241211, "step": 229} {"info/global_step": 230, "train_info/time_within_train_step": 2.524322509765625, "step": 230} {"train_info/time_between_train_steps": 0.003979682922363281, "step": 230} {"info/global_step": 231, "train_info/time_within_train_step": 2.5248055458068848, "step": 231} {"train_info/time_between_train_steps": 0.0037047863006591797, "step": 231} {"info/global_step": 232, "train_info/time_within_train_step": 2.524268388748169, "step": 232} {"train_info/time_between_train_steps": 0.003883838653564453, "step": 232} {"info/global_step": 233, "train_info/time_within_train_step": 2.5247786045074463, "step": 233} {"train_info/time_between_train_steps": 0.0038628578186035156, "step": 233} {"info/global_step": 234, "train_info/time_within_train_step": 2.525088310241699, "step": 234} {"train_info/time_between_train_steps": 0.0036644935607910156, "step": 234} {"info/global_step": 235, "train_info/time_within_train_step": 2.5238280296325684, "step": 235} {"train_info/time_between_train_steps": 0.0037207603454589844, "step": 235} {"info/global_step": 236, "train_info/time_within_train_step": 2.5235114097595215, "step": 236} {"train_info/time_between_train_steps": 0.003918170928955078, "step": 236} {"info/global_step": 237, "train_info/time_within_train_step": 2.5242648124694824, "step": 237} {"train_info/time_between_train_steps": 0.003656148910522461, "step": 237} {"info/global_step": 238, "train_info/time_within_train_step": 2.523367166519165, "step": 238} {"train_info/time_between_train_steps": 0.0036890506744384766, "step": 238} {"info/global_step": 239, "train_info/time_within_train_step": 2.5239813327789307, "step": 239} {"train_info/time_between_train_steps": 0.003716707229614258, "step": 239} {"info/global_step": 240, "train_info/time_within_train_step": 2.5247251987457275, "step": 240} {"train_info/time_between_train_steps": 0.0036818981170654297, "step": 240} {"info/global_step": 241, "train_info/time_within_train_step": 2.5235254764556885, "step": 241} {"train_info/time_between_train_steps": 0.003709077835083008, "step": 241} {"info/global_step": 242, "train_info/time_within_train_step": 2.5247256755828857, "step": 242} {"train_info/time_between_train_steps": 0.003658771514892578, "step": 242} {"info/global_step": 243, "train_info/time_within_train_step": 2.5230188369750977, "step": 243} {"train_info/time_between_train_steps": 0.003709077835083008, "step": 243} {"info/global_step": 244, "train_info/time_within_train_step": 2.524432897567749, "step": 244} {"train_info/time_between_train_steps": 0.003735065460205078, "step": 244} {"info/global_step": 245, "train_info/time_within_train_step": 2.5242271423339844, "step": 245} {"train_info/time_between_train_steps": 0.0037386417388916016, "step": 245} {"info/global_step": 246, "train_info/time_within_train_step": 2.524707078933716, "step": 246} {"train_info/time_between_train_steps": 0.0038106441497802734, "step": 246} {"info/global_step": 247, "train_info/time_within_train_step": 2.5237855911254883, "step": 247} {"train_info/time_between_train_steps": 0.003844738006591797, "step": 247} {"info/global_step": 248, "train_info/time_within_train_step": 2.524634599685669, "step": 248} {"train_info/time_between_train_steps": 0.0037751197814941406, "step": 248} {"info/global_step": 249, "train_info/time_within_train_step": 2.524965763092041, "step": 249} {"train_info/time_between_train_steps": 0.0037593841552734375, "step": 249} {"info/global_step": 250, "train_info/time_within_train_step": 3.142120599746704, "step": 250} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746323646, "_runtime": 694}, "step": 250} {"logs": {"train/loss": 5.9876, "train/learning_rate": 0.0005, "train/epoch": 0.08, "_timestamp": 1746323646, "_runtime": 694}, "step": 250} {"train_info/time_between_train_steps": 0.21280217170715332, "step": 250} {"info/global_step": 251, "train_info/time_within_train_step": 2.524301052093506, "step": 251} {"train_info/time_between_train_steps": 0.0036416053771972656, "step": 251} {"info/global_step": 252, "train_info/time_within_train_step": 2.524177312850952, "step": 252} {"train_info/time_between_train_steps": 0.003667116165161133, "step": 252} {"info/global_step": 253, "train_info/time_within_train_step": 2.5230350494384766, "step": 253} {"train_info/time_between_train_steps": 0.003559112548828125, "step": 253} {"info/global_step": 254, "train_info/time_within_train_step": 2.523852825164795, "step": 254} {"train_info/time_between_train_steps": 0.0036020278930664062, "step": 254} {"info/global_step": 255, "train_info/time_within_train_step": 2.5238828659057617, "step": 255} {"train_info/time_between_train_steps": 0.003725290298461914, "step": 255} {"info/global_step": 256, "train_info/time_within_train_step": 2.523322820663452, "step": 256} {"train_info/time_between_train_steps": 0.003898143768310547, "step": 256} {"info/global_step": 257, "train_info/time_within_train_step": 2.524163007736206, "step": 257} {"train_info/time_between_train_steps": 0.003802776336669922, "step": 257} {"info/global_step": 258, "train_info/time_within_train_step": 2.5241587162017822, "step": 258} {"train_info/time_between_train_steps": 0.0038776397705078125, "step": 258} {"info/global_step": 259, "train_info/time_within_train_step": 2.5248935222625732, "step": 259} {"train_info/time_between_train_steps": 0.0038306713104248047, "step": 259} {"info/global_step": 260, "train_info/time_within_train_step": 2.5250275135040283, "step": 260} {"train_info/time_between_train_steps": 0.0038475990295410156, "step": 260} {"info/global_step": 261, "train_info/time_within_train_step": 2.5245702266693115, "step": 261} {"train_info/time_between_train_steps": 0.0037894248962402344, "step": 261} {"info/global_step": 262, "train_info/time_within_train_step": 2.52486515045166, "step": 262} {"train_info/time_between_train_steps": 0.0037539005279541016, "step": 262} {"info/global_step": 263, "train_info/time_within_train_step": 2.524618148803711, "step": 263} {"train_info/time_between_train_steps": 0.003765106201171875, "step": 263} {"info/global_step": 264, "train_info/time_within_train_step": 2.523280382156372, "step": 264} {"train_info/time_between_train_steps": 0.003768444061279297, "step": 264} {"info/global_step": 265, "train_info/time_within_train_step": 2.5237059593200684, "step": 265} {"train_info/time_between_train_steps": 0.0037224292755126953, "step": 265} {"info/global_step": 266, "train_info/time_within_train_step": 2.523789882659912, "step": 266} {"train_info/time_between_train_steps": 0.0037810802459716797, "step": 266} {"info/global_step": 267, "train_info/time_within_train_step": 2.523987293243408, "step": 267} {"train_info/time_between_train_steps": 0.003743410110473633, "step": 267} {"info/global_step": 268, "train_info/time_within_train_step": 2.525658130645752, "step": 268} {"train_info/time_between_train_steps": 0.00382232666015625, "step": 268} {"info/global_step": 269, "train_info/time_within_train_step": 2.5247206687927246, "step": 269} {"train_info/time_between_train_steps": 0.0037555694580078125, "step": 269} {"info/global_step": 270, "train_info/time_within_train_step": 2.5237152576446533, "step": 270} {"train_info/time_between_train_steps": 0.0037806034088134766, "step": 270} {"info/global_step": 271, "train_info/time_within_train_step": 2.523876905441284, "step": 271} {"train_info/time_between_train_steps": 0.0037522315979003906, "step": 271} {"info/global_step": 272, "train_info/time_within_train_step": 2.524204730987549, "step": 272} {"train_info/time_between_train_steps": 0.003756999969482422, "step": 272} {"info/global_step": 273, "train_info/time_within_train_step": 2.5236282348632812, "step": 273} {"train_info/time_between_train_steps": 0.0037660598754882812, "step": 273} {"info/global_step": 274, "train_info/time_within_train_step": 2.5236215591430664, "step": 274} {"train_info/time_between_train_steps": 0.00370025634765625, "step": 274} {"info/global_step": 275, "train_info/time_within_train_step": 2.523756265640259, "step": 275} {"train_info/time_between_train_steps": 0.0037865638732910156, "step": 275} {"info/global_step": 276, "train_info/time_within_train_step": 2.5261354446411133, "step": 276} {"train_info/time_between_train_steps": 0.003972053527832031, "step": 276} {"info/global_step": 277, "train_info/time_within_train_step": 2.5252583026885986, "step": 277} {"train_info/time_between_train_steps": 0.0037670135498046875, "step": 277} {"info/global_step": 278, "train_info/time_within_train_step": 2.524000883102417, "step": 278} {"train_info/time_between_train_steps": 0.0037856101989746094, "step": 278} {"info/global_step": 279, "train_info/time_within_train_step": 2.5250163078308105, "step": 279} {"train_info/time_between_train_steps": 0.003875255584716797, "step": 279} {"info/global_step": 280, "train_info/time_within_train_step": 2.5252842903137207, "step": 280} {"train_info/time_between_train_steps": 0.003914594650268555, "step": 280} {"info/global_step": 281, "train_info/time_within_train_step": 2.524594783782959, "step": 281} {"train_info/time_between_train_steps": 0.0038001537322998047, "step": 281} {"info/global_step": 282, "train_info/time_within_train_step": 2.5244786739349365, "step": 282} {"train_info/time_between_train_steps": 0.003852367401123047, "step": 282} {"info/global_step": 283, "train_info/time_within_train_step": 2.5246975421905518, "step": 283} {"train_info/time_between_train_steps": 0.0040705204010009766, "step": 283} {"info/global_step": 284, "train_info/time_within_train_step": 2.5250680446624756, "step": 284} {"train_info/time_between_train_steps": 0.003815889358520508, "step": 284} {"info/global_step": 285, "train_info/time_within_train_step": 2.5240557193756104, "step": 285} {"train_info/time_between_train_steps": 0.0037360191345214844, "step": 285} {"info/global_step": 286, "train_info/time_within_train_step": 2.5222997665405273, "step": 286} {"train_info/time_between_train_steps": 0.003786802291870117, "step": 286} {"info/global_step": 287, "train_info/time_within_train_step": 2.5222740173339844, "step": 287} {"train_info/time_between_train_steps": 0.003977060317993164, "step": 287} {"info/global_step": 288, "train_info/time_within_train_step": 2.5222764015197754, "step": 288} {"train_info/time_between_train_steps": 0.0036649703979492188, "step": 288} {"info/global_step": 289, "train_info/time_within_train_step": 2.522500514984131, "step": 289} {"train_info/time_between_train_steps": 0.0040090084075927734, "step": 289} {"info/global_step": 290, "train_info/time_within_train_step": 2.5224978923797607, "step": 290} {"train_info/time_between_train_steps": 0.0039005279541015625, "step": 290} {"info/global_step": 291, "train_info/time_within_train_step": 2.522103786468506, "step": 291} {"train_info/time_between_train_steps": 0.0038976669311523438, "step": 291} {"info/global_step": 292, "train_info/time_within_train_step": 2.5226998329162598, "step": 292} {"train_info/time_between_train_steps": 0.0037271976470947266, "step": 292} {"info/global_step": 293, "train_info/time_within_train_step": 2.5236730575561523, "step": 293} {"train_info/time_between_train_steps": 0.0038957595825195312, "step": 293} {"info/global_step": 294, "train_info/time_within_train_step": 2.523916721343994, "step": 294} {"train_info/time_between_train_steps": 0.003855466842651367, "step": 294} {"info/global_step": 295, "train_info/time_within_train_step": 2.523303508758545, "step": 295} {"train_info/time_between_train_steps": 0.0037736892700195312, "step": 295} {"info/global_step": 296, "train_info/time_within_train_step": 2.523552894592285, "step": 296} {"train_info/time_between_train_steps": 0.0037729740142822266, "step": 296} {"info/global_step": 297, "train_info/time_within_train_step": 2.523563861846924, "step": 297} {"train_info/time_between_train_steps": 0.003693819046020508, "step": 297} {"info/global_step": 298, "train_info/time_within_train_step": 2.884357213973999, "step": 298} {"train_info/time_between_train_steps": 0.0036835670471191406, "step": 298} {"info/global_step": 299, "train_info/time_within_train_step": 2.5215721130371094, "step": 299} {"train_info/time_between_train_steps": 0.0037322044372558594, "step": 299} {"info/global_step": 300, "train_info/time_within_train_step": 2.522324323654175, "step": 300} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746323774, "_runtime": 822}, "step": 300} {"logs": {"train/loss": 5.835, "train/learning_rate": 0.0006, "train/epoch": 0.1, "_timestamp": 1746323774, "_runtime": 822}, "step": 300} {"train_info/time_between_train_steps": 19.073710203170776, "step": 300} {"info/global_step": 301, "train_info/time_within_train_step": 2.336406707763672, "step": 301} {"train_info/time_between_train_steps": 0.0037734508514404297, "step": 301} {"info/global_step": 302, "train_info/time_within_train_step": 2.321387767791748, "step": 302} {"train_info/time_between_train_steps": 0.003672361373901367, "step": 302} {"info/global_step": 303, "train_info/time_within_train_step": 2.4726767539978027, "step": 303} {"train_info/time_between_train_steps": 0.0037889480590820312, "step": 303} {"info/global_step": 304, "train_info/time_within_train_step": 2.5208568572998047, "step": 304} {"train_info/time_between_train_steps": 0.003899097442626953, "step": 304} {"info/global_step": 305, "train_info/time_within_train_step": 2.5204052925109863, "step": 305} {"train_info/time_between_train_steps": 0.003655672073364258, "step": 305} {"info/global_step": 306, "train_info/time_within_train_step": 2.522019624710083, "step": 306} {"train_info/time_between_train_steps": 0.0036847591400146484, "step": 306} {"info/global_step": 307, "train_info/time_within_train_step": 2.5218231678009033, "step": 307} {"train_info/time_between_train_steps": 0.003803730010986328, "step": 307} {"info/global_step": 308, "train_info/time_within_train_step": 2.522517442703247, "step": 308} {"train_info/time_between_train_steps": 0.003908395767211914, "step": 308} {"info/global_step": 309, "train_info/time_within_train_step": 2.5218894481658936, "step": 309} {"train_info/time_between_train_steps": 0.0038843154907226562, "step": 309} {"info/global_step": 310, "train_info/time_within_train_step": 2.5231244564056396, "step": 310} {"train_info/time_between_train_steps": 0.0036458969116210938, "step": 310} {"info/global_step": 311, "train_info/time_within_train_step": 2.522054433822632, "step": 311} {"train_info/time_between_train_steps": 0.0038712024688720703, "step": 311} {"info/global_step": 312, "train_info/time_within_train_step": 2.5271148681640625, "step": 312} {"train_info/time_between_train_steps": 0.003654003143310547, "step": 312} {"info/global_step": 313, "train_info/time_within_train_step": 2.692605972290039, "step": 313} {"train_info/time_between_train_steps": 0.0035059452056884766, "step": 313} {"info/global_step": 314, "train_info/time_within_train_step": 2.522874593734741, "step": 314} {"train_info/time_between_train_steps": 0.0035495758056640625, "step": 314} {"info/global_step": 315, "train_info/time_within_train_step": 2.522003412246704, "step": 315} {"train_info/time_between_train_steps": 0.003480672836303711, "step": 315} {"info/global_step": 316, "train_info/time_within_train_step": 2.5221848487854004, "step": 316} {"train_info/time_between_train_steps": 0.0034666061401367188, "step": 316} {"info/global_step": 317, "train_info/time_within_train_step": 2.523045063018799, "step": 317} {"train_info/time_between_train_steps": 0.0034923553466796875, "step": 317} {"info/global_step": 318, "train_info/time_within_train_step": 2.523045301437378, "step": 318} {"train_info/time_between_train_steps": 0.003675222396850586, "step": 318} {"info/global_step": 319, "train_info/time_within_train_step": 2.522102117538452, "step": 319} {"train_info/time_between_train_steps": 0.003462553024291992, "step": 319} {"info/global_step": 320, "train_info/time_within_train_step": 2.522675037384033, "step": 320} {"train_info/time_between_train_steps": 0.0034589767456054688, "step": 320} {"info/global_step": 321, "train_info/time_within_train_step": 2.522710084915161, "step": 321} {"train_info/time_between_train_steps": 0.0034894943237304688, "step": 321} {"info/global_step": 322, "train_info/time_within_train_step": 2.523216485977173, "step": 322} {"train_info/time_between_train_steps": 0.003527402877807617, "step": 322} {"info/global_step": 323, "train_info/time_within_train_step": 2.5232489109039307, "step": 323} {"train_info/time_between_train_steps": 0.003652811050415039, "step": 323} {"info/global_step": 324, "train_info/time_within_train_step": 2.5227887630462646, "step": 324} {"train_info/time_between_train_steps": 0.003606081008911133, "step": 324} {"info/global_step": 325, "train_info/time_within_train_step": 2.5226683616638184, "step": 325} {"train_info/time_between_train_steps": 0.0034453868865966797, "step": 325} {"info/global_step": 326, "train_info/time_within_train_step": 2.5222008228302, "step": 326} {"train_info/time_between_train_steps": 0.003499269485473633, "step": 326} {"info/global_step": 327, "train_info/time_within_train_step": 2.5213842391967773, "step": 327} {"train_info/time_between_train_steps": 0.003389596939086914, "step": 327} {"info/global_step": 328, "train_info/time_within_train_step": 2.5223517417907715, "step": 328} {"train_info/time_between_train_steps": 0.003422975540161133, "step": 328} {"info/global_step": 329, "train_info/time_within_train_step": 2.522203207015991, "step": 329} {"train_info/time_between_train_steps": 0.0035109519958496094, "step": 329} {"info/global_step": 330, "train_info/time_within_train_step": 2.5219438076019287, "step": 330} {"train_info/time_between_train_steps": 0.003520965576171875, "step": 330} {"info/global_step": 331, "train_info/time_within_train_step": 2.5219619274139404, "step": 331} {"train_info/time_between_train_steps": 0.0037016868591308594, "step": 331} {"info/global_step": 332, "train_info/time_within_train_step": 2.5234296321868896, "step": 332} {"train_info/time_between_train_steps": 0.0034744739532470703, "step": 332} {"info/global_step": 333, "train_info/time_within_train_step": 2.522382974624634, "step": 333} {"train_info/time_between_train_steps": 0.0034360885620117188, "step": 333} {"info/global_step": 334, "train_info/time_within_train_step": 2.521559238433838, "step": 334} {"train_info/time_between_train_steps": 0.003596782684326172, "step": 334} {"info/global_step": 335, "train_info/time_within_train_step": 2.5225086212158203, "step": 335} {"train_info/time_between_train_steps": 0.0034737586975097656, "step": 335} {"info/global_step": 336, "train_info/time_within_train_step": 2.5225014686584473, "step": 336} {"train_info/time_between_train_steps": 0.003461599349975586, "step": 336} {"info/global_step": 337, "train_info/time_within_train_step": 2.8239541053771973, "step": 337} {"train_info/time_between_train_steps": 0.003374814987182617, "step": 337} {"info/global_step": 338, "train_info/time_within_train_step": 2.52305006980896, "step": 338} {"train_info/time_between_train_steps": 0.003388643264770508, "step": 338} {"info/global_step": 339, "train_info/time_within_train_step": 2.52294921875, "step": 339} {"train_info/time_between_train_steps": 0.0036916732788085938, "step": 339} {"info/global_step": 340, "train_info/time_within_train_step": 2.522212028503418, "step": 340} {"train_info/time_between_train_steps": 0.00391077995300293, "step": 340} {"info/global_step": 341, "train_info/time_within_train_step": 2.5219123363494873, "step": 341} {"train_info/time_between_train_steps": 0.0033986568450927734, "step": 341} {"info/global_step": 342, "train_info/time_within_train_step": 2.522087574005127, "step": 342} {"train_info/time_between_train_steps": 0.003391265869140625, "step": 342} {"info/global_step": 343, "train_info/time_within_train_step": 2.522874355316162, "step": 343} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 343} {"info/global_step": 344, "train_info/time_within_train_step": 2.5219295024871826, "step": 344} {"train_info/time_between_train_steps": 0.0033926963806152344, "step": 344} {"info/global_step": 345, "train_info/time_within_train_step": 2.521507740020752, "step": 345} {"train_info/time_between_train_steps": 0.003660917282104492, "step": 345} {"info/global_step": 346, "train_info/time_within_train_step": 2.5222158432006836, "step": 346} {"train_info/time_between_train_steps": 0.0033943653106689453, "step": 346} {"info/global_step": 347, "train_info/time_within_train_step": 2.521900177001953, "step": 347} {"train_info/time_between_train_steps": 0.0033855438232421875, "step": 347} {"info/global_step": 348, "train_info/time_within_train_step": 2.52116060256958, "step": 348} {"train_info/time_between_train_steps": 0.003465414047241211, "step": 348} {"info/global_step": 349, "train_info/time_within_train_step": 2.522576093673706, "step": 349} {"train_info/time_between_train_steps": 0.003501415252685547, "step": 349} {"info/global_step": 350, "train_info/time_within_train_step": 2.522343397140503, "step": 350} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746323920, "_runtime": 968}, "step": 350} {"logs": {"train/loss": 5.6973, "train/learning_rate": 0.0005888888888888889, "train/epoch": 0.12, "_timestamp": 1746323920, "_runtime": 968}, "step": 350} {"train_info/time_between_train_steps": 0.024235248565673828, "step": 350} {"info/global_step": 351, "train_info/time_within_train_step": 2.5215933322906494, "step": 351} {"train_info/time_between_train_steps": 0.0035691261291503906, "step": 351} {"info/global_step": 352, "train_info/time_within_train_step": 2.522514581680298, "step": 352} {"train_info/time_between_train_steps": 0.003429889678955078, "step": 352} {"info/global_step": 353, "train_info/time_within_train_step": 2.52190899848938, "step": 353} {"train_info/time_between_train_steps": 0.0034439563751220703, "step": 353} {"info/global_step": 354, "train_info/time_within_train_step": 2.523010730743408, "step": 354} {"train_info/time_between_train_steps": 0.0034525394439697266, "step": 354} {"info/global_step": 355, "train_info/time_within_train_step": 2.522369384765625, "step": 355} {"train_info/time_between_train_steps": 0.003424406051635742, "step": 355} {"info/global_step": 356, "train_info/time_within_train_step": 2.522033452987671, "step": 356} {"train_info/time_between_train_steps": 0.0034134387969970703, "step": 356} {"info/global_step": 357, "train_info/time_within_train_step": 2.5226690769195557, "step": 357} {"train_info/time_between_train_steps": 0.0034568309783935547, "step": 357} {"info/global_step": 358, "train_info/time_within_train_step": 2.5219497680664062, "step": 358} {"train_info/time_between_train_steps": 0.0034227371215820312, "step": 358} {"info/global_step": 359, "train_info/time_within_train_step": 2.5232932567596436, "step": 359} {"train_info/time_between_train_steps": 0.0035817623138427734, "step": 359} {"info/global_step": 360, "train_info/time_within_train_step": 2.5234131813049316, "step": 360} {"train_info/time_between_train_steps": 0.00354766845703125, "step": 360} {"info/global_step": 361, "train_info/time_within_train_step": 2.5228869915008545, "step": 361} {"train_info/time_between_train_steps": 0.003501415252685547, "step": 361} {"info/global_step": 362, "train_info/time_within_train_step": 2.523489236831665, "step": 362} {"train_info/time_between_train_steps": 0.00344085693359375, "step": 362} {"info/global_step": 363, "train_info/time_within_train_step": 2.521601915359497, "step": 363} {"train_info/time_between_train_steps": 0.003422260284423828, "step": 363} {"info/global_step": 364, "train_info/time_within_train_step": 2.5224575996398926, "step": 364} {"train_info/time_between_train_steps": 0.003417491912841797, "step": 364} {"info/global_step": 365, "train_info/time_within_train_step": 2.521223306655884, "step": 365} {"train_info/time_between_train_steps": 0.0033998489379882812, "step": 365} {"info/global_step": 366, "train_info/time_within_train_step": 2.526271343231201, "step": 366} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 366} {"info/global_step": 367, "train_info/time_within_train_step": 2.5218636989593506, "step": 367} {"train_info/time_between_train_steps": 0.003384828567504883, "step": 367} {"info/global_step": 368, "train_info/time_within_train_step": 2.521629571914673, "step": 368} {"train_info/time_between_train_steps": 0.0033767223358154297, "step": 368} {"info/global_step": 369, "train_info/time_within_train_step": 2.52167010307312, "step": 369} {"train_info/time_between_train_steps": 0.003390789031982422, "step": 369} {"info/global_step": 370, "train_info/time_within_train_step": 2.521542549133301, "step": 370} {"train_info/time_between_train_steps": 0.0034041404724121094, "step": 370} {"info/global_step": 371, "train_info/time_within_train_step": 2.5493998527526855, "step": 371} {"train_info/time_between_train_steps": 0.0034513473510742188, "step": 371} {"info/global_step": 372, "train_info/time_within_train_step": 2.5218284130096436, "step": 372} {"train_info/time_between_train_steps": 0.0034859180450439453, "step": 372} {"info/global_step": 373, "train_info/time_within_train_step": 2.522090435028076, "step": 373} {"train_info/time_between_train_steps": 0.003358125686645508, "step": 373} {"info/global_step": 374, "train_info/time_within_train_step": 2.522092342376709, "step": 374} {"train_info/time_between_train_steps": 0.003498554229736328, "step": 374} {"info/global_step": 375, "train_info/time_within_train_step": 2.521374225616455, "step": 375} {"train_info/time_between_train_steps": 0.12241077423095703, "step": 375} {"info/global_step": 376, "train_info/time_within_train_step": 2.5219123363494873, "step": 376} {"train_info/time_between_train_steps": 0.0033736228942871094, "step": 376} {"info/global_step": 377, "train_info/time_within_train_step": 2.521848678588867, "step": 377} {"train_info/time_between_train_steps": 0.0034792423248291016, "step": 377} {"info/global_step": 378, "train_info/time_within_train_step": 2.5212059020996094, "step": 378} {"train_info/time_between_train_steps": 0.003360748291015625, "step": 378} {"info/global_step": 379, "train_info/time_within_train_step": 2.5215439796447754, "step": 379} {"train_info/time_between_train_steps": 0.0035238265991210938, "step": 379} {"info/global_step": 380, "train_info/time_within_train_step": 2.5211410522460938, "step": 380} {"train_info/time_between_train_steps": 0.0036559104919433594, "step": 380} {"info/global_step": 381, "train_info/time_within_train_step": 2.521637201309204, "step": 381} {"train_info/time_between_train_steps": 0.003469705581665039, "step": 381} {"info/global_step": 382, "train_info/time_within_train_step": 2.5215201377868652, "step": 382} {"train_info/time_between_train_steps": 0.0034248828887939453, "step": 382} {"info/global_step": 383, "train_info/time_within_train_step": 2.5217316150665283, "step": 383} {"train_info/time_between_train_steps": 0.0033845901489257812, "step": 383} {"info/global_step": 384, "train_info/time_within_train_step": 2.521836519241333, "step": 384} {"train_info/time_between_train_steps": 0.0033941268920898438, "step": 384} {"info/global_step": 385, "train_info/time_within_train_step": 2.5226151943206787, "step": 385} {"train_info/time_between_train_steps": 0.0035600662231445312, "step": 385} {"info/global_step": 386, "train_info/time_within_train_step": 2.521529197692871, "step": 386} {"train_info/time_between_train_steps": 0.003470897674560547, "step": 386} {"info/global_step": 387, "train_info/time_within_train_step": 2.5207297801971436, "step": 387} {"train_info/time_between_train_steps": 0.003451824188232422, "step": 387} {"info/global_step": 388, "train_info/time_within_train_step": 2.5216896533966064, "step": 388} {"train_info/time_between_train_steps": 0.0033736228942871094, "step": 388} {"info/global_step": 389, "train_info/time_within_train_step": 2.5216541290283203, "step": 389} {"train_info/time_between_train_steps": 0.003641843795776367, "step": 389} {"info/global_step": 390, "train_info/time_within_train_step": 2.521697521209717, "step": 390} {"train_info/time_between_train_steps": 0.003402233123779297, "step": 390} {"info/global_step": 391, "train_info/time_within_train_step": 2.5223500728607178, "step": 391} {"train_info/time_between_train_steps": 0.0035448074340820312, "step": 391} {"info/global_step": 392, "train_info/time_within_train_step": 2.5219056606292725, "step": 392} {"train_info/time_between_train_steps": 0.00354766845703125, "step": 392} {"info/global_step": 393, "train_info/time_within_train_step": 2.522228479385376, "step": 393} {"train_info/time_between_train_steps": 0.0035195350646972656, "step": 393} {"info/global_step": 394, "train_info/time_within_train_step": 2.52215313911438, "step": 394} {"train_info/time_between_train_steps": 0.0034542083740234375, "step": 394} {"info/global_step": 395, "train_info/time_within_train_step": 2.5230071544647217, "step": 395} {"train_info/time_between_train_steps": 0.0033910274505615234, "step": 395} {"info/global_step": 396, "train_info/time_within_train_step": 2.5220909118652344, "step": 396} {"train_info/time_between_train_steps": 0.0033626556396484375, "step": 396} {"info/global_step": 397, "train_info/time_within_train_step": 2.522087335586548, "step": 397} {"train_info/time_between_train_steps": 0.0034112930297851562, "step": 397} {"info/global_step": 398, "train_info/time_within_train_step": 2.5222244262695312, "step": 398} {"train_info/time_between_train_steps": 0.003481149673461914, "step": 398} {"info/global_step": 399, "train_info/time_within_train_step": 2.5226707458496094, "step": 399} {"train_info/time_between_train_steps": 0.003576040267944336, "step": 399} {"info/global_step": 400, "train_info/time_within_train_step": 2.5508289337158203, "step": 400} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746324048, "_runtime": 1096}, "step": 400} {"logs": {"train/loss": 5.5651, "train/learning_rate": 0.0005777777777777776, "train/epoch": 0.13, "_timestamp": 1746324048, "_runtime": 1096}, "step": 400} {"train_info/time_between_train_steps": 12.375494480133057, "step": 400} {"info/global_step": 401, "train_info/time_within_train_step": 2.3301568031311035, "step": 401} {"train_info/time_between_train_steps": 0.0036525726318359375, "step": 401} {"info/global_step": 402, "train_info/time_within_train_step": 2.3298850059509277, "step": 402} {"train_info/time_between_train_steps": 0.003495931625366211, "step": 402} {"info/global_step": 403, "train_info/time_within_train_step": 2.5068163871765137, "step": 403} {"train_info/time_between_train_steps": 0.0035746097564697266, "step": 403} {"info/global_step": 404, "train_info/time_within_train_step": 2.520017623901367, "step": 404} {"train_info/time_between_train_steps": 0.0033953189849853516, "step": 404} {"info/global_step": 405, "train_info/time_within_train_step": 2.5205633640289307, "step": 405} {"train_info/time_between_train_steps": 0.00359344482421875, "step": 405} {"info/global_step": 406, "train_info/time_within_train_step": 2.521210193634033, "step": 406} {"train_info/time_between_train_steps": 0.0034682750701904297, "step": 406} {"info/global_step": 407, "train_info/time_within_train_step": 2.521876573562622, "step": 407} {"train_info/time_between_train_steps": 0.003437519073486328, "step": 407} {"info/global_step": 408, "train_info/time_within_train_step": 2.521500825881958, "step": 408} {"train_info/time_between_train_steps": 0.0034990310668945312, "step": 408} {"info/global_step": 409, "train_info/time_within_train_step": 2.5221478939056396, "step": 409} {"train_info/time_between_train_steps": 0.0034978389739990234, "step": 409} {"info/global_step": 410, "train_info/time_within_train_step": 2.7668018341064453, "step": 410} {"train_info/time_between_train_steps": 0.0034036636352539062, "step": 410} {"info/global_step": 411, "train_info/time_within_train_step": 2.522148370742798, "step": 411} {"train_info/time_between_train_steps": 0.003492116928100586, "step": 411} {"info/global_step": 412, "train_info/time_within_train_step": 2.5222408771514893, "step": 412} {"train_info/time_between_train_steps": 0.0034837722778320312, "step": 412} {"info/global_step": 413, "train_info/time_within_train_step": 2.52190899848938, "step": 413} {"train_info/time_between_train_steps": 0.003422260284423828, "step": 413} {"info/global_step": 414, "train_info/time_within_train_step": 2.523120403289795, "step": 414} {"train_info/time_between_train_steps": 0.0034487247467041016, "step": 414} {"info/global_step": 415, "train_info/time_within_train_step": 2.5226900577545166, "step": 415} {"train_info/time_between_train_steps": 0.0034079551696777344, "step": 415} {"info/global_step": 416, "train_info/time_within_train_step": 2.527520179748535, "step": 416} {"train_info/time_between_train_steps": 0.0033948421478271484, "step": 416} {"info/global_step": 417, "train_info/time_within_train_step": 2.522738456726074, "step": 417} {"train_info/time_between_train_steps": 0.0034208297729492188, "step": 417} {"info/global_step": 418, "train_info/time_within_train_step": 2.523081064224243, "step": 418} {"train_info/time_between_train_steps": 0.003422975540161133, "step": 418} {"info/global_step": 419, "train_info/time_within_train_step": 2.522747278213501, "step": 419} {"train_info/time_between_train_steps": 0.003414154052734375, "step": 419} {"info/global_step": 420, "train_info/time_within_train_step": 2.5225272178649902, "step": 420} {"train_info/time_between_train_steps": 0.0034122467041015625, "step": 420} {"info/global_step": 421, "train_info/time_within_train_step": 2.522280216217041, "step": 421} {"train_info/time_between_train_steps": 0.003421306610107422, "step": 421} {"info/global_step": 422, "train_info/time_within_train_step": 2.5229642391204834, "step": 422} {"train_info/time_between_train_steps": 0.0033936500549316406, "step": 422} {"info/global_step": 423, "train_info/time_within_train_step": 2.5227231979370117, "step": 423} {"train_info/time_between_train_steps": 0.003401041030883789, "step": 423} {"info/global_step": 424, "train_info/time_within_train_step": 2.5223309993743896, "step": 424} {"train_info/time_between_train_steps": 0.003953218460083008, "step": 424} {"info/global_step": 425, "train_info/time_within_train_step": 2.522677421569824, "step": 425} {"train_info/time_between_train_steps": 0.0033960342407226562, "step": 425} {"info/global_step": 426, "train_info/time_within_train_step": 2.5229294300079346, "step": 426} {"train_info/time_between_train_steps": 0.00339508056640625, "step": 426} {"info/global_step": 427, "train_info/time_within_train_step": 2.523292303085327, "step": 427} {"train_info/time_between_train_steps": 0.003415346145629883, "step": 427} {"info/global_step": 428, "train_info/time_within_train_step": 2.5230448246002197, "step": 428} {"train_info/time_between_train_steps": 0.003412008285522461, "step": 428} {"info/global_step": 429, "train_info/time_within_train_step": 2.522562026977539, "step": 429} {"train_info/time_between_train_steps": 0.003428220748901367, "step": 429} {"info/global_step": 430, "train_info/time_within_train_step": 2.5220675468444824, "step": 430} {"train_info/time_between_train_steps": 0.003392934799194336, "step": 430} {"info/global_step": 431, "train_info/time_within_train_step": 2.52236270904541, "step": 431} {"train_info/time_between_train_steps": 0.003431558609008789, "step": 431} {"info/global_step": 432, "train_info/time_within_train_step": 2.5222463607788086, "step": 432} {"train_info/time_between_train_steps": 0.0034003257751464844, "step": 432} {"info/global_step": 433, "train_info/time_within_train_step": 2.522416353225708, "step": 433} {"train_info/time_between_train_steps": 0.0033881664276123047, "step": 433} {"info/global_step": 434, "train_info/time_within_train_step": 2.5223805904388428, "step": 434} {"train_info/time_between_train_steps": 0.0033943653106689453, "step": 434} {"info/global_step": 435, "train_info/time_within_train_step": 2.5226705074310303, "step": 435} {"train_info/time_between_train_steps": 0.0033941268920898438, "step": 435} {"info/global_step": 436, "train_info/time_within_train_step": 2.52197265625, "step": 436} {"train_info/time_between_train_steps": 0.003437519073486328, "step": 436} {"info/global_step": 437, "train_info/time_within_train_step": 2.5226340293884277, "step": 437} {"train_info/time_between_train_steps": 0.0033791065216064453, "step": 437} {"info/global_step": 438, "train_info/time_within_train_step": 2.6424031257629395, "step": 438} {"train_info/time_between_train_steps": 0.0034422874450683594, "step": 438} {"info/global_step": 439, "train_info/time_within_train_step": 2.522759199142456, "step": 439} {"train_info/time_between_train_steps": 0.003402233123779297, "step": 439} {"info/global_step": 440, "train_info/time_within_train_step": 2.52189302444458, "step": 440} {"train_info/time_between_train_steps": 0.003403186798095703, "step": 440} {"info/global_step": 441, "train_info/time_within_train_step": 2.5225706100463867, "step": 441} {"train_info/time_between_train_steps": 0.003452777862548828, "step": 441} {"info/global_step": 442, "train_info/time_within_train_step": 2.5227503776550293, "step": 442} {"train_info/time_between_train_steps": 0.003459930419921875, "step": 442} {"info/global_step": 443, "train_info/time_within_train_step": 2.5224180221557617, "step": 443} {"train_info/time_between_train_steps": 0.0034024715423583984, "step": 443} {"info/global_step": 444, "train_info/time_within_train_step": 2.5228323936462402, "step": 444} {"train_info/time_between_train_steps": 0.003407001495361328, "step": 444} {"info/global_step": 445, "train_info/time_within_train_step": 2.5231056213378906, "step": 445} {"train_info/time_between_train_steps": 0.0034971237182617188, "step": 445} {"info/global_step": 446, "train_info/time_within_train_step": 2.5230298042297363, "step": 446} {"train_info/time_between_train_steps": 0.0034952163696289062, "step": 446} {"info/global_step": 447, "train_info/time_within_train_step": 2.5239410400390625, "step": 447} {"train_info/time_between_train_steps": 0.003491640090942383, "step": 447} {"info/global_step": 448, "train_info/time_within_train_step": 2.5237393379211426, "step": 448} {"train_info/time_between_train_steps": 0.0038950443267822266, "step": 448} {"info/global_step": 449, "train_info/time_within_train_step": 2.5297725200653076, "step": 449} {"train_info/time_between_train_steps": 0.003912448883056641, "step": 449} {"info/global_step": 450, "train_info/time_within_train_step": 2.524444341659546, "step": 450} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746324187, "_runtime": 1235}, "step": 450} {"logs": {"train/loss": 5.4644, "train/learning_rate": 0.0005666666666666666, "train/epoch": 0.15, "_timestamp": 1746324187, "_runtime": 1235}, "step": 450} {"train_info/time_between_train_steps": 0.025624752044677734, "step": 450} {"info/global_step": 451, "train_info/time_within_train_step": 2.5246708393096924, "step": 451} {"train_info/time_between_train_steps": 0.003803730010986328, "step": 451} {"info/global_step": 452, "train_info/time_within_train_step": 2.523423671722412, "step": 452} {"train_info/time_between_train_steps": 0.0038466453552246094, "step": 452} {"info/global_step": 453, "train_info/time_within_train_step": 2.5240705013275146, "step": 453} {"train_info/time_between_train_steps": 0.0037488937377929688, "step": 453} {"info/global_step": 454, "train_info/time_within_train_step": 2.5241641998291016, "step": 454} {"train_info/time_between_train_steps": 0.00385284423828125, "step": 454} {"info/global_step": 455, "train_info/time_within_train_step": 2.5235393047332764, "step": 455} {"train_info/time_between_train_steps": 0.003786802291870117, "step": 455} {"info/global_step": 456, "train_info/time_within_train_step": 2.5237467288970947, "step": 456} {"train_info/time_between_train_steps": 0.0038459300994873047, "step": 456} {"info/global_step": 457, "train_info/time_within_train_step": 2.523952007293701, "step": 457} {"train_info/time_between_train_steps": 0.003805875778198242, "step": 457} {"info/global_step": 458, "train_info/time_within_train_step": 2.523721933364868, "step": 458} {"train_info/time_between_train_steps": 0.003833770751953125, "step": 458} {"info/global_step": 459, "train_info/time_within_train_step": 2.523637533187866, "step": 459} {"train_info/time_between_train_steps": 0.0037419795989990234, "step": 459} {"info/global_step": 460, "train_info/time_within_train_step": 2.5236406326293945, "step": 460} {"train_info/time_between_train_steps": 0.00389862060546875, "step": 460} {"info/global_step": 461, "train_info/time_within_train_step": 2.5522494316101074, "step": 461} {"train_info/time_between_train_steps": 0.003888368606567383, "step": 461} {"info/global_step": 462, "train_info/time_within_train_step": 2.5252673625946045, "step": 462} {"train_info/time_between_train_steps": 0.0038847923278808594, "step": 462} {"info/global_step": 463, "train_info/time_within_train_step": 2.524930953979492, "step": 463} {"train_info/time_between_train_steps": 0.0038678646087646484, "step": 463} {"info/global_step": 464, "train_info/time_within_train_step": 2.5245063304901123, "step": 464} {"train_info/time_between_train_steps": 0.003861665725708008, "step": 464} {"info/global_step": 465, "train_info/time_within_train_step": 2.5240769386291504, "step": 465} {"train_info/time_between_train_steps": 0.0038907527923583984, "step": 465} {"info/global_step": 466, "train_info/time_within_train_step": 2.553179979324341, "step": 466} {"train_info/time_between_train_steps": 0.0038797855377197266, "step": 466} {"info/global_step": 467, "train_info/time_within_train_step": 2.5250742435455322, "step": 467} {"train_info/time_between_train_steps": 0.003877878189086914, "step": 467} {"info/global_step": 468, "train_info/time_within_train_step": 2.5233194828033447, "step": 468} {"train_info/time_between_train_steps": 0.0039501190185546875, "step": 468} {"info/global_step": 469, "train_info/time_within_train_step": 2.5242257118225098, "step": 469} {"train_info/time_between_train_steps": 0.003880739212036133, "step": 469} {"info/global_step": 470, "train_info/time_within_train_step": 2.5245397090911865, "step": 470} {"train_info/time_between_train_steps": 0.0038106441497802734, "step": 470} {"info/global_step": 471, "train_info/time_within_train_step": 2.525977373123169, "step": 471} {"train_info/time_between_train_steps": 0.003836393356323242, "step": 471} {"info/global_step": 472, "train_info/time_within_train_step": 2.5241453647613525, "step": 472} {"train_info/time_between_train_steps": 0.003828763961791992, "step": 472} {"info/global_step": 473, "train_info/time_within_train_step": 2.5250184535980225, "step": 473} {"train_info/time_between_train_steps": 0.003907918930053711, "step": 473} {"info/global_step": 474, "train_info/time_within_train_step": 2.530330181121826, "step": 474} {"train_info/time_between_train_steps": 0.003978252410888672, "step": 474} {"info/global_step": 475, "train_info/time_within_train_step": 2.5257935523986816, "step": 475} {"train_info/time_between_train_steps": 0.003951549530029297, "step": 475} {"info/global_step": 476, "train_info/time_within_train_step": 2.5246527194976807, "step": 476} {"train_info/time_between_train_steps": 0.0039064884185791016, "step": 476} {"info/global_step": 477, "train_info/time_within_train_step": 2.5248043537139893, "step": 477} {"train_info/time_between_train_steps": 0.003851652145385742, "step": 477} {"info/global_step": 478, "train_info/time_within_train_step": 2.5255134105682373, "step": 478} {"train_info/time_between_train_steps": 0.003903627395629883, "step": 478} {"info/global_step": 479, "train_info/time_within_train_step": 2.5533156394958496, "step": 479} {"train_info/time_between_train_steps": 0.0039327144622802734, "step": 479} {"info/global_step": 480, "train_info/time_within_train_step": 2.5236639976501465, "step": 480} {"train_info/time_between_train_steps": 0.0038559436798095703, "step": 480} {"info/global_step": 481, "train_info/time_within_train_step": 2.5245556831359863, "step": 481} {"train_info/time_between_train_steps": 0.0038537979125976562, "step": 481} {"info/global_step": 482, "train_info/time_within_train_step": 2.5244219303131104, "step": 482} {"train_info/time_between_train_steps": 0.0037822723388671875, "step": 482} {"info/global_step": 483, "train_info/time_within_train_step": 2.5240840911865234, "step": 483} {"train_info/time_between_train_steps": 0.003842592239379883, "step": 483} {"info/global_step": 484, "train_info/time_within_train_step": 2.5247550010681152, "step": 484} {"train_info/time_between_train_steps": 0.0038433074951171875, "step": 484} {"info/global_step": 485, "train_info/time_within_train_step": 2.5246307849884033, "step": 485} {"train_info/time_between_train_steps": 0.003849029541015625, "step": 485} {"info/global_step": 486, "train_info/time_within_train_step": 2.5233311653137207, "step": 486} {"train_info/time_between_train_steps": 0.0037550926208496094, "step": 486} {"info/global_step": 487, "train_info/time_within_train_step": 2.5234546661376953, "step": 487} {"train_info/time_between_train_steps": 0.0038444995880126953, "step": 487} {"info/global_step": 488, "train_info/time_within_train_step": 2.523893356323242, "step": 488} {"train_info/time_between_train_steps": 0.0037848949432373047, "step": 488} {"info/global_step": 489, "train_info/time_within_train_step": 2.5232231616973877, "step": 489} {"train_info/time_between_train_steps": 0.003769397735595703, "step": 489} {"info/global_step": 490, "train_info/time_within_train_step": 2.523625135421753, "step": 490} {"train_info/time_between_train_steps": 0.0037920475006103516, "step": 490} {"info/global_step": 491, "train_info/time_within_train_step": 2.5236566066741943, "step": 491} {"train_info/time_between_train_steps": 0.0037882328033447266, "step": 491} {"info/global_step": 492, "train_info/time_within_train_step": 2.5238430500030518, "step": 492} {"train_info/time_between_train_steps": 0.0038166046142578125, "step": 492} {"info/global_step": 493, "train_info/time_within_train_step": 2.524174928665161, "step": 493} {"train_info/time_between_train_steps": 0.0037870407104492188, "step": 493} {"info/global_step": 494, "train_info/time_within_train_step": 2.5239789485931396, "step": 494} {"train_info/time_between_train_steps": 0.003785848617553711, "step": 494} {"info/global_step": 495, "train_info/time_within_train_step": 2.9027528762817383, "step": 495} {"train_info/time_between_train_steps": 0.0034456253051757812, "step": 495} {"info/global_step": 496, "train_info/time_within_train_step": 2.52811861038208, "step": 496} {"train_info/time_between_train_steps": 0.0034453868865966797, "step": 496} {"info/global_step": 497, "train_info/time_within_train_step": 2.5224804878234863, "step": 497} {"train_info/time_between_train_steps": 0.003428936004638672, "step": 497} {"info/global_step": 498, "train_info/time_within_train_step": 2.523005485534668, "step": 498} {"train_info/time_between_train_steps": 0.003454923629760742, "step": 498} {"info/global_step": 499, "train_info/time_within_train_step": 2.5219967365264893, "step": 499} {"train_info/time_between_train_steps": 0.003433704376220703, "step": 499} {"info/global_step": 500, "train_info/time_within_train_step": 2.975844383239746, "step": 500} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746324316, "_runtime": 1364}, "step": 500} {"logs": {"train/loss": 5.3743, "train/learning_rate": 0.0005555555555555556, "train/epoch": 0.17, "_timestamp": 1746324316, "_runtime": 1364}, "step": 500} {"train_info/time_between_train_steps": 13.403280973434448, "step": 500} {"info/global_step": 501, "train_info/time_within_train_step": 2.3313546180725098, "step": 501} {"train_info/time_between_train_steps": 0.003486156463623047, "step": 501} {"info/global_step": 502, "train_info/time_within_train_step": 2.3330931663513184, "step": 502} {"train_info/time_between_train_steps": 0.003570556640625, "step": 502} {"info/global_step": 503, "train_info/time_within_train_step": 2.5114622116088867, "step": 503} {"train_info/time_between_train_steps": 0.003454923629760742, "step": 503} {"info/global_step": 504, "train_info/time_within_train_step": 2.52030348777771, "step": 504} {"train_info/time_between_train_steps": 0.0034995079040527344, "step": 504} {"info/global_step": 505, "train_info/time_within_train_step": 2.519641399383545, "step": 505} {"train_info/time_between_train_steps": 0.0034308433532714844, "step": 505} {"info/global_step": 506, "train_info/time_within_train_step": 2.5212180614471436, "step": 506} {"train_info/time_between_train_steps": 0.003432750701904297, "step": 506} {"info/global_step": 507, "train_info/time_within_train_step": 2.5218522548675537, "step": 507} {"train_info/time_between_train_steps": 0.0034279823303222656, "step": 507} {"info/global_step": 508, "train_info/time_within_train_step": 2.5208098888397217, "step": 508} {"train_info/time_between_train_steps": 0.0034308433532714844, "step": 508} {"info/global_step": 509, "train_info/time_within_train_step": 2.522218704223633, "step": 509} {"train_info/time_between_train_steps": 0.003468751907348633, "step": 509} {"info/global_step": 510, "train_info/time_within_train_step": 2.5231168270111084, "step": 510} {"train_info/time_between_train_steps": 0.0034787654876708984, "step": 510} {"info/global_step": 511, "train_info/time_within_train_step": 2.5213470458984375, "step": 511} {"train_info/time_between_train_steps": 0.0034868717193603516, "step": 511} {"info/global_step": 512, "train_info/time_within_train_step": 2.521531820297241, "step": 512} {"train_info/time_between_train_steps": 0.0035037994384765625, "step": 512} {"info/global_step": 513, "train_info/time_within_train_step": 2.5232791900634766, "step": 513} {"train_info/time_between_train_steps": 0.003508329391479492, "step": 513} {"info/global_step": 514, "train_info/time_within_train_step": 2.521775007247925, "step": 514} {"train_info/time_between_train_steps": 0.0034770965576171875, "step": 514} {"info/global_step": 515, "train_info/time_within_train_step": 2.522627115249634, "step": 515} {"train_info/time_between_train_steps": 0.003670930862426758, "step": 515} {"info/global_step": 516, "train_info/time_within_train_step": 2.5267701148986816, "step": 516} {"train_info/time_between_train_steps": 0.003594636917114258, "step": 516} {"info/global_step": 517, "train_info/time_within_train_step": 2.522854804992676, "step": 517} {"train_info/time_between_train_steps": 0.0038928985595703125, "step": 517} {"info/global_step": 518, "train_info/time_within_train_step": 2.523772716522217, "step": 518} {"train_info/time_between_train_steps": 0.0037992000579833984, "step": 518} {"info/global_step": 519, "train_info/time_within_train_step": 2.5240724086761475, "step": 519} {"train_info/time_between_train_steps": 0.003829479217529297, "step": 519} {"info/global_step": 520, "train_info/time_within_train_step": 2.5242204666137695, "step": 520} {"train_info/time_between_train_steps": 0.0037734508514404297, "step": 520} {"info/global_step": 521, "train_info/time_within_train_step": 2.5243892669677734, "step": 521} {"train_info/time_between_train_steps": 0.0038356781005859375, "step": 521} {"info/global_step": 522, "train_info/time_within_train_step": 2.5244529247283936, "step": 522} {"train_info/time_between_train_steps": 0.0038101673126220703, "step": 522} {"info/global_step": 523, "train_info/time_within_train_step": 2.5245156288146973, "step": 523} {"train_info/time_between_train_steps": 0.0037689208984375, "step": 523} {"info/global_step": 524, "train_info/time_within_train_step": 2.5245163440704346, "step": 524} {"train_info/time_between_train_steps": 0.0037496089935302734, "step": 524} {"info/global_step": 525, "train_info/time_within_train_step": 2.5252013206481934, "step": 525} {"train_info/time_between_train_steps": 0.0038340091705322266, "step": 525} {"info/global_step": 526, "train_info/time_within_train_step": 2.5243616104125977, "step": 526} {"train_info/time_between_train_steps": 0.0038144588470458984, "step": 526} {"info/global_step": 527, "train_info/time_within_train_step": 2.5250566005706787, "step": 527} {"train_info/time_between_train_steps": 0.003785371780395508, "step": 527} {"info/global_step": 528, "train_info/time_within_train_step": 2.5244178771972656, "step": 528} {"train_info/time_between_train_steps": 0.0037031173706054688, "step": 528} {"info/global_step": 529, "train_info/time_within_train_step": 2.5242106914520264, "step": 529} {"train_info/time_between_train_steps": 0.0037636756896972656, "step": 529} {"info/global_step": 530, "train_info/time_within_train_step": 2.5240769386291504, "step": 530} {"train_info/time_between_train_steps": 0.003752470016479492, "step": 530} {"info/global_step": 531, "train_info/time_within_train_step": 2.5241312980651855, "step": 531} {"train_info/time_between_train_steps": 0.003780841827392578, "step": 531} {"info/global_step": 532, "train_info/time_within_train_step": 2.5235743522644043, "step": 532} {"train_info/time_between_train_steps": 0.0037288665771484375, "step": 532} {"info/global_step": 533, "train_info/time_within_train_step": 2.5237836837768555, "step": 533} {"train_info/time_between_train_steps": 0.0038099288940429688, "step": 533} {"info/global_step": 534, "train_info/time_within_train_step": 2.5239756107330322, "step": 534} {"train_info/time_between_train_steps": 0.0037636756896972656, "step": 534} {"info/global_step": 535, "train_info/time_within_train_step": 2.523123264312744, "step": 535} {"train_info/time_between_train_steps": 0.003710031509399414, "step": 535} {"info/global_step": 536, "train_info/time_within_train_step": 2.523421049118042, "step": 536} {"train_info/time_between_train_steps": 0.003737926483154297, "step": 536} {"info/global_step": 537, "train_info/time_within_train_step": 2.522994041442871, "step": 537} {"train_info/time_between_train_steps": 0.0037755966186523438, "step": 537} {"info/global_step": 538, "train_info/time_within_train_step": 2.5282883644104004, "step": 538} {"train_info/time_between_train_steps": 0.003713369369506836, "step": 538} {"info/global_step": 539, "train_info/time_within_train_step": 2.523958444595337, "step": 539} {"train_info/time_between_train_steps": 0.003782987594604492, "step": 539} {"info/global_step": 540, "train_info/time_within_train_step": 2.524038791656494, "step": 540} {"train_info/time_between_train_steps": 0.0037925243377685547, "step": 540} {"info/global_step": 541, "train_info/time_within_train_step": 2.524040937423706, "step": 541} {"train_info/time_between_train_steps": 0.0036814212799072266, "step": 541} {"info/global_step": 542, "train_info/time_within_train_step": 2.523993968963623, "step": 542} {"train_info/time_between_train_steps": 0.0037064552307128906, "step": 542} {"info/global_step": 543, "train_info/time_within_train_step": 2.5231707096099854, "step": 543} {"train_info/time_between_train_steps": 0.003747224807739258, "step": 543} {"info/global_step": 544, "train_info/time_within_train_step": 2.523578405380249, "step": 544} {"train_info/time_between_train_steps": 0.0038013458251953125, "step": 544} {"info/global_step": 545, "train_info/time_within_train_step": 2.5237414836883545, "step": 545} {"train_info/time_between_train_steps": 0.0038187503814697266, "step": 545} {"info/global_step": 546, "train_info/time_within_train_step": 2.5237090587615967, "step": 546} {"train_info/time_between_train_steps": 0.003710031509399414, "step": 546} {"info/global_step": 547, "train_info/time_within_train_step": 2.523878335952759, "step": 547} {"train_info/time_between_train_steps": 0.0037698745727539062, "step": 547} {"info/global_step": 548, "train_info/time_within_train_step": 2.8945693969726562, "step": 548} {"train_info/time_between_train_steps": 0.0034637451171875, "step": 548} {"info/global_step": 549, "train_info/time_within_train_step": 2.522585868835449, "step": 549} {"train_info/time_between_train_steps": 0.003518342971801758, "step": 549} {"info/global_step": 550, "train_info/time_within_train_step": 2.5230469703674316, "step": 550} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746324457, "_runtime": 1505}, "step": 550} {"logs": {"train/loss": 5.2917, "train/learning_rate": 0.0005444444444444444, "train/epoch": 0.18, "_timestamp": 1746324457, "_runtime": 1505}, "step": 550} {"train_info/time_between_train_steps": 0.06485295295715332, "step": 550} {"info/global_step": 551, "train_info/time_within_train_step": 2.5227835178375244, "step": 551} {"train_info/time_between_train_steps": 0.0035202503204345703, "step": 551} {"info/global_step": 552, "train_info/time_within_train_step": 2.5277183055877686, "step": 552} {"train_info/time_between_train_steps": 0.003448009490966797, "step": 552} {"info/global_step": 553, "train_info/time_within_train_step": 2.5225424766540527, "step": 553} {"train_info/time_between_train_steps": 0.003451824188232422, "step": 553} {"info/global_step": 554, "train_info/time_within_train_step": 2.5225307941436768, "step": 554} {"train_info/time_between_train_steps": 0.003442049026489258, "step": 554} {"info/global_step": 555, "train_info/time_within_train_step": 2.549462080001831, "step": 555} {"train_info/time_between_train_steps": 0.003477811813354492, "step": 555} {"info/global_step": 556, "train_info/time_within_train_step": 2.5222699642181396, "step": 556} {"train_info/time_between_train_steps": 0.0034406185150146484, "step": 556} {"info/global_step": 557, "train_info/time_within_train_step": 2.5221283435821533, "step": 557} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 557} {"info/global_step": 558, "train_info/time_within_train_step": 2.521928071975708, "step": 558} {"train_info/time_between_train_steps": 0.003466367721557617, "step": 558} {"info/global_step": 559, "train_info/time_within_train_step": 2.522578716278076, "step": 559} {"train_info/time_between_train_steps": 0.0034351348876953125, "step": 559} {"info/global_step": 560, "train_info/time_within_train_step": 2.522857904434204, "step": 560} {"train_info/time_between_train_steps": 0.003469228744506836, "step": 560} {"info/global_step": 561, "train_info/time_within_train_step": 2.5227019786834717, "step": 561} {"train_info/time_between_train_steps": 0.0035126209259033203, "step": 561} {"info/global_step": 562, "train_info/time_within_train_step": 2.5225796699523926, "step": 562} {"train_info/time_between_train_steps": 0.0034465789794921875, "step": 562} {"info/global_step": 563, "train_info/time_within_train_step": 2.577678918838501, "step": 563} {"train_info/time_between_train_steps": 0.003443479537963867, "step": 563} {"info/global_step": 564, "train_info/time_within_train_step": 2.5222086906433105, "step": 564} {"train_info/time_between_train_steps": 0.003448963165283203, "step": 564} {"info/global_step": 565, "train_info/time_within_train_step": 2.522620439529419, "step": 565} {"train_info/time_between_train_steps": 0.003465890884399414, "step": 565} {"info/global_step": 566, "train_info/time_within_train_step": 2.5219593048095703, "step": 566} {"train_info/time_between_train_steps": 0.003464221954345703, "step": 566} {"info/global_step": 567, "train_info/time_within_train_step": 2.5227956771850586, "step": 567} {"train_info/time_between_train_steps": 0.003459930419921875, "step": 567} {"info/global_step": 568, "train_info/time_within_train_step": 2.522613286972046, "step": 568} {"train_info/time_between_train_steps": 0.0034258365631103516, "step": 568} {"info/global_step": 569, "train_info/time_within_train_step": 2.5229012966156006, "step": 569} {"train_info/time_between_train_steps": 0.003465890884399414, "step": 569} {"info/global_step": 570, "train_info/time_within_train_step": 2.5222575664520264, "step": 570} {"train_info/time_between_train_steps": 0.0034456253051757812, "step": 570} {"info/global_step": 571, "train_info/time_within_train_step": 2.5219807624816895, "step": 571} {"train_info/time_between_train_steps": 0.003471851348876953, "step": 571} {"info/global_step": 572, "train_info/time_within_train_step": 2.522012948989868, "step": 572} {"train_info/time_between_train_steps": 0.00344085693359375, "step": 572} {"info/global_step": 573, "train_info/time_within_train_step": 2.522221565246582, "step": 573} {"train_info/time_between_train_steps": 0.0034475326538085938, "step": 573} {"info/global_step": 574, "train_info/time_within_train_step": 2.521700859069824, "step": 574} {"train_info/time_between_train_steps": 0.003436565399169922, "step": 574} {"info/global_step": 575, "train_info/time_within_train_step": 2.5213019847869873, "step": 575} {"train_info/time_between_train_steps": 0.0034470558166503906, "step": 575} {"info/global_step": 576, "train_info/time_within_train_step": 2.522062063217163, "step": 576} {"train_info/time_between_train_steps": 0.003423452377319336, "step": 576} {"info/global_step": 577, "train_info/time_within_train_step": 2.521270513534546, "step": 577} {"train_info/time_between_train_steps": 0.0034673213958740234, "step": 577} {"info/global_step": 578, "train_info/time_within_train_step": 2.5214574337005615, "step": 578} {"train_info/time_between_train_steps": 0.0034487247467041016, "step": 578} {"info/global_step": 579, "train_info/time_within_train_step": 2.5221290588378906, "step": 579} {"train_info/time_between_train_steps": 0.0034570693969726562, "step": 579} {"info/global_step": 580, "train_info/time_within_train_step": 2.5350794792175293, "step": 580} {"train_info/time_between_train_steps": 0.0031299591064453125, "step": 580} {"info/global_step": 581, "train_info/time_within_train_step": 2.521446466445923, "step": 581} {"train_info/time_between_train_steps": 0.003094911575317383, "step": 581} {"info/global_step": 582, "train_info/time_within_train_step": 2.5204579830169678, "step": 582} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 582} {"info/global_step": 583, "train_info/time_within_train_step": 2.5211355686187744, "step": 583} {"train_info/time_between_train_steps": 0.003098011016845703, "step": 583} {"info/global_step": 584, "train_info/time_within_train_step": 2.521472930908203, "step": 584} {"train_info/time_between_train_steps": 0.003076791763305664, "step": 584} {"info/global_step": 585, "train_info/time_within_train_step": 2.5208899974823, "step": 585} {"train_info/time_between_train_steps": 0.0030901432037353516, "step": 585} {"info/global_step": 586, "train_info/time_within_train_step": 2.7408204078674316, "step": 586} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 586} {"info/global_step": 587, "train_info/time_within_train_step": 2.5212786197662354, "step": 587} {"train_info/time_between_train_steps": 0.0030944347381591797, "step": 587} {"info/global_step": 588, "train_info/time_within_train_step": 2.521353006362915, "step": 588} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 588} {"info/global_step": 589, "train_info/time_within_train_step": 2.520940065383911, "step": 589} {"train_info/time_between_train_steps": 0.003088235855102539, "step": 589} {"info/global_step": 590, "train_info/time_within_train_step": 2.5213119983673096, "step": 590} {"train_info/time_between_train_steps": 0.0030841827392578125, "step": 590} {"info/global_step": 591, "train_info/time_within_train_step": 2.5204973220825195, "step": 591} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 591} {"info/global_step": 592, "train_info/time_within_train_step": 2.5200035572052, "step": 592} {"train_info/time_between_train_steps": 0.003098726272583008, "step": 592} {"info/global_step": 593, "train_info/time_within_train_step": 2.5211424827575684, "step": 593} {"train_info/time_between_train_steps": 0.003103017807006836, "step": 593} {"info/global_step": 594, "train_info/time_within_train_step": 2.5204226970672607, "step": 594} {"train_info/time_between_train_steps": 0.003100156784057617, "step": 594} {"info/global_step": 595, "train_info/time_within_train_step": 2.52064847946167, "step": 595} {"train_info/time_between_train_steps": 0.003664255142211914, "step": 595} {"info/global_step": 596, "train_info/time_within_train_step": 2.520282030105591, "step": 596} {"train_info/time_between_train_steps": 0.003139972686767578, "step": 596} {"info/global_step": 597, "train_info/time_within_train_step": 2.521310806274414, "step": 597} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 597} {"info/global_step": 598, "train_info/time_within_train_step": 2.521867513656616, "step": 598} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 598} {"info/global_step": 599, "train_info/time_within_train_step": 2.5218851566314697, "step": 599} {"train_info/time_between_train_steps": 0.003125905990600586, "step": 599} {"info/global_step": 600, "train_info/time_within_train_step": 2.5215816497802734, "step": 600} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746324584, "_runtime": 1632}, "step": 600} {"logs": {"train/loss": 5.2139, "train/learning_rate": 0.0005333333333333333, "train/epoch": 0.2, "_timestamp": 1746324584, "_runtime": 1632}, "step": 600} {"train_info/time_between_train_steps": 12.653228998184204, "step": 600} {"info/global_step": 601, "train_info/time_within_train_step": 2.3294525146484375, "step": 601} {"train_info/time_between_train_steps": 0.0031290054321289062, "step": 601} {"info/global_step": 602, "train_info/time_within_train_step": 2.330402374267578, "step": 602} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 602} {"info/global_step": 603, "train_info/time_within_train_step": 2.5066606998443604, "step": 603} {"train_info/time_between_train_steps": 0.003229856491088867, "step": 603} {"info/global_step": 604, "train_info/time_within_train_step": 2.5186500549316406, "step": 604} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 604} {"info/global_step": 605, "train_info/time_within_train_step": 2.518693208694458, "step": 605} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 605} {"info/global_step": 606, "train_info/time_within_train_step": 2.519540548324585, "step": 606} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 606} {"info/global_step": 607, "train_info/time_within_train_step": 2.520509719848633, "step": 607} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 607} {"info/global_step": 608, "train_info/time_within_train_step": 2.5212159156799316, "step": 608} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 608} {"info/global_step": 609, "train_info/time_within_train_step": 2.52087664604187, "step": 609} {"train_info/time_between_train_steps": 0.0031197071075439453, "step": 609} {"info/global_step": 610, "train_info/time_within_train_step": 2.521387815475464, "step": 610} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 610} {"info/global_step": 611, "train_info/time_within_train_step": 2.5210304260253906, "step": 611} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 611} {"info/global_step": 612, "train_info/time_within_train_step": 2.5206971168518066, "step": 612} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 612} {"info/global_step": 613, "train_info/time_within_train_step": 2.5207273960113525, "step": 613} {"train_info/time_between_train_steps": 0.003143310546875, "step": 613} {"info/global_step": 614, "train_info/time_within_train_step": 2.5204691886901855, "step": 614} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 614} {"info/global_step": 615, "train_info/time_within_train_step": 2.520939350128174, "step": 615} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 615} {"info/global_step": 616, "train_info/time_within_train_step": 2.54892897605896, "step": 616} {"train_info/time_between_train_steps": 0.003239870071411133, "step": 616} {"info/global_step": 617, "train_info/time_within_train_step": 2.5208542346954346, "step": 617} {"train_info/time_between_train_steps": 0.0032317638397216797, "step": 617} {"info/global_step": 618, "train_info/time_within_train_step": 2.5251128673553467, "step": 618} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 618} {"info/global_step": 619, "train_info/time_within_train_step": 2.5208098888397217, "step": 619} {"train_info/time_between_train_steps": 0.0032203197479248047, "step": 619} {"info/global_step": 620, "train_info/time_within_train_step": 2.5214903354644775, "step": 620} {"train_info/time_between_train_steps": 0.0032503604888916016, "step": 620} {"info/global_step": 621, "train_info/time_within_train_step": 2.52160906791687, "step": 621} {"train_info/time_between_train_steps": 0.003260374069213867, "step": 621} {"info/global_step": 622, "train_info/time_within_train_step": 2.5216073989868164, "step": 622} {"train_info/time_between_train_steps": 0.0032062530517578125, "step": 622} {"info/global_step": 623, "train_info/time_within_train_step": 2.522278070449829, "step": 623} {"train_info/time_between_train_steps": 0.0032596588134765625, "step": 623} {"info/global_step": 624, "train_info/time_within_train_step": 2.521916151046753, "step": 624} {"train_info/time_between_train_steps": 0.003359556198120117, "step": 624} {"info/global_step": 625, "train_info/time_within_train_step": 2.5219497680664062, "step": 625} {"train_info/time_between_train_steps": 0.003240823745727539, "step": 625} {"info/global_step": 626, "train_info/time_within_train_step": 2.5223283767700195, "step": 626} {"train_info/time_between_train_steps": 0.003340005874633789, "step": 626} {"info/global_step": 627, "train_info/time_within_train_step": 2.5223019123077393, "step": 627} {"train_info/time_between_train_steps": 0.0034096240997314453, "step": 627} {"info/global_step": 628, "train_info/time_within_train_step": 2.5224413871765137, "step": 628} {"train_info/time_between_train_steps": 0.003391742706298828, "step": 628} {"info/global_step": 629, "train_info/time_within_train_step": 2.5225765705108643, "step": 629} {"train_info/time_between_train_steps": 0.0034372806549072266, "step": 629} {"info/global_step": 630, "train_info/time_within_train_step": 2.522252082824707, "step": 630} {"train_info/time_between_train_steps": 0.003420591354370117, "step": 630} {"info/global_step": 631, "train_info/time_within_train_step": 2.52134370803833, "step": 631} {"train_info/time_between_train_steps": 0.003402233123779297, "step": 631} {"info/global_step": 632, "train_info/time_within_train_step": 2.5212528705596924, "step": 632} {"train_info/time_between_train_steps": 0.0033614635467529297, "step": 632} {"info/global_step": 633, "train_info/time_within_train_step": 2.522352695465088, "step": 633} {"train_info/time_between_train_steps": 0.0033817291259765625, "step": 633} {"info/global_step": 634, "train_info/time_within_train_step": 2.521481513977051, "step": 634} {"train_info/time_between_train_steps": 0.0034389495849609375, "step": 634} {"info/global_step": 635, "train_info/time_within_train_step": 2.522646427154541, "step": 635} {"train_info/time_between_train_steps": 0.003399372100830078, "step": 635} {"info/global_step": 636, "train_info/time_within_train_step": 2.522125244140625, "step": 636} {"train_info/time_between_train_steps": 0.0035142898559570312, "step": 636} {"info/global_step": 637, "train_info/time_within_train_step": 2.522063970565796, "step": 637} {"train_info/time_between_train_steps": 0.0034112930297851562, "step": 637} {"info/global_step": 638, "train_info/time_within_train_step": 2.5228025913238525, "step": 638} {"train_info/time_between_train_steps": 0.003385782241821289, "step": 638} {"info/global_step": 639, "train_info/time_within_train_step": 2.5224759578704834, "step": 639} {"train_info/time_between_train_steps": 0.0034034252166748047, "step": 639} {"info/global_step": 640, "train_info/time_within_train_step": 2.523540735244751, "step": 640} {"train_info/time_between_train_steps": 0.0034341812133789062, "step": 640} {"info/global_step": 641, "train_info/time_within_train_step": 2.5233078002929688, "step": 641} {"train_info/time_between_train_steps": 0.003587484359741211, "step": 641} {"info/global_step": 642, "train_info/time_within_train_step": 2.5227246284484863, "step": 642} {"train_info/time_between_train_steps": 0.003359556198120117, "step": 642} {"info/global_step": 643, "train_info/time_within_train_step": 2.5222904682159424, "step": 643} {"train_info/time_between_train_steps": 0.003384828567504883, "step": 643} {"info/global_step": 644, "train_info/time_within_train_step": 2.5220413208007812, "step": 644} {"train_info/time_between_train_steps": 0.0034127235412597656, "step": 644} {"info/global_step": 645, "train_info/time_within_train_step": 2.522017240524292, "step": 645} {"train_info/time_between_train_steps": 0.0033652782440185547, "step": 645} {"info/global_step": 646, "train_info/time_within_train_step": 2.5214807987213135, "step": 646} {"train_info/time_between_train_steps": 0.0033676624298095703, "step": 646} {"info/global_step": 647, "train_info/time_within_train_step": 2.5209038257598877, "step": 647} {"train_info/time_between_train_steps": 0.0033462047576904297, "step": 647} {"info/global_step": 648, "train_info/time_within_train_step": 2.5211257934570312, "step": 648} {"train_info/time_between_train_steps": 0.0034406185150146484, "step": 648} {"info/global_step": 649, "train_info/time_within_train_step": 2.5213916301727295, "step": 649} {"train_info/time_between_train_steps": 0.0033583641052246094, "step": 649} {"info/global_step": 650, "train_info/time_within_train_step": 2.819995403289795, "step": 650} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746324724, "_runtime": 1772}, "step": 650} {"logs": {"train/loss": 5.1432, "train/learning_rate": 0.0005222222222222222, "train/epoch": 0.22, "_timestamp": 1746324724, "_runtime": 1772}, "step": 650} {"train_info/time_between_train_steps": 0.024602890014648438, "step": 650} {"info/global_step": 651, "train_info/time_within_train_step": 2.5198898315429688, "step": 651} {"train_info/time_between_train_steps": 0.003139972686767578, "step": 651} {"info/global_step": 652, "train_info/time_within_train_step": 2.520486354827881, "step": 652} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 652} {"info/global_step": 653, "train_info/time_within_train_step": 2.520179271697998, "step": 653} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 653} {"info/global_step": 654, "train_info/time_within_train_step": 2.5217912197113037, "step": 654} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 654} {"info/global_step": 655, "train_info/time_within_train_step": 2.521674871444702, "step": 655} {"train_info/time_between_train_steps": 0.0031473636627197266, "step": 655} {"info/global_step": 656, "train_info/time_within_train_step": 2.5211286544799805, "step": 656} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 656} {"info/global_step": 657, "train_info/time_within_train_step": 2.5221970081329346, "step": 657} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 657} {"info/global_step": 658, "train_info/time_within_train_step": 2.5207407474517822, "step": 658} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 658} {"info/global_step": 659, "train_info/time_within_train_step": 2.521404266357422, "step": 659} {"train_info/time_between_train_steps": 0.0031332969665527344, "step": 659} {"info/global_step": 660, "train_info/time_within_train_step": 2.522160053253174, "step": 660} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 660} {"info/global_step": 661, "train_info/time_within_train_step": 2.520700454711914, "step": 661} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 661} {"info/global_step": 662, "train_info/time_within_train_step": 2.5208311080932617, "step": 662} {"train_info/time_between_train_steps": 0.003099679946899414, "step": 662} {"info/global_step": 663, "train_info/time_within_train_step": 2.5206892490386963, "step": 663} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 663} {"info/global_step": 664, "train_info/time_within_train_step": 2.521000385284424, "step": 664} {"train_info/time_between_train_steps": 0.0031316280364990234, "step": 664} {"info/global_step": 665, "train_info/time_within_train_step": 2.5198750495910645, "step": 665} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 665} {"info/global_step": 666, "train_info/time_within_train_step": 2.52004075050354, "step": 666} {"train_info/time_between_train_steps": 0.0033903121948242188, "step": 666} {"info/global_step": 667, "train_info/time_within_train_step": 2.51993465423584, "step": 667} {"train_info/time_between_train_steps": 0.0030851364135742188, "step": 667} {"info/global_step": 668, "train_info/time_within_train_step": 2.520941972732544, "step": 668} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 668} {"info/global_step": 669, "train_info/time_within_train_step": 2.5196263790130615, "step": 669} {"train_info/time_between_train_steps": 0.0030760765075683594, "step": 669} {"info/global_step": 670, "train_info/time_within_train_step": 2.519979953765869, "step": 670} {"train_info/time_between_train_steps": 0.0033550262451171875, "step": 670} {"info/global_step": 671, "train_info/time_within_train_step": 2.520914316177368, "step": 671} {"train_info/time_between_train_steps": 0.003118753433227539, "step": 671} {"info/global_step": 672, "train_info/time_within_train_step": 2.5211782455444336, "step": 672} {"train_info/time_between_train_steps": 0.0030832290649414062, "step": 672} {"info/global_step": 673, "train_info/time_within_train_step": 2.520153284072876, "step": 673} {"train_info/time_between_train_steps": 0.0032842159271240234, "step": 673} {"info/global_step": 674, "train_info/time_within_train_step": 2.520785093307495, "step": 674} {"train_info/time_between_train_steps": 0.003328084945678711, "step": 674} {"info/global_step": 675, "train_info/time_within_train_step": 2.526200532913208, "step": 675} {"train_info/time_between_train_steps": 0.003307819366455078, "step": 675} {"info/global_step": 676, "train_info/time_within_train_step": 2.520750045776367, "step": 676} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 676} {"info/global_step": 677, "train_info/time_within_train_step": 2.5199739933013916, "step": 677} {"train_info/time_between_train_steps": 0.0032639503479003906, "step": 677} {"info/global_step": 678, "train_info/time_within_train_step": 2.5205764770507812, "step": 678} {"train_info/time_between_train_steps": 0.003303050994873047, "step": 678} {"info/global_step": 679, "train_info/time_within_train_step": 2.5203442573547363, "step": 679} {"train_info/time_between_train_steps": 0.0031151771545410156, "step": 679} {"info/global_step": 680, "train_info/time_within_train_step": 2.519502878189087, "step": 680} {"train_info/time_between_train_steps": 0.003343820571899414, "step": 680} {"info/global_step": 681, "train_info/time_within_train_step": 2.519566297531128, "step": 681} {"train_info/time_between_train_steps": 0.0033600330352783203, "step": 681} {"info/global_step": 682, "train_info/time_within_train_step": 2.5196304321289062, "step": 682} {"train_info/time_between_train_steps": 0.003092050552368164, "step": 682} {"info/global_step": 683, "train_info/time_within_train_step": 2.518918514251709, "step": 683} {"train_info/time_between_train_steps": 0.003074169158935547, "step": 683} {"info/global_step": 684, "train_info/time_within_train_step": 2.518986940383911, "step": 684} {"train_info/time_between_train_steps": 0.0030853748321533203, "step": 684} {"info/global_step": 685, "train_info/time_within_train_step": 2.519676685333252, "step": 685} {"train_info/time_between_train_steps": 0.0030815601348876953, "step": 685} {"info/global_step": 686, "train_info/time_within_train_step": 2.5193800926208496, "step": 686} {"train_info/time_between_train_steps": 0.003287792205810547, "step": 686} {"info/global_step": 687, "train_info/time_within_train_step": 2.5197479724884033, "step": 687} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 687} {"info/global_step": 688, "train_info/time_within_train_step": 2.5197958946228027, "step": 688} {"train_info/time_between_train_steps": 0.003117799758911133, "step": 688} {"info/global_step": 689, "train_info/time_within_train_step": 2.520174741744995, "step": 689} {"train_info/time_between_train_steps": 0.0030951499938964844, "step": 689} {"info/global_step": 690, "train_info/time_within_train_step": 2.5208346843719482, "step": 690} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 690} {"info/global_step": 691, "train_info/time_within_train_step": 2.521648645401001, "step": 691} {"train_info/time_between_train_steps": 0.003362417221069336, "step": 691} {"info/global_step": 692, "train_info/time_within_train_step": 2.520724296569824, "step": 692} {"train_info/time_between_train_steps": 0.003078937530517578, "step": 692} {"info/global_step": 693, "train_info/time_within_train_step": 2.5219295024871826, "step": 693} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 693} {"info/global_step": 694, "train_info/time_within_train_step": 2.5204250812530518, "step": 694} {"train_info/time_between_train_steps": 0.0032892227172851562, "step": 694} {"info/global_step": 695, "train_info/time_within_train_step": 2.5203933715820312, "step": 695} {"train_info/time_between_train_steps": 0.0032422542572021484, "step": 695} {"info/global_step": 696, "train_info/time_within_train_step": 2.5196356773376465, "step": 696} {"train_info/time_between_train_steps": 0.0032715797424316406, "step": 696} {"info/global_step": 697, "train_info/time_within_train_step": 2.519928216934204, "step": 697} {"train_info/time_between_train_steps": 0.0030558109283447266, "step": 697} {"info/global_step": 698, "train_info/time_within_train_step": 2.5195088386535645, "step": 698} {"train_info/time_between_train_steps": 0.003331899642944336, "step": 698} {"info/global_step": 699, "train_info/time_within_train_step": 2.5207693576812744, "step": 699} {"train_info/time_between_train_steps": 0.003359556198120117, "step": 699} {"info/global_step": 700, "train_info/time_within_train_step": 2.5200486183166504, "step": 700} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746324851, "_runtime": 1899}, "step": 700} {"logs": {"train/loss": 5.0765, "train/learning_rate": 0.0005111111111111111, "train/epoch": 0.23, "_timestamp": 1746324851, "_runtime": 1899}, "step": 700} {"train_info/time_between_train_steps": 12.128132581710815, "step": 700} {"info/global_step": 701, "train_info/time_within_train_step": 2.337769031524658, "step": 701} {"train_info/time_between_train_steps": 0.0031599998474121094, "step": 701} {"info/global_step": 702, "train_info/time_within_train_step": 2.3370370864868164, "step": 702} {"train_info/time_between_train_steps": 0.00311279296875, "step": 702} {"info/global_step": 703, "train_info/time_within_train_step": 2.5102927684783936, "step": 703} {"train_info/time_between_train_steps": 0.0031371116638183594, "step": 703} {"info/global_step": 704, "train_info/time_within_train_step": 2.5157763957977295, "step": 704} {"train_info/time_between_train_steps": 0.0031099319458007812, "step": 704} {"info/global_step": 705, "train_info/time_within_train_step": 2.517871379852295, "step": 705} {"train_info/time_between_train_steps": 0.0031328201293945312, "step": 705} {"info/global_step": 706, "train_info/time_within_train_step": 2.673532009124756, "step": 706} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 706} {"info/global_step": 707, "train_info/time_within_train_step": 2.521697521209717, "step": 707} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 707} {"info/global_step": 708, "train_info/time_within_train_step": 2.522876024246216, "step": 708} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 708} {"info/global_step": 709, "train_info/time_within_train_step": 2.5224852561950684, "step": 709} {"train_info/time_between_train_steps": 0.003239154815673828, "step": 709} {"info/global_step": 710, "train_info/time_within_train_step": 2.522963523864746, "step": 710} {"train_info/time_between_train_steps": 0.0031588077545166016, "step": 710} {"info/global_step": 711, "train_info/time_within_train_step": 2.519965648651123, "step": 711} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 711} {"info/global_step": 712, "train_info/time_within_train_step": 2.520127534866333, "step": 712} {"train_info/time_between_train_steps": 0.003100156784057617, "step": 712} {"info/global_step": 713, "train_info/time_within_train_step": 2.519498348236084, "step": 713} {"train_info/time_between_train_steps": 0.0030798912048339844, "step": 713} {"info/global_step": 714, "train_info/time_within_train_step": 2.520510673522949, "step": 714} {"train_info/time_between_train_steps": 0.0033376216888427734, "step": 714} {"info/global_step": 715, "train_info/time_within_train_step": 2.5191915035247803, "step": 715} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 715} {"info/global_step": 716, "train_info/time_within_train_step": 2.519347906112671, "step": 716} {"train_info/time_between_train_steps": 0.0033125877380371094, "step": 716} {"info/global_step": 717, "train_info/time_within_train_step": 2.519174575805664, "step": 717} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 717} {"info/global_step": 718, "train_info/time_within_train_step": 2.520014762878418, "step": 718} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 718} {"info/global_step": 719, "train_info/time_within_train_step": 2.5202677249908447, "step": 719} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 719} {"info/global_step": 720, "train_info/time_within_train_step": 2.5198068618774414, "step": 720} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 720} {"info/global_step": 721, "train_info/time_within_train_step": 2.521104097366333, "step": 721} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 721} {"info/global_step": 722, "train_info/time_within_train_step": 2.520742177963257, "step": 722} {"train_info/time_between_train_steps": 0.0034253597259521484, "step": 722} {"info/global_step": 723, "train_info/time_within_train_step": 2.521240472793579, "step": 723} {"train_info/time_between_train_steps": 0.0033721923828125, "step": 723} {"info/global_step": 724, "train_info/time_within_train_step": 2.522505283355713, "step": 724} {"train_info/time_between_train_steps": 0.003262042999267578, "step": 724} {"info/global_step": 725, "train_info/time_within_train_step": 2.521416664123535, "step": 725} {"train_info/time_between_train_steps": 0.0033042430877685547, "step": 725} {"info/global_step": 726, "train_info/time_within_train_step": 2.5206446647644043, "step": 726} {"train_info/time_between_train_steps": 0.003511190414428711, "step": 726} {"info/global_step": 727, "train_info/time_within_train_step": 2.521573305130005, "step": 727} {"train_info/time_between_train_steps": 0.0035886764526367188, "step": 727} {"info/global_step": 728, "train_info/time_within_train_step": 2.5219199657440186, "step": 728} {"train_info/time_between_train_steps": 0.003663778305053711, "step": 728} {"info/global_step": 729, "train_info/time_within_train_step": 2.5220582485198975, "step": 729} {"train_info/time_between_train_steps": 0.0036001205444335938, "step": 729} {"info/global_step": 730, "train_info/time_within_train_step": 2.521350860595703, "step": 730} {"train_info/time_between_train_steps": 0.0034949779510498047, "step": 730} {"info/global_step": 731, "train_info/time_within_train_step": 2.5218160152435303, "step": 731} {"train_info/time_between_train_steps": 0.0035300254821777344, "step": 731} {"info/global_step": 732, "train_info/time_within_train_step": 2.5213232040405273, "step": 732} {"train_info/time_between_train_steps": 0.003430604934692383, "step": 732} {"info/global_step": 733, "train_info/time_within_train_step": 2.5210189819335938, "step": 733} {"train_info/time_between_train_steps": 0.003658294677734375, "step": 733} {"info/global_step": 734, "train_info/time_within_train_step": 2.5211808681488037, "step": 734} {"train_info/time_between_train_steps": 0.0034885406494140625, "step": 734} {"info/global_step": 735, "train_info/time_within_train_step": 2.5215516090393066, "step": 735} {"train_info/time_between_train_steps": 0.0034456253051757812, "step": 735} {"info/global_step": 736, "train_info/time_within_train_step": 2.5211143493652344, "step": 736} {"train_info/time_between_train_steps": 0.003448009490966797, "step": 736} {"info/global_step": 737, "train_info/time_within_train_step": 2.5208160877227783, "step": 737} {"train_info/time_between_train_steps": 0.0034325122833251953, "step": 737} {"info/global_step": 738, "train_info/time_within_train_step": 2.5201644897460938, "step": 738} {"train_info/time_between_train_steps": 0.0033431053161621094, "step": 738} {"info/global_step": 739, "train_info/time_within_train_step": 2.521408796310425, "step": 739} {"train_info/time_between_train_steps": 0.0033843517303466797, "step": 739} {"info/global_step": 740, "train_info/time_within_train_step": 2.5210204124450684, "step": 740} {"train_info/time_between_train_steps": 0.0034072399139404297, "step": 740} {"info/global_step": 741, "train_info/time_within_train_step": 2.520876169204712, "step": 741} {"train_info/time_between_train_steps": 0.0033941268920898438, "step": 741} {"info/global_step": 742, "train_info/time_within_train_step": 2.5222091674804688, "step": 742} {"train_info/time_between_train_steps": 0.003589153289794922, "step": 742} {"info/global_step": 743, "train_info/time_within_train_step": 2.522040843963623, "step": 743} {"train_info/time_between_train_steps": 0.0035495758056640625, "step": 743} {"info/global_step": 744, "train_info/time_within_train_step": 2.5222272872924805, "step": 744} {"train_info/time_between_train_steps": 0.003435373306274414, "step": 744} {"info/global_step": 745, "train_info/time_within_train_step": 2.52311372756958, "step": 745} {"train_info/time_between_train_steps": 0.0034208297729492188, "step": 745} {"info/global_step": 746, "train_info/time_within_train_step": 2.5219531059265137, "step": 746} {"train_info/time_between_train_steps": 0.0035240650177001953, "step": 746} {"info/global_step": 747, "train_info/time_within_train_step": 2.5231270790100098, "step": 747} {"train_info/time_between_train_steps": 0.003428936004638672, "step": 747} {"info/global_step": 748, "train_info/time_within_train_step": 2.521650791168213, "step": 748} {"train_info/time_between_train_steps": 0.0033986568450927734, "step": 748} {"info/global_step": 749, "train_info/time_within_train_step": 2.521786689758301, "step": 749} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 749} {"info/global_step": 750, "train_info/time_within_train_step": 2.9744699001312256, "step": 750} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746324991, "_runtime": 2039}, "step": 750} {"logs": {"train/loss": 4.9792, "train/learning_rate": 0.0005, "train/epoch": 0.25, "_timestamp": 1746324991, "_runtime": 2039}, "step": 750} {"train_info/time_between_train_steps": 0.025217533111572266, "step": 750} {"info/global_step": 751, "train_info/time_within_train_step": 2.543236494064331, "step": 751} {"train_info/time_between_train_steps": 0.003426074981689453, "step": 751} {"info/global_step": 752, "train_info/time_within_train_step": 2.5206427574157715, "step": 752} {"train_info/time_between_train_steps": 0.003417491912841797, "step": 752} {"info/global_step": 753, "train_info/time_within_train_step": 2.5479660034179688, "step": 753} {"train_info/time_between_train_steps": 0.003433704376220703, "step": 753} {"info/global_step": 754, "train_info/time_within_train_step": 2.5212767124176025, "step": 754} {"train_info/time_between_train_steps": 0.003405332565307617, "step": 754} {"info/global_step": 755, "train_info/time_within_train_step": 2.5206336975097656, "step": 755} {"train_info/time_between_train_steps": 0.0034296512603759766, "step": 755} {"info/global_step": 756, "train_info/time_within_train_step": 2.521250009536743, "step": 756} {"train_info/time_between_train_steps": 0.0034961700439453125, "step": 756} {"info/global_step": 757, "train_info/time_within_train_step": 2.5209226608276367, "step": 757} {"train_info/time_between_train_steps": 0.0034139156341552734, "step": 757} {"info/global_step": 758, "train_info/time_within_train_step": 2.5223093032836914, "step": 758} {"train_info/time_between_train_steps": 0.0036437511444091797, "step": 758} {"info/global_step": 759, "train_info/time_within_train_step": 2.521434783935547, "step": 759} {"train_info/time_between_train_steps": 0.003513813018798828, "step": 759} {"info/global_step": 760, "train_info/time_within_train_step": 2.5213100910186768, "step": 760} {"train_info/time_between_train_steps": 0.003433704376220703, "step": 760} {"info/global_step": 761, "train_info/time_within_train_step": 2.741584062576294, "step": 761} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 761} {"info/global_step": 762, "train_info/time_within_train_step": 2.5211281776428223, "step": 762} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 762} {"info/global_step": 763, "train_info/time_within_train_step": 2.520481824874878, "step": 763} {"train_info/time_between_train_steps": 0.0032019615173339844, "step": 763} {"info/global_step": 764, "train_info/time_within_train_step": 2.5209014415740967, "step": 764} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 764} {"info/global_step": 765, "train_info/time_within_train_step": 2.520413398742676, "step": 765} {"train_info/time_between_train_steps": 0.0032052993774414062, "step": 765} {"info/global_step": 766, "train_info/time_within_train_step": 2.5203685760498047, "step": 766} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 766} {"info/global_step": 767, "train_info/time_within_train_step": 2.5199453830718994, "step": 767} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 767} {"info/global_step": 768, "train_info/time_within_train_step": 2.5204458236694336, "step": 768} {"train_info/time_between_train_steps": 0.0031943321228027344, "step": 768} {"info/global_step": 769, "train_info/time_within_train_step": 2.5201046466827393, "step": 769} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 769} {"info/global_step": 770, "train_info/time_within_train_step": 2.519838571548462, "step": 770} {"train_info/time_between_train_steps": 0.003245830535888672, "step": 770} {"info/global_step": 771, "train_info/time_within_train_step": 2.5195202827453613, "step": 771} {"train_info/time_between_train_steps": 0.0031943321228027344, "step": 771} {"info/global_step": 772, "train_info/time_within_train_step": 2.519559144973755, "step": 772} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 772} {"info/global_step": 773, "train_info/time_within_train_step": 2.52002215385437, "step": 773} {"train_info/time_between_train_steps": 0.0032439231872558594, "step": 773} {"info/global_step": 774, "train_info/time_within_train_step": 2.5200278759002686, "step": 774} {"train_info/time_between_train_steps": 0.003149747848510742, "step": 774} {"info/global_step": 775, "train_info/time_within_train_step": 2.5192248821258545, "step": 775} {"train_info/time_between_train_steps": 0.003188610076904297, "step": 775} {"info/global_step": 776, "train_info/time_within_train_step": 2.5203943252563477, "step": 776} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 776} {"info/global_step": 777, "train_info/time_within_train_step": 2.520123243331909, "step": 777} {"train_info/time_between_train_steps": 0.0032355785369873047, "step": 777} {"info/global_step": 778, "train_info/time_within_train_step": 2.5205371379852295, "step": 778} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 778} {"info/global_step": 779, "train_info/time_within_train_step": 2.5195412635803223, "step": 779} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 779} {"info/global_step": 780, "train_info/time_within_train_step": 2.5207273960113525, "step": 780} {"train_info/time_between_train_steps": 0.0033254623413085938, "step": 780} {"info/global_step": 781, "train_info/time_within_train_step": 2.519894599914551, "step": 781} {"train_info/time_between_train_steps": 0.003301382064819336, "step": 781} {"info/global_step": 782, "train_info/time_within_train_step": 2.519904136657715, "step": 782} {"train_info/time_between_train_steps": 0.003282785415649414, "step": 782} {"info/global_step": 783, "train_info/time_within_train_step": 2.521388530731201, "step": 783} {"train_info/time_between_train_steps": 0.003244638442993164, "step": 783} {"info/global_step": 784, "train_info/time_within_train_step": 2.5198886394500732, "step": 784} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 784} {"info/global_step": 785, "train_info/time_within_train_step": 2.520186424255371, "step": 785} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 785} {"info/global_step": 786, "train_info/time_within_train_step": 2.519806385040283, "step": 786} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 786} {"info/global_step": 787, "train_info/time_within_train_step": 2.519331932067871, "step": 787} {"train_info/time_between_train_steps": 0.003387451171875, "step": 787} {"info/global_step": 788, "train_info/time_within_train_step": 2.5194344520568848, "step": 788} {"train_info/time_between_train_steps": 0.0033278465270996094, "step": 788} {"info/global_step": 789, "train_info/time_within_train_step": 2.5205886363983154, "step": 789} {"train_info/time_between_train_steps": 0.0033235549926757812, "step": 789} {"info/global_step": 790, "train_info/time_within_train_step": 2.520921230316162, "step": 790} {"train_info/time_between_train_steps": 0.003499269485473633, "step": 790} {"info/global_step": 791, "train_info/time_within_train_step": 2.521622896194458, "step": 791} {"train_info/time_between_train_steps": 0.003798961639404297, "step": 791} {"info/global_step": 792, "train_info/time_within_train_step": 2.5208401679992676, "step": 792} {"train_info/time_between_train_steps": 0.003757476806640625, "step": 792} {"info/global_step": 793, "train_info/time_within_train_step": 2.5209743976593018, "step": 793} {"train_info/time_between_train_steps": 0.0036118030548095703, "step": 793} {"info/global_step": 794, "train_info/time_within_train_step": 2.5209462642669678, "step": 794} {"train_info/time_between_train_steps": 0.0033800601959228516, "step": 794} {"info/global_step": 795, "train_info/time_within_train_step": 2.52130126953125, "step": 795} {"train_info/time_between_train_steps": 0.0034821033477783203, "step": 795} {"info/global_step": 796, "train_info/time_within_train_step": 2.5213725566864014, "step": 796} {"train_info/time_between_train_steps": 0.003589630126953125, "step": 796} {"info/global_step": 797, "train_info/time_within_train_step": 2.521454334259033, "step": 797} {"train_info/time_between_train_steps": 0.0034894943237304688, "step": 797} {"info/global_step": 798, "train_info/time_within_train_step": 2.521998167037964, "step": 798} {"train_info/time_between_train_steps": 0.00362396240234375, "step": 798} {"info/global_step": 799, "train_info/time_within_train_step": 2.5212745666503906, "step": 799} {"train_info/time_between_train_steps": 0.003442525863647461, "step": 799} {"info/global_step": 800, "train_info/time_within_train_step": 2.522099018096924, "step": 800} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746325118, "_runtime": 2166}, "step": 800} {"logs": {"train/loss": 4.9118, "train/learning_rate": 0.0004888888888888889, "train/epoch": 0.27, "_timestamp": 1746325118, "_runtime": 2166}, "step": 800} {"train_info/time_between_train_steps": 21.95136284828186, "step": 800} {"info/global_step": 801, "train_info/time_within_train_step": 2.334594488143921, "step": 801} {"train_info/time_between_train_steps": 0.0033757686614990234, "step": 801} {"info/global_step": 802, "train_info/time_within_train_step": 2.3161370754241943, "step": 802} {"train_info/time_between_train_steps": 0.0034952163696289062, "step": 802} {"info/global_step": 803, "train_info/time_within_train_step": 2.4544384479522705, "step": 803} {"train_info/time_between_train_steps": 0.00337982177734375, "step": 803} {"info/global_step": 804, "train_info/time_within_train_step": 2.5174036026000977, "step": 804} {"train_info/time_between_train_steps": 0.0035953521728515625, "step": 804} {"info/global_step": 805, "train_info/time_within_train_step": 2.5183703899383545, "step": 805} {"train_info/time_between_train_steps": 0.0035033226013183594, "step": 805} {"info/global_step": 806, "train_info/time_within_train_step": 2.5193817615509033, "step": 806} {"train_info/time_between_train_steps": 0.003446340560913086, "step": 806} {"info/global_step": 807, "train_info/time_within_train_step": 2.5207178592681885, "step": 807} {"train_info/time_between_train_steps": 0.003642559051513672, "step": 807} {"info/global_step": 808, "train_info/time_within_train_step": 2.5213842391967773, "step": 808} {"train_info/time_between_train_steps": 0.003290891647338867, "step": 808} {"info/global_step": 809, "train_info/time_within_train_step": 2.5216052532196045, "step": 809} {"train_info/time_between_train_steps": 0.0034668445587158203, "step": 809} {"info/global_step": 810, "train_info/time_within_train_step": 2.5216574668884277, "step": 810} {"train_info/time_between_train_steps": 0.0036516189575195312, "step": 810} {"info/global_step": 811, "train_info/time_within_train_step": 2.521458864212036, "step": 811} {"train_info/time_between_train_steps": 0.0036308765411376953, "step": 811} {"info/global_step": 812, "train_info/time_within_train_step": 2.5222225189208984, "step": 812} {"train_info/time_between_train_steps": 0.003396749496459961, "step": 812} {"info/global_step": 813, "train_info/time_within_train_step": 2.522125244140625, "step": 813} {"train_info/time_between_train_steps": 0.0034933090209960938, "step": 813} {"info/global_step": 814, "train_info/time_within_train_step": 2.5221786499023438, "step": 814} {"train_info/time_between_train_steps": 0.0034928321838378906, "step": 814} {"info/global_step": 815, "train_info/time_within_train_step": 2.5222465991973877, "step": 815} {"train_info/time_between_train_steps": 0.0033407211303710938, "step": 815} {"info/global_step": 816, "train_info/time_within_train_step": 2.5225861072540283, "step": 816} {"train_info/time_between_train_steps": 0.0035567283630371094, "step": 816} {"info/global_step": 817, "train_info/time_within_train_step": 2.521775484085083, "step": 817} {"train_info/time_between_train_steps": 0.0034437179565429688, "step": 817} {"info/global_step": 818, "train_info/time_within_train_step": 2.521639347076416, "step": 818} {"train_info/time_between_train_steps": 0.00350189208984375, "step": 818} {"info/global_step": 819, "train_info/time_within_train_step": 2.5217854976654053, "step": 819} {"train_info/time_between_train_steps": 0.003571033477783203, "step": 819} {"info/global_step": 820, "train_info/time_within_train_step": 2.522043228149414, "step": 820} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 820} {"info/global_step": 821, "train_info/time_within_train_step": 2.5225062370300293, "step": 821} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 821} {"info/global_step": 822, "train_info/time_within_train_step": 2.6352157592773438, "step": 822} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 822} {"info/global_step": 823, "train_info/time_within_train_step": 2.521648406982422, "step": 823} {"train_info/time_between_train_steps": 0.0031385421752929688, "step": 823} {"info/global_step": 824, "train_info/time_within_train_step": 2.520535945892334, "step": 824} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 824} {"info/global_step": 825, "train_info/time_within_train_step": 2.520784616470337, "step": 825} {"train_info/time_between_train_steps": 0.0031185150146484375, "step": 825} {"info/global_step": 826, "train_info/time_within_train_step": 2.520001173019409, "step": 826} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 826} {"info/global_step": 827, "train_info/time_within_train_step": 2.5208210945129395, "step": 827} {"train_info/time_between_train_steps": 0.003119230270385742, "step": 827} {"info/global_step": 828, "train_info/time_within_train_step": 2.5210020542144775, "step": 828} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 828} {"info/global_step": 829, "train_info/time_within_train_step": 2.5212085247039795, "step": 829} {"train_info/time_between_train_steps": 0.003129720687866211, "step": 829} {"info/global_step": 830, "train_info/time_within_train_step": 2.5214004516601562, "step": 830} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 830} {"info/global_step": 831, "train_info/time_within_train_step": 2.5203492641448975, "step": 831} {"train_info/time_between_train_steps": 0.0036547183990478516, "step": 831} {"info/global_step": 832, "train_info/time_within_train_step": 2.521136522293091, "step": 832} {"train_info/time_between_train_steps": 0.003216266632080078, "step": 832} {"info/global_step": 833, "train_info/time_within_train_step": 2.5207953453063965, "step": 833} {"train_info/time_between_train_steps": 0.0031261444091796875, "step": 833} {"info/global_step": 834, "train_info/time_within_train_step": 2.520374298095703, "step": 834} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 834} {"info/global_step": 835, "train_info/time_within_train_step": 2.5205893516540527, "step": 835} {"train_info/time_between_train_steps": 0.00312042236328125, "step": 835} {"info/global_step": 836, "train_info/time_within_train_step": 2.519838809967041, "step": 836} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 836} {"info/global_step": 837, "train_info/time_within_train_step": 2.5203733444213867, "step": 837} {"train_info/time_between_train_steps": 0.0030908584594726562, "step": 837} {"info/global_step": 838, "train_info/time_within_train_step": 2.521439790725708, "step": 838} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 838} {"info/global_step": 839, "train_info/time_within_train_step": 2.5203354358673096, "step": 839} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 839} {"info/global_step": 840, "train_info/time_within_train_step": 2.5212390422821045, "step": 840} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 840} {"info/global_step": 841, "train_info/time_within_train_step": 2.521178722381592, "step": 841} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 841} {"info/global_step": 842, "train_info/time_within_train_step": 2.5209784507751465, "step": 842} {"train_info/time_between_train_steps": 0.0031173229217529297, "step": 842} {"info/global_step": 843, "train_info/time_within_train_step": 2.520843982696533, "step": 843} {"train_info/time_between_train_steps": 0.003139972686767578, "step": 843} {"info/global_step": 844, "train_info/time_within_train_step": 2.521014451980591, "step": 844} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 844} {"info/global_step": 845, "train_info/time_within_train_step": 2.5211286544799805, "step": 845} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 845} {"info/global_step": 846, "train_info/time_within_train_step": 2.5210812091827393, "step": 846} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 846} {"info/global_step": 847, "train_info/time_within_train_step": 2.5215773582458496, "step": 847} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 847} {"info/global_step": 848, "train_info/time_within_train_step": 2.5216152667999268, "step": 848} {"train_info/time_between_train_steps": 0.0032372474670410156, "step": 848} {"info/global_step": 849, "train_info/time_within_train_step": 2.5213232040405273, "step": 849} {"train_info/time_between_train_steps": 0.0033485889434814453, "step": 849} {"info/global_step": 850, "train_info/time_within_train_step": 2.5208189487457275, "step": 850} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5070.0, "train_info/memory_max_reserved": 5070.0, "_timestamp": 1746325267, "_runtime": 2315}, "step": 850} {"logs": {"train/loss": 4.8467, "train/learning_rate": 0.0004777777777777777, "train/epoch": 0.28, "_timestamp": 1746325267, "_runtime": 2315}, "step": 850} {"train_info/time_between_train_steps": 0.024692058563232422, "step": 850} {"info/global_step": 851, "train_info/time_within_train_step": 2.5257086753845215, "step": 851} {"train_info/time_between_train_steps": 0.003245115280151367, "step": 851} {"info/global_step": 852, "train_info/time_within_train_step": 2.520880937576294, "step": 852} {"train_info/time_between_train_steps": 0.003368854522705078, "step": 852} {"info/global_step": 853, "train_info/time_within_train_step": 2.520700693130493, "step": 853} {"train_info/time_between_train_steps": 0.00331878662109375, "step": 853} {"info/global_step": 854, "train_info/time_within_train_step": 2.5209622383117676, "step": 854} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 854} {"info/global_step": 855, "train_info/time_within_train_step": 2.520382881164551, "step": 855} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 855} {"info/global_step": 856, "train_info/time_within_train_step": 2.5212509632110596, "step": 856} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 856} {"info/global_step": 857, "train_info/time_within_train_step": 2.5202693939208984, "step": 857} {"train_info/time_between_train_steps": 0.0031380653381347656, "step": 857} {"info/global_step": 858, "train_info/time_within_train_step": 2.5255188941955566, "step": 858} {"train_info/time_between_train_steps": 0.0031211376190185547, "step": 858} {"info/global_step": 859, "train_info/time_within_train_step": 2.520399570465088, "step": 859} {"train_info/time_between_train_steps": 0.0033931732177734375, "step": 859} {"info/global_step": 860, "train_info/time_within_train_step": 2.520501136779785, "step": 860} {"train_info/time_between_train_steps": 0.003459453582763672, "step": 860} {"info/global_step": 861, "train_info/time_within_train_step": 2.54876708984375, "step": 861} {"train_info/time_between_train_steps": 0.0033621788024902344, "step": 861} {"info/global_step": 862, "train_info/time_within_train_step": 2.52178955078125, "step": 862} {"train_info/time_between_train_steps": 0.003462553024291992, "step": 862} {"info/global_step": 863, "train_info/time_within_train_step": 2.52120041847229, "step": 863} {"train_info/time_between_train_steps": 0.0036568641662597656, "step": 863} {"info/global_step": 864, "train_info/time_within_train_step": 2.5215234756469727, "step": 864} {"train_info/time_between_train_steps": 0.0035643577575683594, "step": 864} {"info/global_step": 865, "train_info/time_within_train_step": 2.549617290496826, "step": 865} {"train_info/time_between_train_steps": 0.003325223922729492, "step": 865} {"info/global_step": 866, "train_info/time_within_train_step": 2.5220158100128174, "step": 866} {"train_info/time_between_train_steps": 0.003373384475708008, "step": 866} {"info/global_step": 867, "train_info/time_within_train_step": 2.5213208198547363, "step": 867} {"train_info/time_between_train_steps": 0.003390073776245117, "step": 867} {"info/global_step": 868, "train_info/time_within_train_step": 2.5216615200042725, "step": 868} {"train_info/time_between_train_steps": 0.0033388137817382812, "step": 868} {"info/global_step": 869, "train_info/time_within_train_step": 2.522401809692383, "step": 869} {"train_info/time_between_train_steps": 0.003367900848388672, "step": 869} {"info/global_step": 870, "train_info/time_within_train_step": 2.522559404373169, "step": 870} {"train_info/time_between_train_steps": 0.003426790237426758, "step": 870} {"info/global_step": 871, "train_info/time_within_train_step": 2.522686004638672, "step": 871} {"train_info/time_between_train_steps": 0.003419160842895508, "step": 871} {"info/global_step": 872, "train_info/time_within_train_step": 2.521017551422119, "step": 872} {"train_info/time_between_train_steps": 0.003475189208984375, "step": 872} {"info/global_step": 873, "train_info/time_within_train_step": 2.576873540878296, "step": 873} {"train_info/time_between_train_steps": 0.003435373306274414, "step": 873} {"info/global_step": 874, "train_info/time_within_train_step": 2.5212080478668213, "step": 874} {"train_info/time_between_train_steps": 0.0035696029663085938, "step": 874} {"info/global_step": 875, "train_info/time_within_train_step": 2.521868944168091, "step": 875} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 875} {"info/global_step": 876, "train_info/time_within_train_step": 2.521635055541992, "step": 876} {"train_info/time_between_train_steps": 0.0033485889434814453, "step": 876} {"info/global_step": 877, "train_info/time_within_train_step": 2.5216567516326904, "step": 877} {"train_info/time_between_train_steps": 0.0034987926483154297, "step": 877} {"info/global_step": 878, "train_info/time_within_train_step": 2.5268735885620117, "step": 878} {"train_info/time_between_train_steps": 0.0035402774810791016, "step": 878} {"info/global_step": 879, "train_info/time_within_train_step": 2.5208959579467773, "step": 879} {"train_info/time_between_train_steps": 0.003480672836303711, "step": 879} {"info/global_step": 880, "train_info/time_within_train_step": 2.521329879760742, "step": 880} {"train_info/time_between_train_steps": 0.003312349319458008, "step": 880} {"info/global_step": 881, "train_info/time_within_train_step": 2.5216639041900635, "step": 881} {"train_info/time_between_train_steps": 0.003495454788208008, "step": 881} {"info/global_step": 882, "train_info/time_within_train_step": 2.5219318866729736, "step": 882} {"train_info/time_between_train_steps": 0.003631114959716797, "step": 882} {"info/global_step": 883, "train_info/time_within_train_step": 2.522848606109619, "step": 883} {"train_info/time_between_train_steps": 0.003473520278930664, "step": 883} {"info/global_step": 884, "train_info/time_within_train_step": 2.5219733715057373, "step": 884} {"train_info/time_between_train_steps": 0.0034682750701904297, "step": 884} {"info/global_step": 885, "train_info/time_within_train_step": 2.522407293319702, "step": 885} {"train_info/time_between_train_steps": 0.003796815872192383, "step": 885} {"info/global_step": 886, "train_info/time_within_train_step": 2.5220160484313965, "step": 886} {"train_info/time_between_train_steps": 0.003846406936645508, "step": 886} {"info/global_step": 887, "train_info/time_within_train_step": 2.523120641708374, "step": 887} {"train_info/time_between_train_steps": 0.0038022994995117188, "step": 887} {"info/global_step": 888, "train_info/time_within_train_step": 2.5227670669555664, "step": 888} {"train_info/time_between_train_steps": 0.003816366195678711, "step": 888} {"info/global_step": 889, "train_info/time_within_train_step": 2.523268938064575, "step": 889} {"train_info/time_between_train_steps": 0.0040090084075927734, "step": 889} {"info/global_step": 890, "train_info/time_within_train_step": 2.524066686630249, "step": 890} {"train_info/time_between_train_steps": 0.003973245620727539, "step": 890} {"info/global_step": 891, "train_info/time_within_train_step": 2.52457857131958, "step": 891} {"train_info/time_between_train_steps": 0.004522800445556641, "step": 891} {"info/global_step": 892, "train_info/time_within_train_step": 2.5249056816101074, "step": 892} {"train_info/time_between_train_steps": 0.004862070083618164, "step": 892} {"train_info/time_between_train_steps": 3.0042684078216553, "step": 892} {"info/global_step": 893, "train_info/time_within_train_step": 2.5204007625579834, "step": 893} {"train_info/time_between_train_steps": 0.0033712387084960938, "step": 893} {"info/global_step": 894, "train_info/time_within_train_step": 2.5202314853668213, "step": 894} {"train_info/time_between_train_steps": 0.003343343734741211, "step": 894} {"info/global_step": 895, "train_info/time_within_train_step": 2.5224249362945557, "step": 895} {"train_info/time_between_train_steps": 0.0035958290100097656, "step": 895} {"info/global_step": 896, "train_info/time_within_train_step": 2.521430730819702, "step": 896} {"train_info/time_between_train_steps": 0.0033621788024902344, "step": 896} {"info/global_step": 897, "train_info/time_within_train_step": 2.5202748775482178, "step": 897} {"train_info/time_between_train_steps": 0.0036177635192871094, "step": 897} {"info/global_step": 898, "train_info/time_within_train_step": 2.5214765071868896, "step": 898} {"train_info/time_between_train_steps": 0.0038738250732421875, "step": 898} {"info/global_step": 899, "train_info/time_within_train_step": 2.521899461746216, "step": 899} {"train_info/time_between_train_steps": 0.003482341766357422, "step": 899} {"info/global_step": 900, "train_info/time_within_train_step": 2.5207266807556152, "step": 900} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5092.0, "train_info/memory_max_reserved": 5092.0, "_timestamp": 1746325398, "_runtime": 2446}, "step": 900} {"logs": {"train/loss": 4.837, "train/learning_rate": 0.0004666666666666666, "train/epoch": 1.0, "_timestamp": 1746325398, "_runtime": 2446}, "step": 900} {"train_info/time_between_train_steps": 13.043952703475952, "step": 900} {"info/global_step": 901, "train_info/time_within_train_step": 2.3294894695281982, "step": 901} {"train_info/time_between_train_steps": 0.003628969192504883, "step": 901} {"info/global_step": 902, "train_info/time_within_train_step": 2.3227179050445557, "step": 902} {"train_info/time_between_train_steps": 0.0036268234252929688, "step": 902} {"info/global_step": 903, "train_info/time_within_train_step": 2.504082202911377, "step": 903} {"train_info/time_between_train_steps": 0.0036323070526123047, "step": 903} {"info/global_step": 904, "train_info/time_within_train_step": 2.519988775253296, "step": 904} {"train_info/time_between_train_steps": 0.0036149024963378906, "step": 904} {"info/global_step": 905, "train_info/time_within_train_step": 2.5202975273132324, "step": 905} {"train_info/time_between_train_steps": 0.0036089420318603516, "step": 905} {"info/global_step": 906, "train_info/time_within_train_step": 2.521516799926758, "step": 906} {"train_info/time_between_train_steps": 0.003647327423095703, "step": 906} {"info/global_step": 907, "train_info/time_within_train_step": 2.523155689239502, "step": 907} {"train_info/time_between_train_steps": 0.003655672073364258, "step": 907} {"info/global_step": 908, "train_info/time_within_train_step": 2.5237514972686768, "step": 908} {"train_info/time_between_train_steps": 0.0036139488220214844, "step": 908} {"info/global_step": 909, "train_info/time_within_train_step": 2.5234298706054688, "step": 909} {"train_info/time_between_train_steps": 0.0036363601684570312, "step": 909} {"info/global_step": 910, "train_info/time_within_train_step": 2.5235159397125244, "step": 910} {"train_info/time_between_train_steps": 0.0036745071411132812, "step": 910} {"info/global_step": 911, "train_info/time_within_train_step": 2.523144006729126, "step": 911} {"train_info/time_between_train_steps": 0.0036613941192626953, "step": 911} {"info/global_step": 912, "train_info/time_within_train_step": 2.5229103565216064, "step": 912} {"train_info/time_between_train_steps": 0.003687143325805664, "step": 912} {"info/global_step": 913, "train_info/time_within_train_step": 2.5227270126342773, "step": 913} {"train_info/time_between_train_steps": 0.003543853759765625, "step": 913} {"info/global_step": 914, "train_info/time_within_train_step": 2.5232133865356445, "step": 914} {"train_info/time_between_train_steps": 0.003641366958618164, "step": 914} {"info/global_step": 915, "train_info/time_within_train_step": 2.5238163471221924, "step": 915} {"train_info/time_between_train_steps": 0.003659486770629883, "step": 915} {"info/global_step": 916, "train_info/time_within_train_step": 2.523562431335449, "step": 916} {"train_info/time_between_train_steps": 0.003647327423095703, "step": 916} {"info/global_step": 917, "train_info/time_within_train_step": 2.5235273838043213, "step": 917} {"train_info/time_between_train_steps": 0.0035996437072753906, "step": 917} {"info/global_step": 918, "train_info/time_within_train_step": 2.5226056575775146, "step": 918} {"train_info/time_between_train_steps": 0.0036754608154296875, "step": 918} {"info/global_step": 919, "train_info/time_within_train_step": 2.5230343341827393, "step": 919} {"train_info/time_between_train_steps": 0.0036115646362304688, "step": 919} {"info/global_step": 920, "train_info/time_within_train_step": 2.5252625942230225, "step": 920} {"train_info/time_between_train_steps": 0.003925323486328125, "step": 920} {"info/global_step": 921, "train_info/time_within_train_step": 2.5245416164398193, "step": 921} {"train_info/time_between_train_steps": 0.003704071044921875, "step": 921} {"info/global_step": 922, "train_info/time_within_train_step": 2.523984670639038, "step": 922} {"train_info/time_between_train_steps": 0.003715991973876953, "step": 922} {"info/global_step": 923, "train_info/time_within_train_step": 2.524901866912842, "step": 923} {"train_info/time_between_train_steps": 0.003612995147705078, "step": 923} {"info/global_step": 924, "train_info/time_within_train_step": 2.5248448848724365, "step": 924} {"train_info/time_between_train_steps": 0.003607511520385742, "step": 924} {"info/global_step": 925, "train_info/time_within_train_step": 2.524221658706665, "step": 925} {"train_info/time_between_train_steps": 0.0036475658416748047, "step": 925} {"info/global_step": 926, "train_info/time_within_train_step": 2.525052070617676, "step": 926} {"train_info/time_between_train_steps": 0.0038347244262695312, "step": 926} {"info/global_step": 927, "train_info/time_within_train_step": 2.5247082710266113, "step": 927} {"train_info/time_between_train_steps": 0.003656148910522461, "step": 927} {"info/global_step": 928, "train_info/time_within_train_step": 2.5244553089141846, "step": 928} {"train_info/time_between_train_steps": 0.0036318302154541016, "step": 928} {"info/global_step": 929, "train_info/time_within_train_step": 2.528839111328125, "step": 929} {"train_info/time_between_train_steps": 0.003679037094116211, "step": 929} {"info/global_step": 930, "train_info/time_within_train_step": 2.523617744445801, "step": 930} {"train_info/time_between_train_steps": 0.003628969192504883, "step": 930} {"info/global_step": 931, "train_info/time_within_train_step": 2.5235986709594727, "step": 931} {"train_info/time_between_train_steps": 0.0036818981170654297, "step": 931} {"info/global_step": 932, "train_info/time_within_train_step": 2.524009943008423, "step": 932} {"train_info/time_between_train_steps": 0.003677845001220703, "step": 932} {"info/global_step": 933, "train_info/time_within_train_step": 2.5238845348358154, "step": 933} {"train_info/time_between_train_steps": 0.003698587417602539, "step": 933} {"info/global_step": 934, "train_info/time_within_train_step": 2.523798942565918, "step": 934} {"train_info/time_between_train_steps": 0.0036983489990234375, "step": 934} {"info/global_step": 935, "train_info/time_within_train_step": 2.5234453678131104, "step": 935} {"train_info/time_between_train_steps": 0.0037360191345214844, "step": 935} {"info/global_step": 936, "train_info/time_within_train_step": 2.5232760906219482, "step": 936} {"train_info/time_between_train_steps": 0.0037260055541992188, "step": 936} {"info/global_step": 937, "train_info/time_within_train_step": 2.524505376815796, "step": 937} {"train_info/time_between_train_steps": 0.0037713050842285156, "step": 937} {"info/global_step": 938, "train_info/time_within_train_step": 2.5235841274261475, "step": 938} {"train_info/time_between_train_steps": 0.0036880970001220703, "step": 938} {"info/global_step": 939, "train_info/time_within_train_step": 2.5234599113464355, "step": 939} {"train_info/time_between_train_steps": 0.003676176071166992, "step": 939} {"info/global_step": 940, "train_info/time_within_train_step": 2.523275375366211, "step": 940} {"train_info/time_between_train_steps": 0.0036826133728027344, "step": 940} {"info/global_step": 941, "train_info/time_within_train_step": 2.523489475250244, "step": 941} {"train_info/time_between_train_steps": 0.0036933422088623047, "step": 941} {"info/global_step": 942, "train_info/time_within_train_step": 2.5233824253082275, "step": 942} {"train_info/time_between_train_steps": 0.0036783218383789062, "step": 942} {"info/global_step": 943, "train_info/time_within_train_step": 2.5231196880340576, "step": 943} {"train_info/time_between_train_steps": 0.003675222396850586, "step": 943} {"info/global_step": 944, "train_info/time_within_train_step": 2.52394962310791, "step": 944} {"train_info/time_between_train_steps": 0.003714323043823242, "step": 944} {"info/global_step": 945, "train_info/time_within_train_step": 2.5232319831848145, "step": 945} {"train_info/time_between_train_steps": 0.003704547882080078, "step": 945} {"info/global_step": 946, "train_info/time_within_train_step": 2.523623466491699, "step": 946} {"train_info/time_between_train_steps": 0.0036771297454833984, "step": 946} {"info/global_step": 947, "train_info/time_within_train_step": 2.5229742527008057, "step": 947} {"train_info/time_between_train_steps": 0.0036079883575439453, "step": 947} {"info/global_step": 948, "train_info/time_within_train_step": 2.867797613143921, "step": 948} {"train_info/time_between_train_steps": 0.003389120101928711, "step": 948} {"info/global_step": 949, "train_info/time_within_train_step": 2.5215964317321777, "step": 949} {"train_info/time_between_train_steps": 0.003351449966430664, "step": 949} {"info/global_step": 950, "train_info/time_within_train_step": 2.5223941802978516, "step": 950} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5092.0, "train_info/memory_max_reserved": 5092.0, "_timestamp": 1746325538, "_runtime": 2586}, "step": 950} {"logs": {"train/loss": 4.7469, "train/learning_rate": 0.00045555555555555556, "train/epoch": 1.02, "_timestamp": 1746325538, "_runtime": 2586}, "step": 950} {"train_info/time_between_train_steps": 0.02413344383239746, "step": 950} {"info/global_step": 951, "train_info/time_within_train_step": 2.5222601890563965, "step": 951} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 951} {"info/global_step": 952, "train_info/time_within_train_step": 2.5228688716888428, "step": 952} {"train_info/time_between_train_steps": 0.003350496292114258, "step": 952} {"info/global_step": 953, "train_info/time_within_train_step": 2.5219316482543945, "step": 953} {"train_info/time_between_train_steps": 0.0033991336822509766, "step": 953} {"info/global_step": 954, "train_info/time_within_train_step": 2.522200345993042, "step": 954} {"train_info/time_between_train_steps": 0.003401041030883789, "step": 954} {"info/global_step": 955, "train_info/time_within_train_step": 2.6565909385681152, "step": 955} {"train_info/time_between_train_steps": 0.0034062862396240234, "step": 955} {"info/global_step": 956, "train_info/time_within_train_step": 2.5222294330596924, "step": 956} {"train_info/time_between_train_steps": 0.0034470558166503906, "step": 956} {"info/global_step": 957, "train_info/time_within_train_step": 2.523439884185791, "step": 957} {"train_info/time_between_train_steps": 0.003397226333618164, "step": 957} {"info/global_step": 958, "train_info/time_within_train_step": 2.5227277278900146, "step": 958} {"train_info/time_between_train_steps": 0.003390073776245117, "step": 958} {"info/global_step": 959, "train_info/time_within_train_step": 2.522677421569824, "step": 959} {"train_info/time_between_train_steps": 0.0033783912658691406, "step": 959} {"info/global_step": 960, "train_info/time_within_train_step": 2.522594690322876, "step": 960} {"train_info/time_between_train_steps": 0.003385782241821289, "step": 960} {"info/global_step": 961, "train_info/time_within_train_step": 2.522477388381958, "step": 961} {"train_info/time_between_train_steps": 0.003403902053833008, "step": 961} {"info/global_step": 962, "train_info/time_within_train_step": 2.5228464603424072, "step": 962} {"train_info/time_between_train_steps": 0.0033905506134033203, "step": 962} {"info/global_step": 963, "train_info/time_within_train_step": 2.5224459171295166, "step": 963} {"train_info/time_between_train_steps": 0.003406047821044922, "step": 963} {"info/global_step": 964, "train_info/time_within_train_step": 2.5228569507598877, "step": 964} {"train_info/time_between_train_steps": 0.003393411636352539, "step": 964} {"info/global_step": 965, "train_info/time_within_train_step": 2.521987199783325, "step": 965} {"train_info/time_between_train_steps": 0.003412485122680664, "step": 965} {"info/global_step": 966, "train_info/time_within_train_step": 2.522273540496826, "step": 966} {"train_info/time_between_train_steps": 0.0034418106079101562, "step": 966} {"info/global_step": 967, "train_info/time_within_train_step": 2.522395372390747, "step": 967} {"train_info/time_between_train_steps": 0.003373861312866211, "step": 967} {"info/global_step": 968, "train_info/time_within_train_step": 2.5272655487060547, "step": 968} {"train_info/time_between_train_steps": 0.003371715545654297, "step": 968} {"info/global_step": 969, "train_info/time_within_train_step": 2.522475481033325, "step": 969} {"train_info/time_between_train_steps": 0.0033707618713378906, "step": 969} {"info/global_step": 970, "train_info/time_within_train_step": 2.526576519012451, "step": 970} {"train_info/time_between_train_steps": 0.003384828567504883, "step": 970} {"info/global_step": 971, "train_info/time_within_train_step": 2.521970272064209, "step": 971} {"train_info/time_between_train_steps": 0.0033731460571289062, "step": 971} {"info/global_step": 972, "train_info/time_within_train_step": 2.5218753814697266, "step": 972} {"train_info/time_between_train_steps": 0.0033750534057617188, "step": 972} {"info/global_step": 973, "train_info/time_within_train_step": 2.5491297245025635, "step": 973} {"train_info/time_between_train_steps": 0.003377676010131836, "step": 973} {"info/global_step": 974, "train_info/time_within_train_step": 2.5219101905822754, "step": 974} {"train_info/time_between_train_steps": 0.0034148693084716797, "step": 974} {"info/global_step": 975, "train_info/time_within_train_step": 2.5206525325775146, "step": 975} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 975} {"info/global_step": 976, "train_info/time_within_train_step": 2.525909423828125, "step": 976} {"train_info/time_between_train_steps": 0.003367185592651367, "step": 976} {"info/global_step": 977, "train_info/time_within_train_step": 2.5484492778778076, "step": 977} {"train_info/time_between_train_steps": 0.0033576488494873047, "step": 977} {"info/global_step": 978, "train_info/time_within_train_step": 2.522214889526367, "step": 978} {"train_info/time_between_train_steps": 0.003409862518310547, "step": 978} {"info/global_step": 979, "train_info/time_within_train_step": 2.5221705436706543, "step": 979} {"train_info/time_between_train_steps": 0.003363370895385742, "step": 979} {"info/global_step": 980, "train_info/time_within_train_step": 2.521895170211792, "step": 980} {"train_info/time_between_train_steps": 0.003484010696411133, "step": 980} {"info/global_step": 981, "train_info/time_within_train_step": 2.523141384124756, "step": 981} {"train_info/time_between_train_steps": 0.0034062862396240234, "step": 981} {"info/global_step": 982, "train_info/time_within_train_step": 2.5226593017578125, "step": 982} {"train_info/time_between_train_steps": 0.0034079551696777344, "step": 982} {"info/global_step": 983, "train_info/time_within_train_step": 2.5227019786834717, "step": 983} {"train_info/time_between_train_steps": 0.0034112930297851562, "step": 983} {"info/global_step": 984, "train_info/time_within_train_step": 2.523195266723633, "step": 984} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 984} {"info/global_step": 985, "train_info/time_within_train_step": 2.5233447551727295, "step": 985} {"train_info/time_between_train_steps": 0.0034089088439941406, "step": 985} {"info/global_step": 986, "train_info/time_within_train_step": 2.5242197513580322, "step": 986} {"train_info/time_between_train_steps": 0.003401517868041992, "step": 986} {"info/global_step": 987, "train_info/time_within_train_step": 2.5236518383026123, "step": 987} {"train_info/time_between_train_steps": 0.0033888816833496094, "step": 987} {"info/global_step": 988, "train_info/time_within_train_step": 2.522191047668457, "step": 988} {"train_info/time_between_train_steps": 0.0034193992614746094, "step": 988} {"info/global_step": 989, "train_info/time_within_train_step": 2.5222301483154297, "step": 989} {"train_info/time_between_train_steps": 0.0034203529357910156, "step": 989} {"info/global_step": 990, "train_info/time_within_train_step": 2.52189564704895, "step": 990} {"train_info/time_between_train_steps": 0.0033979415893554688, "step": 990} {"info/global_step": 991, "train_info/time_within_train_step": 2.5213778018951416, "step": 991} {"train_info/time_between_train_steps": 0.003372669219970703, "step": 991} {"info/global_step": 992, "train_info/time_within_train_step": 2.5215964317321777, "step": 992} {"train_info/time_between_train_steps": 0.0034017562866210938, "step": 992} {"info/global_step": 993, "train_info/time_within_train_step": 2.5220961570739746, "step": 993} {"train_info/time_between_train_steps": 0.0034220218658447266, "step": 993} {"info/global_step": 994, "train_info/time_within_train_step": 2.5210459232330322, "step": 994} {"train_info/time_between_train_steps": 0.003367900848388672, "step": 994} {"info/global_step": 995, "train_info/time_within_train_step": 2.522768259048462, "step": 995} {"train_info/time_between_train_steps": 0.0034918785095214844, "step": 995} {"info/global_step": 996, "train_info/time_within_train_step": 2.522245168685913, "step": 996} {"train_info/time_between_train_steps": 0.0034627914428710938, "step": 996} {"info/global_step": 997, "train_info/time_within_train_step": 2.5229947566986084, "step": 997} {"train_info/time_between_train_steps": 0.0034530162811279297, "step": 997} {"info/global_step": 998, "train_info/time_within_train_step": 2.523062229156494, "step": 998} {"train_info/time_between_train_steps": 0.0034499168395996094, "step": 998} {"info/global_step": 999, "train_info/time_within_train_step": 2.5224969387054443, "step": 999} {"train_info/time_between_train_steps": 0.003439188003540039, "step": 999} {"info/global_step": 1000, "train_info/time_within_train_step": 3.041003465652466, "step": 1000} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 5092.0, "train_info/memory_max_reserved": 5092.0, "_timestamp": 1746325666, "_runtime": 2714}, "step": 1000} {"logs": {"train/loss": 4.6924, "train/learning_rate": 0.00044444444444444436, "train/epoch": 1.04, "_timestamp": 1746325666, "_runtime": 2714}, "step": 1000} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746325672, "_runtime": 2720}, "step": 1000} {"logs": {"eval/loss": 5.0328216552734375, "eval/runtime": 5.46, "eval/samples_per_second": 36.63, "eval/steps_per_second": 1.282, "train/epoch": 1.04, "_timestamp": 1746325672, "_runtime": 2720}, "step": 1000} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746325672, "_runtime": 2720}, "step": 1000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 5.0328216552734375, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 153.36514631671417, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.46, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.63, "train/epoch": 1.04, "_timestamp": 1746325672, "_runtime": 2720}, "step": 1000} {"train_info/time_between_train_steps": 18.772645235061646, "step": 1000} {"info/global_step": 1001, "train_info/time_within_train_step": 2.3297016620635986, "step": 1001} {"train_info/time_between_train_steps": 0.0034155845642089844, "step": 1001} {"info/global_step": 1002, "train_info/time_within_train_step": 2.3374555110931396, "step": 1002} {"train_info/time_between_train_steps": 0.003525257110595703, "step": 1002} {"info/global_step": 1003, "train_info/time_within_train_step": 2.509312391281128, "step": 1003} {"train_info/time_between_train_steps": 0.003461599349975586, "step": 1003} {"info/global_step": 1004, "train_info/time_within_train_step": 2.519646644592285, "step": 1004} {"train_info/time_between_train_steps": 0.003523111343383789, "step": 1004} {"info/global_step": 1005, "train_info/time_within_train_step": 2.5197606086730957, "step": 1005} {"train_info/time_between_train_steps": 0.0034999847412109375, "step": 1005} {"info/global_step": 1006, "train_info/time_within_train_step": 2.5212602615356445, "step": 1006} {"train_info/time_between_train_steps": 0.0036678314208984375, "step": 1006} {"info/global_step": 1007, "train_info/time_within_train_step": 2.5221107006073, "step": 1007} {"train_info/time_between_train_steps": 0.0035979747772216797, "step": 1007} {"info/global_step": 1008, "train_info/time_within_train_step": 2.5220816135406494, "step": 1008} {"train_info/time_between_train_steps": 0.0036177635192871094, "step": 1008} {"info/global_step": 1009, "train_info/time_within_train_step": 2.521883249282837, "step": 1009} {"train_info/time_between_train_steps": 0.003587484359741211, "step": 1009} {"info/global_step": 1010, "train_info/time_within_train_step": 2.522122859954834, "step": 1010} {"train_info/time_between_train_steps": 0.0037527084350585938, "step": 1010} {"info/global_step": 1011, "train_info/time_within_train_step": 2.5224380493164062, "step": 1011} {"train_info/time_between_train_steps": 0.0036559104919433594, "step": 1011} {"info/global_step": 1012, "train_info/time_within_train_step": 2.523387908935547, "step": 1012} {"train_info/time_between_train_steps": 0.0036067962646484375, "step": 1012} {"info/global_step": 1013, "train_info/time_within_train_step": 2.5232350826263428, "step": 1013} {"train_info/time_between_train_steps": 0.003610372543334961, "step": 1013} {"info/global_step": 1014, "train_info/time_within_train_step": 2.5224952697753906, "step": 1014} {"train_info/time_between_train_steps": 0.0036377906799316406, "step": 1014} {"info/global_step": 1015, "train_info/time_within_train_step": 2.523561716079712, "step": 1015} {"train_info/time_between_train_steps": 0.0035817623138427734, "step": 1015} {"info/global_step": 1016, "train_info/time_within_train_step": 2.5275955200195312, "step": 1016} {"train_info/time_between_train_steps": 0.0036101341247558594, "step": 1016} {"info/global_step": 1017, "train_info/time_within_train_step": 2.5503273010253906, "step": 1017} {"train_info/time_between_train_steps": 0.16461586952209473, "step": 1017} {"info/global_step": 1018, "train_info/time_within_train_step": 2.5231611728668213, "step": 1018} {"train_info/time_between_train_steps": 0.0035469532012939453, "step": 1018} {"info/global_step": 1019, "train_info/time_within_train_step": 2.52201509475708, "step": 1019} {"train_info/time_between_train_steps": 0.0034537315368652344, "step": 1019} {"info/global_step": 1020, "train_info/time_within_train_step": 2.5221023559570312, "step": 1020} {"train_info/time_between_train_steps": 0.003492593765258789, "step": 1020} {"info/global_step": 1021, "train_info/time_within_train_step": 2.522566795349121, "step": 1021} {"train_info/time_between_train_steps": 0.003515481948852539, "step": 1021} {"info/global_step": 1022, "train_info/time_within_train_step": 2.5229315757751465, "step": 1022} {"train_info/time_between_train_steps": 0.0035169124603271484, "step": 1022} {"info/global_step": 1023, "train_info/time_within_train_step": 2.522723436355591, "step": 1023} {"train_info/time_between_train_steps": 0.0035021305084228516, "step": 1023} {"info/global_step": 1024, "train_info/time_within_train_step": 2.522808074951172, "step": 1024} {"train_info/time_between_train_steps": 0.003499746322631836, "step": 1024} {"info/global_step": 1025, "train_info/time_within_train_step": 2.5230586528778076, "step": 1025} {"train_info/time_between_train_steps": 0.0034973621368408203, "step": 1025} {"info/global_step": 1026, "train_info/time_within_train_step": 2.5228030681610107, "step": 1026} {"train_info/time_between_train_steps": 0.0035386085510253906, "step": 1026} {"info/global_step": 1027, "train_info/time_within_train_step": 2.5236923694610596, "step": 1027} {"train_info/time_between_train_steps": 0.00350189208984375, "step": 1027} {"info/global_step": 1028, "train_info/time_within_train_step": 2.523979663848877, "step": 1028} {"train_info/time_between_train_steps": 0.003506898880004883, "step": 1028} {"info/global_step": 1029, "train_info/time_within_train_step": 2.5237796306610107, "step": 1029} {"train_info/time_between_train_steps": 0.0034711360931396484, "step": 1029} {"info/global_step": 1030, "train_info/time_within_train_step": 2.523308515548706, "step": 1030} {"train_info/time_between_train_steps": 0.0035147666931152344, "step": 1030} {"info/global_step": 1031, "train_info/time_within_train_step": 2.523705005645752, "step": 1031} {"train_info/time_between_train_steps": 0.003513336181640625, "step": 1031} {"info/global_step": 1032, "train_info/time_within_train_step": 2.5235226154327393, "step": 1032} {"train_info/time_between_train_steps": 0.0035490989685058594, "step": 1032} {"info/global_step": 1033, "train_info/time_within_train_step": 2.522646903991699, "step": 1033} {"train_info/time_between_train_steps": 0.0035028457641601562, "step": 1033} {"info/global_step": 1034, "train_info/time_within_train_step": 2.523555278778076, "step": 1034} {"train_info/time_between_train_steps": 0.0035085678100585938, "step": 1034} {"info/global_step": 1035, "train_info/time_within_train_step": 2.5226330757141113, "step": 1035} {"train_info/time_between_train_steps": 0.0035305023193359375, "step": 1035} {"info/global_step": 1036, "train_info/time_within_train_step": 2.5220682621002197, "step": 1036} {"train_info/time_between_train_steps": 0.003551483154296875, "step": 1036} {"info/global_step": 1037, "train_info/time_within_train_step": 2.5224058628082275, "step": 1037} {"train_info/time_between_train_steps": 0.0035042762756347656, "step": 1037} {"info/global_step": 1038, "train_info/time_within_train_step": 2.5233404636383057, "step": 1038} {"train_info/time_between_train_steps": 0.0034983158111572266, "step": 1038} {"info/global_step": 1039, "train_info/time_within_train_step": 2.52280330657959, "step": 1039} {"train_info/time_between_train_steps": 0.0034613609313964844, "step": 1039} {"info/global_step": 1040, "train_info/time_within_train_step": 2.5220582485198975, "step": 1040} {"train_info/time_between_train_steps": 0.0035283565521240234, "step": 1040} {"info/global_step": 1041, "train_info/time_within_train_step": 2.5225205421447754, "step": 1041} {"train_info/time_between_train_steps": 0.0035278797149658203, "step": 1041} {"info/global_step": 1042, "train_info/time_within_train_step": 2.523200273513794, "step": 1042} {"train_info/time_between_train_steps": 0.0035321712493896484, "step": 1042} {"info/global_step": 1043, "train_info/time_within_train_step": 2.522343873977661, "step": 1043} {"train_info/time_between_train_steps": 0.003467082977294922, "step": 1043} {"info/global_step": 1044, "train_info/time_within_train_step": 2.523725748062134, "step": 1044} {"train_info/time_between_train_steps": 0.0036704540252685547, "step": 1044} {"info/global_step": 1045, "train_info/time_within_train_step": 2.5229995250701904, "step": 1045} {"train_info/time_between_train_steps": 0.0036897659301757812, "step": 1045} {"info/global_step": 1046, "train_info/time_within_train_step": 2.5236477851867676, "step": 1046} {"train_info/time_between_train_steps": 0.0034608840942382812, "step": 1046} {"info/global_step": 1047, "train_info/time_within_train_step": 2.523916244506836, "step": 1047} {"train_info/time_between_train_steps": 0.0034050941467285156, "step": 1047} {"info/global_step": 1048, "train_info/time_within_train_step": 2.5229432582855225, "step": 1048} {"train_info/time_between_train_steps": 0.003466367721557617, "step": 1048} {"info/global_step": 1049, "train_info/time_within_train_step": 2.5234057903289795, "step": 1049} {"train_info/time_between_train_steps": 0.003423452377319336, "step": 1049} {"info/global_step": 1050, "train_info/time_within_train_step": 2.8096461296081543, "step": 1050} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746325812, "_runtime": 2860}, "step": 1050} {"logs": {"train/loss": 4.6467, "train/learning_rate": 0.0004333333333333333, "train/epoch": 1.05, "_timestamp": 1746325812, "_runtime": 2860}, "step": 1050} {"train_info/time_between_train_steps": 0.024903297424316406, "step": 1050} {"info/global_step": 1051, "train_info/time_within_train_step": 2.522941827774048, "step": 1051} {"train_info/time_between_train_steps": 0.003360271453857422, "step": 1051} {"info/global_step": 1052, "train_info/time_within_train_step": 2.522402763366699, "step": 1052} {"train_info/time_between_train_steps": 0.003355741500854492, "step": 1052} {"info/global_step": 1053, "train_info/time_within_train_step": 2.522686004638672, "step": 1053} {"train_info/time_between_train_steps": 0.0033714771270751953, "step": 1053} {"info/global_step": 1054, "train_info/time_within_train_step": 2.5212175846099854, "step": 1054} {"train_info/time_between_train_steps": 0.003559112548828125, "step": 1054} {"info/global_step": 1055, "train_info/time_within_train_step": 2.521929979324341, "step": 1055} {"train_info/time_between_train_steps": 0.003536224365234375, "step": 1055} {"info/global_step": 1056, "train_info/time_within_train_step": 2.5218377113342285, "step": 1056} {"train_info/time_between_train_steps": 0.003539562225341797, "step": 1056} {"info/global_step": 1057, "train_info/time_within_train_step": 2.521243095397949, "step": 1057} {"train_info/time_between_train_steps": 0.00359344482421875, "step": 1057} {"info/global_step": 1058, "train_info/time_within_train_step": 2.5219132900238037, "step": 1058} {"train_info/time_between_train_steps": 0.003583669662475586, "step": 1058} {"info/global_step": 1059, "train_info/time_within_train_step": 2.5223395824432373, "step": 1059} {"train_info/time_between_train_steps": 0.0033309459686279297, "step": 1059} {"info/global_step": 1060, "train_info/time_within_train_step": 2.521969795227051, "step": 1060} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 1060} {"info/global_step": 1061, "train_info/time_within_train_step": 2.5222630500793457, "step": 1061} {"train_info/time_between_train_steps": 0.0033416748046875, "step": 1061} {"info/global_step": 1062, "train_info/time_within_train_step": 2.5228428840637207, "step": 1062} {"train_info/time_between_train_steps": 0.0035855770111083984, "step": 1062} {"info/global_step": 1063, "train_info/time_within_train_step": 2.52350115776062, "step": 1063} {"train_info/time_between_train_steps": 0.003453493118286133, "step": 1063} {"info/global_step": 1064, "train_info/time_within_train_step": 2.5235352516174316, "step": 1064} {"train_info/time_between_train_steps": 0.00335693359375, "step": 1064} {"info/global_step": 1065, "train_info/time_within_train_step": 2.5223188400268555, "step": 1065} {"train_info/time_between_train_steps": 0.0035467147827148438, "step": 1065} {"info/global_step": 1066, "train_info/time_within_train_step": 2.521944284439087, "step": 1066} {"train_info/time_between_train_steps": 0.0035104751586914062, "step": 1066} {"info/global_step": 1067, "train_info/time_within_train_step": 2.5217831134796143, "step": 1067} {"train_info/time_between_train_steps": 0.0033712387084960938, "step": 1067} {"info/global_step": 1068, "train_info/time_within_train_step": 2.522306203842163, "step": 1068} {"train_info/time_between_train_steps": 0.003476381301879883, "step": 1068} {"info/global_step": 1069, "train_info/time_within_train_step": 2.522142171859741, "step": 1069} {"train_info/time_between_train_steps": 0.003387451171875, "step": 1069} {"info/global_step": 1070, "train_info/time_within_train_step": 2.5216856002807617, "step": 1070} {"train_info/time_between_train_steps": 0.003353118896484375, "step": 1070} {"info/global_step": 1071, "train_info/time_within_train_step": 2.5210940837860107, "step": 1071} {"train_info/time_between_train_steps": 0.003361940383911133, "step": 1071} {"info/global_step": 1072, "train_info/time_within_train_step": 2.521324396133423, "step": 1072} {"train_info/time_between_train_steps": 0.0033979415893554688, "step": 1072} {"info/global_step": 1073, "train_info/time_within_train_step": 2.5214502811431885, "step": 1073} {"train_info/time_between_train_steps": 0.0033953189849853516, "step": 1073} {"info/global_step": 1074, "train_info/time_within_train_step": 2.521987199783325, "step": 1074} {"train_info/time_between_train_steps": 0.003397703170776367, "step": 1074} {"info/global_step": 1075, "train_info/time_within_train_step": 2.5216996669769287, "step": 1075} {"train_info/time_between_train_steps": 0.0033693313598632812, "step": 1075} {"info/global_step": 1076, "train_info/time_within_train_step": 2.522127389907837, "step": 1076} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 1076} {"info/global_step": 1077, "train_info/time_within_train_step": 2.5217936038970947, "step": 1077} {"train_info/time_between_train_steps": 0.0033676624298095703, "step": 1077} {"info/global_step": 1078, "train_info/time_within_train_step": 2.5217955112457275, "step": 1078} {"train_info/time_between_train_steps": 0.0033788681030273438, "step": 1078} {"info/global_step": 1079, "train_info/time_within_train_step": 2.5216946601867676, "step": 1079} {"train_info/time_between_train_steps": 0.0033555030822753906, "step": 1079} {"info/global_step": 1080, "train_info/time_within_train_step": 2.6392300128936768, "step": 1080} {"train_info/time_between_train_steps": 0.003431558609008789, "step": 1080} {"info/global_step": 1081, "train_info/time_within_train_step": 2.5217881202697754, "step": 1081} {"train_info/time_between_train_steps": 0.0033826828002929688, "step": 1081} {"info/global_step": 1082, "train_info/time_within_train_step": 2.521289825439453, "step": 1082} {"train_info/time_between_train_steps": 0.003381013870239258, "step": 1082} {"info/global_step": 1083, "train_info/time_within_train_step": 2.521810293197632, "step": 1083} {"train_info/time_between_train_steps": 0.0033943653106689453, "step": 1083} {"info/global_step": 1084, "train_info/time_within_train_step": 2.5218117237091064, "step": 1084} {"train_info/time_between_train_steps": 0.0033729076385498047, "step": 1084} {"info/global_step": 1085, "train_info/time_within_train_step": 2.5218052864074707, "step": 1085} {"train_info/time_between_train_steps": 0.003381490707397461, "step": 1085} {"info/global_step": 1086, "train_info/time_within_train_step": 2.521336793899536, "step": 1086} {"train_info/time_between_train_steps": 0.003423452377319336, "step": 1086} {"info/global_step": 1087, "train_info/time_within_train_step": 2.522218942642212, "step": 1087} {"train_info/time_between_train_steps": 0.0033609867095947266, "step": 1087} {"info/global_step": 1088, "train_info/time_within_train_step": 2.521761417388916, "step": 1088} {"train_info/time_between_train_steps": 0.0033829212188720703, "step": 1088} {"info/global_step": 1089, "train_info/time_within_train_step": 2.521451950073242, "step": 1089} {"train_info/time_between_train_steps": 0.0034227371215820312, "step": 1089} {"info/global_step": 1090, "train_info/time_within_train_step": 2.5218300819396973, "step": 1090} {"train_info/time_between_train_steps": 0.003385305404663086, "step": 1090} {"info/global_step": 1091, "train_info/time_within_train_step": 2.5216293334960938, "step": 1091} {"train_info/time_between_train_steps": 0.003428220748901367, "step": 1091} {"info/global_step": 1092, "train_info/time_within_train_step": 2.5225303173065186, "step": 1092} {"train_info/time_between_train_steps": 0.0034041404724121094, "step": 1092} {"info/global_step": 1093, "train_info/time_within_train_step": 2.5222418308258057, "step": 1093} {"train_info/time_between_train_steps": 0.003403186798095703, "step": 1093} {"info/global_step": 1094, "train_info/time_within_train_step": 2.5221760272979736, "step": 1094} {"train_info/time_between_train_steps": 0.0034079551696777344, "step": 1094} {"info/global_step": 1095, "train_info/time_within_train_step": 2.52209734916687, "step": 1095} {"train_info/time_between_train_steps": 0.003397703170776367, "step": 1095} {"info/global_step": 1096, "train_info/time_within_train_step": 2.5210609436035156, "step": 1096} {"train_info/time_between_train_steps": 0.0034055709838867188, "step": 1096} {"info/global_step": 1097, "train_info/time_within_train_step": 2.5211031436920166, "step": 1097} {"train_info/time_between_train_steps": 0.003406524658203125, "step": 1097} {"info/global_step": 1098, "train_info/time_within_train_step": 2.5212666988372803, "step": 1098} {"train_info/time_between_train_steps": 0.0034074783325195312, "step": 1098} {"info/global_step": 1099, "train_info/time_within_train_step": 2.5221714973449707, "step": 1099} {"train_info/time_between_train_steps": 0.003411531448364258, "step": 1099} {"info/global_step": 1100, "train_info/time_within_train_step": 2.5209381580352783, "step": 1100} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746325940, "_runtime": 2988}, "step": 1100} {"logs": {"train/loss": 4.6066, "train/learning_rate": 0.0004222222222222222, "train/epoch": 1.07, "_timestamp": 1746325940, "_runtime": 2988}, "step": 1100} {"train_info/time_between_train_steps": 12.559264183044434, "step": 1100} {"info/global_step": 1101, "train_info/time_within_train_step": 2.3333520889282227, "step": 1101} {"train_info/time_between_train_steps": 0.0033910274505615234, "step": 1101} {"info/global_step": 1102, "train_info/time_within_train_step": 2.5431621074676514, "step": 1102} {"train_info/time_between_train_steps": 0.0033829212188720703, "step": 1102} {"info/global_step": 1103, "train_info/time_within_train_step": 2.496441125869751, "step": 1103} {"train_info/time_between_train_steps": 0.0033638477325439453, "step": 1103} {"info/global_step": 1104, "train_info/time_within_train_step": 2.5187137126922607, "step": 1104} {"train_info/time_between_train_steps": 0.0034363269805908203, "step": 1104} {"info/global_step": 1105, "train_info/time_within_train_step": 2.51986026763916, "step": 1105} {"train_info/time_between_train_steps": 0.0033740997314453125, "step": 1105} {"info/global_step": 1106, "train_info/time_within_train_step": 2.520256519317627, "step": 1106} {"train_info/time_between_train_steps": 0.0033903121948242188, "step": 1106} {"info/global_step": 1107, "train_info/time_within_train_step": 2.520371198654175, "step": 1107} {"train_info/time_between_train_steps": 0.0033845901489257812, "step": 1107} {"info/global_step": 1108, "train_info/time_within_train_step": 2.520432233810425, "step": 1108} {"train_info/time_between_train_steps": 0.0034132003784179688, "step": 1108} {"info/global_step": 1109, "train_info/time_within_train_step": 2.5202956199645996, "step": 1109} {"train_info/time_between_train_steps": 0.0033817291259765625, "step": 1109} {"info/global_step": 1110, "train_info/time_within_train_step": 2.5203633308410645, "step": 1110} {"train_info/time_between_train_steps": 0.003416776657104492, "step": 1110} {"info/global_step": 1111, "train_info/time_within_train_step": 2.520777702331543, "step": 1111} {"train_info/time_between_train_steps": 0.0034067630767822266, "step": 1111} {"info/global_step": 1112, "train_info/time_within_train_step": 2.5211195945739746, "step": 1112} {"train_info/time_between_train_steps": 0.0033957958221435547, "step": 1112} {"info/global_step": 1113, "train_info/time_within_train_step": 2.5214314460754395, "step": 1113} {"train_info/time_between_train_steps": 0.0034177303314208984, "step": 1113} {"info/global_step": 1114, "train_info/time_within_train_step": 2.5219929218292236, "step": 1114} {"train_info/time_between_train_steps": 0.003401041030883789, "step": 1114} {"info/global_step": 1115, "train_info/time_within_train_step": 2.520697593688965, "step": 1115} {"train_info/time_between_train_steps": 0.003401041030883789, "step": 1115} {"info/global_step": 1116, "train_info/time_within_train_step": 2.5218186378479004, "step": 1116} {"train_info/time_between_train_steps": 0.003409862518310547, "step": 1116} {"info/global_step": 1117, "train_info/time_within_train_step": 2.521596670150757, "step": 1117} {"train_info/time_between_train_steps": 0.0034332275390625, "step": 1117} {"info/global_step": 1118, "train_info/time_within_train_step": 2.521886110305786, "step": 1118} {"train_info/time_between_train_steps": 0.003413677215576172, "step": 1118} {"info/global_step": 1119, "train_info/time_within_train_step": 2.5221002101898193, "step": 1119} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 1119} {"info/global_step": 1120, "train_info/time_within_train_step": 2.5220463275909424, "step": 1120} {"train_info/time_between_train_steps": 0.0034449100494384766, "step": 1120} {"info/global_step": 1121, "train_info/time_within_train_step": 2.5218563079833984, "step": 1121} {"train_info/time_between_train_steps": 0.003381013870239258, "step": 1121} {"info/global_step": 1122, "train_info/time_within_train_step": 2.5218892097473145, "step": 1122} {"train_info/time_between_train_steps": 0.0034372806549072266, "step": 1122} {"info/global_step": 1123, "train_info/time_within_train_step": 2.5258629322052, "step": 1123} {"train_info/time_between_train_steps": 0.003407716751098633, "step": 1123} {"info/global_step": 1124, "train_info/time_within_train_step": 2.5214855670928955, "step": 1124} {"train_info/time_between_train_steps": 0.0033752918243408203, "step": 1124} {"info/global_step": 1125, "train_info/time_within_train_step": 2.5215871334075928, "step": 1125} {"train_info/time_between_train_steps": 0.0033884048461914062, "step": 1125} {"info/global_step": 1126, "train_info/time_within_train_step": 2.5495193004608154, "step": 1126} {"train_info/time_between_train_steps": 0.003429412841796875, "step": 1126} {"info/global_step": 1127, "train_info/time_within_train_step": 2.5211353302001953, "step": 1127} {"train_info/time_between_train_steps": 0.0034132003784179688, "step": 1127} {"info/global_step": 1128, "train_info/time_within_train_step": 2.5219945907592773, "step": 1128} {"train_info/time_between_train_steps": 0.003408670425415039, "step": 1128} {"info/global_step": 1129, "train_info/time_within_train_step": 2.522639513015747, "step": 1129} {"train_info/time_between_train_steps": 0.003435373306274414, "step": 1129} {"info/global_step": 1130, "train_info/time_within_train_step": 2.5222933292388916, "step": 1130} {"train_info/time_between_train_steps": 0.0033965110778808594, "step": 1130} {"info/global_step": 1131, "train_info/time_within_train_step": 2.521832227706909, "step": 1131} {"train_info/time_between_train_steps": 0.003405332565307617, "step": 1131} {"info/global_step": 1132, "train_info/time_within_train_step": 2.521825075149536, "step": 1132} {"train_info/time_between_train_steps": 0.003421306610107422, "step": 1132} {"info/global_step": 1133, "train_info/time_within_train_step": 2.5216617584228516, "step": 1133} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 1133} {"info/global_step": 1134, "train_info/time_within_train_step": 2.5228981971740723, "step": 1134} {"train_info/time_between_train_steps": 0.0034112930297851562, "step": 1134} {"info/global_step": 1135, "train_info/time_within_train_step": 2.5236504077911377, "step": 1135} {"train_info/time_between_train_steps": 0.003729104995727539, "step": 1135} {"info/global_step": 1136, "train_info/time_within_train_step": 2.5232534408569336, "step": 1136} {"train_info/time_between_train_steps": 0.003438234329223633, "step": 1136} {"info/global_step": 1137, "train_info/time_within_train_step": 2.523134469985962, "step": 1137} {"train_info/time_between_train_steps": 0.0034117698669433594, "step": 1137} {"info/global_step": 1138, "train_info/time_within_train_step": 2.523080825805664, "step": 1138} {"train_info/time_between_train_steps": 0.0034050941467285156, "step": 1138} {"info/global_step": 1139, "train_info/time_within_train_step": 2.522916316986084, "step": 1139} {"train_info/time_between_train_steps": 0.003413677215576172, "step": 1139} {"info/global_step": 1140, "train_info/time_within_train_step": 2.747544288635254, "step": 1140} {"train_info/time_between_train_steps": 0.0034341812133789062, "step": 1140} {"info/global_step": 1141, "train_info/time_within_train_step": 2.5225210189819336, "step": 1141} {"train_info/time_between_train_steps": 0.003407001495361328, "step": 1141} {"info/global_step": 1142, "train_info/time_within_train_step": 2.521686315536499, "step": 1142} {"train_info/time_between_train_steps": 0.12191915512084961, "step": 1142} {"info/global_step": 1143, "train_info/time_within_train_step": 2.522242784500122, "step": 1143} {"train_info/time_between_train_steps": 0.003443479537963867, "step": 1143} {"info/global_step": 1144, "train_info/time_within_train_step": 2.5224292278289795, "step": 1144} {"train_info/time_between_train_steps": 0.003439188003540039, "step": 1144} {"info/global_step": 1145, "train_info/time_within_train_step": 2.5228359699249268, "step": 1145} {"train_info/time_between_train_steps": 0.003419160842895508, "step": 1145} {"info/global_step": 1146, "train_info/time_within_train_step": 2.522258758544922, "step": 1146} {"train_info/time_between_train_steps": 0.003468036651611328, "step": 1146} {"info/global_step": 1147, "train_info/time_within_train_step": 2.522310256958008, "step": 1147} {"train_info/time_between_train_steps": 0.0034711360931396484, "step": 1147} {"info/global_step": 1148, "train_info/time_within_train_step": 2.522975206375122, "step": 1148} {"train_info/time_between_train_steps": 0.0037314891815185547, "step": 1148} {"info/global_step": 1149, "train_info/time_within_train_step": 2.5224337577819824, "step": 1149} {"train_info/time_between_train_steps": 0.003981351852416992, "step": 1149} {"info/global_step": 1150, "train_info/time_within_train_step": 2.522897720336914, "step": 1150} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746326080, "_runtime": 3128}, "step": 1150} {"logs": {"train/loss": 4.567, "train/learning_rate": 0.0004111111111111111, "train/epoch": 1.09, "_timestamp": 1746326080, "_runtime": 3128}, "step": 1150} {"train_info/time_between_train_steps": 0.025204181671142578, "step": 1150} {"info/global_step": 1151, "train_info/time_within_train_step": 2.5220794677734375, "step": 1151} {"train_info/time_between_train_steps": 0.003481626510620117, "step": 1151} {"info/global_step": 1152, "train_info/time_within_train_step": 2.522498846054077, "step": 1152} {"train_info/time_between_train_steps": 0.0034542083740234375, "step": 1152} {"info/global_step": 1153, "train_info/time_within_train_step": 2.522846221923828, "step": 1153} {"train_info/time_between_train_steps": 0.0034601688385009766, "step": 1153} {"info/global_step": 1154, "train_info/time_within_train_step": 2.523022174835205, "step": 1154} {"train_info/time_between_train_steps": 0.0034241676330566406, "step": 1154} {"info/global_step": 1155, "train_info/time_within_train_step": 2.522214412689209, "step": 1155} {"train_info/time_between_train_steps": 0.003498554229736328, "step": 1155} {"info/global_step": 1156, "train_info/time_within_train_step": 2.5228652954101562, "step": 1156} {"train_info/time_between_train_steps": 0.0034537315368652344, "step": 1156} {"info/global_step": 1157, "train_info/time_within_train_step": 2.5224568843841553, "step": 1157} {"train_info/time_between_train_steps": 0.0037026405334472656, "step": 1157} {"info/global_step": 1158, "train_info/time_within_train_step": 2.5221123695373535, "step": 1158} {"train_info/time_between_train_steps": 0.003388643264770508, "step": 1158} {"info/global_step": 1159, "train_info/time_within_train_step": 2.521979808807373, "step": 1159} {"train_info/time_between_train_steps": 0.0033850669860839844, "step": 1159} {"info/global_step": 1160, "train_info/time_within_train_step": 2.520909309387207, "step": 1160} {"train_info/time_between_train_steps": 0.003371000289916992, "step": 1160} {"info/global_step": 1161, "train_info/time_within_train_step": 2.5217673778533936, "step": 1161} {"train_info/time_between_train_steps": 0.003392934799194336, "step": 1161} {"info/global_step": 1162, "train_info/time_within_train_step": 2.5219972133636475, "step": 1162} {"train_info/time_between_train_steps": 0.003459453582763672, "step": 1162} {"info/global_step": 1163, "train_info/time_within_train_step": 2.5209460258483887, "step": 1163} {"train_info/time_between_train_steps": 0.0034394264221191406, "step": 1163} {"info/global_step": 1164, "train_info/time_within_train_step": 2.5218842029571533, "step": 1164} {"train_info/time_between_train_steps": 0.003408193588256836, "step": 1164} {"info/global_step": 1165, "train_info/time_within_train_step": 2.521260976791382, "step": 1165} {"train_info/time_between_train_steps": 0.003391265869140625, "step": 1165} {"info/global_step": 1166, "train_info/time_within_train_step": 2.5220634937286377, "step": 1166} {"train_info/time_between_train_steps": 0.003376483917236328, "step": 1166} {"info/global_step": 1167, "train_info/time_within_train_step": 2.5208241939544678, "step": 1167} {"train_info/time_between_train_steps": 0.0034608840942382812, "step": 1167} {"info/global_step": 1168, "train_info/time_within_train_step": 2.5213613510131836, "step": 1168} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 1168} {"info/global_step": 1169, "train_info/time_within_train_step": 2.521397113800049, "step": 1169} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 1169} {"info/global_step": 1170, "train_info/time_within_train_step": 2.5215179920196533, "step": 1170} {"train_info/time_between_train_steps": 0.003404378890991211, "step": 1170} {"info/global_step": 1171, "train_info/time_within_train_step": 2.5257155895233154, "step": 1171} {"train_info/time_between_train_steps": 0.003361940383911133, "step": 1171} {"info/global_step": 1172, "train_info/time_within_train_step": 2.520888328552246, "step": 1172} {"train_info/time_between_train_steps": 0.003413677215576172, "step": 1172} {"info/global_step": 1173, "train_info/time_within_train_step": 2.52130126953125, "step": 1173} {"train_info/time_between_train_steps": 0.0034172534942626953, "step": 1173} {"info/global_step": 1174, "train_info/time_within_train_step": 2.5210323333740234, "step": 1174} {"train_info/time_between_train_steps": 0.0033833980560302734, "step": 1174} {"info/global_step": 1175, "train_info/time_within_train_step": 2.5213072299957275, "step": 1175} {"train_info/time_between_train_steps": 0.003367900848388672, "step": 1175} {"info/global_step": 1176, "train_info/time_within_train_step": 2.5218262672424316, "step": 1176} {"train_info/time_between_train_steps": 0.0033843517303466797, "step": 1176} {"info/global_step": 1177, "train_info/time_within_train_step": 2.5217130184173584, "step": 1177} {"train_info/time_between_train_steps": 0.0033931732177734375, "step": 1177} {"info/global_step": 1178, "train_info/time_within_train_step": 2.52290678024292, "step": 1178} {"train_info/time_between_train_steps": 0.0033721923828125, "step": 1178} {"info/global_step": 1179, "train_info/time_within_train_step": 2.521996259689331, "step": 1179} {"train_info/time_between_train_steps": 0.003383636474609375, "step": 1179} {"info/global_step": 1180, "train_info/time_within_train_step": 2.521775722503662, "step": 1180} {"train_info/time_between_train_steps": 0.0033936500549316406, "step": 1180} {"info/global_step": 1181, "train_info/time_within_train_step": 2.5230531692504883, "step": 1181} {"train_info/time_between_train_steps": 0.0034093856811523438, "step": 1181} {"info/global_step": 1182, "train_info/time_within_train_step": 2.5217864513397217, "step": 1182} {"train_info/time_between_train_steps": 0.0033864974975585938, "step": 1182} {"info/global_step": 1183, "train_info/time_within_train_step": 2.5218605995178223, "step": 1183} {"train_info/time_between_train_steps": 0.0033724308013916016, "step": 1183} {"info/global_step": 1184, "train_info/time_within_train_step": 2.521393060684204, "step": 1184} {"train_info/time_between_train_steps": 0.0034062862396240234, "step": 1184} {"info/global_step": 1185, "train_info/time_within_train_step": 2.5210092067718506, "step": 1185} {"train_info/time_between_train_steps": 0.003368377685546875, "step": 1185} {"info/global_step": 1186, "train_info/time_within_train_step": 2.521719217300415, "step": 1186} {"train_info/time_between_train_steps": 0.003386259078979492, "step": 1186} {"info/global_step": 1187, "train_info/time_within_train_step": 2.5269365310668945, "step": 1187} {"train_info/time_between_train_steps": 0.003451824188232422, "step": 1187} {"info/global_step": 1188, "train_info/time_within_train_step": 2.5210983753204346, "step": 1188} {"train_info/time_between_train_steps": 0.003373384475708008, "step": 1188} {"info/global_step": 1189, "train_info/time_within_train_step": 2.5217654705047607, "step": 1189} {"train_info/time_between_train_steps": 0.003406524658203125, "step": 1189} {"info/global_step": 1190, "train_info/time_within_train_step": 2.521726608276367, "step": 1190} {"train_info/time_between_train_steps": 0.0033719539642333984, "step": 1190} {"info/global_step": 1191, "train_info/time_within_train_step": 2.521744966506958, "step": 1191} {"train_info/time_between_train_steps": 0.003408193588256836, "step": 1191} {"info/global_step": 1192, "train_info/time_within_train_step": 2.5211682319641113, "step": 1192} {"train_info/time_between_train_steps": 0.003432750701904297, "step": 1192} {"info/global_step": 1193, "train_info/time_within_train_step": 2.5215423107147217, "step": 1193} {"train_info/time_between_train_steps": 0.003525257110595703, "step": 1193} {"info/global_step": 1194, "train_info/time_within_train_step": 2.5222365856170654, "step": 1194} {"train_info/time_between_train_steps": 0.0033729076385498047, "step": 1194} {"info/global_step": 1195, "train_info/time_within_train_step": 2.521366596221924, "step": 1195} {"train_info/time_between_train_steps": 0.003362894058227539, "step": 1195} {"info/global_step": 1196, "train_info/time_within_train_step": 2.52181077003479, "step": 1196} {"train_info/time_between_train_steps": 0.003578662872314453, "step": 1196} {"info/global_step": 1197, "train_info/time_within_train_step": 2.5493381023406982, "step": 1197} {"train_info/time_between_train_steps": 0.0035333633422851562, "step": 1197} {"info/global_step": 1198, "train_info/time_within_train_step": 2.5207366943359375, "step": 1198} {"train_info/time_between_train_steps": 0.0033304691314697266, "step": 1198} {"info/global_step": 1199, "train_info/time_within_train_step": 2.5212900638580322, "step": 1199} {"train_info/time_between_train_steps": 0.0035963058471679688, "step": 1199} {"info/global_step": 1200, "train_info/time_within_train_step": 2.520441770553589, "step": 1200} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746326207, "_runtime": 3255}, "step": 1200} {"logs": {"train/loss": 4.5236, "train/learning_rate": 0.00039999999999999996, "train/epoch": 1.1, "_timestamp": 1746326207, "_runtime": 3255}, "step": 1200} {"train_info/time_between_train_steps": 18.286272048950195, "step": 1200} {"info/global_step": 1201, "train_info/time_within_train_step": 2.331033229827881, "step": 1201} {"train_info/time_between_train_steps": 0.003412485122680664, "step": 1201} {"info/global_step": 1202, "train_info/time_within_train_step": 2.317446231842041, "step": 1202} {"train_info/time_between_train_steps": 0.0034246444702148438, "step": 1202} {"info/global_step": 1203, "train_info/time_within_train_step": 2.4788711071014404, "step": 1203} {"train_info/time_between_train_steps": 0.003407001495361328, "step": 1203} {"info/global_step": 1204, "train_info/time_within_train_step": 2.517021417617798, "step": 1204} {"train_info/time_between_train_steps": 0.0033731460571289062, "step": 1204} {"info/global_step": 1205, "train_info/time_within_train_step": 2.638723850250244, "step": 1205} {"train_info/time_between_train_steps": 0.003556966781616211, "step": 1205} {"info/global_step": 1206, "train_info/time_within_train_step": 2.520256996154785, "step": 1206} {"train_info/time_between_train_steps": 0.003435373306274414, "step": 1206} {"info/global_step": 1207, "train_info/time_within_train_step": 2.5201101303100586, "step": 1207} {"train_info/time_between_train_steps": 0.0033812522888183594, "step": 1207} {"info/global_step": 1208, "train_info/time_within_train_step": 2.520625114440918, "step": 1208} {"train_info/time_between_train_steps": 0.0033783912658691406, "step": 1208} {"info/global_step": 1209, "train_info/time_within_train_step": 2.5211892127990723, "step": 1209} {"train_info/time_between_train_steps": 0.003395557403564453, "step": 1209} {"info/global_step": 1210, "train_info/time_within_train_step": 2.521653413772583, "step": 1210} {"train_info/time_between_train_steps": 0.003422975540161133, "step": 1210} {"info/global_step": 1211, "train_info/time_within_train_step": 2.5217597484588623, "step": 1211} {"train_info/time_between_train_steps": 0.003385305404663086, "step": 1211} {"info/global_step": 1212, "train_info/time_within_train_step": 2.5231752395629883, "step": 1212} {"train_info/time_between_train_steps": 0.0033986568450927734, "step": 1212} {"info/global_step": 1213, "train_info/time_within_train_step": 2.5220658779144287, "step": 1213} {"train_info/time_between_train_steps": 0.00342559814453125, "step": 1213} {"info/global_step": 1214, "train_info/time_within_train_step": 2.5223448276519775, "step": 1214} {"train_info/time_between_train_steps": 0.003442525863647461, "step": 1214} {"info/global_step": 1215, "train_info/time_within_train_step": 2.753965139389038, "step": 1215} {"train_info/time_between_train_steps": 0.003377676010131836, "step": 1215} {"info/global_step": 1216, "train_info/time_within_train_step": 2.522914409637451, "step": 1216} {"train_info/time_between_train_steps": 0.0034241676330566406, "step": 1216} {"info/global_step": 1217, "train_info/time_within_train_step": 2.5220227241516113, "step": 1217} {"train_info/time_between_train_steps": 0.0033860206604003906, "step": 1217} {"info/global_step": 1218, "train_info/time_within_train_step": 2.5228283405303955, "step": 1218} {"train_info/time_between_train_steps": 0.003395557403564453, "step": 1218} {"info/global_step": 1219, "train_info/time_within_train_step": 2.5223300457000732, "step": 1219} {"train_info/time_between_train_steps": 0.003362417221069336, "step": 1219} {"info/global_step": 1220, "train_info/time_within_train_step": 2.5228500366210938, "step": 1220} {"train_info/time_between_train_steps": 0.0033807754516601562, "step": 1220} {"info/global_step": 1221, "train_info/time_within_train_step": 2.521883487701416, "step": 1221} {"train_info/time_between_train_steps": 0.0033888816833496094, "step": 1221} {"info/global_step": 1222, "train_info/time_within_train_step": 2.5218286514282227, "step": 1222} {"train_info/time_between_train_steps": 0.003390073776245117, "step": 1222} {"info/global_step": 1223, "train_info/time_within_train_step": 2.521899461746216, "step": 1223} {"train_info/time_between_train_steps": 0.0033674240112304688, "step": 1223} {"info/global_step": 1224, "train_info/time_within_train_step": 2.522099494934082, "step": 1224} {"train_info/time_between_train_steps": 0.003390789031982422, "step": 1224} {"info/global_step": 1225, "train_info/time_within_train_step": 2.5217955112457275, "step": 1225} {"train_info/time_between_train_steps": 0.003378629684448242, "step": 1225} {"info/global_step": 1226, "train_info/time_within_train_step": 2.522646427154541, "step": 1226} {"train_info/time_between_train_steps": 0.0034151077270507812, "step": 1226} {"info/global_step": 1227, "train_info/time_within_train_step": 2.522127151489258, "step": 1227} {"train_info/time_between_train_steps": 0.003633260726928711, "step": 1227} {"info/global_step": 1228, "train_info/time_within_train_step": 2.522104501724243, "step": 1228} {"train_info/time_between_train_steps": 0.0034325122833251953, "step": 1228} {"info/global_step": 1229, "train_info/time_within_train_step": 2.522491455078125, "step": 1229} {"train_info/time_between_train_steps": 0.0033812522888183594, "step": 1229} {"info/global_step": 1230, "train_info/time_within_train_step": 2.5233492851257324, "step": 1230} {"train_info/time_between_train_steps": 0.0034224987030029297, "step": 1230} {"info/global_step": 1231, "train_info/time_within_train_step": 2.522581100463867, "step": 1231} {"train_info/time_between_train_steps": 0.003432750701904297, "step": 1231} {"info/global_step": 1232, "train_info/time_within_train_step": 2.5225424766540527, "step": 1232} {"train_info/time_between_train_steps": 0.0034012794494628906, "step": 1232} {"info/global_step": 1233, "train_info/time_within_train_step": 2.5227949619293213, "step": 1233} {"train_info/time_between_train_steps": 0.0033805370330810547, "step": 1233} {"info/global_step": 1234, "train_info/time_within_train_step": 2.5225377082824707, "step": 1234} {"train_info/time_between_train_steps": 0.0033919811248779297, "step": 1234} {"info/global_step": 1235, "train_info/time_within_train_step": 2.523200273513794, "step": 1235} {"train_info/time_between_train_steps": 0.0033795833587646484, "step": 1235} {"info/global_step": 1236, "train_info/time_within_train_step": 2.5221242904663086, "step": 1236} {"train_info/time_between_train_steps": 0.0033829212188720703, "step": 1236} {"info/global_step": 1237, "train_info/time_within_train_step": 2.521505355834961, "step": 1237} {"train_info/time_between_train_steps": 0.0034003257751464844, "step": 1237} {"info/global_step": 1238, "train_info/time_within_train_step": 2.521444320678711, "step": 1238} {"train_info/time_between_train_steps": 0.0033898353576660156, "step": 1238} {"info/global_step": 1239, "train_info/time_within_train_step": 2.5218474864959717, "step": 1239} {"train_info/time_between_train_steps": 0.0033998489379882812, "step": 1239} {"info/global_step": 1240, "train_info/time_within_train_step": 2.525757074356079, "step": 1240} {"train_info/time_between_train_steps": 0.0033860206604003906, "step": 1240} {"info/global_step": 1241, "train_info/time_within_train_step": 2.52177357673645, "step": 1241} {"train_info/time_between_train_steps": 0.0033898353576660156, "step": 1241} {"info/global_step": 1242, "train_info/time_within_train_step": 2.521864175796509, "step": 1242} {"train_info/time_between_train_steps": 0.0033986568450927734, "step": 1242} {"info/global_step": 1243, "train_info/time_within_train_step": 2.52178692817688, "step": 1243} {"train_info/time_between_train_steps": 0.0033905506134033203, "step": 1243} {"info/global_step": 1244, "train_info/time_within_train_step": 2.5222716331481934, "step": 1244} {"train_info/time_between_train_steps": 0.0033791065216064453, "step": 1244} {"info/global_step": 1245, "train_info/time_within_train_step": 2.5226142406463623, "step": 1245} {"train_info/time_between_train_steps": 0.0033822059631347656, "step": 1245} {"info/global_step": 1246, "train_info/time_within_train_step": 2.5229594707489014, "step": 1246} {"train_info/time_between_train_steps": 0.0034067630767822266, "step": 1246} {"info/global_step": 1247, "train_info/time_within_train_step": 2.52252459526062, "step": 1247} {"train_info/time_between_train_steps": 0.0033957958221435547, "step": 1247} {"info/global_step": 1248, "train_info/time_within_train_step": 2.522155284881592, "step": 1248} {"train_info/time_between_train_steps": 0.003393888473510742, "step": 1248} {"info/global_step": 1249, "train_info/time_within_train_step": 2.5230917930603027, "step": 1249} {"train_info/time_between_train_steps": 0.0034017562866210938, "step": 1249} {"info/global_step": 1250, "train_info/time_within_train_step": 3.043947458267212, "step": 1250} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746326353, "_runtime": 3401}, "step": 1250} {"logs": {"train/loss": 4.4979, "train/learning_rate": 0.00038888888888888887, "train/epoch": 1.12, "_timestamp": 1746326353, "_runtime": 3401}, "step": 1250} {"train_info/time_between_train_steps": 0.024283647537231445, "step": 1250} {"info/global_step": 1251, "train_info/time_within_train_step": 2.5225744247436523, "step": 1251} {"train_info/time_between_train_steps": 0.0034339427947998047, "step": 1251} {"info/global_step": 1252, "train_info/time_within_train_step": 2.522348642349243, "step": 1252} {"train_info/time_between_train_steps": 0.0034062862396240234, "step": 1252} {"info/global_step": 1253, "train_info/time_within_train_step": 2.7590904235839844, "step": 1253} {"train_info/time_between_train_steps": 0.003417491912841797, "step": 1253} {"info/global_step": 1254, "train_info/time_within_train_step": 2.522047281265259, "step": 1254} {"train_info/time_between_train_steps": 0.0034112930297851562, "step": 1254} {"info/global_step": 1255, "train_info/time_within_train_step": 2.5219435691833496, "step": 1255} {"train_info/time_between_train_steps": 0.003459453582763672, "step": 1255} {"info/global_step": 1256, "train_info/time_within_train_step": 2.522456169128418, "step": 1256} {"train_info/time_between_train_steps": 0.0034019947052001953, "step": 1256} {"info/global_step": 1257, "train_info/time_within_train_step": 2.5216033458709717, "step": 1257} {"train_info/time_between_train_steps": 0.003426790237426758, "step": 1257} {"info/global_step": 1258, "train_info/time_within_train_step": 2.5264086723327637, "step": 1258} {"train_info/time_between_train_steps": 0.0033991336822509766, "step": 1258} {"info/global_step": 1259, "train_info/time_within_train_step": 2.521254539489746, "step": 1259} {"train_info/time_between_train_steps": 0.0034232139587402344, "step": 1259} {"info/global_step": 1260, "train_info/time_within_train_step": 2.522247314453125, "step": 1260} {"train_info/time_between_train_steps": 0.00341796875, "step": 1260} {"info/global_step": 1261, "train_info/time_within_train_step": 2.5215604305267334, "step": 1261} {"train_info/time_between_train_steps": 0.003421783447265625, "step": 1261} {"info/global_step": 1262, "train_info/time_within_train_step": 2.521798849105835, "step": 1262} {"train_info/time_between_train_steps": 0.003381013870239258, "step": 1262} {"info/global_step": 1263, "train_info/time_within_train_step": 2.521815538406372, "step": 1263} {"train_info/time_between_train_steps": 0.0034270286560058594, "step": 1263} {"info/global_step": 1264, "train_info/time_within_train_step": 2.520812511444092, "step": 1264} {"train_info/time_between_train_steps": 0.0033800601959228516, "step": 1264} {"info/global_step": 1265, "train_info/time_within_train_step": 2.520958423614502, "step": 1265} {"train_info/time_between_train_steps": 0.0034351348876953125, "step": 1265} {"info/global_step": 1266, "train_info/time_within_train_step": 2.5221028327941895, "step": 1266} {"train_info/time_between_train_steps": 0.0033774375915527344, "step": 1266} {"info/global_step": 1267, "train_info/time_within_train_step": 2.521965742111206, "step": 1267} {"train_info/time_between_train_steps": 0.1232142448425293, "step": 1267} {"info/global_step": 1268, "train_info/time_within_train_step": 2.522775173187256, "step": 1268} {"train_info/time_between_train_steps": 0.003443479537963867, "step": 1268} {"info/global_step": 1269, "train_info/time_within_train_step": 2.522897243499756, "step": 1269} {"train_info/time_between_train_steps": 0.0034983158111572266, "step": 1269} {"info/global_step": 1270, "train_info/time_within_train_step": 2.522583246231079, "step": 1270} {"train_info/time_between_train_steps": 0.003470897674560547, "step": 1270} {"info/global_step": 1271, "train_info/time_within_train_step": 2.5223772525787354, "step": 1271} {"train_info/time_between_train_steps": 0.003461599349975586, "step": 1271} {"info/global_step": 1272, "train_info/time_within_train_step": 2.521984338760376, "step": 1272} {"train_info/time_between_train_steps": 0.003377199172973633, "step": 1272} {"info/global_step": 1273, "train_info/time_within_train_step": 2.5212576389312744, "step": 1273} {"train_info/time_between_train_steps": 0.0034384727478027344, "step": 1273} {"info/global_step": 1274, "train_info/time_within_train_step": 2.5214884281158447, "step": 1274} {"train_info/time_between_train_steps": 0.003401041030883789, "step": 1274} {"info/global_step": 1275, "train_info/time_within_train_step": 2.5211658477783203, "step": 1275} {"train_info/time_between_train_steps": 0.003394603729248047, "step": 1275} {"info/global_step": 1276, "train_info/time_within_train_step": 2.5203022956848145, "step": 1276} {"train_info/time_between_train_steps": 0.003371715545654297, "step": 1276} {"info/global_step": 1277, "train_info/time_within_train_step": 2.521395683288574, "step": 1277} {"train_info/time_between_train_steps": 0.0034224987030029297, "step": 1277} {"info/global_step": 1278, "train_info/time_within_train_step": 2.5213658809661865, "step": 1278} {"train_info/time_between_train_steps": 0.0034062862396240234, "step": 1278} {"info/global_step": 1279, "train_info/time_within_train_step": 2.5220069885253906, "step": 1279} {"train_info/time_between_train_steps": 0.0034210681915283203, "step": 1279} {"info/global_step": 1280, "train_info/time_within_train_step": 2.521235227584839, "step": 1280} {"train_info/time_between_train_steps": 0.0033762454986572266, "step": 1280} {"info/global_step": 1281, "train_info/time_within_train_step": 2.52185320854187, "step": 1281} {"train_info/time_between_train_steps": 0.0033829212188720703, "step": 1281} {"info/global_step": 1282, "train_info/time_within_train_step": 2.5209059715270996, "step": 1282} {"train_info/time_between_train_steps": 0.003403186798095703, "step": 1282} {"info/global_step": 1283, "train_info/time_within_train_step": 2.5214831829071045, "step": 1283} {"train_info/time_between_train_steps": 0.003419637680053711, "step": 1283} {"info/global_step": 1284, "train_info/time_within_train_step": 2.5213873386383057, "step": 1284} {"train_info/time_between_train_steps": 0.003388643264770508, "step": 1284} {"info/global_step": 1285, "train_info/time_within_train_step": 2.521545171737671, "step": 1285} {"train_info/time_between_train_steps": 0.0033652782440185547, "step": 1285} {"info/global_step": 1286, "train_info/time_within_train_step": 2.5214037895202637, "step": 1286} {"train_info/time_between_train_steps": 0.003374338150024414, "step": 1286} {"info/global_step": 1287, "train_info/time_within_train_step": 2.525747060775757, "step": 1287} {"train_info/time_between_train_steps": 0.0034067630767822266, "step": 1287} {"info/global_step": 1288, "train_info/time_within_train_step": 2.5210912227630615, "step": 1288} {"train_info/time_between_train_steps": 0.0033655166625976562, "step": 1288} {"info/global_step": 1289, "train_info/time_within_train_step": 2.5210273265838623, "step": 1289} {"train_info/time_between_train_steps": 0.0034639835357666016, "step": 1289} {"info/global_step": 1290, "train_info/time_within_train_step": 2.521056890487671, "step": 1290} {"train_info/time_between_train_steps": 0.003384828567504883, "step": 1290} {"info/global_step": 1291, "train_info/time_within_train_step": 2.5215916633605957, "step": 1291} {"train_info/time_between_train_steps": 0.0033731460571289062, "step": 1291} {"info/global_step": 1292, "train_info/time_within_train_step": 2.52069091796875, "step": 1292} {"train_info/time_between_train_steps": 0.003378152847290039, "step": 1292} {"info/global_step": 1293, "train_info/time_within_train_step": 2.5213701725006104, "step": 1293} {"train_info/time_between_train_steps": 0.003401517868041992, "step": 1293} {"info/global_step": 1294, "train_info/time_within_train_step": 2.521299123764038, "step": 1294} {"train_info/time_between_train_steps": 0.003426074981689453, "step": 1294} {"info/global_step": 1295, "train_info/time_within_train_step": 2.5218005180358887, "step": 1295} {"train_info/time_between_train_steps": 0.0034050941467285156, "step": 1295} {"info/global_step": 1296, "train_info/time_within_train_step": 2.5218303203582764, "step": 1296} {"train_info/time_between_train_steps": 0.0033860206604003906, "step": 1296} {"info/global_step": 1297, "train_info/time_within_train_step": 2.521160125732422, "step": 1297} {"train_info/time_between_train_steps": 0.0033588409423828125, "step": 1297} {"info/global_step": 1298, "train_info/time_within_train_step": 2.520277976989746, "step": 1298} {"train_info/time_between_train_steps": 0.0033674240112304688, "step": 1298} {"info/global_step": 1299, "train_info/time_within_train_step": 2.521296739578247, "step": 1299} {"train_info/time_between_train_steps": 0.003392457962036133, "step": 1299} {"info/global_step": 1300, "train_info/time_within_train_step": 2.5216825008392334, "step": 1300} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746326481, "_runtime": 3529}, "step": 1300} {"logs": {"train/loss": 4.4661, "train/learning_rate": 0.00037777777777777777, "train/epoch": 1.14, "_timestamp": 1746326481, "_runtime": 3529}, "step": 1300} {"train_info/time_between_train_steps": 19.07573652267456, "step": 1300} {"info/global_step": 1301, "train_info/time_within_train_step": 2.339510917663574, "step": 1301} {"train_info/time_between_train_steps": 0.0033638477325439453, "step": 1301} {"info/global_step": 1302, "train_info/time_within_train_step": 2.315824031829834, "step": 1302} {"train_info/time_between_train_steps": 0.003330230712890625, "step": 1302} {"info/global_step": 1303, "train_info/time_within_train_step": 2.4639828205108643, "step": 1303} {"train_info/time_between_train_steps": 0.003403902053833008, "step": 1303} {"info/global_step": 1304, "train_info/time_within_train_step": 2.5185863971710205, "step": 1304} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 1304} {"info/global_step": 1305, "train_info/time_within_train_step": 2.518601894378662, "step": 1305} {"train_info/time_between_train_steps": 0.003359556198120117, "step": 1305} {"info/global_step": 1306, "train_info/time_within_train_step": 2.520296096801758, "step": 1306} {"train_info/time_between_train_steps": 0.0033948421478271484, "step": 1306} {"info/global_step": 1307, "train_info/time_within_train_step": 2.5215470790863037, "step": 1307} {"train_info/time_between_train_steps": 0.0034503936767578125, "step": 1307} {"info/global_step": 1308, "train_info/time_within_train_step": 2.5212719440460205, "step": 1308} {"train_info/time_between_train_steps": 0.0033524036407470703, "step": 1308} {"info/global_step": 1309, "train_info/time_within_train_step": 2.521841049194336, "step": 1309} {"train_info/time_between_train_steps": 0.00335693359375, "step": 1309} {"info/global_step": 1310, "train_info/time_within_train_step": 2.521653413772583, "step": 1310} {"train_info/time_between_train_steps": 0.003374814987182617, "step": 1310} {"info/global_step": 1311, "train_info/time_within_train_step": 2.523472547531128, "step": 1311} {"train_info/time_between_train_steps": 0.003385782241821289, "step": 1311} {"info/global_step": 1312, "train_info/time_within_train_step": 2.5499088764190674, "step": 1312} {"train_info/time_between_train_steps": 0.0033783912658691406, "step": 1312} {"info/global_step": 1313, "train_info/time_within_train_step": 2.5225391387939453, "step": 1313} {"train_info/time_between_train_steps": 0.0039441585540771484, "step": 1313} {"info/global_step": 1314, "train_info/time_within_train_step": 2.5230765342712402, "step": 1314} {"train_info/time_between_train_steps": 0.003362417221069336, "step": 1314} {"info/global_step": 1315, "train_info/time_within_train_step": 2.5224785804748535, "step": 1315} {"train_info/time_between_train_steps": 0.0033636093139648438, "step": 1315} {"info/global_step": 1316, "train_info/time_within_train_step": 2.522465467453003, "step": 1316} {"train_info/time_between_train_steps": 0.003335237503051758, "step": 1316} {"info/global_step": 1317, "train_info/time_within_train_step": 2.522310733795166, "step": 1317} {"train_info/time_between_train_steps": 0.003376007080078125, "step": 1317} {"info/global_step": 1318, "train_info/time_within_train_step": 2.763218402862549, "step": 1318} {"train_info/time_between_train_steps": 0.003366708755493164, "step": 1318} {"info/global_step": 1319, "train_info/time_within_train_step": 2.5224568843841553, "step": 1319} {"train_info/time_between_train_steps": 0.0033431053161621094, "step": 1319} {"info/global_step": 1320, "train_info/time_within_train_step": 2.522789478302002, "step": 1320} {"train_info/time_between_train_steps": 0.0033674240112304688, "step": 1320} {"info/global_step": 1321, "train_info/time_within_train_step": 2.523458242416382, "step": 1321} {"train_info/time_between_train_steps": 0.003918647766113281, "step": 1321} {"info/global_step": 1322, "train_info/time_within_train_step": 2.5226731300354004, "step": 1322} {"train_info/time_between_train_steps": 0.003360748291015625, "step": 1322} {"info/global_step": 1323, "train_info/time_within_train_step": 2.5233137607574463, "step": 1323} {"train_info/time_between_train_steps": 0.003365755081176758, "step": 1323} {"info/global_step": 1324, "train_info/time_within_train_step": 2.522120714187622, "step": 1324} {"train_info/time_between_train_steps": 0.003347158432006836, "step": 1324} {"info/global_step": 1325, "train_info/time_within_train_step": 2.5224716663360596, "step": 1325} {"train_info/time_between_train_steps": 0.003351449966430664, "step": 1325} {"info/global_step": 1326, "train_info/time_within_train_step": 2.5222246646881104, "step": 1326} {"train_info/time_between_train_steps": 0.003376483917236328, "step": 1326} {"info/global_step": 1327, "train_info/time_within_train_step": 2.5227649211883545, "step": 1327} {"train_info/time_between_train_steps": 0.0033559799194335938, "step": 1327} {"info/global_step": 1328, "train_info/time_within_train_step": 2.523357629776001, "step": 1328} {"train_info/time_between_train_steps": 0.0033631324768066406, "step": 1328} {"info/global_step": 1329, "train_info/time_within_train_step": 2.5227410793304443, "step": 1329} {"train_info/time_between_train_steps": 0.0033578872680664062, "step": 1329} {"info/global_step": 1330, "train_info/time_within_train_step": 2.648998737335205, "step": 1330} {"train_info/time_between_train_steps": 0.0033888816833496094, "step": 1330} {"info/global_step": 1331, "train_info/time_within_train_step": 2.5226893424987793, "step": 1331} {"train_info/time_between_train_steps": 0.0033910274505615234, "step": 1331} {"info/global_step": 1332, "train_info/time_within_train_step": 2.522881507873535, "step": 1332} {"train_info/time_between_train_steps": 0.0033729076385498047, "step": 1332} {"info/global_step": 1333, "train_info/time_within_train_step": 2.522582530975342, "step": 1333} {"train_info/time_between_train_steps": 0.0034008026123046875, "step": 1333} {"info/global_step": 1334, "train_info/time_within_train_step": 2.5232815742492676, "step": 1334} {"train_info/time_between_train_steps": 0.003552675247192383, "step": 1334} {"info/global_step": 1335, "train_info/time_within_train_step": 2.5220248699188232, "step": 1335} {"train_info/time_between_train_steps": 0.0035212039947509766, "step": 1335} {"info/global_step": 1336, "train_info/time_within_train_step": 2.5230281352996826, "step": 1336} {"train_info/time_between_train_steps": 0.003365039825439453, "step": 1336} {"info/global_step": 1337, "train_info/time_within_train_step": 2.5230886936187744, "step": 1337} {"train_info/time_between_train_steps": 0.003436565399169922, "step": 1337} {"info/global_step": 1338, "train_info/time_within_train_step": 2.522244691848755, "step": 1338} {"train_info/time_between_train_steps": 0.0033528804779052734, "step": 1338} {"info/global_step": 1339, "train_info/time_within_train_step": 2.522634983062744, "step": 1339} {"train_info/time_between_train_steps": 0.0035152435302734375, "step": 1339} {"info/global_step": 1340, "train_info/time_within_train_step": 2.522066593170166, "step": 1340} {"train_info/time_between_train_steps": 0.0036094188690185547, "step": 1340} {"info/global_step": 1341, "train_info/time_within_train_step": 2.5223047733306885, "step": 1341} {"train_info/time_between_train_steps": 0.0033676624298095703, "step": 1341} {"info/global_step": 1342, "train_info/time_within_train_step": 2.52236270904541, "step": 1342} {"train_info/time_between_train_steps": 0.0033648014068603516, "step": 1342} {"info/global_step": 1343, "train_info/time_within_train_step": 2.52217960357666, "step": 1343} {"train_info/time_between_train_steps": 0.003391742706298828, "step": 1343} {"info/global_step": 1344, "train_info/time_within_train_step": 2.5214667320251465, "step": 1344} {"train_info/time_between_train_steps": 0.0033833980560302734, "step": 1344} {"info/global_step": 1345, "train_info/time_within_train_step": 2.522066593170166, "step": 1345} {"train_info/time_between_train_steps": 0.0033500194549560547, "step": 1345} {"info/global_step": 1346, "train_info/time_within_train_step": 2.521613836288452, "step": 1346} {"train_info/time_between_train_steps": 0.0033860206604003906, "step": 1346} {"info/global_step": 1347, "train_info/time_within_train_step": 2.521766424179077, "step": 1347} {"train_info/time_between_train_steps": 0.0033388137817382812, "step": 1347} {"info/global_step": 1348, "train_info/time_within_train_step": 2.5502443313598633, "step": 1348} {"train_info/time_between_train_steps": 0.0034761428833007812, "step": 1348} {"info/global_step": 1349, "train_info/time_within_train_step": 2.521563768386841, "step": 1349} {"train_info/time_between_train_steps": 0.003615856170654297, "step": 1349} {"info/global_step": 1350, "train_info/time_within_train_step": 2.5220398902893066, "step": 1350} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746326627, "_runtime": 3675}, "step": 1350} {"logs": {"train/loss": 4.4409, "train/learning_rate": 0.00036666666666666667, "train/epoch": 1.15, "_timestamp": 1746326627, "_runtime": 3675}, "step": 1350} {"train_info/time_between_train_steps": 0.025150537490844727, "step": 1350} {"info/global_step": 1351, "train_info/time_within_train_step": 2.5221283435821533, "step": 1351} {"train_info/time_between_train_steps": 0.0033042430877685547, "step": 1351} {"info/global_step": 1352, "train_info/time_within_train_step": 2.5216853618621826, "step": 1352} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 1352} {"info/global_step": 1353, "train_info/time_within_train_step": 2.521676778793335, "step": 1353} {"train_info/time_between_train_steps": 0.0036232471466064453, "step": 1353} {"info/global_step": 1354, "train_info/time_within_train_step": 2.5226731300354004, "step": 1354} {"train_info/time_between_train_steps": 0.003596067428588867, "step": 1354} {"info/global_step": 1355, "train_info/time_within_train_step": 2.521810531616211, "step": 1355} {"train_info/time_between_train_steps": 0.003342866897583008, "step": 1355} {"info/global_step": 1356, "train_info/time_within_train_step": 2.5217413902282715, "step": 1356} {"train_info/time_between_train_steps": 0.003355264663696289, "step": 1356} {"info/global_step": 1357, "train_info/time_within_train_step": 2.522019863128662, "step": 1357} {"train_info/time_between_train_steps": 0.0034241676330566406, "step": 1357} {"info/global_step": 1358, "train_info/time_within_train_step": 2.5227811336517334, "step": 1358} {"train_info/time_between_train_steps": 0.0034601688385009766, "step": 1358} {"info/global_step": 1359, "train_info/time_within_train_step": 2.5229952335357666, "step": 1359} {"train_info/time_between_train_steps": 0.0034787654876708984, "step": 1359} {"info/global_step": 1360, "train_info/time_within_train_step": 2.523486614227295, "step": 1360} {"train_info/time_between_train_steps": 0.0035779476165771484, "step": 1360} {"info/global_step": 1361, "train_info/time_within_train_step": 2.5236892700195312, "step": 1361} {"train_info/time_between_train_steps": 0.003477811813354492, "step": 1361} {"info/global_step": 1362, "train_info/time_within_train_step": 2.523390293121338, "step": 1362} {"train_info/time_between_train_steps": 0.0034961700439453125, "step": 1362} {"info/global_step": 1363, "train_info/time_within_train_step": 2.5230836868286133, "step": 1363} {"train_info/time_between_train_steps": 0.003473043441772461, "step": 1363} {"info/global_step": 1364, "train_info/time_within_train_step": 2.5232150554656982, "step": 1364} {"train_info/time_between_train_steps": 0.003448009490966797, "step": 1364} {"info/global_step": 1365, "train_info/time_within_train_step": 2.5234246253967285, "step": 1365} {"train_info/time_between_train_steps": 0.0035085678100585938, "step": 1365} {"info/global_step": 1366, "train_info/time_within_train_step": 2.523057699203491, "step": 1366} {"train_info/time_between_train_steps": 0.003444194793701172, "step": 1366} {"info/global_step": 1367, "train_info/time_within_train_step": 2.5227816104888916, "step": 1367} {"train_info/time_between_train_steps": 0.003458738327026367, "step": 1367} {"info/global_step": 1368, "train_info/time_within_train_step": 2.523405075073242, "step": 1368} {"train_info/time_between_train_steps": 0.003471851348876953, "step": 1368} {"info/global_step": 1369, "train_info/time_within_train_step": 2.52396559715271, "step": 1369} {"train_info/time_between_train_steps": 0.0034465789794921875, "step": 1369} {"info/global_step": 1370, "train_info/time_within_train_step": 2.5228006839752197, "step": 1370} {"train_info/time_between_train_steps": 0.003448009490966797, "step": 1370} {"info/global_step": 1371, "train_info/time_within_train_step": 2.5228500366210938, "step": 1371} {"train_info/time_between_train_steps": 0.0034720897674560547, "step": 1371} {"info/global_step": 1372, "train_info/time_within_train_step": 2.5220987796783447, "step": 1372} {"train_info/time_between_train_steps": 0.0034797191619873047, "step": 1372} {"info/global_step": 1373, "train_info/time_within_train_step": 2.5221688747406006, "step": 1373} {"train_info/time_between_train_steps": 0.003461122512817383, "step": 1373} {"info/global_step": 1374, "train_info/time_within_train_step": 2.527620315551758, "step": 1374} {"train_info/time_between_train_steps": 0.00347900390625, "step": 1374} {"info/global_step": 1375, "train_info/time_within_train_step": 2.523470640182495, "step": 1375} {"train_info/time_between_train_steps": 0.004026174545288086, "step": 1375} {"info/global_step": 1376, "train_info/time_within_train_step": 2.523453712463379, "step": 1376} {"train_info/time_between_train_steps": 0.0035042762756347656, "step": 1376} {"info/global_step": 1377, "train_info/time_within_train_step": 2.5506224632263184, "step": 1377} {"train_info/time_between_train_steps": 0.0034782886505126953, "step": 1377} {"info/global_step": 1378, "train_info/time_within_train_step": 2.523641347885132, "step": 1378} {"train_info/time_between_train_steps": 0.0034685134887695312, "step": 1378} {"info/global_step": 1379, "train_info/time_within_train_step": 2.52286958694458, "step": 1379} {"train_info/time_between_train_steps": 0.0034880638122558594, "step": 1379} {"info/global_step": 1380, "train_info/time_within_train_step": 2.5230214595794678, "step": 1380} {"train_info/time_between_train_steps": 0.0034728050231933594, "step": 1380} {"info/global_step": 1381, "train_info/time_within_train_step": 2.523190975189209, "step": 1381} {"train_info/time_between_train_steps": 0.003469705581665039, "step": 1381} {"info/global_step": 1382, "train_info/time_within_train_step": 2.522803783416748, "step": 1382} {"train_info/time_between_train_steps": 0.003485441207885742, "step": 1382} {"info/global_step": 1383, "train_info/time_within_train_step": 2.5489234924316406, "step": 1383} {"train_info/time_between_train_steps": 0.003458738327026367, "step": 1383} {"info/global_step": 1384, "train_info/time_within_train_step": 2.521909713745117, "step": 1384} {"train_info/time_between_train_steps": 0.003475666046142578, "step": 1384} {"info/global_step": 1385, "train_info/time_within_train_step": 2.5263876914978027, "step": 1385} {"train_info/time_between_train_steps": 0.003432035446166992, "step": 1385} {"info/global_step": 1386, "train_info/time_within_train_step": 2.521223545074463, "step": 1386} {"train_info/time_between_train_steps": 0.003417491912841797, "step": 1386} {"info/global_step": 1387, "train_info/time_within_train_step": 2.521287679672241, "step": 1387} {"train_info/time_between_train_steps": 0.0033936500549316406, "step": 1387} {"info/global_step": 1388, "train_info/time_within_train_step": 2.520442485809326, "step": 1388} {"train_info/time_between_train_steps": 0.0034220218658447266, "step": 1388} {"info/global_step": 1389, "train_info/time_within_train_step": 2.5216314792633057, "step": 1389} {"train_info/time_between_train_steps": 0.0034027099609375, "step": 1389} {"info/global_step": 1390, "train_info/time_within_train_step": 2.5208916664123535, "step": 1390} {"train_info/time_between_train_steps": 0.0034112930297851562, "step": 1390} {"info/global_step": 1391, "train_info/time_within_train_step": 2.521883010864258, "step": 1391} {"train_info/time_between_train_steps": 0.003426790237426758, "step": 1391} {"info/global_step": 1392, "train_info/time_within_train_step": 2.5268945693969727, "step": 1392} {"train_info/time_between_train_steps": 0.12947487831115723, "step": 1392} {"info/global_step": 1393, "train_info/time_within_train_step": 2.5215563774108887, "step": 1393} {"train_info/time_between_train_steps": 0.003423452377319336, "step": 1393} {"info/global_step": 1394, "train_info/time_within_train_step": 2.5224711894989014, "step": 1394} {"train_info/time_between_train_steps": 0.0040280818939208984, "step": 1394} {"info/global_step": 1395, "train_info/time_within_train_step": 2.526320219039917, "step": 1395} {"train_info/time_between_train_steps": 0.0033881664276123047, "step": 1395} {"info/global_step": 1396, "train_info/time_within_train_step": 2.522585391998291, "step": 1396} {"train_info/time_between_train_steps": 0.003418445587158203, "step": 1396} {"info/global_step": 1397, "train_info/time_within_train_step": 2.521979808807373, "step": 1397} {"train_info/time_between_train_steps": 0.0034513473510742188, "step": 1397} {"info/global_step": 1398, "train_info/time_within_train_step": 2.52209210395813, "step": 1398} {"train_info/time_between_train_steps": 0.0034351348876953125, "step": 1398} {"info/global_step": 1399, "train_info/time_within_train_step": 2.521787643432617, "step": 1399} {"train_info/time_between_train_steps": 0.003392934799194336, "step": 1399} {"info/global_step": 1400, "train_info/time_within_train_step": 2.5216500759124756, "step": 1400} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746326755, "_runtime": 3803}, "step": 1400} {"logs": {"train/loss": 4.4042, "train/learning_rate": 0.0003555555555555555, "train/epoch": 1.17, "_timestamp": 1746326755, "_runtime": 3803}, "step": 1400} {"train_info/time_between_train_steps": 16.589205503463745, "step": 1400} {"info/global_step": 1401, "train_info/time_within_train_step": 2.589526891708374, "step": 1401} {"train_info/time_between_train_steps": 0.0034742355346679688, "step": 1401} {"info/global_step": 1402, "train_info/time_within_train_step": 2.3185882568359375, "step": 1402} {"train_info/time_between_train_steps": 0.003366708755493164, "step": 1402} {"info/global_step": 1403, "train_info/time_within_train_step": 2.4586129188537598, "step": 1403} {"train_info/time_between_train_steps": 0.0034868717193603516, "step": 1403} {"info/global_step": 1404, "train_info/time_within_train_step": 2.5194272994995117, "step": 1404} {"train_info/time_between_train_steps": 0.003374338150024414, "step": 1404} {"info/global_step": 1405, "train_info/time_within_train_step": 2.5194075107574463, "step": 1405} {"train_info/time_between_train_steps": 0.003533601760864258, "step": 1405} {"info/global_step": 1406, "train_info/time_within_train_step": 2.520419120788574, "step": 1406} {"train_info/time_between_train_steps": 0.003366708755493164, "step": 1406} {"info/global_step": 1407, "train_info/time_within_train_step": 2.5201566219329834, "step": 1407} {"train_info/time_between_train_steps": 0.0034554004669189453, "step": 1407} {"info/global_step": 1408, "train_info/time_within_train_step": 2.521946907043457, "step": 1408} {"train_info/time_between_train_steps": 0.003381490707397461, "step": 1408} {"info/global_step": 1409, "train_info/time_within_train_step": 2.520892858505249, "step": 1409} {"train_info/time_between_train_steps": 0.0034101009368896484, "step": 1409} {"info/global_step": 1410, "train_info/time_within_train_step": 2.5220565795898438, "step": 1410} {"train_info/time_between_train_steps": 0.0035047531127929688, "step": 1410} {"info/global_step": 1411, "train_info/time_within_train_step": 2.521360158920288, "step": 1411} {"train_info/time_between_train_steps": 0.0034439563751220703, "step": 1411} {"info/global_step": 1412, "train_info/time_within_train_step": 2.5215539932250977, "step": 1412} {"train_info/time_between_train_steps": 0.003345012664794922, "step": 1412} {"info/global_step": 1413, "train_info/time_within_train_step": 2.5214767456054688, "step": 1413} {"train_info/time_between_train_steps": 0.003348827362060547, "step": 1413} {"info/global_step": 1414, "train_info/time_within_train_step": 2.5235753059387207, "step": 1414} {"train_info/time_between_train_steps": 0.0034122467041015625, "step": 1414} {"info/global_step": 1415, "train_info/time_within_train_step": 2.5223772525787354, "step": 1415} {"train_info/time_between_train_steps": 0.0034279823303222656, "step": 1415} {"info/global_step": 1416, "train_info/time_within_train_step": 2.5220096111297607, "step": 1416} {"train_info/time_between_train_steps": 0.0035245418548583984, "step": 1416} {"info/global_step": 1417, "train_info/time_within_train_step": 2.522596597671509, "step": 1417} {"train_info/time_between_train_steps": 0.003630399703979492, "step": 1417} {"info/global_step": 1418, "train_info/time_within_train_step": 2.522651433944702, "step": 1418} {"train_info/time_between_train_steps": 0.003413677215576172, "step": 1418} {"info/global_step": 1419, "train_info/time_within_train_step": 2.522096633911133, "step": 1419} {"train_info/time_between_train_steps": 0.0034046173095703125, "step": 1419} {"info/global_step": 1420, "train_info/time_within_train_step": 2.5231213569641113, "step": 1420} {"train_info/time_between_train_steps": 0.003533601760864258, "step": 1420} {"info/global_step": 1421, "train_info/time_within_train_step": 2.5233278274536133, "step": 1421} {"train_info/time_between_train_steps": 0.003625631332397461, "step": 1421} {"info/global_step": 1422, "train_info/time_within_train_step": 2.5226495265960693, "step": 1422} {"train_info/time_between_train_steps": 0.0035572052001953125, "step": 1422} {"info/global_step": 1423, "train_info/time_within_train_step": 2.5219614505767822, "step": 1423} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 1423} {"info/global_step": 1424, "train_info/time_within_train_step": 2.5221033096313477, "step": 1424} {"train_info/time_between_train_steps": 0.003424406051635742, "step": 1424} {"info/global_step": 1425, "train_info/time_within_train_step": 2.5217678546905518, "step": 1425} {"train_info/time_between_train_steps": 0.0034689903259277344, "step": 1425} {"info/global_step": 1426, "train_info/time_within_train_step": 2.522449254989624, "step": 1426} {"train_info/time_between_train_steps": 0.0036275386810302734, "step": 1426} {"info/global_step": 1427, "train_info/time_within_train_step": 2.5222108364105225, "step": 1427} {"train_info/time_between_train_steps": 0.00335693359375, "step": 1427} {"info/global_step": 1428, "train_info/time_within_train_step": 2.5218496322631836, "step": 1428} {"train_info/time_between_train_steps": 0.003362894058227539, "step": 1428} {"info/global_step": 1429, "train_info/time_within_train_step": 2.5217978954315186, "step": 1429} {"train_info/time_between_train_steps": 0.003641843795776367, "step": 1429} {"info/global_step": 1430, "train_info/time_within_train_step": 2.521958351135254, "step": 1430} {"train_info/time_between_train_steps": 0.0034127235412597656, "step": 1430} {"info/global_step": 1431, "train_info/time_within_train_step": 2.5226480960845947, "step": 1431} {"train_info/time_between_train_steps": 0.003360748291015625, "step": 1431} {"info/global_step": 1432, "train_info/time_within_train_step": 2.522575855255127, "step": 1432} {"train_info/time_between_train_steps": 0.003345489501953125, "step": 1432} {"info/global_step": 1433, "train_info/time_within_train_step": 2.523648738861084, "step": 1433} {"train_info/time_between_train_steps": 0.003627300262451172, "step": 1433} {"info/global_step": 1434, "train_info/time_within_train_step": 2.5231587886810303, "step": 1434} {"train_info/time_between_train_steps": 0.0035696029663085938, "step": 1434} {"info/global_step": 1435, "train_info/time_within_train_step": 2.5228095054626465, "step": 1435} {"train_info/time_between_train_steps": 0.0033376216888427734, "step": 1435} {"info/global_step": 1436, "train_info/time_within_train_step": 2.5559308528900146, "step": 1436} {"train_info/time_between_train_steps": 0.0035135746002197266, "step": 1436} {"info/global_step": 1437, "train_info/time_within_train_step": 2.5233967304229736, "step": 1437} {"train_info/time_between_train_steps": 0.0033559799194335938, "step": 1437} {"info/global_step": 1438, "train_info/time_within_train_step": 2.5224123001098633, "step": 1438} {"train_info/time_between_train_steps": 0.0035109519958496094, "step": 1438} {"info/global_step": 1439, "train_info/time_within_train_step": 2.521686315536499, "step": 1439} {"train_info/time_between_train_steps": 0.003353118896484375, "step": 1439} {"info/global_step": 1440, "train_info/time_within_train_step": 2.522352457046509, "step": 1440} {"train_info/time_between_train_steps": 0.003365755081176758, "step": 1440} {"info/global_step": 1441, "train_info/time_within_train_step": 2.7689058780670166, "step": 1441} {"train_info/time_between_train_steps": 0.0035963058471679688, "step": 1441} {"info/global_step": 1442, "train_info/time_within_train_step": 2.521693229675293, "step": 1442} {"train_info/time_between_train_steps": 0.003635883331298828, "step": 1442} {"info/global_step": 1443, "train_info/time_within_train_step": 2.5218429565429688, "step": 1443} {"train_info/time_between_train_steps": 0.003407001495361328, "step": 1443} {"info/global_step": 1444, "train_info/time_within_train_step": 2.5212817192077637, "step": 1444} {"train_info/time_between_train_steps": 0.0034003257751464844, "step": 1444} {"info/global_step": 1445, "train_info/time_within_train_step": 2.5218634605407715, "step": 1445} {"train_info/time_between_train_steps": 0.003336668014526367, "step": 1445} {"info/global_step": 1446, "train_info/time_within_train_step": 2.521450996398926, "step": 1446} {"train_info/time_between_train_steps": 0.0033636093139648438, "step": 1446} {"info/global_step": 1447, "train_info/time_within_train_step": 2.5224428176879883, "step": 1447} {"train_info/time_between_train_steps": 0.0034279823303222656, "step": 1447} {"info/global_step": 1448, "train_info/time_within_train_step": 2.5232911109924316, "step": 1448} {"train_info/time_between_train_steps": 0.003409147262573242, "step": 1448} {"info/global_step": 1449, "train_info/time_within_train_step": 2.523059129714966, "step": 1449} {"train_info/time_between_train_steps": 0.003406524658203125, "step": 1449} {"info/global_step": 1450, "train_info/time_within_train_step": 2.5222175121307373, "step": 1450} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746326899, "_runtime": 3947}, "step": 1450} {"logs": {"train/loss": 4.3785, "train/learning_rate": 0.0003444444444444444, "train/epoch": 1.19, "_timestamp": 1746326899, "_runtime": 3947}, "step": 1450} {"train_info/time_between_train_steps": 0.02778148651123047, "step": 1450} {"info/global_step": 1451, "train_info/time_within_train_step": 2.521929979324341, "step": 1451} {"train_info/time_between_train_steps": 0.004004001617431641, "step": 1451} {"info/global_step": 1452, "train_info/time_within_train_step": 2.522533655166626, "step": 1452} {"train_info/time_between_train_steps": 0.003404378890991211, "step": 1452} {"info/global_step": 1453, "train_info/time_within_train_step": 2.52235746383667, "step": 1453} {"train_info/time_between_train_steps": 0.003427267074584961, "step": 1453} {"info/global_step": 1454, "train_info/time_within_train_step": 2.521510601043701, "step": 1454} {"train_info/time_between_train_steps": 0.003415822982788086, "step": 1454} {"info/global_step": 1455, "train_info/time_within_train_step": 2.5714612007141113, "step": 1455} {"train_info/time_between_train_steps": 0.0034711360931396484, "step": 1455} {"info/global_step": 1456, "train_info/time_within_train_step": 2.521397113800049, "step": 1456} {"train_info/time_between_train_steps": 0.003483295440673828, "step": 1456} {"info/global_step": 1457, "train_info/time_within_train_step": 2.5213563442230225, "step": 1457} {"train_info/time_between_train_steps": 0.0034601688385009766, "step": 1457} {"info/global_step": 1458, "train_info/time_within_train_step": 2.520965576171875, "step": 1458} {"train_info/time_between_train_steps": 0.0034465789794921875, "step": 1458} {"info/global_step": 1459, "train_info/time_within_train_step": 2.521416425704956, "step": 1459} {"train_info/time_between_train_steps": 0.0034258365631103516, "step": 1459} {"info/global_step": 1460, "train_info/time_within_train_step": 2.5209922790527344, "step": 1460} {"train_info/time_between_train_steps": 0.0033981800079345703, "step": 1460} {"info/global_step": 1461, "train_info/time_within_train_step": 2.520862579345703, "step": 1461} {"train_info/time_between_train_steps": 0.0034465789794921875, "step": 1461} {"info/global_step": 1462, "train_info/time_within_train_step": 2.5216681957244873, "step": 1462} {"train_info/time_between_train_steps": 0.0034666061401367188, "step": 1462} {"info/global_step": 1463, "train_info/time_within_train_step": 2.522434711456299, "step": 1463} {"train_info/time_between_train_steps": 0.003436565399169922, "step": 1463} {"info/global_step": 1464, "train_info/time_within_train_step": 2.522071361541748, "step": 1464} {"train_info/time_between_train_steps": 0.003422975540161133, "step": 1464} {"info/global_step": 1465, "train_info/time_within_train_step": 2.5227246284484863, "step": 1465} {"train_info/time_between_train_steps": 0.0034530162811279297, "step": 1465} {"info/global_step": 1466, "train_info/time_within_train_step": 2.5221214294433594, "step": 1466} {"train_info/time_between_train_steps": 0.0034170150756835938, "step": 1466} {"info/global_step": 1467, "train_info/time_within_train_step": 2.5217950344085693, "step": 1467} {"train_info/time_between_train_steps": 0.0034215450286865234, "step": 1467} {"info/global_step": 1468, "train_info/time_within_train_step": 2.5218989849090576, "step": 1468} {"train_info/time_between_train_steps": 0.003422260284423828, "step": 1468} {"info/global_step": 1469, "train_info/time_within_train_step": 2.522455930709839, "step": 1469} {"train_info/time_between_train_steps": 0.0034470558166503906, "step": 1469} {"info/global_step": 1470, "train_info/time_within_train_step": 2.522705078125, "step": 1470} {"train_info/time_between_train_steps": 0.0034792423248291016, "step": 1470} {"info/global_step": 1471, "train_info/time_within_train_step": 2.549405813217163, "step": 1471} {"train_info/time_between_train_steps": 0.0035021305084228516, "step": 1471} {"info/global_step": 1472, "train_info/time_within_train_step": 2.5335986614227295, "step": 1472} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 1472} {"info/global_step": 1473, "train_info/time_within_train_step": 2.5244951248168945, "step": 1473} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 1473} {"info/global_step": 1474, "train_info/time_within_train_step": 2.520498752593994, "step": 1474} {"train_info/time_between_train_steps": 0.003093719482421875, "step": 1474} {"info/global_step": 1475, "train_info/time_within_train_step": 2.520630359649658, "step": 1475} {"train_info/time_between_train_steps": 0.003085613250732422, "step": 1475} {"info/global_step": 1476, "train_info/time_within_train_step": 2.520670175552368, "step": 1476} {"train_info/time_between_train_steps": 0.0030698776245117188, "step": 1476} {"info/global_step": 1477, "train_info/time_within_train_step": 2.5198304653167725, "step": 1477} {"train_info/time_between_train_steps": 0.003068208694458008, "step": 1477} {"info/global_step": 1478, "train_info/time_within_train_step": 2.520892858505249, "step": 1478} {"train_info/time_between_train_steps": 0.0030858516693115234, "step": 1478} {"info/global_step": 1479, "train_info/time_within_train_step": 2.5204825401306152, "step": 1479} {"train_info/time_between_train_steps": 0.0031206607818603516, "step": 1479} {"info/global_step": 1480, "train_info/time_within_train_step": 2.746760129928589, "step": 1480} {"train_info/time_between_train_steps": 0.0030829906463623047, "step": 1480} {"info/global_step": 1481, "train_info/time_within_train_step": 2.5224452018737793, "step": 1481} {"train_info/time_between_train_steps": 0.003076791763305664, "step": 1481} {"info/global_step": 1482, "train_info/time_within_train_step": 2.5207557678222656, "step": 1482} {"train_info/time_between_train_steps": 0.0031270980834960938, "step": 1482} {"info/global_step": 1483, "train_info/time_within_train_step": 2.5217041969299316, "step": 1483} {"train_info/time_between_train_steps": 0.0031371116638183594, "step": 1483} {"info/global_step": 1484, "train_info/time_within_train_step": 2.5218141078948975, "step": 1484} {"train_info/time_between_train_steps": 0.003091096878051758, "step": 1484} {"info/global_step": 1485, "train_info/time_within_train_step": 2.521411895751953, "step": 1485} {"train_info/time_between_train_steps": 0.003077268600463867, "step": 1485} {"info/global_step": 1486, "train_info/time_within_train_step": 2.521512985229492, "step": 1486} {"train_info/time_between_train_steps": 0.003125429153442383, "step": 1486} {"info/global_step": 1487, "train_info/time_within_train_step": 2.5205352306365967, "step": 1487} {"train_info/time_between_train_steps": 0.0031015872955322266, "step": 1487} {"info/global_step": 1488, "train_info/time_within_train_step": 2.5216965675354004, "step": 1488} {"train_info/time_between_train_steps": 0.0031023025512695312, "step": 1488} {"info/global_step": 1489, "train_info/time_within_train_step": 2.5214428901672363, "step": 1489} {"train_info/time_between_train_steps": 0.0030927658081054688, "step": 1489} {"info/global_step": 1490, "train_info/time_within_train_step": 2.521254539489746, "step": 1490} {"train_info/time_between_train_steps": 0.0030851364135742188, "step": 1490} {"info/global_step": 1491, "train_info/time_within_train_step": 2.5211639404296875, "step": 1491} {"train_info/time_between_train_steps": 0.0030868053436279297, "step": 1491} {"info/global_step": 1492, "train_info/time_within_train_step": 2.52105450630188, "step": 1492} {"train_info/time_between_train_steps": 0.0030884742736816406, "step": 1492} {"info/global_step": 1493, "train_info/time_within_train_step": 2.5215275287628174, "step": 1493} {"train_info/time_between_train_steps": 0.0030868053436279297, "step": 1493} {"info/global_step": 1494, "train_info/time_within_train_step": 2.522207736968994, "step": 1494} {"train_info/time_between_train_steps": 0.0030868053436279297, "step": 1494} {"info/global_step": 1495, "train_info/time_within_train_step": 2.5212864875793457, "step": 1495} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 1495} {"info/global_step": 1496, "train_info/time_within_train_step": 2.521315097808838, "step": 1496} {"train_info/time_between_train_steps": 0.0030455589294433594, "step": 1496} {"info/global_step": 1497, "train_info/time_within_train_step": 2.5201776027679443, "step": 1497} {"train_info/time_between_train_steps": 0.003087759017944336, "step": 1497} {"info/global_step": 1498, "train_info/time_within_train_step": 2.5214223861694336, "step": 1498} {"train_info/time_between_train_steps": 0.00323486328125, "step": 1498} {"info/global_step": 1499, "train_info/time_within_train_step": 2.5212643146514893, "step": 1499} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 1499} {"info/global_step": 1500, "train_info/time_within_train_step": 3.0421111583709717, "step": 1500} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746327027, "_runtime": 4075}, "step": 1500} {"logs": {"train/loss": 4.3536, "train/learning_rate": 0.0003333333333333333, "train/epoch": 1.2, "_timestamp": 1746327027, "_runtime": 4075}, "step": 1500} {"train_info/time_between_train_steps": 17.153687000274658, "step": 1500} {"info/global_step": 1501, "train_info/time_within_train_step": 2.3356423377990723, "step": 1501} {"train_info/time_between_train_steps": 0.0030477046966552734, "step": 1501} {"info/global_step": 1502, "train_info/time_within_train_step": 2.3179547786712646, "step": 1502} {"train_info/time_between_train_steps": 0.003098726272583008, "step": 1502} {"info/global_step": 1503, "train_info/time_within_train_step": 2.4641542434692383, "step": 1503} {"train_info/time_between_train_steps": 0.0030393600463867188, "step": 1503} {"info/global_step": 1504, "train_info/time_within_train_step": 2.517974853515625, "step": 1504} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 1504} {"info/global_step": 1505, "train_info/time_within_train_step": 2.519186019897461, "step": 1505} {"train_info/time_between_train_steps": 0.0030367374420166016, "step": 1505} {"info/global_step": 1506, "train_info/time_within_train_step": 2.520778179168701, "step": 1506} {"train_info/time_between_train_steps": 0.0030858516693115234, "step": 1506} {"info/global_step": 1507, "train_info/time_within_train_step": 2.548656940460205, "step": 1507} {"train_info/time_between_train_steps": 0.0030450820922851562, "step": 1507} {"info/global_step": 1508, "train_info/time_within_train_step": 2.5215630531311035, "step": 1508} {"train_info/time_between_train_steps": 0.0030906200408935547, "step": 1508} {"info/global_step": 1509, "train_info/time_within_train_step": 2.5217349529266357, "step": 1509} {"train_info/time_between_train_steps": 0.003141641616821289, "step": 1509} {"info/global_step": 1510, "train_info/time_within_train_step": 2.5214333534240723, "step": 1510} {"train_info/time_between_train_steps": 0.003316164016723633, "step": 1510} {"info/global_step": 1511, "train_info/time_within_train_step": 2.5217111110687256, "step": 1511} {"train_info/time_between_train_steps": 0.003113269805908203, "step": 1511} {"info/global_step": 1512, "train_info/time_within_train_step": 2.5225703716278076, "step": 1512} {"train_info/time_between_train_steps": 0.0031087398529052734, "step": 1512} {"info/global_step": 1513, "train_info/time_within_train_step": 2.521953821182251, "step": 1513} {"train_info/time_between_train_steps": 0.0031080245971679688, "step": 1513} {"info/global_step": 1514, "train_info/time_within_train_step": 2.5214076042175293, "step": 1514} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 1514} {"info/global_step": 1515, "train_info/time_within_train_step": 2.5216426849365234, "step": 1515} {"train_info/time_between_train_steps": 0.0031006336212158203, "step": 1515} {"info/global_step": 1516, "train_info/time_within_train_step": 2.521965503692627, "step": 1516} {"train_info/time_between_train_steps": 0.003101348876953125, "step": 1516} {"info/global_step": 1517, "train_info/time_within_train_step": 2.5221664905548096, "step": 1517} {"train_info/time_between_train_steps": 0.0030994415283203125, "step": 1517} {"info/global_step": 1518, "train_info/time_within_train_step": 2.522968292236328, "step": 1518} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 1518} {"info/global_step": 1519, "train_info/time_within_train_step": 2.521958112716675, "step": 1519} {"train_info/time_between_train_steps": 0.003110170364379883, "step": 1519} {"info/global_step": 1520, "train_info/time_within_train_step": 2.522655963897705, "step": 1520} {"train_info/time_between_train_steps": 0.0030841827392578125, "step": 1520} {"info/global_step": 1521, "train_info/time_within_train_step": 2.5227713584899902, "step": 1521} {"train_info/time_between_train_steps": 0.0031037330627441406, "step": 1521} {"info/global_step": 1522, "train_info/time_within_train_step": 2.5236761569976807, "step": 1522} {"train_info/time_between_train_steps": 0.003100156784057617, "step": 1522} {"info/global_step": 1523, "train_info/time_within_train_step": 2.522606134414673, "step": 1523} {"train_info/time_between_train_steps": 0.003111600875854492, "step": 1523} {"info/global_step": 1524, "train_info/time_within_train_step": 2.5228617191314697, "step": 1524} {"train_info/time_between_train_steps": 0.003095388412475586, "step": 1524} {"info/global_step": 1525, "train_info/time_within_train_step": 2.5229039192199707, "step": 1525} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 1525} {"info/global_step": 1526, "train_info/time_within_train_step": 2.5224475860595703, "step": 1526} {"train_info/time_between_train_steps": 0.0031015872955322266, "step": 1526} {"info/global_step": 1527, "train_info/time_within_train_step": 2.5220322608947754, "step": 1527} {"train_info/time_between_train_steps": 0.0030939579010009766, "step": 1527} {"info/global_step": 1528, "train_info/time_within_train_step": 2.522103786468506, "step": 1528} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 1528} {"info/global_step": 1529, "train_info/time_within_train_step": 2.7201168537139893, "step": 1529} {"train_info/time_between_train_steps": 0.003094196319580078, "step": 1529} {"info/global_step": 1530, "train_info/time_within_train_step": 2.522749423980713, "step": 1530} {"train_info/time_between_train_steps": 0.0031082630157470703, "step": 1530} {"info/global_step": 1531, "train_info/time_within_train_step": 2.5222971439361572, "step": 1531} {"train_info/time_between_train_steps": 0.0031054019927978516, "step": 1531} {"info/global_step": 1532, "train_info/time_within_train_step": 2.523117780685425, "step": 1532} {"train_info/time_between_train_steps": 0.0031037330627441406, "step": 1532} {"info/global_step": 1533, "train_info/time_within_train_step": 2.522096633911133, "step": 1533} {"train_info/time_between_train_steps": 0.003132343292236328, "step": 1533} {"info/global_step": 1534, "train_info/time_within_train_step": 2.5217175483703613, "step": 1534} {"train_info/time_between_train_steps": 0.0031363964080810547, "step": 1534} {"info/global_step": 1535, "train_info/time_within_train_step": 2.522522449493408, "step": 1535} {"train_info/time_between_train_steps": 0.0030889511108398438, "step": 1535} {"info/global_step": 1536, "train_info/time_within_train_step": 2.5218563079833984, "step": 1536} {"train_info/time_between_train_steps": 0.0033638477325439453, "step": 1536} {"info/global_step": 1537, "train_info/time_within_train_step": 2.523099184036255, "step": 1537} {"train_info/time_between_train_steps": 0.003084421157836914, "step": 1537} {"info/global_step": 1538, "train_info/time_within_train_step": 2.521752119064331, "step": 1538} {"train_info/time_between_train_steps": 0.0031332969665527344, "step": 1538} {"info/global_step": 1539, "train_info/time_within_train_step": 2.5218396186828613, "step": 1539} {"train_info/time_between_train_steps": 0.003093242645263672, "step": 1539} {"info/global_step": 1540, "train_info/time_within_train_step": 2.521677017211914, "step": 1540} {"train_info/time_between_train_steps": 0.0030896663665771484, "step": 1540} {"info/global_step": 1541, "train_info/time_within_train_step": 2.521090269088745, "step": 1541} {"train_info/time_between_train_steps": 0.0031104087829589844, "step": 1541} {"info/global_step": 1542, "train_info/time_within_train_step": 2.5216422080993652, "step": 1542} {"train_info/time_between_train_steps": 0.003094911575317383, "step": 1542} {"info/global_step": 1543, "train_info/time_within_train_step": 2.521740198135376, "step": 1543} {"train_info/time_between_train_steps": 0.003083467483520508, "step": 1543} {"info/global_step": 1544, "train_info/time_within_train_step": 2.5255815982818604, "step": 1544} {"train_info/time_between_train_steps": 0.0030968189239501953, "step": 1544} {"info/global_step": 1545, "train_info/time_within_train_step": 2.5211453437805176, "step": 1545} {"train_info/time_between_train_steps": 0.0030891895294189453, "step": 1545} {"info/global_step": 1546, "train_info/time_within_train_step": 2.5216121673583984, "step": 1546} {"train_info/time_between_train_steps": 0.003108978271484375, "step": 1546} {"info/global_step": 1547, "train_info/time_within_train_step": 2.520876169204712, "step": 1547} {"train_info/time_between_train_steps": 0.0031044483184814453, "step": 1547} {"info/global_step": 1548, "train_info/time_within_train_step": 2.521568775177002, "step": 1548} {"train_info/time_between_train_steps": 0.0031075477600097656, "step": 1548} {"info/global_step": 1549, "train_info/time_within_train_step": 2.522087335586548, "step": 1549} {"train_info/time_between_train_steps": 0.003108978271484375, "step": 1549} {"info/global_step": 1550, "train_info/time_within_train_step": 2.5271546840667725, "step": 1550} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746327171, "_runtime": 4219}, "step": 1550} {"logs": {"train/loss": 4.3292, "train/learning_rate": 0.0003222222222222222, "train/epoch": 1.22, "_timestamp": 1746327171, "_runtime": 4219}, "step": 1550} {"train_info/time_between_train_steps": 0.023892879486083984, "step": 1550} {"info/global_step": 1551, "train_info/time_within_train_step": 2.5213077068328857, "step": 1551} {"train_info/time_between_train_steps": 0.003078460693359375, "step": 1551} {"info/global_step": 1552, "train_info/time_within_train_step": 2.5217299461364746, "step": 1552} {"train_info/time_between_train_steps": 0.0030846595764160156, "step": 1552} {"info/global_step": 1553, "train_info/time_within_train_step": 2.5217156410217285, "step": 1553} {"train_info/time_between_train_steps": 0.003090381622314453, "step": 1553} {"info/global_step": 1554, "train_info/time_within_train_step": 2.521474599838257, "step": 1554} {"train_info/time_between_train_steps": 0.0033349990844726562, "step": 1554} {"info/global_step": 1555, "train_info/time_within_train_step": 2.5217254161834717, "step": 1555} {"train_info/time_between_train_steps": 0.003097057342529297, "step": 1555} {"info/global_step": 1556, "train_info/time_within_train_step": 2.5216622352600098, "step": 1556} {"train_info/time_between_train_steps": 0.0030934810638427734, "step": 1556} {"info/global_step": 1557, "train_info/time_within_train_step": 2.521665334701538, "step": 1557} {"train_info/time_between_train_steps": 0.003123044967651367, "step": 1557} {"info/global_step": 1558, "train_info/time_within_train_step": 2.5223400592803955, "step": 1558} {"train_info/time_between_train_steps": 0.0031328201293945312, "step": 1558} {"info/global_step": 1559, "train_info/time_within_train_step": 2.5216147899627686, "step": 1559} {"train_info/time_between_train_steps": 0.003072023391723633, "step": 1559} {"info/global_step": 1560, "train_info/time_within_train_step": 2.521167516708374, "step": 1560} {"train_info/time_between_train_steps": 0.003124237060546875, "step": 1560} {"info/global_step": 1561, "train_info/time_within_train_step": 2.521867513656616, "step": 1561} {"train_info/time_between_train_steps": 0.0030908584594726562, "step": 1561} {"info/global_step": 1562, "train_info/time_within_train_step": 2.521030902862549, "step": 1562} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 1562} {"info/global_step": 1563, "train_info/time_within_train_step": 2.520922899246216, "step": 1563} {"train_info/time_between_train_steps": 0.003126859664916992, "step": 1563} {"info/global_step": 1564, "train_info/time_within_train_step": 2.520815372467041, "step": 1564} {"train_info/time_between_train_steps": 0.003103494644165039, "step": 1564} {"info/global_step": 1565, "train_info/time_within_train_step": 2.521651268005371, "step": 1565} {"train_info/time_between_train_steps": 0.0033063888549804688, "step": 1565} {"info/global_step": 1566, "train_info/time_within_train_step": 2.5214385986328125, "step": 1566} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 1566} {"info/global_step": 1567, "train_info/time_within_train_step": 2.5221824645996094, "step": 1567} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 1567} {"info/global_step": 1568, "train_info/time_within_train_step": 2.5222721099853516, "step": 1568} {"train_info/time_between_train_steps": 0.00354766845703125, "step": 1568} {"info/global_step": 1569, "train_info/time_within_train_step": 2.801023006439209, "step": 1569} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 1569} {"info/global_step": 1570, "train_info/time_within_train_step": 2.52211856842041, "step": 1570} {"train_info/time_between_train_steps": 0.0033533573150634766, "step": 1570} {"info/global_step": 1571, "train_info/time_within_train_step": 2.5214953422546387, "step": 1571} {"train_info/time_between_train_steps": 0.003240823745727539, "step": 1571} {"info/global_step": 1572, "train_info/time_within_train_step": 2.5213093757629395, "step": 1572} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 1572} {"info/global_step": 1573, "train_info/time_within_train_step": 2.5219337940216064, "step": 1573} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 1573} {"info/global_step": 1574, "train_info/time_within_train_step": 2.5215632915496826, "step": 1574} {"train_info/time_between_train_steps": 0.0031261444091796875, "step": 1574} {"info/global_step": 1575, "train_info/time_within_train_step": 2.5211021900177, "step": 1575} {"train_info/time_between_train_steps": 0.003136157989501953, "step": 1575} {"info/global_step": 1576, "train_info/time_within_train_step": 2.52083683013916, "step": 1576} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 1576} {"info/global_step": 1577, "train_info/time_within_train_step": 2.520897150039673, "step": 1577} {"train_info/time_between_train_steps": 0.003123044967651367, "step": 1577} {"info/global_step": 1578, "train_info/time_within_train_step": 2.5215182304382324, "step": 1578} {"train_info/time_between_train_steps": 0.003439664840698242, "step": 1578} {"info/global_step": 1579, "train_info/time_within_train_step": 2.5216104984283447, "step": 1579} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 1579} {"info/global_step": 1580, "train_info/time_within_train_step": 2.5213117599487305, "step": 1580} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 1580} {"info/global_step": 1581, "train_info/time_within_train_step": 2.521092176437378, "step": 1581} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 1581} {"info/global_step": 1582, "train_info/time_within_train_step": 2.5221381187438965, "step": 1582} {"train_info/time_between_train_steps": 0.0032062530517578125, "step": 1582} {"info/global_step": 1583, "train_info/time_within_train_step": 2.522489309310913, "step": 1583} {"train_info/time_between_train_steps": 0.003299713134765625, "step": 1583} {"info/global_step": 1584, "train_info/time_within_train_step": 2.5211994647979736, "step": 1584} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 1584} {"info/global_step": 1585, "train_info/time_within_train_step": 2.522702693939209, "step": 1585} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 1585} {"info/global_step": 1586, "train_info/time_within_train_step": 2.521592855453491, "step": 1586} {"train_info/time_between_train_steps": 0.003199338912963867, "step": 1586} {"info/global_step": 1587, "train_info/time_within_train_step": 2.5214645862579346, "step": 1587} {"train_info/time_between_train_steps": 0.00334930419921875, "step": 1587} {"info/global_step": 1588, "train_info/time_within_train_step": 2.521857261657715, "step": 1588} {"train_info/time_between_train_steps": 0.0032510757446289062, "step": 1588} {"info/global_step": 1589, "train_info/time_within_train_step": 2.521641969680786, "step": 1589} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 1589} {"info/global_step": 1590, "train_info/time_within_train_step": 2.5217864513397217, "step": 1590} {"train_info/time_between_train_steps": 0.003369569778442383, "step": 1590} {"info/global_step": 1591, "train_info/time_within_train_step": 2.521624803543091, "step": 1591} {"train_info/time_between_train_steps": 0.0033609867095947266, "step": 1591} {"info/global_step": 1592, "train_info/time_within_train_step": 2.5213754177093506, "step": 1592} {"train_info/time_between_train_steps": 0.0035696029663085938, "step": 1592} {"info/global_step": 1593, "train_info/time_within_train_step": 2.5217268466949463, "step": 1593} {"train_info/time_between_train_steps": 0.0035142898559570312, "step": 1593} {"info/global_step": 1594, "train_info/time_within_train_step": 2.5215606689453125, "step": 1594} {"train_info/time_between_train_steps": 0.003537416458129883, "step": 1594} {"info/global_step": 1595, "train_info/time_within_train_step": 2.521468162536621, "step": 1595} {"train_info/time_between_train_steps": 0.0034787654876708984, "step": 1595} {"info/global_step": 1596, "train_info/time_within_train_step": 2.5223007202148438, "step": 1596} {"train_info/time_between_train_steps": 0.0036249160766601562, "step": 1596} {"info/global_step": 1597, "train_info/time_within_train_step": 2.5217549800872803, "step": 1597} {"train_info/time_between_train_steps": 0.003446817398071289, "step": 1597} {"info/global_step": 1598, "train_info/time_within_train_step": 2.5217466354370117, "step": 1598} {"train_info/time_between_train_steps": 0.003448486328125, "step": 1598} {"info/global_step": 1599, "train_info/time_within_train_step": 2.5215156078338623, "step": 1599} {"train_info/time_between_train_steps": 0.0033555030822753906, "step": 1599} {"info/global_step": 1600, "train_info/time_within_train_step": 2.522177219390869, "step": 1600} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746327299, "_runtime": 4347}, "step": 1600} {"logs": {"train/loss": 4.3076, "train/learning_rate": 0.00031111111111111107, "train/epoch": 1.24, "_timestamp": 1746327299, "_runtime": 4347}, "step": 1600} {"train_info/time_between_train_steps": 18.60539984703064, "step": 1600} {"info/global_step": 1601, "train_info/time_within_train_step": 2.33748459815979, "step": 1601} {"train_info/time_between_train_steps": 0.003406524658203125, "step": 1601} {"info/global_step": 1602, "train_info/time_within_train_step": 2.3195385932922363, "step": 1602} {"train_info/time_between_train_steps": 0.0035202503204345703, "step": 1602} {"info/global_step": 1603, "train_info/time_within_train_step": 2.4502711296081543, "step": 1603} {"train_info/time_between_train_steps": 0.0034332275390625, "step": 1603} {"info/global_step": 1604, "train_info/time_within_train_step": 2.5168960094451904, "step": 1604} {"train_info/time_between_train_steps": 0.00351715087890625, "step": 1604} {"info/global_step": 1605, "train_info/time_within_train_step": 2.5167641639709473, "step": 1605} {"train_info/time_between_train_steps": 0.003321409225463867, "step": 1605} {"info/global_step": 1606, "train_info/time_within_train_step": 2.520080327987671, "step": 1606} {"train_info/time_between_train_steps": 0.0033502578735351562, "step": 1606} {"info/global_step": 1607, "train_info/time_within_train_step": 2.5209758281707764, "step": 1607} {"train_info/time_between_train_steps": 0.0033600330352783203, "step": 1607} {"info/global_step": 1608, "train_info/time_within_train_step": 2.521066665649414, "step": 1608} {"train_info/time_between_train_steps": 0.003345966339111328, "step": 1608} {"info/global_step": 1609, "train_info/time_within_train_step": 2.521131753921509, "step": 1609} {"train_info/time_between_train_steps": 0.0033180713653564453, "step": 1609} {"info/global_step": 1610, "train_info/time_within_train_step": 2.5205070972442627, "step": 1610} {"train_info/time_between_train_steps": 0.0033311843872070312, "step": 1610} {"info/global_step": 1611, "train_info/time_within_train_step": 2.521260976791382, "step": 1611} {"train_info/time_between_train_steps": 0.003294706344604492, "step": 1611} {"info/global_step": 1612, "train_info/time_within_train_step": 2.5211479663848877, "step": 1612} {"train_info/time_between_train_steps": 0.0033447742462158203, "step": 1612} {"info/global_step": 1613, "train_info/time_within_train_step": 2.521158218383789, "step": 1613} {"train_info/time_between_train_steps": 0.0033416748046875, "step": 1613} {"info/global_step": 1614, "train_info/time_within_train_step": 2.520444393157959, "step": 1614} {"train_info/time_between_train_steps": 0.0033631324768066406, "step": 1614} {"info/global_step": 1615, "train_info/time_within_train_step": 2.5212206840515137, "step": 1615} {"train_info/time_between_train_steps": 0.0033180713653564453, "step": 1615} {"info/global_step": 1616, "train_info/time_within_train_step": 2.5211217403411865, "step": 1616} {"train_info/time_between_train_steps": 0.003301858901977539, "step": 1616} {"info/global_step": 1617, "train_info/time_within_train_step": 2.5219473838806152, "step": 1617} {"train_info/time_between_train_steps": 0.003283262252807617, "step": 1617} {"info/global_step": 1618, "train_info/time_within_train_step": 2.5216281414031982, "step": 1618} {"train_info/time_between_train_steps": 0.0033113956451416016, "step": 1618} {"info/global_step": 1619, "train_info/time_within_train_step": 2.5219886302948, "step": 1619} {"train_info/time_between_train_steps": 0.0033631324768066406, "step": 1619} {"info/global_step": 1620, "train_info/time_within_train_step": 2.5216224193573, "step": 1620} {"train_info/time_between_train_steps": 0.0033364295959472656, "step": 1620} {"info/global_step": 1621, "train_info/time_within_train_step": 2.521775007247925, "step": 1621} {"train_info/time_between_train_steps": 0.003315448760986328, "step": 1621} {"info/global_step": 1622, "train_info/time_within_train_step": 2.522573709487915, "step": 1622} {"train_info/time_between_train_steps": 0.0034012794494628906, "step": 1622} {"info/global_step": 1623, "train_info/time_within_train_step": 2.5226192474365234, "step": 1623} {"train_info/time_between_train_steps": 0.003375530242919922, "step": 1623} {"info/global_step": 1624, "train_info/time_within_train_step": 2.5230093002319336, "step": 1624} {"train_info/time_between_train_steps": 0.0033190250396728516, "step": 1624} {"info/global_step": 1625, "train_info/time_within_train_step": 2.52294659614563, "step": 1625} {"train_info/time_between_train_steps": 0.003543853759765625, "step": 1625} {"info/global_step": 1626, "train_info/time_within_train_step": 2.522533655166626, "step": 1626} {"train_info/time_between_train_steps": 0.003454446792602539, "step": 1626} {"info/global_step": 1627, "train_info/time_within_train_step": 2.7371490001678467, "step": 1627} {"train_info/time_between_train_steps": 0.003170490264892578, "step": 1627} {"info/global_step": 1628, "train_info/time_within_train_step": 2.521073579788208, "step": 1628} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 1628} {"info/global_step": 1629, "train_info/time_within_train_step": 2.5210206508636475, "step": 1629} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 1629} {"info/global_step": 1630, "train_info/time_within_train_step": 2.521573305130005, "step": 1630} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 1630} {"info/global_step": 1631, "train_info/time_within_train_step": 2.5223448276519775, "step": 1631} {"train_info/time_between_train_steps": 0.003437042236328125, "step": 1631} {"info/global_step": 1632, "train_info/time_within_train_step": 2.5227584838867188, "step": 1632} {"train_info/time_between_train_steps": 0.003397226333618164, "step": 1632} {"info/global_step": 1633, "train_info/time_within_train_step": 2.5232670307159424, "step": 1633} {"train_info/time_between_train_steps": 0.004040241241455078, "step": 1633} {"info/global_step": 1634, "train_info/time_within_train_step": 2.52321195602417, "step": 1634} {"train_info/time_between_train_steps": 0.003398418426513672, "step": 1634} {"info/global_step": 1635, "train_info/time_within_train_step": 2.5233662128448486, "step": 1635} {"train_info/time_between_train_steps": 0.003384828567504883, "step": 1635} {"info/global_step": 1636, "train_info/time_within_train_step": 2.522440195083618, "step": 1636} {"train_info/time_between_train_steps": 0.003435373306274414, "step": 1636} {"info/global_step": 1637, "train_info/time_within_train_step": 2.522782802581787, "step": 1637} {"train_info/time_between_train_steps": 0.0033555030822753906, "step": 1637} {"info/global_step": 1638, "train_info/time_within_train_step": 2.522209644317627, "step": 1638} {"train_info/time_between_train_steps": 0.003341197967529297, "step": 1638} {"info/global_step": 1639, "train_info/time_within_train_step": 2.521979570388794, "step": 1639} {"train_info/time_between_train_steps": 0.0033707618713378906, "step": 1639} {"info/global_step": 1640, "train_info/time_within_train_step": 2.5213139057159424, "step": 1640} {"train_info/time_between_train_steps": 0.003427743911743164, "step": 1640} {"info/global_step": 1641, "train_info/time_within_train_step": 2.521374225616455, "step": 1641} {"train_info/time_between_train_steps": 0.0033462047576904297, "step": 1641} {"info/global_step": 1642, "train_info/time_within_train_step": 2.5218231678009033, "step": 1642} {"train_info/time_between_train_steps": 0.003393411636352539, "step": 1642} {"info/global_step": 1643, "train_info/time_within_train_step": 2.5204482078552246, "step": 1643} {"train_info/time_between_train_steps": 0.0034084320068359375, "step": 1643} {"info/global_step": 1644, "train_info/time_within_train_step": 2.5212502479553223, "step": 1644} {"train_info/time_between_train_steps": 0.003411531448364258, "step": 1644} {"info/global_step": 1645, "train_info/time_within_train_step": 2.5218348503112793, "step": 1645} {"train_info/time_between_train_steps": 0.003422975540161133, "step": 1645} {"info/global_step": 1646, "train_info/time_within_train_step": 2.521817207336426, "step": 1646} {"train_info/time_between_train_steps": 0.0035638809204101562, "step": 1646} {"info/global_step": 1647, "train_info/time_within_train_step": 2.522514581680298, "step": 1647} {"train_info/time_between_train_steps": 0.0033965110778808594, "step": 1647} {"info/global_step": 1648, "train_info/time_within_train_step": 2.521958827972412, "step": 1648} {"train_info/time_between_train_steps": 0.0034716129302978516, "step": 1648} {"info/global_step": 1649, "train_info/time_within_train_step": 2.5216307640075684, "step": 1649} {"train_info/time_between_train_steps": 0.0034101009368896484, "step": 1649} {"info/global_step": 1650, "train_info/time_within_train_step": 2.522878646850586, "step": 1650} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746327444, "_runtime": 4492}, "step": 1650} {"logs": {"train/loss": 4.2697, "train/learning_rate": 0.0003, "train/epoch": 1.25, "_timestamp": 1746327444, "_runtime": 4492}, "step": 1650} {"train_info/time_between_train_steps": 0.02429676055908203, "step": 1650} {"info/global_step": 1651, "train_info/time_within_train_step": 2.5223870277404785, "step": 1651} {"train_info/time_between_train_steps": 0.003437042236328125, "step": 1651} {"info/global_step": 1652, "train_info/time_within_train_step": 2.5220606327056885, "step": 1652} {"train_info/time_between_train_steps": 0.0033321380615234375, "step": 1652} {"info/global_step": 1653, "train_info/time_within_train_step": 2.5229644775390625, "step": 1653} {"train_info/time_between_train_steps": 0.0033762454986572266, "step": 1653} {"info/global_step": 1654, "train_info/time_within_train_step": 2.522562265396118, "step": 1654} {"train_info/time_between_train_steps": 0.003345966339111328, "step": 1654} {"info/global_step": 1655, "train_info/time_within_train_step": 2.5220847129821777, "step": 1655} {"train_info/time_between_train_steps": 0.0034203529357910156, "step": 1655} {"info/global_step": 1656, "train_info/time_within_train_step": 2.522016763687134, "step": 1656} {"train_info/time_between_train_steps": 0.0034182071685791016, "step": 1656} {"info/global_step": 1657, "train_info/time_within_train_step": 2.5210680961608887, "step": 1657} {"train_info/time_between_train_steps": 0.0034041404724121094, "step": 1657} {"info/global_step": 1658, "train_info/time_within_train_step": 2.521921157836914, "step": 1658} {"train_info/time_between_train_steps": 0.003400564193725586, "step": 1658} {"info/global_step": 1659, "train_info/time_within_train_step": 2.5224690437316895, "step": 1659} {"train_info/time_between_train_steps": 0.0034339427947998047, "step": 1659} {"info/global_step": 1660, "train_info/time_within_train_step": 2.522313117980957, "step": 1660} {"train_info/time_between_train_steps": 0.0034317970275878906, "step": 1660} {"info/global_step": 1661, "train_info/time_within_train_step": 2.5218353271484375, "step": 1661} {"train_info/time_between_train_steps": 0.003467559814453125, "step": 1661} {"info/global_step": 1662, "train_info/time_within_train_step": 2.5223164558410645, "step": 1662} {"train_info/time_between_train_steps": 0.003479480743408203, "step": 1662} {"info/global_step": 1663, "train_info/time_within_train_step": 2.5222928524017334, "step": 1663} {"train_info/time_between_train_steps": 0.0034465789794921875, "step": 1663} {"info/global_step": 1664, "train_info/time_within_train_step": 2.5221972465515137, "step": 1664} {"train_info/time_between_train_steps": 0.0034117698669433594, "step": 1664} {"info/global_step": 1665, "train_info/time_within_train_step": 2.522568702697754, "step": 1665} {"train_info/time_between_train_steps": 0.0034482479095458984, "step": 1665} {"info/global_step": 1666, "train_info/time_within_train_step": 2.5227432250976562, "step": 1666} {"train_info/time_between_train_steps": 0.0034246444702148438, "step": 1666} {"info/global_step": 1667, "train_info/time_within_train_step": 2.5234124660491943, "step": 1667} {"train_info/time_between_train_steps": 0.0034372806549072266, "step": 1667} {"info/global_step": 1668, "train_info/time_within_train_step": 2.522393226623535, "step": 1668} {"train_info/time_between_train_steps": 0.0034465789794921875, "step": 1668} {"info/global_step": 1669, "train_info/time_within_train_step": 2.5221424102783203, "step": 1669} {"train_info/time_between_train_steps": 0.0034356117248535156, "step": 1669} {"info/global_step": 1670, "train_info/time_within_train_step": 2.522273302078247, "step": 1670} {"train_info/time_between_train_steps": 0.003553152084350586, "step": 1670} {"info/global_step": 1671, "train_info/time_within_train_step": 2.5502049922943115, "step": 1671} {"train_info/time_between_train_steps": 0.003339052200317383, "step": 1671} {"info/global_step": 1672, "train_info/time_within_train_step": 2.5210535526275635, "step": 1672} {"train_info/time_between_train_steps": 0.003372669219970703, "step": 1672} {"info/global_step": 1673, "train_info/time_within_train_step": 2.520451545715332, "step": 1673} {"train_info/time_between_train_steps": 0.0034275054931640625, "step": 1673} {"info/global_step": 1674, "train_info/time_within_train_step": 2.520477294921875, "step": 1674} {"train_info/time_between_train_steps": 0.0033805370330810547, "step": 1674} {"info/global_step": 1675, "train_info/time_within_train_step": 2.520578145980835, "step": 1675} {"train_info/time_between_train_steps": 0.003349781036376953, "step": 1675} {"info/global_step": 1676, "train_info/time_within_train_step": 2.520348310470581, "step": 1676} {"train_info/time_between_train_steps": 0.003393411636352539, "step": 1676} {"info/global_step": 1677, "train_info/time_within_train_step": 2.5209758281707764, "step": 1677} {"train_info/time_between_train_steps": 0.003345012664794922, "step": 1677} {"info/global_step": 1678, "train_info/time_within_train_step": 2.5202932357788086, "step": 1678} {"train_info/time_between_train_steps": 0.003341197967529297, "step": 1678} {"info/global_step": 1679, "train_info/time_within_train_step": 2.52099609375, "step": 1679} {"train_info/time_between_train_steps": 0.0033397674560546875, "step": 1679} {"info/global_step": 1680, "train_info/time_within_train_step": 2.5203773975372314, "step": 1680} {"train_info/time_between_train_steps": 0.0033140182495117188, "step": 1680} {"info/global_step": 1681, "train_info/time_within_train_step": 2.5207462310791016, "step": 1681} {"train_info/time_between_train_steps": 0.003304004669189453, "step": 1681} {"info/global_step": 1682, "train_info/time_within_train_step": 2.553262233734131, "step": 1682} {"train_info/time_between_train_steps": 0.0033528804779052734, "step": 1682} {"info/global_step": 1683, "train_info/time_within_train_step": 2.5216257572174072, "step": 1683} {"train_info/time_between_train_steps": 0.0033617019653320312, "step": 1683} {"info/global_step": 1684, "train_info/time_within_train_step": 2.521317720413208, "step": 1684} {"train_info/time_between_train_steps": 0.003292560577392578, "step": 1684} {"info/global_step": 1685, "train_info/time_within_train_step": 2.5215139389038086, "step": 1685} {"train_info/time_between_train_steps": 0.0033049583435058594, "step": 1685} {"info/global_step": 1686, "train_info/time_within_train_step": 2.52067494392395, "step": 1686} {"train_info/time_between_train_steps": 0.003306150436401367, "step": 1686} {"info/global_step": 1687, "train_info/time_within_train_step": 2.521658420562744, "step": 1687} {"train_info/time_between_train_steps": 0.003298044204711914, "step": 1687} {"info/global_step": 1688, "train_info/time_within_train_step": 2.5214414596557617, "step": 1688} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 1688} {"info/global_step": 1689, "train_info/time_within_train_step": 2.5204310417175293, "step": 1689} {"train_info/time_between_train_steps": 0.0033872127532958984, "step": 1689} {"info/global_step": 1690, "train_info/time_within_train_step": 2.5202536582946777, "step": 1690} {"train_info/time_between_train_steps": 0.003298044204711914, "step": 1690} {"info/global_step": 1691, "train_info/time_within_train_step": 2.5203771591186523, "step": 1691} {"train_info/time_between_train_steps": 0.0033283233642578125, "step": 1691} {"info/global_step": 1692, "train_info/time_within_train_step": 2.519113063812256, "step": 1692} {"train_info/time_between_train_steps": 0.0033066272735595703, "step": 1692} {"info/global_step": 1693, "train_info/time_within_train_step": 2.520723342895508, "step": 1693} {"train_info/time_between_train_steps": 0.0033235549926757812, "step": 1693} {"info/global_step": 1694, "train_info/time_within_train_step": 2.5209906101226807, "step": 1694} {"train_info/time_between_train_steps": 0.0033524036407470703, "step": 1694} {"info/global_step": 1695, "train_info/time_within_train_step": 2.521235942840576, "step": 1695} {"train_info/time_between_train_steps": 0.003360748291015625, "step": 1695} {"info/global_step": 1696, "train_info/time_within_train_step": 2.5218148231506348, "step": 1696} {"train_info/time_between_train_steps": 0.0033407211303710938, "step": 1696} {"info/global_step": 1697, "train_info/time_within_train_step": 2.5215792655944824, "step": 1697} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 1697} {"info/global_step": 1698, "train_info/time_within_train_step": 2.5217134952545166, "step": 1698} {"train_info/time_between_train_steps": 0.003359079360961914, "step": 1698} {"info/global_step": 1699, "train_info/time_within_train_step": 2.521695137023926, "step": 1699} {"train_info/time_between_train_steps": 0.0033910274505615234, "step": 1699} {"info/global_step": 1700, "train_info/time_within_train_step": 2.5221428871154785, "step": 1700} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746327572, "_runtime": 4620}, "step": 1700} {"logs": {"train/loss": 4.2584, "train/learning_rate": 0.0002888888888888888, "train/epoch": 1.27, "_timestamp": 1746327572, "_runtime": 4620}, "step": 1700} {"train_info/time_between_train_steps": 17.45184016227722, "step": 1700} {"info/global_step": 1701, "train_info/time_within_train_step": 2.3353397846221924, "step": 1701} {"train_info/time_between_train_steps": 0.0033638477325439453, "step": 1701} {"info/global_step": 1702, "train_info/time_within_train_step": 2.3205184936523438, "step": 1702} {"train_info/time_between_train_steps": 0.0035593509674072266, "step": 1702} {"info/global_step": 1703, "train_info/time_within_train_step": 2.477945327758789, "step": 1703} {"train_info/time_between_train_steps": 0.0033478736877441406, "step": 1703} {"info/global_step": 1704, "train_info/time_within_train_step": 2.5197956562042236, "step": 1704} {"train_info/time_between_train_steps": 0.003369569778442383, "step": 1704} {"info/global_step": 1705, "train_info/time_within_train_step": 2.5186550617218018, "step": 1705} {"train_info/time_between_train_steps": 0.003304719924926758, "step": 1705} {"info/global_step": 1706, "train_info/time_within_train_step": 2.5201268196105957, "step": 1706} {"train_info/time_between_train_steps": 0.003332376480102539, "step": 1706} {"info/global_step": 1707, "train_info/time_within_train_step": 2.5203540325164795, "step": 1707} {"train_info/time_between_train_steps": 0.0033190250396728516, "step": 1707} {"info/global_step": 1708, "train_info/time_within_train_step": 2.520988941192627, "step": 1708} {"train_info/time_between_train_steps": 0.003400087356567383, "step": 1708} {"info/global_step": 1709, "train_info/time_within_train_step": 2.5212466716766357, "step": 1709} {"train_info/time_between_train_steps": 0.003341197967529297, "step": 1709} {"info/global_step": 1710, "train_info/time_within_train_step": 2.6365513801574707, "step": 1710} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 1710} {"info/global_step": 1711, "train_info/time_within_train_step": 2.5221564769744873, "step": 1711} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 1711} {"info/global_step": 1712, "train_info/time_within_train_step": 2.5219082832336426, "step": 1712} {"train_info/time_between_train_steps": 0.0031468868255615234, "step": 1712} {"info/global_step": 1713, "train_info/time_within_train_step": 2.5204100608825684, "step": 1713} {"train_info/time_between_train_steps": 0.0031337738037109375, "step": 1713} {"info/global_step": 1714, "train_info/time_within_train_step": 2.5206682682037354, "step": 1714} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 1714} {"info/global_step": 1715, "train_info/time_within_train_step": 2.5219926834106445, "step": 1715} {"train_info/time_between_train_steps": 0.0031280517578125, "step": 1715} {"info/global_step": 1716, "train_info/time_within_train_step": 2.5210742950439453, "step": 1716} {"train_info/time_between_train_steps": 0.003282785415649414, "step": 1716} {"info/global_step": 1717, "train_info/time_within_train_step": 2.521578550338745, "step": 1717} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 1717} {"info/global_step": 1718, "train_info/time_within_train_step": 2.521909475326538, "step": 1718} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 1718} {"info/global_step": 1719, "train_info/time_within_train_step": 2.523205041885376, "step": 1719} {"train_info/time_between_train_steps": 0.0031468868255615234, "step": 1719} {"info/global_step": 1720, "train_info/time_within_train_step": 2.521843194961548, "step": 1720} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 1720} {"info/global_step": 1721, "train_info/time_within_train_step": 2.5222976207733154, "step": 1721} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 1721} {"info/global_step": 1722, "train_info/time_within_train_step": 2.521782159805298, "step": 1722} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 1722} {"info/global_step": 1723, "train_info/time_within_train_step": 2.521639108657837, "step": 1723} {"train_info/time_between_train_steps": 0.0031702518463134766, "step": 1723} {"info/global_step": 1724, "train_info/time_within_train_step": 2.522030830383301, "step": 1724} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 1724} {"info/global_step": 1725, "train_info/time_within_train_step": 2.521909475326538, "step": 1725} {"train_info/time_between_train_steps": 0.003215789794921875, "step": 1725} {"info/global_step": 1726, "train_info/time_within_train_step": 2.522472858428955, "step": 1726} {"train_info/time_between_train_steps": 0.0033202171325683594, "step": 1726} {"info/global_step": 1727, "train_info/time_within_train_step": 2.5217859745025635, "step": 1727} {"train_info/time_between_train_steps": 0.0032501220703125, "step": 1727} {"info/global_step": 1728, "train_info/time_within_train_step": 2.52186918258667, "step": 1728} {"train_info/time_between_train_steps": 0.0034177303314208984, "step": 1728} {"info/global_step": 1729, "train_info/time_within_train_step": 2.522387981414795, "step": 1729} {"train_info/time_between_train_steps": 0.0033545494079589844, "step": 1729} {"info/global_step": 1730, "train_info/time_within_train_step": 2.5230276584625244, "step": 1730} {"train_info/time_between_train_steps": 0.003386259078979492, "step": 1730} {"info/global_step": 1731, "train_info/time_within_train_step": 2.5518605709075928, "step": 1731} {"train_info/time_between_train_steps": 0.0037202835083007812, "step": 1731} {"info/global_step": 1732, "train_info/time_within_train_step": 2.5228936672210693, "step": 1732} {"train_info/time_between_train_steps": 0.0034945011138916016, "step": 1732} {"info/global_step": 1733, "train_info/time_within_train_step": 2.5227839946746826, "step": 1733} {"train_info/time_between_train_steps": 0.003588438034057617, "step": 1733} {"info/global_step": 1734, "train_info/time_within_train_step": 2.5223612785339355, "step": 1734} {"train_info/time_between_train_steps": 0.003538370132446289, "step": 1734} {"info/global_step": 1735, "train_info/time_within_train_step": 2.523231029510498, "step": 1735} {"train_info/time_between_train_steps": 0.003599405288696289, "step": 1735} {"info/global_step": 1736, "train_info/time_within_train_step": 2.523029088973999, "step": 1736} {"train_info/time_between_train_steps": 0.0033867359161376953, "step": 1736} {"info/global_step": 1737, "train_info/time_within_train_step": 2.5221545696258545, "step": 1737} {"train_info/time_between_train_steps": 0.0034525394439697266, "step": 1737} {"info/global_step": 1738, "train_info/time_within_train_step": 2.522336721420288, "step": 1738} {"train_info/time_between_train_steps": 0.0034270286560058594, "step": 1738} {"info/global_step": 1739, "train_info/time_within_train_step": 2.5212905406951904, "step": 1739} {"train_info/time_between_train_steps": 0.003464221954345703, "step": 1739} {"info/global_step": 1740, "train_info/time_within_train_step": 2.522507429122925, "step": 1740} {"train_info/time_between_train_steps": 0.0033805370330810547, "step": 1740} {"info/global_step": 1741, "train_info/time_within_train_step": 2.521552801132202, "step": 1741} {"train_info/time_between_train_steps": 0.003399372100830078, "step": 1741} {"info/global_step": 1742, "train_info/time_within_train_step": 2.521209239959717, "step": 1742} {"train_info/time_between_train_steps": 0.003400564193725586, "step": 1742} {"info/global_step": 1743, "train_info/time_within_train_step": 2.5260326862335205, "step": 1743} {"train_info/time_between_train_steps": 0.0033042430877685547, "step": 1743} {"info/global_step": 1744, "train_info/time_within_train_step": 2.5207467079162598, "step": 1744} {"train_info/time_between_train_steps": 0.00336456298828125, "step": 1744} {"info/global_step": 1745, "train_info/time_within_train_step": 2.5207982063293457, "step": 1745} {"train_info/time_between_train_steps": 0.0033185482025146484, "step": 1745} {"info/global_step": 1746, "train_info/time_within_train_step": 2.5216503143310547, "step": 1746} {"train_info/time_between_train_steps": 0.0033156871795654297, "step": 1746} {"info/global_step": 1747, "train_info/time_within_train_step": 2.5206844806671143, "step": 1747} {"train_info/time_between_train_steps": 0.003350496292114258, "step": 1747} {"info/global_step": 1748, "train_info/time_within_train_step": 2.521202802658081, "step": 1748} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 1748} {"info/global_step": 1749, "train_info/time_within_train_step": 2.521261215209961, "step": 1749} {"train_info/time_between_train_steps": 0.003431081771850586, "step": 1749} {"info/global_step": 1750, "train_info/time_within_train_step": 3.050091505050659, "step": 1750} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746327717, "_runtime": 4765}, "step": 1750} {"logs": {"train/loss": 4.2387, "train/learning_rate": 0.0002777777777777778, "train/epoch": 1.29, "_timestamp": 1746327717, "_runtime": 4765}, "step": 1750} {"train_info/time_between_train_steps": 0.02437901496887207, "step": 1750} {"info/global_step": 1751, "train_info/time_within_train_step": 2.521461248397827, "step": 1751} {"train_info/time_between_train_steps": 0.0034563541412353516, "step": 1751} {"info/global_step": 1752, "train_info/time_within_train_step": 2.5224850177764893, "step": 1752} {"train_info/time_between_train_steps": 0.003525257110595703, "step": 1752} {"info/global_step": 1753, "train_info/time_within_train_step": 2.5219082832336426, "step": 1753} {"train_info/time_between_train_steps": 0.003298521041870117, "step": 1753} {"info/global_step": 1754, "train_info/time_within_train_step": 2.522662401199341, "step": 1754} {"train_info/time_between_train_steps": 0.003354310989379883, "step": 1754} {"info/global_step": 1755, "train_info/time_within_train_step": 2.521639347076416, "step": 1755} {"train_info/time_between_train_steps": 0.0033807754516601562, "step": 1755} {"info/global_step": 1756, "train_info/time_within_train_step": 2.521796464920044, "step": 1756} {"train_info/time_between_train_steps": 0.0034465789794921875, "step": 1756} {"info/global_step": 1757, "train_info/time_within_train_step": 2.5219297409057617, "step": 1757} {"train_info/time_between_train_steps": 0.0034177303314208984, "step": 1757} {"info/global_step": 1758, "train_info/time_within_train_step": 2.5217270851135254, "step": 1758} {"train_info/time_between_train_steps": 0.0037033557891845703, "step": 1758} {"info/global_step": 1759, "train_info/time_within_train_step": 2.5217106342315674, "step": 1759} {"train_info/time_between_train_steps": 0.003614187240600586, "step": 1759} {"info/global_step": 1760, "train_info/time_within_train_step": 2.521519184112549, "step": 1760} {"train_info/time_between_train_steps": 0.0033533573150634766, "step": 1760} {"info/global_step": 1761, "train_info/time_within_train_step": 2.52120304107666, "step": 1761} {"train_info/time_between_train_steps": 0.003522634506225586, "step": 1761} {"info/global_step": 1762, "train_info/time_within_train_step": 2.5216987133026123, "step": 1762} {"train_info/time_between_train_steps": 0.003667593002319336, "step": 1762} {"info/global_step": 1763, "train_info/time_within_train_step": 2.520556688308716, "step": 1763} {"train_info/time_between_train_steps": 0.0035881996154785156, "step": 1763} {"info/global_step": 1764, "train_info/time_within_train_step": 2.5213534832000732, "step": 1764} {"train_info/time_between_train_steps": 0.0035529136657714844, "step": 1764} {"info/global_step": 1765, "train_info/time_within_train_step": 2.520944833755493, "step": 1765} {"train_info/time_between_train_steps": 0.0033597946166992188, "step": 1765} {"info/global_step": 1766, "train_info/time_within_train_step": 2.5213632583618164, "step": 1766} {"train_info/time_between_train_steps": 0.0038194656372070312, "step": 1766} {"info/global_step": 1767, "train_info/time_within_train_step": 2.521087646484375, "step": 1767} {"train_info/time_between_train_steps": 0.003678560256958008, "step": 1767} {"info/global_step": 1768, "train_info/time_within_train_step": 2.5209195613861084, "step": 1768} {"train_info/time_between_train_steps": 0.003468751907348633, "step": 1768} {"info/global_step": 1769, "train_info/time_within_train_step": 2.5214149951934814, "step": 1769} {"train_info/time_between_train_steps": 0.003664731979370117, "step": 1769} {"info/global_step": 1770, "train_info/time_within_train_step": 2.5215611457824707, "step": 1770} {"train_info/time_between_train_steps": 0.0035920143127441406, "step": 1770} {"info/global_step": 1771, "train_info/time_within_train_step": 2.555290937423706, "step": 1771} {"train_info/time_between_train_steps": 0.003796100616455078, "step": 1771} {"info/global_step": 1772, "train_info/time_within_train_step": 2.520604372024536, "step": 1772} {"train_info/time_between_train_steps": 0.003610372543334961, "step": 1772} {"info/global_step": 1773, "train_info/time_within_train_step": 2.5218775272369385, "step": 1773} {"train_info/time_between_train_steps": 0.0038299560546875, "step": 1773} {"info/global_step": 1774, "train_info/time_within_train_step": 2.521998643875122, "step": 1774} {"train_info/time_between_train_steps": 0.003772258758544922, "step": 1774} {"info/global_step": 1775, "train_info/time_within_train_step": 2.5218801498413086, "step": 1775} {"train_info/time_between_train_steps": 0.0036194324493408203, "step": 1775} {"info/global_step": 1776, "train_info/time_within_train_step": 2.5216176509857178, "step": 1776} {"train_info/time_between_train_steps": 0.0037267208099365234, "step": 1776} {"info/global_step": 1777, "train_info/time_within_train_step": 2.5209171772003174, "step": 1777} {"train_info/time_between_train_steps": 0.0037682056427001953, "step": 1777} {"info/global_step": 1778, "train_info/time_within_train_step": 2.5495357513427734, "step": 1778} {"train_info/time_between_train_steps": 0.004039287567138672, "step": 1778} {"info/global_step": 1779, "train_info/time_within_train_step": 2.5211570262908936, "step": 1779} {"train_info/time_between_train_steps": 0.0036907196044921875, "step": 1779} {"info/global_step": 1780, "train_info/time_within_train_step": 2.5224363803863525, "step": 1780} {"train_info/time_between_train_steps": 0.0038650035858154297, "step": 1780} {"info/global_step": 1781, "train_info/time_within_train_step": 2.5224790573120117, "step": 1781} {"train_info/time_between_train_steps": 0.003767728805541992, "step": 1781} {"info/global_step": 1782, "train_info/time_within_train_step": 2.5242178440093994, "step": 1782} {"train_info/time_between_train_steps": 0.004052400588989258, "step": 1782} {"info/global_step": 1783, "train_info/time_within_train_step": 2.522517442703247, "step": 1783} {"train_info/time_between_train_steps": 0.0044634342193603516, "step": 1783} {"info/global_step": 1784, "train_info/time_within_train_step": 2.523613691329956, "step": 1784} {"train_info/time_between_train_steps": 0.004565000534057617, "step": 1784} {"train_info/time_between_train_steps": 2.947753667831421, "step": 1784} {"info/global_step": 1785, "train_info/time_within_train_step": 2.520176649093628, "step": 1785} {"train_info/time_between_train_steps": 0.003367185592651367, "step": 1785} {"info/global_step": 1786, "train_info/time_within_train_step": 2.5194661617279053, "step": 1786} {"train_info/time_between_train_steps": 0.0033583641052246094, "step": 1786} {"info/global_step": 1787, "train_info/time_within_train_step": 2.5194973945617676, "step": 1787} {"train_info/time_between_train_steps": 0.003317594528198242, "step": 1787} {"info/global_step": 1788, "train_info/time_within_train_step": 2.520181179046631, "step": 1788} {"train_info/time_between_train_steps": 0.0033524036407470703, "step": 1788} {"info/global_step": 1789, "train_info/time_within_train_step": 2.520092487335205, "step": 1789} {"train_info/time_between_train_steps": 0.0033223628997802734, "step": 1789} {"info/global_step": 1790, "train_info/time_within_train_step": 2.5204989910125732, "step": 1790} {"train_info/time_between_train_steps": 0.0035181045532226562, "step": 1790} {"info/global_step": 1791, "train_info/time_within_train_step": 2.5201010704040527, "step": 1791} {"train_info/time_between_train_steps": 0.0033571720123291016, "step": 1791} {"info/global_step": 1792, "train_info/time_within_train_step": 2.520298719406128, "step": 1792} {"train_info/time_between_train_steps": 0.003326892852783203, "step": 1792} {"info/global_step": 1793, "train_info/time_within_train_step": 2.5205748081207275, "step": 1793} {"train_info/time_between_train_steps": 0.0033490657806396484, "step": 1793} {"info/global_step": 1794, "train_info/time_within_train_step": 2.5208935737609863, "step": 1794} {"train_info/time_between_train_steps": 0.003374814987182617, "step": 1794} {"info/global_step": 1795, "train_info/time_within_train_step": 2.5214459896087646, "step": 1795} {"train_info/time_between_train_steps": 0.003343820571899414, "step": 1795} {"info/global_step": 1796, "train_info/time_within_train_step": 2.5209405422210693, "step": 1796} {"train_info/time_between_train_steps": 0.004002571105957031, "step": 1796} {"info/global_step": 1797, "train_info/time_within_train_step": 2.521764039993286, "step": 1797} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 1797} {"info/global_step": 1798, "train_info/time_within_train_step": 2.5216822624206543, "step": 1798} {"train_info/time_between_train_steps": 0.0034227371215820312, "step": 1798} {"info/global_step": 1799, "train_info/time_within_train_step": 2.5214126110076904, "step": 1799} {"train_info/time_between_train_steps": 0.003465414047241211, "step": 1799} {"info/global_step": 1800, "train_info/time_within_train_step": 2.522599697113037, "step": 1800} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746327847, "_runtime": 4895}, "step": 1800} {"logs": {"train/loss": 4.2601, "train/learning_rate": 0.0002666666666666666, "train/epoch": 2.01, "_timestamp": 1746327847, "_runtime": 4895}, "step": 1800} {"train_info/time_between_train_steps": 15.17902135848999, "step": 1800} {"info/global_step": 1801, "train_info/time_within_train_step": 2.553881883621216, "step": 1801} {"train_info/time_between_train_steps": 0.0033833980560302734, "step": 1801} {"info/global_step": 1802, "train_info/time_within_train_step": 2.3168787956237793, "step": 1802} {"train_info/time_between_train_steps": 0.003383636474609375, "step": 1802} {"info/global_step": 1803, "train_info/time_within_train_step": 2.4772021770477295, "step": 1803} {"train_info/time_between_train_steps": 0.0034699440002441406, "step": 1803} {"info/global_step": 1804, "train_info/time_within_train_step": 2.5210018157958984, "step": 1804} {"train_info/time_between_train_steps": 0.003452301025390625, "step": 1804} {"info/global_step": 1805, "train_info/time_within_train_step": 2.5218605995178223, "step": 1805} {"train_info/time_between_train_steps": 0.0033960342407226562, "step": 1805} {"info/global_step": 1806, "train_info/time_within_train_step": 2.521467685699463, "step": 1806} {"train_info/time_between_train_steps": 0.0034532546997070312, "step": 1806} {"info/global_step": 1807, "train_info/time_within_train_step": 2.521092176437378, "step": 1807} {"train_info/time_between_train_steps": 0.003377199172973633, "step": 1807} {"info/global_step": 1808, "train_info/time_within_train_step": 2.521522283554077, "step": 1808} {"train_info/time_between_train_steps": 0.0033795833587646484, "step": 1808} {"info/global_step": 1809, "train_info/time_within_train_step": 2.521634340286255, "step": 1809} {"train_info/time_between_train_steps": 0.003414154052734375, "step": 1809} {"info/global_step": 1810, "train_info/time_within_train_step": 2.521483898162842, "step": 1810} {"train_info/time_between_train_steps": 0.003422975540161133, "step": 1810} {"info/global_step": 1811, "train_info/time_within_train_step": 2.522958993911743, "step": 1811} {"train_info/time_between_train_steps": 0.003456592559814453, "step": 1811} {"info/global_step": 1812, "train_info/time_within_train_step": 2.523042678833008, "step": 1812} {"train_info/time_between_train_steps": 0.0034830570220947266, "step": 1812} {"info/global_step": 1813, "train_info/time_within_train_step": 2.522869110107422, "step": 1813} {"train_info/time_between_train_steps": 0.0034554004669189453, "step": 1813} {"info/global_step": 1814, "train_info/time_within_train_step": 2.5226926803588867, "step": 1814} {"train_info/time_between_train_steps": 0.003483295440673828, "step": 1814} {"info/global_step": 1815, "train_info/time_within_train_step": 2.523759365081787, "step": 1815} {"train_info/time_between_train_steps": 0.0034303665161132812, "step": 1815} {"info/global_step": 1816, "train_info/time_within_train_step": 2.523338794708252, "step": 1816} {"train_info/time_between_train_steps": 0.003390073776245117, "step": 1816} {"info/global_step": 1817, "train_info/time_within_train_step": 2.5223848819732666, "step": 1817} {"train_info/time_between_train_steps": 0.003376007080078125, "step": 1817} {"info/global_step": 1818, "train_info/time_within_train_step": 2.522974967956543, "step": 1818} {"train_info/time_between_train_steps": 0.0038149356842041016, "step": 1818} {"info/global_step": 1819, "train_info/time_within_train_step": 2.5226364135742188, "step": 1819} {"train_info/time_between_train_steps": 0.0034215450286865234, "step": 1819} {"info/global_step": 1820, "train_info/time_within_train_step": 2.552147150039673, "step": 1820} {"train_info/time_between_train_steps": 0.003412961959838867, "step": 1820} {"info/global_step": 1821, "train_info/time_within_train_step": 2.5230154991149902, "step": 1821} {"train_info/time_between_train_steps": 0.0033805370330810547, "step": 1821} {"info/global_step": 1822, "train_info/time_within_train_step": 2.522834539413452, "step": 1822} {"train_info/time_between_train_steps": 0.0034134387969970703, "step": 1822} {"info/global_step": 1823, "train_info/time_within_train_step": 2.523186445236206, "step": 1823} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 1823} {"info/global_step": 1824, "train_info/time_within_train_step": 2.522209882736206, "step": 1824} {"train_info/time_between_train_steps": 0.003986358642578125, "step": 1824} {"info/global_step": 1825, "train_info/time_within_train_step": 2.522815465927124, "step": 1825} {"train_info/time_between_train_steps": 0.0033860206604003906, "step": 1825} {"info/global_step": 1826, "train_info/time_within_train_step": 2.5235860347747803, "step": 1826} {"train_info/time_between_train_steps": 0.0036606788635253906, "step": 1826} {"info/global_step": 1827, "train_info/time_within_train_step": 2.5231471061706543, "step": 1827} {"train_info/time_between_train_steps": 0.003507852554321289, "step": 1827} {"info/global_step": 1828, "train_info/time_within_train_step": 2.523735523223877, "step": 1828} {"train_info/time_between_train_steps": 0.003449678421020508, "step": 1828} {"info/global_step": 1829, "train_info/time_within_train_step": 2.523388385772705, "step": 1829} {"train_info/time_between_train_steps": 0.0035066604614257812, "step": 1829} {"info/global_step": 1830, "train_info/time_within_train_step": 2.5238749980926514, "step": 1830} {"train_info/time_between_train_steps": 0.003515005111694336, "step": 1830} {"info/global_step": 1831, "train_info/time_within_train_step": 2.5231778621673584, "step": 1831} {"train_info/time_between_train_steps": 0.0034551620483398438, "step": 1831} {"info/global_step": 1832, "train_info/time_within_train_step": 2.5227487087249756, "step": 1832} {"train_info/time_between_train_steps": 0.0034542083740234375, "step": 1832} {"info/global_step": 1833, "train_info/time_within_train_step": 2.522899866104126, "step": 1833} {"train_info/time_between_train_steps": 0.003502368927001953, "step": 1833} {"info/global_step": 1834, "train_info/time_within_train_step": 2.523001194000244, "step": 1834} {"train_info/time_between_train_steps": 0.0034530162811279297, "step": 1834} {"info/global_step": 1835, "train_info/time_within_train_step": 2.5503556728363037, "step": 1835} {"train_info/time_between_train_steps": 0.0034782886505126953, "step": 1835} {"info/global_step": 1836, "train_info/time_within_train_step": 2.5223865509033203, "step": 1836} {"train_info/time_between_train_steps": 0.0034961700439453125, "step": 1836} {"info/global_step": 1837, "train_info/time_within_train_step": 2.522353410720825, "step": 1837} {"train_info/time_between_train_steps": 0.0034775733947753906, "step": 1837} {"info/global_step": 1838, "train_info/time_within_train_step": 2.5224647521972656, "step": 1838} {"train_info/time_between_train_steps": 0.003532886505126953, "step": 1838} {"info/global_step": 1839, "train_info/time_within_train_step": 2.5221991539001465, "step": 1839} {"train_info/time_between_train_steps": 0.003457784652709961, "step": 1839} {"info/global_step": 1840, "train_info/time_within_train_step": 2.5222482681274414, "step": 1840} {"train_info/time_between_train_steps": 0.003490924835205078, "step": 1840} {"info/global_step": 1841, "train_info/time_within_train_step": 2.523704767227173, "step": 1841} {"train_info/time_between_train_steps": 0.0035004615783691406, "step": 1841} {"info/global_step": 1842, "train_info/time_within_train_step": 2.522745370864868, "step": 1842} {"train_info/time_between_train_steps": 0.0034933090209960938, "step": 1842} {"info/global_step": 1843, "train_info/time_within_train_step": 2.522991180419922, "step": 1843} {"train_info/time_between_train_steps": 0.0034935474395751953, "step": 1843} {"info/global_step": 1844, "train_info/time_within_train_step": 2.523167371749878, "step": 1844} {"train_info/time_between_train_steps": 0.0034606456756591797, "step": 1844} {"info/global_step": 1845, "train_info/time_within_train_step": 2.5225343704223633, "step": 1845} {"train_info/time_between_train_steps": 0.003442049026489258, "step": 1845} {"info/global_step": 1846, "train_info/time_within_train_step": 2.5221304893493652, "step": 1846} {"train_info/time_between_train_steps": 0.0034863948822021484, "step": 1846} {"info/global_step": 1847, "train_info/time_within_train_step": 2.6450307369232178, "step": 1847} {"train_info/time_between_train_steps": 0.003487825393676758, "step": 1847} {"info/global_step": 1848, "train_info/time_within_train_step": 2.523023843765259, "step": 1848} {"train_info/time_between_train_steps": 0.0034332275390625, "step": 1848} {"info/global_step": 1849, "train_info/time_within_train_step": 2.5232162475585938, "step": 1849} {"train_info/time_between_train_steps": 0.0034368038177490234, "step": 1849} {"info/global_step": 1850, "train_info/time_within_train_step": 2.5233030319213867, "step": 1850} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746327989, "_runtime": 5037}, "step": 1850} {"logs": {"train/loss": 4.2027, "train/learning_rate": 0.00025555555555555553, "train/epoch": 2.02, "_timestamp": 1746327989, "_runtime": 5037}, "step": 1850} {"train_info/time_between_train_steps": 0.024527311325073242, "step": 1850} {"info/global_step": 1851, "train_info/time_within_train_step": 2.521955966949463, "step": 1851} {"train_info/time_between_train_steps": 0.0034024715423583984, "step": 1851} {"info/global_step": 1852, "train_info/time_within_train_step": 2.522799253463745, "step": 1852} {"train_info/time_between_train_steps": 0.0034379959106445312, "step": 1852} {"info/global_step": 1853, "train_info/time_within_train_step": 2.522629499435425, "step": 1853} {"train_info/time_between_train_steps": 0.003438711166381836, "step": 1853} {"info/global_step": 1854, "train_info/time_within_train_step": 2.5229334831237793, "step": 1854} {"train_info/time_between_train_steps": 0.003401517868041992, "step": 1854} {"info/global_step": 1855, "train_info/time_within_train_step": 2.5232093334198, "step": 1855} {"train_info/time_between_train_steps": 0.0034084320068359375, "step": 1855} {"info/global_step": 1856, "train_info/time_within_train_step": 2.522217273712158, "step": 1856} {"train_info/time_between_train_steps": 0.0034074783325195312, "step": 1856} {"info/global_step": 1857, "train_info/time_within_train_step": 2.5224573612213135, "step": 1857} {"train_info/time_between_train_steps": 0.0034132003784179688, "step": 1857} {"info/global_step": 1858, "train_info/time_within_train_step": 2.5224881172180176, "step": 1858} {"train_info/time_between_train_steps": 0.0034117698669433594, "step": 1858} {"info/global_step": 1859, "train_info/time_within_train_step": 2.5222373008728027, "step": 1859} {"train_info/time_between_train_steps": 0.003435373306274414, "step": 1859} {"info/global_step": 1860, "train_info/time_within_train_step": 2.521677017211914, "step": 1860} {"train_info/time_between_train_steps": 0.003385305404663086, "step": 1860} {"info/global_step": 1861, "train_info/time_within_train_step": 2.5214710235595703, "step": 1861} {"train_info/time_between_train_steps": 0.0034155845642089844, "step": 1861} {"info/global_step": 1862, "train_info/time_within_train_step": 2.522247076034546, "step": 1862} {"train_info/time_between_train_steps": 0.003416299819946289, "step": 1862} {"info/global_step": 1863, "train_info/time_within_train_step": 2.522317886352539, "step": 1863} {"train_info/time_between_train_steps": 0.003401041030883789, "step": 1863} {"info/global_step": 1864, "train_info/time_within_train_step": 2.522714614868164, "step": 1864} {"train_info/time_between_train_steps": 0.0034694671630859375, "step": 1864} {"info/global_step": 1865, "train_info/time_within_train_step": 2.5226783752441406, "step": 1865} {"train_info/time_between_train_steps": 0.004011631011962891, "step": 1865} {"info/global_step": 1866, "train_info/time_within_train_step": 2.5224695205688477, "step": 1866} {"train_info/time_between_train_steps": 0.0034494400024414062, "step": 1866} {"info/global_step": 1867, "train_info/time_within_train_step": 2.5226492881774902, "step": 1867} {"train_info/time_between_train_steps": 0.0034112930297851562, "step": 1867} {"info/global_step": 1868, "train_info/time_within_train_step": 2.5234122276306152, "step": 1868} {"train_info/time_between_train_steps": 0.0034880638122558594, "step": 1868} {"info/global_step": 1869, "train_info/time_within_train_step": 2.5227766036987305, "step": 1869} {"train_info/time_between_train_steps": 0.0034093856811523438, "step": 1869} {"info/global_step": 1870, "train_info/time_within_train_step": 2.5228400230407715, "step": 1870} {"train_info/time_between_train_steps": 0.0034427642822265625, "step": 1870} {"info/global_step": 1871, "train_info/time_within_train_step": 2.557645320892334, "step": 1871} {"train_info/time_between_train_steps": 0.003438234329223633, "step": 1871} {"info/global_step": 1872, "train_info/time_within_train_step": 2.522930145263672, "step": 1872} {"train_info/time_between_train_steps": 0.003431081771850586, "step": 1872} {"info/global_step": 1873, "train_info/time_within_train_step": 2.5229969024658203, "step": 1873} {"train_info/time_between_train_steps": 0.0034949779510498047, "step": 1873} {"info/global_step": 1874, "train_info/time_within_train_step": 2.522817611694336, "step": 1874} {"train_info/time_between_train_steps": 0.0034515857696533203, "step": 1874} {"info/global_step": 1875, "train_info/time_within_train_step": 2.522120475769043, "step": 1875} {"train_info/time_between_train_steps": 0.0034437179565429688, "step": 1875} {"info/global_step": 1876, "train_info/time_within_train_step": 2.5212242603302, "step": 1876} {"train_info/time_between_train_steps": 0.003415346145629883, "step": 1876} {"info/global_step": 1877, "train_info/time_within_train_step": 2.521475076675415, "step": 1877} {"train_info/time_between_train_steps": 0.0034101009368896484, "step": 1877} {"info/global_step": 1878, "train_info/time_within_train_step": 2.5216617584228516, "step": 1878} {"train_info/time_between_train_steps": 0.003434896469116211, "step": 1878} {"info/global_step": 1879, "train_info/time_within_train_step": 2.5222349166870117, "step": 1879} {"train_info/time_between_train_steps": 0.003404378890991211, "step": 1879} {"info/global_step": 1880, "train_info/time_within_train_step": 2.5221948623657227, "step": 1880} {"train_info/time_between_train_steps": 0.0034172534942626953, "step": 1880} {"info/global_step": 1881, "train_info/time_within_train_step": 2.522749423980713, "step": 1881} {"train_info/time_between_train_steps": 0.0034532546997070312, "step": 1881} {"info/global_step": 1882, "train_info/time_within_train_step": 2.52702260017395, "step": 1882} {"train_info/time_between_train_steps": 0.0035865306854248047, "step": 1882} {"info/global_step": 1883, "train_info/time_within_train_step": 2.522738456726074, "step": 1883} {"train_info/time_between_train_steps": 0.003390789031982422, "step": 1883} {"info/global_step": 1884, "train_info/time_within_train_step": 2.523249864578247, "step": 1884} {"train_info/time_between_train_steps": 0.0034110546112060547, "step": 1884} {"info/global_step": 1885, "train_info/time_within_train_step": 2.5227391719818115, "step": 1885} {"train_info/time_between_train_steps": 0.00341033935546875, "step": 1885} {"info/global_step": 1886, "train_info/time_within_train_step": 2.5222396850585938, "step": 1886} {"train_info/time_between_train_steps": 0.0034706592559814453, "step": 1886} {"info/global_step": 1887, "train_info/time_within_train_step": 2.7791812419891357, "step": 1887} {"train_info/time_between_train_steps": 0.0033817291259765625, "step": 1887} {"info/global_step": 1888, "train_info/time_within_train_step": 2.5230352878570557, "step": 1888} {"train_info/time_between_train_steps": 0.003397703170776367, "step": 1888} {"info/global_step": 1889, "train_info/time_within_train_step": 2.5231950283050537, "step": 1889} {"train_info/time_between_train_steps": 0.003426074981689453, "step": 1889} {"info/global_step": 1890, "train_info/time_within_train_step": 2.5240001678466797, "step": 1890} {"train_info/time_between_train_steps": 0.0034303665161132812, "step": 1890} {"info/global_step": 1891, "train_info/time_within_train_step": 2.5229101181030273, "step": 1891} {"train_info/time_between_train_steps": 0.0033919811248779297, "step": 1891} {"info/global_step": 1892, "train_info/time_within_train_step": 2.521916627883911, "step": 1892} {"train_info/time_between_train_steps": 0.00394749641418457, "step": 1892} {"info/global_step": 1893, "train_info/time_within_train_step": 2.521275043487549, "step": 1893} {"train_info/time_between_train_steps": 0.003411531448364258, "step": 1893} {"info/global_step": 1894, "train_info/time_within_train_step": 2.5222856998443604, "step": 1894} {"train_info/time_between_train_steps": 0.0034461021423339844, "step": 1894} {"info/global_step": 1895, "train_info/time_within_train_step": 2.5224058628082275, "step": 1895} {"train_info/time_between_train_steps": 0.0033855438232421875, "step": 1895} {"info/global_step": 1896, "train_info/time_within_train_step": 2.5218358039855957, "step": 1896} {"train_info/time_between_train_steps": 0.003397703170776367, "step": 1896} {"info/global_step": 1897, "train_info/time_within_train_step": 2.5223309993743896, "step": 1897} {"train_info/time_between_train_steps": 0.0035593509674072266, "step": 1897} {"info/global_step": 1898, "train_info/time_within_train_step": 2.522904396057129, "step": 1898} {"train_info/time_between_train_steps": 0.0034210681915283203, "step": 1898} {"info/global_step": 1899, "train_info/time_within_train_step": 2.522651433944702, "step": 1899} {"train_info/time_between_train_steps": 0.0034074783325195312, "step": 1899} {"info/global_step": 1900, "train_info/time_within_train_step": 2.522864580154419, "step": 1900} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746328117, "_runtime": 5165}, "step": 1900} {"logs": {"train/loss": 4.1752, "train/learning_rate": 0.00024444444444444443, "train/epoch": 2.04, "_timestamp": 1746328117, "_runtime": 5165}, "step": 1900} {"train_info/time_between_train_steps": 15.410084247589111, "step": 1900} {"info/global_step": 1901, "train_info/time_within_train_step": 2.330777883529663, "step": 1901} {"train_info/time_between_train_steps": 0.0034465789794921875, "step": 1901} {"info/global_step": 1902, "train_info/time_within_train_step": 2.3182623386383057, "step": 1902} {"train_info/time_between_train_steps": 0.0034513473510742188, "step": 1902} {"info/global_step": 1903, "train_info/time_within_train_step": 2.4806253910064697, "step": 1903} {"train_info/time_between_train_steps": 0.003436565399169922, "step": 1903} {"info/global_step": 1904, "train_info/time_within_train_step": 2.5172431468963623, "step": 1904} {"train_info/time_between_train_steps": 0.003448963165283203, "step": 1904} {"info/global_step": 1905, "train_info/time_within_train_step": 2.5187151432037354, "step": 1905} {"train_info/time_between_train_steps": 0.0034027099609375, "step": 1905} {"info/global_step": 1906, "train_info/time_within_train_step": 2.519563913345337, "step": 1906} {"train_info/time_between_train_steps": 0.0036084651947021484, "step": 1906} {"info/global_step": 1907, "train_info/time_within_train_step": 2.5204241275787354, "step": 1907} {"train_info/time_between_train_steps": 0.003574371337890625, "step": 1907} {"info/global_step": 1908, "train_info/time_within_train_step": 2.519850492477417, "step": 1908} {"train_info/time_between_train_steps": 0.0033948421478271484, "step": 1908} {"info/global_step": 1909, "train_info/time_within_train_step": 2.5206782817840576, "step": 1909} {"train_info/time_between_train_steps": 0.12136220932006836, "step": 1909} {"info/global_step": 1910, "train_info/time_within_train_step": 2.5212182998657227, "step": 1910} {"train_info/time_between_train_steps": 0.0037031173706054688, "step": 1910} {"info/global_step": 1911, "train_info/time_within_train_step": 2.5217294692993164, "step": 1911} {"train_info/time_between_train_steps": 0.003487825393676758, "step": 1911} {"info/global_step": 1912, "train_info/time_within_train_step": 2.5205078125, "step": 1912} {"train_info/time_between_train_steps": 0.0033719539642333984, "step": 1912} {"info/global_step": 1913, "train_info/time_within_train_step": 2.521980047225952, "step": 1913} {"train_info/time_between_train_steps": 0.003562450408935547, "step": 1913} {"info/global_step": 1914, "train_info/time_within_train_step": 2.521296739578247, "step": 1914} {"train_info/time_between_train_steps": 0.003587484359741211, "step": 1914} {"info/global_step": 1915, "train_info/time_within_train_step": 2.522343158721924, "step": 1915} {"train_info/time_between_train_steps": 0.0034253597259521484, "step": 1915} {"info/global_step": 1916, "train_info/time_within_train_step": 2.522813320159912, "step": 1916} {"train_info/time_between_train_steps": 0.0037102699279785156, "step": 1916} {"info/global_step": 1917, "train_info/time_within_train_step": 2.5216879844665527, "step": 1917} {"train_info/time_between_train_steps": 0.0036263465881347656, "step": 1917} {"info/global_step": 1918, "train_info/time_within_train_step": 2.5219054222106934, "step": 1918} {"train_info/time_between_train_steps": 0.0038886070251464844, "step": 1918} {"info/global_step": 1919, "train_info/time_within_train_step": 2.5219616889953613, "step": 1919} {"train_info/time_between_train_steps": 0.003398418426513672, "step": 1919} {"info/global_step": 1920, "train_info/time_within_train_step": 2.5219063758850098, "step": 1920} {"train_info/time_between_train_steps": 0.0034508705139160156, "step": 1920} {"info/global_step": 1921, "train_info/time_within_train_step": 2.5219500064849854, "step": 1921} {"train_info/time_between_train_steps": 0.003574848175048828, "step": 1921} {"info/global_step": 1922, "train_info/time_within_train_step": 2.5217254161834717, "step": 1922} {"train_info/time_between_train_steps": 0.0035314559936523438, "step": 1922} {"info/global_step": 1923, "train_info/time_within_train_step": 2.521941900253296, "step": 1923} {"train_info/time_between_train_steps": 0.0034933090209960938, "step": 1923} {"info/global_step": 1924, "train_info/time_within_train_step": 2.5225391387939453, "step": 1924} {"train_info/time_between_train_steps": 0.0035066604614257812, "step": 1924} {"info/global_step": 1925, "train_info/time_within_train_step": 2.5222480297088623, "step": 1925} {"train_info/time_between_train_steps": 0.0034894943237304688, "step": 1925} {"info/global_step": 1926, "train_info/time_within_train_step": 2.5223000049591064, "step": 1926} {"train_info/time_between_train_steps": 0.0034258365631103516, "step": 1926} {"info/global_step": 1927, "train_info/time_within_train_step": 2.521900177001953, "step": 1927} {"train_info/time_between_train_steps": 0.003455638885498047, "step": 1927} {"info/global_step": 1928, "train_info/time_within_train_step": 2.522989273071289, "step": 1928} {"train_info/time_between_train_steps": 0.003492593765258789, "step": 1928} {"info/global_step": 1929, "train_info/time_within_train_step": 2.5220344066619873, "step": 1929} {"train_info/time_between_train_steps": 0.0034470558166503906, "step": 1929} {"info/global_step": 1930, "train_info/time_within_train_step": 2.7764387130737305, "step": 1930} {"train_info/time_between_train_steps": 0.0033981800079345703, "step": 1930} {"info/global_step": 1931, "train_info/time_within_train_step": 2.522428035736084, "step": 1931} {"train_info/time_between_train_steps": 0.0033664703369140625, "step": 1931} {"info/global_step": 1932, "train_info/time_within_train_step": 2.5219967365264893, "step": 1932} {"train_info/time_between_train_steps": 0.0033702850341796875, "step": 1932} {"info/global_step": 1933, "train_info/time_within_train_step": 2.523059606552124, "step": 1933} {"train_info/time_between_train_steps": 0.0033571720123291016, "step": 1933} {"info/global_step": 1934, "train_info/time_within_train_step": 2.5234811305999756, "step": 1934} {"train_info/time_between_train_steps": 0.0033655166625976562, "step": 1934} {"info/global_step": 1935, "train_info/time_within_train_step": 2.5216376781463623, "step": 1935} {"train_info/time_between_train_steps": 0.0033597946166992188, "step": 1935} {"info/global_step": 1936, "train_info/time_within_train_step": 2.5217580795288086, "step": 1936} {"train_info/time_between_train_steps": 0.0033469200134277344, "step": 1936} {"info/global_step": 1937, "train_info/time_within_train_step": 2.5221545696258545, "step": 1937} {"train_info/time_between_train_steps": 0.0033388137817382812, "step": 1937} {"info/global_step": 1938, "train_info/time_within_train_step": 2.521106004714966, "step": 1938} {"train_info/time_between_train_steps": 0.003337383270263672, "step": 1938} {"info/global_step": 1939, "train_info/time_within_train_step": 2.5211455821990967, "step": 1939} {"train_info/time_between_train_steps": 0.0033423900604248047, "step": 1939} {"info/global_step": 1940, "train_info/time_within_train_step": 2.52152419090271, "step": 1940} {"train_info/time_between_train_steps": 0.003394603729248047, "step": 1940} {"info/global_step": 1941, "train_info/time_within_train_step": 2.52146053314209, "step": 1941} {"train_info/time_between_train_steps": 0.0033385753631591797, "step": 1941} {"info/global_step": 1942, "train_info/time_within_train_step": 2.521064043045044, "step": 1942} {"train_info/time_between_train_steps": 0.003343820571899414, "step": 1942} {"info/global_step": 1943, "train_info/time_within_train_step": 2.521561861038208, "step": 1943} {"train_info/time_between_train_steps": 0.0033507347106933594, "step": 1943} {"info/global_step": 1944, "train_info/time_within_train_step": 2.521862745285034, "step": 1944} {"train_info/time_between_train_steps": 0.003337860107421875, "step": 1944} {"info/global_step": 1945, "train_info/time_within_train_step": 2.5218262672424316, "step": 1945} {"train_info/time_between_train_steps": 0.0033409595489501953, "step": 1945} {"info/global_step": 1946, "train_info/time_within_train_step": 2.52226185798645, "step": 1946} {"train_info/time_between_train_steps": 0.0033550262451171875, "step": 1946} {"info/global_step": 1947, "train_info/time_within_train_step": 2.521486520767212, "step": 1947} {"train_info/time_between_train_steps": 0.0033464431762695312, "step": 1947} {"info/global_step": 1948, "train_info/time_within_train_step": 2.5219171047210693, "step": 1948} {"train_info/time_between_train_steps": 0.0033538341522216797, "step": 1948} {"info/global_step": 1949, "train_info/time_within_train_step": 2.5212464332580566, "step": 1949} {"train_info/time_between_train_steps": 0.0033538341522216797, "step": 1949} {"info/global_step": 1950, "train_info/time_within_train_step": 2.521801710128784, "step": 1950} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746328260, "_runtime": 5308}, "step": 1950} {"logs": {"train/loss": 4.1609, "train/learning_rate": 0.0002333333333333333, "train/epoch": 2.06, "_timestamp": 1746328260, "_runtime": 5308}, "step": 1950} {"train_info/time_between_train_steps": 0.028806686401367188, "step": 1950} {"info/global_step": 1951, "train_info/time_within_train_step": 2.521578311920166, "step": 1951} {"train_info/time_between_train_steps": 0.003430604934692383, "step": 1951} {"info/global_step": 1952, "train_info/time_within_train_step": 2.520885705947876, "step": 1952} {"train_info/time_between_train_steps": 0.0033867359161376953, "step": 1952} {"info/global_step": 1953, "train_info/time_within_train_step": 2.521789789199829, "step": 1953} {"train_info/time_between_train_steps": 0.003423452377319336, "step": 1953} {"info/global_step": 1954, "train_info/time_within_train_step": 2.521475076675415, "step": 1954} {"train_info/time_between_train_steps": 0.003385782241821289, "step": 1954} {"info/global_step": 1955, "train_info/time_within_train_step": 2.521648406982422, "step": 1955} {"train_info/time_between_train_steps": 0.003381013870239258, "step": 1955} {"info/global_step": 1956, "train_info/time_within_train_step": 2.522007703781128, "step": 1956} {"train_info/time_between_train_steps": 0.0033864974975585938, "step": 1956} {"info/global_step": 1957, "train_info/time_within_train_step": 2.5219743251800537, "step": 1957} {"train_info/time_between_train_steps": 0.003366231918334961, "step": 1957} {"info/global_step": 1958, "train_info/time_within_train_step": 2.5212488174438477, "step": 1958} {"train_info/time_between_train_steps": 0.003371000289916992, "step": 1958} {"info/global_step": 1959, "train_info/time_within_train_step": 2.521345376968384, "step": 1959} {"train_info/time_between_train_steps": 0.0034143924713134766, "step": 1959} {"info/global_step": 1960, "train_info/time_within_train_step": 2.5206472873687744, "step": 1960} {"train_info/time_between_train_steps": 0.0034170150756835938, "step": 1960} {"info/global_step": 1961, "train_info/time_within_train_step": 2.522252321243286, "step": 1961} {"train_info/time_between_train_steps": 0.003408193588256836, "step": 1961} {"info/global_step": 1962, "train_info/time_within_train_step": 2.5207252502441406, "step": 1962} {"train_info/time_between_train_steps": 0.003420114517211914, "step": 1962} {"info/global_step": 1963, "train_info/time_within_train_step": 2.521416664123535, "step": 1963} {"train_info/time_between_train_steps": 0.0034003257751464844, "step": 1963} {"info/global_step": 1964, "train_info/time_within_train_step": 2.5215210914611816, "step": 1964} {"train_info/time_between_train_steps": 0.003541707992553711, "step": 1964} {"info/global_step": 1965, "train_info/time_within_train_step": 2.522042989730835, "step": 1965} {"train_info/time_between_train_steps": 0.0034401416778564453, "step": 1965} {"info/global_step": 1966, "train_info/time_within_train_step": 2.521662712097168, "step": 1966} {"train_info/time_between_train_steps": 0.003465414047241211, "step": 1966} {"info/global_step": 1967, "train_info/time_within_train_step": 2.5216925144195557, "step": 1967} {"train_info/time_between_train_steps": 0.0034453868865966797, "step": 1967} {"info/global_step": 1968, "train_info/time_within_train_step": 2.521672487258911, "step": 1968} {"train_info/time_between_train_steps": 0.003447294235229492, "step": 1968} {"info/global_step": 1969, "train_info/time_within_train_step": 2.5224623680114746, "step": 1969} {"train_info/time_between_train_steps": 0.0034742355346679688, "step": 1969} {"info/global_step": 1970, "train_info/time_within_train_step": 2.5217833518981934, "step": 1970} {"train_info/time_between_train_steps": 0.0034558773040771484, "step": 1970} {"info/global_step": 1971, "train_info/time_within_train_step": 2.553516149520874, "step": 1971} {"train_info/time_between_train_steps": 0.0034134387969970703, "step": 1971} {"info/global_step": 1972, "train_info/time_within_train_step": 2.6403164863586426, "step": 1972} {"train_info/time_between_train_steps": 0.003530263900756836, "step": 1972} {"info/global_step": 1973, "train_info/time_within_train_step": 2.5222344398498535, "step": 1973} {"train_info/time_between_train_steps": 0.003455638885498047, "step": 1973} {"info/global_step": 1974, "train_info/time_within_train_step": 2.521278142929077, "step": 1974} {"train_info/time_between_train_steps": 0.003437042236328125, "step": 1974} {"info/global_step": 1975, "train_info/time_within_train_step": 2.521799087524414, "step": 1975} {"train_info/time_between_train_steps": 0.0034427642822265625, "step": 1975} {"info/global_step": 1976, "train_info/time_within_train_step": 2.521897315979004, "step": 1976} {"train_info/time_between_train_steps": 0.0034465789794921875, "step": 1976} {"info/global_step": 1977, "train_info/time_within_train_step": 2.521181106567383, "step": 1977} {"train_info/time_between_train_steps": 0.003417491912841797, "step": 1977} {"info/global_step": 1978, "train_info/time_within_train_step": 2.5221612453460693, "step": 1978} {"train_info/time_between_train_steps": 0.0035254955291748047, "step": 1978} {"info/global_step": 1979, "train_info/time_within_train_step": 2.5221898555755615, "step": 1979} {"train_info/time_between_train_steps": 0.0034542083740234375, "step": 1979} {"info/global_step": 1980, "train_info/time_within_train_step": 2.52131986618042, "step": 1980} {"train_info/time_between_train_steps": 0.0034177303314208984, "step": 1980} {"info/global_step": 1981, "train_info/time_within_train_step": 2.520454168319702, "step": 1981} {"train_info/time_between_train_steps": 0.003507852554321289, "step": 1981} {"info/global_step": 1982, "train_info/time_within_train_step": 2.521763324737549, "step": 1982} {"train_info/time_between_train_steps": 0.0036475658416748047, "step": 1982} {"info/global_step": 1983, "train_info/time_within_train_step": 2.521862030029297, "step": 1983} {"train_info/time_between_train_steps": 0.0035228729248046875, "step": 1983} {"info/global_step": 1984, "train_info/time_within_train_step": 2.522486925125122, "step": 1984} {"train_info/time_between_train_steps": 0.0035753250122070312, "step": 1984} {"info/global_step": 1985, "train_info/time_within_train_step": 2.5219345092773438, "step": 1985} {"train_info/time_between_train_steps": 0.004006385803222656, "step": 1985} {"info/global_step": 1986, "train_info/time_within_train_step": 2.5215041637420654, "step": 1986} {"train_info/time_between_train_steps": 0.003445148468017578, "step": 1986} {"info/global_step": 1987, "train_info/time_within_train_step": 2.521116018295288, "step": 1987} {"train_info/time_between_train_steps": 0.0036644935607910156, "step": 1987} {"info/global_step": 1988, "train_info/time_within_train_step": 2.5200626850128174, "step": 1988} {"train_info/time_between_train_steps": 0.0034661293029785156, "step": 1988} {"info/global_step": 1989, "train_info/time_within_train_step": 2.5206940174102783, "step": 1989} {"train_info/time_between_train_steps": 0.003433704376220703, "step": 1989} {"info/global_step": 1990, "train_info/time_within_train_step": 2.521573781967163, "step": 1990} {"train_info/time_between_train_steps": 0.0034148693084716797, "step": 1990} {"info/global_step": 1991, "train_info/time_within_train_step": 2.521244525909424, "step": 1991} {"train_info/time_between_train_steps": 0.003512144088745117, "step": 1991} {"info/global_step": 1992, "train_info/time_within_train_step": 2.5221853256225586, "step": 1992} {"train_info/time_between_train_steps": 0.003615856170654297, "step": 1992} {"info/global_step": 1993, "train_info/time_within_train_step": 2.5222208499908447, "step": 1993} {"train_info/time_between_train_steps": 0.003453493118286133, "step": 1993} {"info/global_step": 1994, "train_info/time_within_train_step": 2.5218400955200195, "step": 1994} {"train_info/time_between_train_steps": 0.0036203861236572266, "step": 1994} {"info/global_step": 1995, "train_info/time_within_train_step": 2.5220212936401367, "step": 1995} {"train_info/time_between_train_steps": 0.0036020278930664062, "step": 1995} {"info/global_step": 1996, "train_info/time_within_train_step": 2.521500825881958, "step": 1996} {"train_info/time_between_train_steps": 0.0034630298614501953, "step": 1996} {"info/global_step": 1997, "train_info/time_within_train_step": 2.5216617584228516, "step": 1997} {"train_info/time_between_train_steps": 0.0033996105194091797, "step": 1997} {"info/global_step": 1998, "train_info/time_within_train_step": 2.5223209857940674, "step": 1998} {"train_info/time_between_train_steps": 0.0035429000854492188, "step": 1998} {"info/global_step": 1999, "train_info/time_within_train_step": 3.052241802215576, "step": 1999} {"train_info/time_between_train_steps": 0.0034291744232177734, "step": 1999} {"info/global_step": 2000, "train_info/time_within_train_step": 2.521878480911255, "step": 2000} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746328388, "_runtime": 5436}, "step": 2000} {"logs": {"train/loss": 4.1393, "train/learning_rate": 0.00022222222222222218, "train/epoch": 2.07, "_timestamp": 1746328388, "_runtime": 5436}, "step": 2000} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746328393, "_runtime": 5441}, "step": 2000} {"logs": {"eval/loss": 4.583547115325928, "eval/runtime": 5.1306, "eval/samples_per_second": 38.982, "eval/steps_per_second": 1.364, "train/epoch": 2.07, "_timestamp": 1746328393, "_runtime": 5441}, "step": 2000} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746328393, "_runtime": 5441}, "step": 2000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.583547115325928, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 97.86090319960805, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1306, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 38.982, "train/epoch": 2.07, "_timestamp": 1746328393, "_runtime": 5441}, "step": 2000} {"train_info/time_between_train_steps": 21.942055225372314, "step": 2000} {"info/global_step": 2001, "train_info/time_within_train_step": 2.3399999141693115, "step": 2001} {"train_info/time_between_train_steps": 0.0035195350646972656, "step": 2001} {"info/global_step": 2002, "train_info/time_within_train_step": 2.3194665908813477, "step": 2002} {"train_info/time_between_train_steps": 0.0035419464111328125, "step": 2002} {"info/global_step": 2003, "train_info/time_within_train_step": 2.467721462249756, "step": 2003} {"train_info/time_between_train_steps": 0.0034570693969726562, "step": 2003} {"info/global_step": 2004, "train_info/time_within_train_step": 2.5186450481414795, "step": 2004} {"train_info/time_between_train_steps": 0.0034754276275634766, "step": 2004} {"info/global_step": 2005, "train_info/time_within_train_step": 2.5183959007263184, "step": 2005} {"train_info/time_between_train_steps": 0.003474712371826172, "step": 2005} {"info/global_step": 2006, "train_info/time_within_train_step": 2.5196988582611084, "step": 2006} {"train_info/time_between_train_steps": 0.0035161972045898438, "step": 2006} {"info/global_step": 2007, "train_info/time_within_train_step": 2.5207982063293457, "step": 2007} {"train_info/time_between_train_steps": 0.003467082977294922, "step": 2007} {"info/global_step": 2008, "train_info/time_within_train_step": 2.7833499908447266, "step": 2008} {"train_info/time_between_train_steps": 0.0034551620483398438, "step": 2008} {"info/global_step": 2009, "train_info/time_within_train_step": 2.5215327739715576, "step": 2009} {"train_info/time_between_train_steps": 0.0033936500549316406, "step": 2009} {"info/global_step": 2010, "train_info/time_within_train_step": 2.5213637351989746, "step": 2010} {"train_info/time_between_train_steps": 0.0034074783325195312, "step": 2010} {"info/global_step": 2011, "train_info/time_within_train_step": 2.5219218730926514, "step": 2011} {"train_info/time_between_train_steps": 0.003405332565307617, "step": 2011} {"info/global_step": 2012, "train_info/time_within_train_step": 2.522599935531616, "step": 2012} {"train_info/time_between_train_steps": 0.0034515857696533203, "step": 2012} {"info/global_step": 2013, "train_info/time_within_train_step": 2.5223379135131836, "step": 2013} {"train_info/time_between_train_steps": 0.003443002700805664, "step": 2013} {"info/global_step": 2014, "train_info/time_within_train_step": 2.5228326320648193, "step": 2014} {"train_info/time_between_train_steps": 0.003441333770751953, "step": 2014} {"info/global_step": 2015, "train_info/time_within_train_step": 2.5226891040802, "step": 2015} {"train_info/time_between_train_steps": 0.003492116928100586, "step": 2015} {"info/global_step": 2016, "train_info/time_within_train_step": 2.523024082183838, "step": 2016} {"train_info/time_between_train_steps": 0.0034558773040771484, "step": 2016} {"info/global_step": 2017, "train_info/time_within_train_step": 2.522892951965332, "step": 2017} {"train_info/time_between_train_steps": 0.003427267074584961, "step": 2017} {"info/global_step": 2018, "train_info/time_within_train_step": 2.5230767726898193, "step": 2018} {"train_info/time_between_train_steps": 0.0034329891204833984, "step": 2018} {"info/global_step": 2019, "train_info/time_within_train_step": 2.5228450298309326, "step": 2019} {"train_info/time_between_train_steps": 0.0034780502319335938, "step": 2019} {"info/global_step": 2020, "train_info/time_within_train_step": 2.5233638286590576, "step": 2020} {"train_info/time_between_train_steps": 0.003448486328125, "step": 2020} {"info/global_step": 2021, "train_info/time_within_train_step": 2.522932291030884, "step": 2021} {"train_info/time_between_train_steps": 0.003482341766357422, "step": 2021} {"info/global_step": 2022, "train_info/time_within_train_step": 2.5228941440582275, "step": 2022} {"train_info/time_between_train_steps": 0.003486156463623047, "step": 2022} {"info/global_step": 2023, "train_info/time_within_train_step": 2.5231988430023193, "step": 2023} {"train_info/time_between_train_steps": 0.0034313201904296875, "step": 2023} {"info/global_step": 2024, "train_info/time_within_train_step": 2.5221645832061768, "step": 2024} {"train_info/time_between_train_steps": 0.004099607467651367, "step": 2024} {"info/global_step": 2025, "train_info/time_within_train_step": 2.522587537765503, "step": 2025} {"train_info/time_between_train_steps": 0.0034742355346679688, "step": 2025} {"info/global_step": 2026, "train_info/time_within_train_step": 2.522573471069336, "step": 2026} {"train_info/time_between_train_steps": 0.0033931732177734375, "step": 2026} {"info/global_step": 2027, "train_info/time_within_train_step": 2.5223238468170166, "step": 2027} {"train_info/time_between_train_steps": 0.0034341812133789062, "step": 2027} {"info/global_step": 2028, "train_info/time_within_train_step": 2.522233247756958, "step": 2028} {"train_info/time_between_train_steps": 0.003430604934692383, "step": 2028} {"info/global_step": 2029, "train_info/time_within_train_step": 2.52217698097229, "step": 2029} {"train_info/time_between_train_steps": 0.0034677982330322266, "step": 2029} {"info/global_step": 2030, "train_info/time_within_train_step": 2.5218276977539062, "step": 2030} {"train_info/time_between_train_steps": 0.0034368038177490234, "step": 2030} {"info/global_step": 2031, "train_info/time_within_train_step": 2.5217628479003906, "step": 2031} {"train_info/time_between_train_steps": 0.0034704208374023438, "step": 2031} {"info/global_step": 2032, "train_info/time_within_train_step": 2.522766590118408, "step": 2032} {"train_info/time_between_train_steps": 0.003417491912841797, "step": 2032} {"info/global_step": 2033, "train_info/time_within_train_step": 2.5226542949676514, "step": 2033} {"train_info/time_between_train_steps": 0.0034439563751220703, "step": 2033} {"info/global_step": 2034, "train_info/time_within_train_step": 2.5270981788635254, "step": 2034} {"train_info/time_between_train_steps": 0.12293171882629395, "step": 2034} {"info/global_step": 2035, "train_info/time_within_train_step": 2.522594451904297, "step": 2035} {"train_info/time_between_train_steps": 0.003483295440673828, "step": 2035} {"info/global_step": 2036, "train_info/time_within_train_step": 2.521866798400879, "step": 2036} {"train_info/time_between_train_steps": 0.003485441207885742, "step": 2036} {"info/global_step": 2037, "train_info/time_within_train_step": 2.5229063034057617, "step": 2037} {"train_info/time_between_train_steps": 0.0040645599365234375, "step": 2037} {"info/global_step": 2038, "train_info/time_within_train_step": 2.521768093109131, "step": 2038} {"train_info/time_between_train_steps": 0.0034637451171875, "step": 2038} {"info/global_step": 2039, "train_info/time_within_train_step": 2.5229978561401367, "step": 2039} {"train_info/time_between_train_steps": 0.003511667251586914, "step": 2039} {"info/global_step": 2040, "train_info/time_within_train_step": 2.523447036743164, "step": 2040} {"train_info/time_between_train_steps": 0.0034618377685546875, "step": 2040} {"info/global_step": 2041, "train_info/time_within_train_step": 2.52244234085083, "step": 2041} {"train_info/time_between_train_steps": 0.0034449100494384766, "step": 2041} {"info/global_step": 2042, "train_info/time_within_train_step": 2.5219125747680664, "step": 2042} {"train_info/time_between_train_steps": 0.003498554229736328, "step": 2042} {"info/global_step": 2043, "train_info/time_within_train_step": 2.5221290588378906, "step": 2043} {"train_info/time_between_train_steps": 0.0034570693969726562, "step": 2043} {"info/global_step": 2044, "train_info/time_within_train_step": 2.5220682621002197, "step": 2044} {"train_info/time_between_train_steps": 0.003459453582763672, "step": 2044} {"info/global_step": 2045, "train_info/time_within_train_step": 2.5221216678619385, "step": 2045} {"train_info/time_between_train_steps": 0.003448963165283203, "step": 2045} {"info/global_step": 2046, "train_info/time_within_train_step": 2.5221447944641113, "step": 2046} {"train_info/time_between_train_steps": 0.0034723281860351562, "step": 2046} {"info/global_step": 2047, "train_info/time_within_train_step": 2.5223231315612793, "step": 2047} {"train_info/time_between_train_steps": 0.003445148468017578, "step": 2047} {"info/global_step": 2048, "train_info/time_within_train_step": 2.7796709537506104, "step": 2048} {"train_info/time_between_train_steps": 0.0033860206604003906, "step": 2048} {"info/global_step": 2049, "train_info/time_within_train_step": 2.522235631942749, "step": 2049} {"train_info/time_between_train_steps": 0.0033996105194091797, "step": 2049} {"info/global_step": 2050, "train_info/time_within_train_step": 2.5208041667938232, "step": 2050} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746328537, "_runtime": 5585}, "step": 2050} {"logs": {"train/loss": 4.1142, "train/learning_rate": 0.0002111111111111111, "train/epoch": 2.09, "_timestamp": 1746328537, "_runtime": 5585}, "step": 2050} {"train_info/time_between_train_steps": 0.028029203414916992, "step": 2050} {"info/global_step": 2051, "train_info/time_within_train_step": 2.521327495574951, "step": 2051} {"train_info/time_between_train_steps": 0.0033867359161376953, "step": 2051} {"info/global_step": 2052, "train_info/time_within_train_step": 2.5223283767700195, "step": 2052} {"train_info/time_between_train_steps": 0.003391265869140625, "step": 2052} {"info/global_step": 2053, "train_info/time_within_train_step": 2.5211338996887207, "step": 2053} {"train_info/time_between_train_steps": 0.0034270286560058594, "step": 2053} {"info/global_step": 2054, "train_info/time_within_train_step": 2.5216357707977295, "step": 2054} {"train_info/time_between_train_steps": 0.003413677215576172, "step": 2054} {"info/global_step": 2055, "train_info/time_within_train_step": 2.5217745304107666, "step": 2055} {"train_info/time_between_train_steps": 0.0033948421478271484, "step": 2055} {"info/global_step": 2056, "train_info/time_within_train_step": 2.5215907096862793, "step": 2056} {"train_info/time_between_train_steps": 0.0034589767456054688, "step": 2056} {"info/global_step": 2057, "train_info/time_within_train_step": 2.5215017795562744, "step": 2057} {"train_info/time_between_train_steps": 0.0034470558166503906, "step": 2057} {"info/global_step": 2058, "train_info/time_within_train_step": 2.5213913917541504, "step": 2058} {"train_info/time_between_train_steps": 0.0034062862396240234, "step": 2058} {"info/global_step": 2059, "train_info/time_within_train_step": 2.521282196044922, "step": 2059} {"train_info/time_between_train_steps": 0.0034072399139404297, "step": 2059} {"info/global_step": 2060, "train_info/time_within_train_step": 2.5205743312835693, "step": 2060} {"train_info/time_between_train_steps": 0.003426074981689453, "step": 2060} {"info/global_step": 2061, "train_info/time_within_train_step": 2.521519422531128, "step": 2061} {"train_info/time_between_train_steps": 0.003399372100830078, "step": 2061} {"info/global_step": 2062, "train_info/time_within_train_step": 2.521686553955078, "step": 2062} {"train_info/time_between_train_steps": 0.003429889678955078, "step": 2062} {"info/global_step": 2063, "train_info/time_within_train_step": 2.5220329761505127, "step": 2063} {"train_info/time_between_train_steps": 0.003397226333618164, "step": 2063} {"info/global_step": 2064, "train_info/time_within_train_step": 2.5221593379974365, "step": 2064} {"train_info/time_between_train_steps": 0.0034322738647460938, "step": 2064} {"info/global_step": 2065, "train_info/time_within_train_step": 2.5220112800598145, "step": 2065} {"train_info/time_between_train_steps": 0.003414154052734375, "step": 2065} {"info/global_step": 2066, "train_info/time_within_train_step": 2.5222015380859375, "step": 2066} {"train_info/time_between_train_steps": 0.0034089088439941406, "step": 2066} {"info/global_step": 2067, "train_info/time_within_train_step": 2.5214171409606934, "step": 2067} {"train_info/time_between_train_steps": 0.003381967544555664, "step": 2067} {"info/global_step": 2068, "train_info/time_within_train_step": 2.521946668624878, "step": 2068} {"train_info/time_between_train_steps": 0.003416299819946289, "step": 2068} {"info/global_step": 2069, "train_info/time_within_train_step": 2.52187180519104, "step": 2069} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 2069} {"info/global_step": 2070, "train_info/time_within_train_step": 2.5214381217956543, "step": 2070} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 2070} {"info/global_step": 2071, "train_info/time_within_train_step": 2.55354905128479, "step": 2071} {"train_info/time_between_train_steps": 0.0034096240997314453, "step": 2071} {"info/global_step": 2072, "train_info/time_within_train_step": 2.5215651988983154, "step": 2072} {"train_info/time_between_train_steps": 0.0033996105194091797, "step": 2072} {"info/global_step": 2073, "train_info/time_within_train_step": 2.521116256713867, "step": 2073} {"train_info/time_between_train_steps": 0.0034117698669433594, "step": 2073} {"info/global_step": 2074, "train_info/time_within_train_step": 2.5216753482818604, "step": 2074} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 2074} {"info/global_step": 2075, "train_info/time_within_train_step": 2.5212035179138184, "step": 2075} {"train_info/time_between_train_steps": 0.003398895263671875, "step": 2075} {"info/global_step": 2076, "train_info/time_within_train_step": 2.5221052169799805, "step": 2076} {"train_info/time_between_train_steps": 0.003443002700805664, "step": 2076} {"info/global_step": 2077, "train_info/time_within_train_step": 2.5220179557800293, "step": 2077} {"train_info/time_between_train_steps": 0.0033931732177734375, "step": 2077} {"info/global_step": 2078, "train_info/time_within_train_step": 2.522365093231201, "step": 2078} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 2078} {"info/global_step": 2079, "train_info/time_within_train_step": 2.522352457046509, "step": 2079} {"train_info/time_between_train_steps": 0.0034046173095703125, "step": 2079} {"info/global_step": 2080, "train_info/time_within_train_step": 2.522266149520874, "step": 2080} {"train_info/time_between_train_steps": 0.0034050941467285156, "step": 2080} {"info/global_step": 2081, "train_info/time_within_train_step": 2.5220677852630615, "step": 2081} {"train_info/time_between_train_steps": 0.003409147262573242, "step": 2081} {"info/global_step": 2082, "train_info/time_within_train_step": 2.521308422088623, "step": 2082} {"train_info/time_between_train_steps": 0.003400087356567383, "step": 2082} {"info/global_step": 2083, "train_info/time_within_train_step": 2.5216004848480225, "step": 2083} {"train_info/time_between_train_steps": 0.003403902053833008, "step": 2083} {"info/global_step": 2084, "train_info/time_within_train_step": 2.521442413330078, "step": 2084} {"train_info/time_between_train_steps": 0.0034246444702148438, "step": 2084} {"info/global_step": 2085, "train_info/time_within_train_step": 2.521899700164795, "step": 2085} {"train_info/time_between_train_steps": 0.00341796875, "step": 2085} {"info/global_step": 2086, "train_info/time_within_train_step": 2.5213842391967773, "step": 2086} {"train_info/time_between_train_steps": 0.0033953189849853516, "step": 2086} {"info/global_step": 2087, "train_info/time_within_train_step": 2.7565126419067383, "step": 2087} {"train_info/time_between_train_steps": 0.0034055709838867188, "step": 2087} {"info/global_step": 2088, "train_info/time_within_train_step": 2.5207040309906006, "step": 2088} {"train_info/time_between_train_steps": 0.003350496292114258, "step": 2088} {"info/global_step": 2089, "train_info/time_within_train_step": 2.5214312076568604, "step": 2089} {"train_info/time_between_train_steps": 0.0033736228942871094, "step": 2089} {"info/global_step": 2090, "train_info/time_within_train_step": 2.520789623260498, "step": 2090} {"train_info/time_between_train_steps": 0.0034189224243164062, "step": 2090} {"info/global_step": 2091, "train_info/time_within_train_step": 2.521462917327881, "step": 2091} {"train_info/time_between_train_steps": 0.0033807754516601562, "step": 2091} {"info/global_step": 2092, "train_info/time_within_train_step": 2.521728992462158, "step": 2092} {"train_info/time_between_train_steps": 0.0033936500549316406, "step": 2092} {"info/global_step": 2093, "train_info/time_within_train_step": 2.5214650630950928, "step": 2093} {"train_info/time_between_train_steps": 0.0033752918243408203, "step": 2093} {"info/global_step": 2094, "train_info/time_within_train_step": 2.521660089492798, "step": 2094} {"train_info/time_between_train_steps": 0.0033936500549316406, "step": 2094} {"info/global_step": 2095, "train_info/time_within_train_step": 2.5206336975097656, "step": 2095} {"train_info/time_between_train_steps": 0.003384113311767578, "step": 2095} {"info/global_step": 2096, "train_info/time_within_train_step": 2.5223076343536377, "step": 2096} {"train_info/time_between_train_steps": 0.003369569778442383, "step": 2096} {"info/global_step": 2097, "train_info/time_within_train_step": 2.642376184463501, "step": 2097} {"train_info/time_between_train_steps": 0.0034189224243164062, "step": 2097} {"info/global_step": 2098, "train_info/time_within_train_step": 2.522824764251709, "step": 2098} {"train_info/time_between_train_steps": 0.0033845901489257812, "step": 2098} {"info/global_step": 2099, "train_info/time_within_train_step": 2.5276505947113037, "step": 2099} {"train_info/time_between_train_steps": 0.0033826828002929688, "step": 2099} {"info/global_step": 2100, "train_info/time_within_train_step": 2.521315813064575, "step": 2100} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746328665, "_runtime": 5713}, "step": 2100} {"logs": {"train/loss": 4.1033, "train/learning_rate": 0.00019999999999999998, "train/epoch": 2.11, "_timestamp": 1746328665, "_runtime": 5713}, "step": 2100} {"train_info/time_between_train_steps": 19.266000747680664, "step": 2100} {"info/global_step": 2101, "train_info/time_within_train_step": 2.3381848335266113, "step": 2101} {"train_info/time_between_train_steps": 0.0034341812133789062, "step": 2101} {"info/global_step": 2102, "train_info/time_within_train_step": 2.3149964809417725, "step": 2102} {"train_info/time_between_train_steps": 0.0035066604614257812, "step": 2102} {"info/global_step": 2103, "train_info/time_within_train_step": 2.4467201232910156, "step": 2103} {"train_info/time_between_train_steps": 0.003325223922729492, "step": 2103} {"info/global_step": 2104, "train_info/time_within_train_step": 2.519399881362915, "step": 2104} {"train_info/time_between_train_steps": 0.00363922119140625, "step": 2104} {"info/global_step": 2105, "train_info/time_within_train_step": 2.5193521976470947, "step": 2105} {"train_info/time_between_train_steps": 0.0035674571990966797, "step": 2105} {"info/global_step": 2106, "train_info/time_within_train_step": 2.5213189125061035, "step": 2106} {"train_info/time_between_train_steps": 0.0033898353576660156, "step": 2106} {"info/global_step": 2107, "train_info/time_within_train_step": 2.5225765705108643, "step": 2107} {"train_info/time_between_train_steps": 0.0033431053161621094, "step": 2107} {"info/global_step": 2108, "train_info/time_within_train_step": 2.5229218006134033, "step": 2108} {"train_info/time_between_train_steps": 0.00337982177734375, "step": 2108} {"info/global_step": 2109, "train_info/time_within_train_step": 2.5233418941497803, "step": 2109} {"train_info/time_between_train_steps": 0.0033731460571289062, "step": 2109} {"info/global_step": 2110, "train_info/time_within_train_step": 2.523141384124756, "step": 2110} {"train_info/time_between_train_steps": 0.00334930419921875, "step": 2110} {"info/global_step": 2111, "train_info/time_within_train_step": 2.5223422050476074, "step": 2111} {"train_info/time_between_train_steps": 0.0033299922943115234, "step": 2111} {"info/global_step": 2112, "train_info/time_within_train_step": 2.5235681533813477, "step": 2112} {"train_info/time_between_train_steps": 0.003372669219970703, "step": 2112} {"info/global_step": 2113, "train_info/time_within_train_step": 2.5232410430908203, "step": 2113} {"train_info/time_between_train_steps": 0.0033731460571289062, "step": 2113} {"info/global_step": 2114, "train_info/time_within_train_step": 2.5242457389831543, "step": 2114} {"train_info/time_between_train_steps": 0.0033676624298095703, "step": 2114} {"info/global_step": 2115, "train_info/time_within_train_step": 2.5238983631134033, "step": 2115} {"train_info/time_between_train_steps": 0.00365447998046875, "step": 2115} {"info/global_step": 2116, "train_info/time_within_train_step": 2.52340030670166, "step": 2116} {"train_info/time_between_train_steps": 0.0034341812133789062, "step": 2116} {"info/global_step": 2117, "train_info/time_within_train_step": 2.5238699913024902, "step": 2117} {"train_info/time_between_train_steps": 0.003340005874633789, "step": 2117} {"info/global_step": 2118, "train_info/time_within_train_step": 2.5240089893341064, "step": 2118} {"train_info/time_between_train_steps": 0.0033485889434814453, "step": 2118} {"info/global_step": 2119, "train_info/time_within_train_step": 2.5229809284210205, "step": 2119} {"train_info/time_between_train_steps": 0.0033714771270751953, "step": 2119} {"info/global_step": 2120, "train_info/time_within_train_step": 2.5232784748077393, "step": 2120} {"train_info/time_between_train_steps": 0.003381490707397461, "step": 2120} {"info/global_step": 2121, "train_info/time_within_train_step": 2.5241143703460693, "step": 2121} {"train_info/time_between_train_steps": 0.0033380985260009766, "step": 2121} {"info/global_step": 2122, "train_info/time_within_train_step": 2.5241289138793945, "step": 2122} {"train_info/time_between_train_steps": 0.003503084182739258, "step": 2122} {"info/global_step": 2123, "train_info/time_within_train_step": 2.5244522094726562, "step": 2123} {"train_info/time_between_train_steps": 0.003325223922729492, "step": 2123} {"info/global_step": 2124, "train_info/time_within_train_step": 2.524176597595215, "step": 2124} {"train_info/time_between_train_steps": 0.0034084320068359375, "step": 2124} {"info/global_step": 2125, "train_info/time_within_train_step": 2.5236284732818604, "step": 2125} {"train_info/time_between_train_steps": 0.003348112106323242, "step": 2125} {"info/global_step": 2126, "train_info/time_within_train_step": 2.523658037185669, "step": 2126} {"train_info/time_between_train_steps": 0.0034170150756835938, "step": 2126} {"info/global_step": 2127, "train_info/time_within_train_step": 2.523857593536377, "step": 2127} {"train_info/time_between_train_steps": 0.003576517105102539, "step": 2127} {"info/global_step": 2128, "train_info/time_within_train_step": 2.5241074562072754, "step": 2128} {"train_info/time_between_train_steps": 0.0033664703369140625, "step": 2128} {"info/global_step": 2129, "train_info/time_within_train_step": 2.5239062309265137, "step": 2129} {"train_info/time_between_train_steps": 0.003357410430908203, "step": 2129} {"info/global_step": 2130, "train_info/time_within_train_step": 2.550999402999878, "step": 2130} {"train_info/time_between_train_steps": 0.0033652782440185547, "step": 2130} {"info/global_step": 2131, "train_info/time_within_train_step": 2.5232417583465576, "step": 2131} {"train_info/time_between_train_steps": 0.003383636474609375, "step": 2131} {"info/global_step": 2132, "train_info/time_within_train_step": 2.5235490798950195, "step": 2132} {"train_info/time_between_train_steps": 0.0035021305084228516, "step": 2132} {"info/global_step": 2133, "train_info/time_within_train_step": 2.763845920562744, "step": 2133} {"train_info/time_between_train_steps": 0.0034542083740234375, "step": 2133} {"info/global_step": 2134, "train_info/time_within_train_step": 2.5231692790985107, "step": 2134} {"train_info/time_between_train_steps": 0.0033354759216308594, "step": 2134} {"info/global_step": 2135, "train_info/time_within_train_step": 2.5235469341278076, "step": 2135} {"train_info/time_between_train_steps": 0.0033533573150634766, "step": 2135} {"info/global_step": 2136, "train_info/time_within_train_step": 2.5235514640808105, "step": 2136} {"train_info/time_between_train_steps": 0.0033843517303466797, "step": 2136} {"info/global_step": 2137, "train_info/time_within_train_step": 2.523815155029297, "step": 2137} {"train_info/time_between_train_steps": 0.0033283233642578125, "step": 2137} {"info/global_step": 2138, "train_info/time_within_train_step": 2.5234546661376953, "step": 2138} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 2138} {"info/global_step": 2139, "train_info/time_within_train_step": 2.5243113040924072, "step": 2139} {"train_info/time_between_train_steps": 0.0033407211303710938, "step": 2139} {"info/global_step": 2140, "train_info/time_within_train_step": 2.522742748260498, "step": 2140} {"train_info/time_between_train_steps": 0.0033178329467773438, "step": 2140} {"info/global_step": 2141, "train_info/time_within_train_step": 2.5231354236602783, "step": 2141} {"train_info/time_between_train_steps": 0.0033445358276367188, "step": 2141} {"info/global_step": 2142, "train_info/time_within_train_step": 2.5238144397735596, "step": 2142} {"train_info/time_between_train_steps": 0.0033376216888427734, "step": 2142} {"info/global_step": 2143, "train_info/time_within_train_step": 2.522996664047241, "step": 2143} {"train_info/time_between_train_steps": 0.003347635269165039, "step": 2143} {"info/global_step": 2144, "train_info/time_within_train_step": 2.522735834121704, "step": 2144} {"train_info/time_between_train_steps": 0.0033550262451171875, "step": 2144} {"info/global_step": 2145, "train_info/time_within_train_step": 2.523205518722534, "step": 2145} {"train_info/time_between_train_steps": 0.003375530242919922, "step": 2145} {"info/global_step": 2146, "train_info/time_within_train_step": 2.5234086513519287, "step": 2146} {"train_info/time_between_train_steps": 0.0033648014068603516, "step": 2146} {"info/global_step": 2147, "train_info/time_within_train_step": 2.523939609527588, "step": 2147} {"train_info/time_between_train_steps": 0.0036232471466064453, "step": 2147} {"info/global_step": 2148, "train_info/time_within_train_step": 2.5242412090301514, "step": 2148} {"train_info/time_between_train_steps": 0.003525257110595703, "step": 2148} {"info/global_step": 2149, "train_info/time_within_train_step": 2.523268461227417, "step": 2149} {"train_info/time_between_train_steps": 0.0034122467041015625, "step": 2149} {"info/global_step": 2150, "train_info/time_within_train_step": 2.523338556289673, "step": 2150} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746328812, "_runtime": 5860}, "step": 2150} {"logs": {"train/loss": 4.0839, "train/learning_rate": 0.00018888888888888888, "train/epoch": 2.12, "_timestamp": 1746328812, "_runtime": 5860}, "step": 2150} {"train_info/time_between_train_steps": 0.024108409881591797, "step": 2150} {"info/global_step": 2151, "train_info/time_within_train_step": 2.523754835128784, "step": 2151} {"train_info/time_between_train_steps": 0.003426074981689453, "step": 2151} {"info/global_step": 2152, "train_info/time_within_train_step": 2.522974967956543, "step": 2152} {"train_info/time_between_train_steps": 0.0033621788024902344, "step": 2152} {"info/global_step": 2153, "train_info/time_within_train_step": 2.5237860679626465, "step": 2153} {"train_info/time_between_train_steps": 0.003363370895385742, "step": 2153} {"info/global_step": 2154, "train_info/time_within_train_step": 2.5234830379486084, "step": 2154} {"train_info/time_between_train_steps": 0.003381013870239258, "step": 2154} {"info/global_step": 2155, "train_info/time_within_train_step": 2.522967576980591, "step": 2155} {"train_info/time_between_train_steps": 0.003392457962036133, "step": 2155} {"info/global_step": 2156, "train_info/time_within_train_step": 2.5224850177764893, "step": 2156} {"train_info/time_between_train_steps": 0.003381013870239258, "step": 2156} {"info/global_step": 2157, "train_info/time_within_train_step": 2.522806167602539, "step": 2157} {"train_info/time_between_train_steps": 0.0033953189849853516, "step": 2157} {"info/global_step": 2158, "train_info/time_within_train_step": 2.554072141647339, "step": 2158} {"train_info/time_between_train_steps": 0.003377676010131836, "step": 2158} {"info/global_step": 2159, "train_info/time_within_train_step": 2.5230941772460938, "step": 2159} {"train_info/time_between_train_steps": 0.1230621337890625, "step": 2159} {"info/global_step": 2160, "train_info/time_within_train_step": 2.5231800079345703, "step": 2160} {"train_info/time_between_train_steps": 0.0034449100494384766, "step": 2160} {"info/global_step": 2161, "train_info/time_within_train_step": 2.5239205360412598, "step": 2161} {"train_info/time_between_train_steps": 0.003407716751098633, "step": 2161} {"info/global_step": 2162, "train_info/time_within_train_step": 2.5230886936187744, "step": 2162} {"train_info/time_between_train_steps": 0.003397703170776367, "step": 2162} {"info/global_step": 2163, "train_info/time_within_train_step": 2.522686719894409, "step": 2163} {"train_info/time_between_train_steps": 0.003457784652709961, "step": 2163} {"info/global_step": 2164, "train_info/time_within_train_step": 2.5228188037872314, "step": 2164} {"train_info/time_between_train_steps": 0.0034227371215820312, "step": 2164} {"info/global_step": 2165, "train_info/time_within_train_step": 2.5226573944091797, "step": 2165} {"train_info/time_between_train_steps": 0.0034074783325195312, "step": 2165} {"info/global_step": 2166, "train_info/time_within_train_step": 2.5228476524353027, "step": 2166} {"train_info/time_between_train_steps": 0.003418445587158203, "step": 2166} {"info/global_step": 2167, "train_info/time_within_train_step": 2.522800922393799, "step": 2167} {"train_info/time_between_train_steps": 0.0034127235412597656, "step": 2167} {"info/global_step": 2168, "train_info/time_within_train_step": 2.5227744579315186, "step": 2168} {"train_info/time_between_train_steps": 0.003413677215576172, "step": 2168} {"info/global_step": 2169, "train_info/time_within_train_step": 2.5230181217193604, "step": 2169} {"train_info/time_between_train_steps": 0.0034208297729492188, "step": 2169} {"info/global_step": 2170, "train_info/time_within_train_step": 2.5216007232666016, "step": 2170} {"train_info/time_between_train_steps": 0.0033953189849853516, "step": 2170} {"info/global_step": 2171, "train_info/time_within_train_step": 2.523493528366089, "step": 2171} {"train_info/time_between_train_steps": 0.003408193588256836, "step": 2171} {"info/global_step": 2172, "train_info/time_within_train_step": 2.523118734359741, "step": 2172} {"train_info/time_between_train_steps": 0.0034198760986328125, "step": 2172} {"info/global_step": 2173, "train_info/time_within_train_step": 2.523216724395752, "step": 2173} {"train_info/time_between_train_steps": 0.0034356117248535156, "step": 2173} {"info/global_step": 2174, "train_info/time_within_train_step": 2.5224342346191406, "step": 2174} {"train_info/time_between_train_steps": 0.003435373306274414, "step": 2174} {"info/global_step": 2175, "train_info/time_within_train_step": 2.5229527950286865, "step": 2175} {"train_info/time_between_train_steps": 0.003420591354370117, "step": 2175} {"info/global_step": 2176, "train_info/time_within_train_step": 2.5230329036712646, "step": 2176} {"train_info/time_between_train_steps": 0.003403186798095703, "step": 2176} {"info/global_step": 2177, "train_info/time_within_train_step": 2.523148536682129, "step": 2177} {"train_info/time_between_train_steps": 0.003420591354370117, "step": 2177} {"info/global_step": 2178, "train_info/time_within_train_step": 2.5231287479400635, "step": 2178} {"train_info/time_between_train_steps": 0.003410816192626953, "step": 2178} {"info/global_step": 2179, "train_info/time_within_train_step": 2.522188901901245, "step": 2179} {"train_info/time_between_train_steps": 0.003401041030883789, "step": 2179} {"info/global_step": 2180, "train_info/time_within_train_step": 2.5229508876800537, "step": 2180} {"train_info/time_between_train_steps": 0.003414154052734375, "step": 2180} {"info/global_step": 2181, "train_info/time_within_train_step": 2.5221924781799316, "step": 2181} {"train_info/time_between_train_steps": 0.0034003257751464844, "step": 2181} {"info/global_step": 2182, "train_info/time_within_train_step": 2.5228030681610107, "step": 2182} {"train_info/time_between_train_steps": 0.003409147262573242, "step": 2182} {"info/global_step": 2183, "train_info/time_within_train_step": 2.522899866104126, "step": 2183} {"train_info/time_between_train_steps": 0.0033996105194091797, "step": 2183} {"info/global_step": 2184, "train_info/time_within_train_step": 2.522857427597046, "step": 2184} {"train_info/time_between_train_steps": 0.003462553024291992, "step": 2184} {"info/global_step": 2185, "train_info/time_within_train_step": 2.52229905128479, "step": 2185} {"train_info/time_between_train_steps": 0.0034017562866210938, "step": 2185} {"info/global_step": 2186, "train_info/time_within_train_step": 2.527627944946289, "step": 2186} {"train_info/time_between_train_steps": 0.0034155845642089844, "step": 2186} {"info/global_step": 2187, "train_info/time_within_train_step": 2.5226523876190186, "step": 2187} {"train_info/time_between_train_steps": 0.0034117698669433594, "step": 2187} {"info/global_step": 2188, "train_info/time_within_train_step": 2.5224218368530273, "step": 2188} {"train_info/time_between_train_steps": 0.0033965110778808594, "step": 2188} {"info/global_step": 2189, "train_info/time_within_train_step": 2.522780418395996, "step": 2189} {"train_info/time_between_train_steps": 0.0034110546112060547, "step": 2189} {"info/global_step": 2190, "train_info/time_within_train_step": 2.521818161010742, "step": 2190} {"train_info/time_between_train_steps": 0.003588438034057617, "step": 2190} {"info/global_step": 2191, "train_info/time_within_train_step": 2.522534132003784, "step": 2191} {"train_info/time_between_train_steps": 0.0035741329193115234, "step": 2191} {"info/global_step": 2192, "train_info/time_within_train_step": 2.523003578186035, "step": 2192} {"train_info/time_between_train_steps": 0.0033512115478515625, "step": 2192} {"info/global_step": 2193, "train_info/time_within_train_step": 2.52262282371521, "step": 2193} {"train_info/time_between_train_steps": 0.0036077499389648438, "step": 2193} {"info/global_step": 2194, "train_info/time_within_train_step": 2.5227930545806885, "step": 2194} {"train_info/time_between_train_steps": 0.003376483917236328, "step": 2194} {"info/global_step": 2195, "train_info/time_within_train_step": 2.522871732711792, "step": 2195} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 2195} {"info/global_step": 2196, "train_info/time_within_train_step": 2.5220367908477783, "step": 2196} {"train_info/time_between_train_steps": 0.003408670425415039, "step": 2196} {"info/global_step": 2197, "train_info/time_within_train_step": 2.522542953491211, "step": 2197} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 2197} {"info/global_step": 2198, "train_info/time_within_train_step": 2.522639274597168, "step": 2198} {"train_info/time_between_train_steps": 0.0033979415893554688, "step": 2198} {"info/global_step": 2199, "train_info/time_within_train_step": 2.5221641063690186, "step": 2199} {"train_info/time_between_train_steps": 0.003350973129272461, "step": 2199} {"info/global_step": 2200, "train_info/time_within_train_step": 2.522730588912964, "step": 2200} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746328939, "_runtime": 5987}, "step": 2200} {"logs": {"train/loss": 4.0686, "train/learning_rate": 0.00017777777777777776, "train/epoch": 2.14, "_timestamp": 1746328939, "_runtime": 5987}, "step": 2200} {"train_info/time_between_train_steps": 15.48814606666565, "step": 2200} {"info/global_step": 2201, "train_info/time_within_train_step": 2.3247759342193604, "step": 2201} {"train_info/time_between_train_steps": 0.003378629684448242, "step": 2201} {"info/global_step": 2202, "train_info/time_within_train_step": 2.3177380561828613, "step": 2202} {"train_info/time_between_train_steps": 0.003389596939086914, "step": 2202} {"info/global_step": 2203, "train_info/time_within_train_step": 2.464639902114868, "step": 2203} {"train_info/time_between_train_steps": 0.003446340560913086, "step": 2203} {"info/global_step": 2204, "train_info/time_within_train_step": 2.518275260925293, "step": 2204} {"train_info/time_between_train_steps": 0.003367900848388672, "step": 2204} {"info/global_step": 2205, "train_info/time_within_train_step": 2.5176944732666016, "step": 2205} {"train_info/time_between_train_steps": 0.003403186798095703, "step": 2205} {"info/global_step": 2206, "train_info/time_within_train_step": 2.520293951034546, "step": 2206} {"train_info/time_between_train_steps": 0.003976345062255859, "step": 2206} {"info/global_step": 2207, "train_info/time_within_train_step": 2.5203371047973633, "step": 2207} {"train_info/time_between_train_steps": 0.0034112930297851562, "step": 2207} {"info/global_step": 2208, "train_info/time_within_train_step": 2.5198144912719727, "step": 2208} {"train_info/time_between_train_steps": 0.003410816192626953, "step": 2208} {"info/global_step": 2209, "train_info/time_within_train_step": 2.7668027877807617, "step": 2209} {"train_info/time_between_train_steps": 0.003421306610107422, "step": 2209} {"info/global_step": 2210, "train_info/time_within_train_step": 2.5209031105041504, "step": 2210} {"train_info/time_between_train_steps": 0.003358125686645508, "step": 2210} {"info/global_step": 2211, "train_info/time_within_train_step": 2.5208523273468018, "step": 2211} {"train_info/time_between_train_steps": 0.0033881664276123047, "step": 2211} {"info/global_step": 2212, "train_info/time_within_train_step": 2.520972967147827, "step": 2212} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 2212} {"info/global_step": 2213, "train_info/time_within_train_step": 2.521427631378174, "step": 2213} {"train_info/time_between_train_steps": 0.0033752918243408203, "step": 2213} {"info/global_step": 2214, "train_info/time_within_train_step": 2.5218515396118164, "step": 2214} {"train_info/time_between_train_steps": 0.0035512447357177734, "step": 2214} {"info/global_step": 2215, "train_info/time_within_train_step": 2.5211539268493652, "step": 2215} {"train_info/time_between_train_steps": 0.0035495758056640625, "step": 2215} {"info/global_step": 2216, "train_info/time_within_train_step": 2.521432876586914, "step": 2216} {"train_info/time_between_train_steps": 0.0033991336822509766, "step": 2216} {"info/global_step": 2217, "train_info/time_within_train_step": 2.5216658115386963, "step": 2217} {"train_info/time_between_train_steps": 0.0035364627838134766, "step": 2217} {"info/global_step": 2218, "train_info/time_within_train_step": 2.521829843521118, "step": 2218} {"train_info/time_between_train_steps": 0.0033483505249023438, "step": 2218} {"info/global_step": 2219, "train_info/time_within_train_step": 2.521987199783325, "step": 2219} {"train_info/time_between_train_steps": 0.003532886505126953, "step": 2219} {"info/global_step": 2220, "train_info/time_within_train_step": 2.5495734214782715, "step": 2220} {"train_info/time_between_train_steps": 0.003598451614379883, "step": 2220} {"info/global_step": 2221, "train_info/time_within_train_step": 2.521070718765259, "step": 2221} {"train_info/time_between_train_steps": 0.003450632095336914, "step": 2221} {"info/global_step": 2222, "train_info/time_within_train_step": 2.643528699874878, "step": 2222} {"train_info/time_between_train_steps": 0.003410816192626953, "step": 2222} {"info/global_step": 2223, "train_info/time_within_train_step": 2.520615339279175, "step": 2223} {"train_info/time_between_train_steps": 0.0035767555236816406, "step": 2223} {"info/global_step": 2224, "train_info/time_within_train_step": 2.52189040184021, "step": 2224} {"train_info/time_between_train_steps": 0.003499269485473633, "step": 2224} {"info/global_step": 2225, "train_info/time_within_train_step": 2.522559642791748, "step": 2225} {"train_info/time_between_train_steps": 0.0034754276275634766, "step": 2225} {"info/global_step": 2226, "train_info/time_within_train_step": 2.5215649604797363, "step": 2226} {"train_info/time_between_train_steps": 0.0034906864166259766, "step": 2226} {"info/global_step": 2227, "train_info/time_within_train_step": 2.5216622352600098, "step": 2227} {"train_info/time_between_train_steps": 0.0036017894744873047, "step": 2227} {"info/global_step": 2228, "train_info/time_within_train_step": 2.5215258598327637, "step": 2228} {"train_info/time_between_train_steps": 0.0036268234252929688, "step": 2228} {"info/global_step": 2229, "train_info/time_within_train_step": 2.521125078201294, "step": 2229} {"train_info/time_between_train_steps": 0.003345966339111328, "step": 2229} {"info/global_step": 2230, "train_info/time_within_train_step": 2.521528959274292, "step": 2230} {"train_info/time_between_train_steps": 0.0033452510833740234, "step": 2230} {"info/global_step": 2231, "train_info/time_within_train_step": 2.522019863128662, "step": 2231} {"train_info/time_between_train_steps": 0.0035173892974853516, "step": 2231} {"info/global_step": 2232, "train_info/time_within_train_step": 2.5217344760894775, "step": 2232} {"train_info/time_between_train_steps": 0.0033860206604003906, "step": 2232} {"info/global_step": 2233, "train_info/time_within_train_step": 2.526761054992676, "step": 2233} {"train_info/time_between_train_steps": 0.0035867691040039062, "step": 2233} {"info/global_step": 2234, "train_info/time_within_train_step": 2.522163152694702, "step": 2234} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 2234} {"info/global_step": 2235, "train_info/time_within_train_step": 2.522397518157959, "step": 2235} {"train_info/time_between_train_steps": 0.0033860206604003906, "step": 2235} {"info/global_step": 2236, "train_info/time_within_train_step": 2.5543227195739746, "step": 2236} {"train_info/time_between_train_steps": 0.003367900848388672, "step": 2236} {"info/global_step": 2237, "train_info/time_within_train_step": 2.5222721099853516, "step": 2237} {"train_info/time_between_train_steps": 0.003345966339111328, "step": 2237} {"info/global_step": 2238, "train_info/time_within_train_step": 2.522097110748291, "step": 2238} {"train_info/time_between_train_steps": 0.0034279823303222656, "step": 2238} {"info/global_step": 2239, "train_info/time_within_train_step": 2.522448778152466, "step": 2239} {"train_info/time_between_train_steps": 0.003380298614501953, "step": 2239} {"info/global_step": 2240, "train_info/time_within_train_step": 2.5222489833831787, "step": 2240} {"train_info/time_between_train_steps": 0.0034449100494384766, "step": 2240} {"info/global_step": 2241, "train_info/time_within_train_step": 2.5228657722473145, "step": 2241} {"train_info/time_between_train_steps": 0.0033822059631347656, "step": 2241} {"info/global_step": 2242, "train_info/time_within_train_step": 2.5213987827301025, "step": 2242} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 2242} {"info/global_step": 2243, "train_info/time_within_train_step": 2.5208356380462646, "step": 2243} {"train_info/time_between_train_steps": 0.0033910274505615234, "step": 2243} {"info/global_step": 2244, "train_info/time_within_train_step": 2.5219335556030273, "step": 2244} {"train_info/time_between_train_steps": 0.003391742706298828, "step": 2244} {"info/global_step": 2245, "train_info/time_within_train_step": 2.5217854976654053, "step": 2245} {"train_info/time_between_train_steps": 0.0033922195434570312, "step": 2245} {"info/global_step": 2246, "train_info/time_within_train_step": 2.520925998687744, "step": 2246} {"train_info/time_between_train_steps": 0.003409147262573242, "step": 2246} {"info/global_step": 2247, "train_info/time_within_train_step": 2.520785331726074, "step": 2247} {"train_info/time_between_train_steps": 0.0033783912658691406, "step": 2247} {"info/global_step": 2248, "train_info/time_within_train_step": 2.5206596851348877, "step": 2248} {"train_info/time_between_train_steps": 0.0033872127532958984, "step": 2248} {"info/global_step": 2249, "train_info/time_within_train_step": 3.0255753993988037, "step": 2249} {"train_info/time_between_train_steps": 0.0034258365631103516, "step": 2249} {"info/global_step": 2250, "train_info/time_within_train_step": 2.5212881565093994, "step": 2250} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746329082, "_runtime": 6130}, "step": 2250} {"logs": {"train/loss": 4.0567, "train/learning_rate": 0.00016666666666666666, "train/epoch": 2.16, "_timestamp": 1746329082, "_runtime": 6130}, "step": 2250} {"train_info/time_between_train_steps": 0.024756669998168945, "step": 2250} {"info/global_step": 2251, "train_info/time_within_train_step": 2.520569324493408, "step": 2251} {"train_info/time_between_train_steps": 0.0033826828002929688, "step": 2251} {"info/global_step": 2252, "train_info/time_within_train_step": 2.520742893218994, "step": 2252} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 2252} {"info/global_step": 2253, "train_info/time_within_train_step": 2.522204875946045, "step": 2253} {"train_info/time_between_train_steps": 0.003418445587158203, "step": 2253} {"info/global_step": 2254, "train_info/time_within_train_step": 2.521282196044922, "step": 2254} {"train_info/time_between_train_steps": 0.003412961959838867, "step": 2254} {"info/global_step": 2255, "train_info/time_within_train_step": 2.521826982498169, "step": 2255} {"train_info/time_between_train_steps": 0.0034172534942626953, "step": 2255} {"info/global_step": 2256, "train_info/time_within_train_step": 2.5212302207946777, "step": 2256} {"train_info/time_between_train_steps": 0.0033426284790039062, "step": 2256} {"info/global_step": 2257, "train_info/time_within_train_step": 2.5218935012817383, "step": 2257} {"train_info/time_between_train_steps": 0.003381013870239258, "step": 2257} {"info/global_step": 2258, "train_info/time_within_train_step": 2.5205554962158203, "step": 2258} {"train_info/time_between_train_steps": 0.0037755966186523438, "step": 2258} {"info/global_step": 2259, "train_info/time_within_train_step": 2.520569086074829, "step": 2259} {"train_info/time_between_train_steps": 0.003375530242919922, "step": 2259} {"info/global_step": 2260, "train_info/time_within_train_step": 2.520322799682617, "step": 2260} {"train_info/time_between_train_steps": 0.003362894058227539, "step": 2260} {"info/global_step": 2261, "train_info/time_within_train_step": 2.520280361175537, "step": 2261} {"train_info/time_between_train_steps": 0.0034394264221191406, "step": 2261} {"info/global_step": 2262, "train_info/time_within_train_step": 2.520566701889038, "step": 2262} {"train_info/time_between_train_steps": 0.003427267074584961, "step": 2262} {"info/global_step": 2263, "train_info/time_within_train_step": 2.5200133323669434, "step": 2263} {"train_info/time_between_train_steps": 0.003340005874633789, "step": 2263} {"info/global_step": 2264, "train_info/time_within_train_step": 2.5199990272521973, "step": 2264} {"train_info/time_between_train_steps": 0.0034706592559814453, "step": 2264} {"info/global_step": 2265, "train_info/time_within_train_step": 2.5202107429504395, "step": 2265} {"train_info/time_between_train_steps": 0.0036084651947021484, "step": 2265} {"info/global_step": 2266, "train_info/time_within_train_step": 2.5199155807495117, "step": 2266} {"train_info/time_between_train_steps": 0.0033218860626220703, "step": 2266} {"info/global_step": 2267, "train_info/time_within_train_step": 2.5474870204925537, "step": 2267} {"train_info/time_between_train_steps": 0.003560781478881836, "step": 2267} {"info/global_step": 2268, "train_info/time_within_train_step": 2.5207831859588623, "step": 2268} {"train_info/time_between_train_steps": 0.0034139156341552734, "step": 2268} {"info/global_step": 2269, "train_info/time_within_train_step": 2.521409511566162, "step": 2269} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 2269} {"info/global_step": 2270, "train_info/time_within_train_step": 2.5213606357574463, "step": 2270} {"train_info/time_between_train_steps": 0.0034263134002685547, "step": 2270} {"info/global_step": 2271, "train_info/time_within_train_step": 2.5220556259155273, "step": 2271} {"train_info/time_between_train_steps": 0.003579854965209961, "step": 2271} {"info/global_step": 2272, "train_info/time_within_train_step": 2.5226635932922363, "step": 2272} {"train_info/time_between_train_steps": 0.0033617019653320312, "step": 2272} {"info/global_step": 2273, "train_info/time_within_train_step": 2.521393060684204, "step": 2273} {"train_info/time_between_train_steps": 0.0033876895904541016, "step": 2273} {"info/global_step": 2274, "train_info/time_within_train_step": 2.522167205810547, "step": 2274} {"train_info/time_between_train_steps": 0.003416299819946289, "step": 2274} {"info/global_step": 2275, "train_info/time_within_train_step": 2.5207619667053223, "step": 2275} {"train_info/time_between_train_steps": 0.0033473968505859375, "step": 2275} {"info/global_step": 2276, "train_info/time_within_train_step": 2.5212981700897217, "step": 2276} {"train_info/time_between_train_steps": 0.003376483917236328, "step": 2276} {"info/global_step": 2277, "train_info/time_within_train_step": 2.5205132961273193, "step": 2277} {"train_info/time_between_train_steps": 0.0035140514373779297, "step": 2277} {"info/global_step": 2278, "train_info/time_within_train_step": 2.520195960998535, "step": 2278} {"train_info/time_between_train_steps": 0.003612041473388672, "step": 2278} {"info/global_step": 2279, "train_info/time_within_train_step": 2.51969575881958, "step": 2279} {"train_info/time_between_train_steps": 0.0033380985260009766, "step": 2279} {"info/global_step": 2280, "train_info/time_within_train_step": 2.525257110595703, "step": 2280} {"train_info/time_between_train_steps": 0.003381013870239258, "step": 2280} {"info/global_step": 2281, "train_info/time_within_train_step": 2.5198068618774414, "step": 2281} {"train_info/time_between_train_steps": 0.00356292724609375, "step": 2281} {"info/global_step": 2282, "train_info/time_within_train_step": 2.520042657852173, "step": 2282} {"train_info/time_between_train_steps": 0.0034754276275634766, "step": 2282} {"info/global_step": 2283, "train_info/time_within_train_step": 2.5517354011535645, "step": 2283} {"train_info/time_between_train_steps": 0.003450155258178711, "step": 2283} {"info/global_step": 2284, "train_info/time_within_train_step": 2.520026922225952, "step": 2284} {"train_info/time_between_train_steps": 0.12473559379577637, "step": 2284} {"info/global_step": 2285, "train_info/time_within_train_step": 2.520951747894287, "step": 2285} {"train_info/time_between_train_steps": 0.0034177303314208984, "step": 2285} {"info/global_step": 2286, "train_info/time_within_train_step": 2.5219178199768066, "step": 2286} {"train_info/time_between_train_steps": 0.0034134387969970703, "step": 2286} {"info/global_step": 2287, "train_info/time_within_train_step": 2.522156000137329, "step": 2287} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 2287} {"info/global_step": 2288, "train_info/time_within_train_step": 2.5214855670928955, "step": 2288} {"train_info/time_between_train_steps": 0.003391265869140625, "step": 2288} {"info/global_step": 2289, "train_info/time_within_train_step": 2.5221660137176514, "step": 2289} {"train_info/time_between_train_steps": 0.0034029483795166016, "step": 2289} {"info/global_step": 2290, "train_info/time_within_train_step": 2.5220508575439453, "step": 2290} {"train_info/time_between_train_steps": 0.003395557403564453, "step": 2290} {"info/global_step": 2291, "train_info/time_within_train_step": 2.5224013328552246, "step": 2291} {"train_info/time_between_train_steps": 0.0033979415893554688, "step": 2291} {"info/global_step": 2292, "train_info/time_within_train_step": 2.521599054336548, "step": 2292} {"train_info/time_between_train_steps": 0.0034117698669433594, "step": 2292} {"info/global_step": 2293, "train_info/time_within_train_step": 2.521677255630493, "step": 2293} {"train_info/time_between_train_steps": 0.0033941268920898438, "step": 2293} {"info/global_step": 2294, "train_info/time_within_train_step": 2.5214433670043945, "step": 2294} {"train_info/time_between_train_steps": 0.0033931732177734375, "step": 2294} {"info/global_step": 2295, "train_info/time_within_train_step": 2.520918130874634, "step": 2295} {"train_info/time_between_train_steps": 0.003410816192626953, "step": 2295} {"info/global_step": 2296, "train_info/time_within_train_step": 2.773726463317871, "step": 2296} {"train_info/time_between_train_steps": 0.0034596920013427734, "step": 2296} {"info/global_step": 2297, "train_info/time_within_train_step": 2.5201644897460938, "step": 2297} {"train_info/time_between_train_steps": 0.0034236907958984375, "step": 2297} {"info/global_step": 2298, "train_info/time_within_train_step": 2.5206360816955566, "step": 2298} {"train_info/time_between_train_steps": 0.0033910274505615234, "step": 2298} {"info/global_step": 2299, "train_info/time_within_train_step": 2.5212361812591553, "step": 2299} {"train_info/time_between_train_steps": 0.0034286975860595703, "step": 2299} {"info/global_step": 2300, "train_info/time_within_train_step": 2.5213425159454346, "step": 2300} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746329210, "_runtime": 6258}, "step": 2300} {"logs": {"train/loss": 4.0346, "train/learning_rate": 0.00015555555555555554, "train/epoch": 2.17, "_timestamp": 1746329210, "_runtime": 6258}, "step": 2300} {"train_info/time_between_train_steps": 13.392890214920044, "step": 2300} {"info/global_step": 2301, "train_info/time_within_train_step": 2.337298631668091, "step": 2301} {"train_info/time_between_train_steps": 0.003400087356567383, "step": 2301} {"info/global_step": 2302, "train_info/time_within_train_step": 2.3238368034362793, "step": 2302} {"train_info/time_between_train_steps": 0.003441333770751953, "step": 2302} {"info/global_step": 2303, "train_info/time_within_train_step": 2.4901716709136963, "step": 2303} {"train_info/time_between_train_steps": 0.0034208297729492188, "step": 2303} {"info/global_step": 2304, "train_info/time_within_train_step": 2.521181583404541, "step": 2304} {"train_info/time_between_train_steps": 0.0034170150756835938, "step": 2304} {"info/global_step": 2305, "train_info/time_within_train_step": 2.520317316055298, "step": 2305} {"train_info/time_between_train_steps": 0.0033986568450927734, "step": 2305} {"info/global_step": 2306, "train_info/time_within_train_step": 2.521381139755249, "step": 2306} {"train_info/time_between_train_steps": 0.0034601688385009766, "step": 2306} {"info/global_step": 2307, "train_info/time_within_train_step": 2.5224061012268066, "step": 2307} {"train_info/time_between_train_steps": 0.0034062862396240234, "step": 2307} {"info/global_step": 2308, "train_info/time_within_train_step": 2.521744728088379, "step": 2308} {"train_info/time_between_train_steps": 0.003392457962036133, "step": 2308} {"info/global_step": 2309, "train_info/time_within_train_step": 2.5494751930236816, "step": 2309} {"train_info/time_between_train_steps": 0.0034008026123046875, "step": 2309} {"info/global_step": 2310, "train_info/time_within_train_step": 2.521845579147339, "step": 2310} {"train_info/time_between_train_steps": 0.003415822982788086, "step": 2310} {"info/global_step": 2311, "train_info/time_within_train_step": 2.521770477294922, "step": 2311} {"train_info/time_between_train_steps": 0.0034127235412597656, "step": 2311} {"info/global_step": 2312, "train_info/time_within_train_step": 2.5221915245056152, "step": 2312} {"train_info/time_between_train_steps": 0.003465890884399414, "step": 2312} {"info/global_step": 2313, "train_info/time_within_train_step": 2.5222716331481934, "step": 2313} {"train_info/time_between_train_steps": 0.003399372100830078, "step": 2313} {"info/global_step": 2314, "train_info/time_within_train_step": 2.5226190090179443, "step": 2314} {"train_info/time_between_train_steps": 0.0034279823303222656, "step": 2314} {"info/global_step": 2315, "train_info/time_within_train_step": 2.522322416305542, "step": 2315} {"train_info/time_between_train_steps": 0.003407001495361328, "step": 2315} {"info/global_step": 2316, "train_info/time_within_train_step": 2.5226995944976807, "step": 2316} {"train_info/time_between_train_steps": 0.003396272659301758, "step": 2316} {"info/global_step": 2317, "train_info/time_within_train_step": 2.522993803024292, "step": 2317} {"train_info/time_between_train_steps": 0.003408193588256836, "step": 2317} {"info/global_step": 2318, "train_info/time_within_train_step": 2.521996021270752, "step": 2318} {"train_info/time_between_train_steps": 0.003460407257080078, "step": 2318} {"info/global_step": 2319, "train_info/time_within_train_step": 2.522662401199341, "step": 2319} {"train_info/time_between_train_steps": 0.0035071372985839844, "step": 2319} {"info/global_step": 2320, "train_info/time_within_train_step": 2.52311372756958, "step": 2320} {"train_info/time_between_train_steps": 0.0033876895904541016, "step": 2320} {"info/global_step": 2321, "train_info/time_within_train_step": 2.523094892501831, "step": 2321} {"train_info/time_between_train_steps": 0.0034439563751220703, "step": 2321} {"info/global_step": 2322, "train_info/time_within_train_step": 2.527592658996582, "step": 2322} {"train_info/time_between_train_steps": 0.0034127235412597656, "step": 2322} {"info/global_step": 2323, "train_info/time_within_train_step": 2.5230157375335693, "step": 2323} {"train_info/time_between_train_steps": 0.0034127235412597656, "step": 2323} {"info/global_step": 2324, "train_info/time_within_train_step": 2.52327823638916, "step": 2324} {"train_info/time_between_train_steps": 0.0035219192504882812, "step": 2324} {"info/global_step": 2325, "train_info/time_within_train_step": 2.5553317070007324, "step": 2325} {"train_info/time_between_train_steps": 0.003419637680053711, "step": 2325} {"info/global_step": 2326, "train_info/time_within_train_step": 2.5226898193359375, "step": 2326} {"train_info/time_between_train_steps": 0.003477334976196289, "step": 2326} {"info/global_step": 2327, "train_info/time_within_train_step": 2.522630453109741, "step": 2327} {"train_info/time_between_train_steps": 0.003426790237426758, "step": 2327} {"info/global_step": 2328, "train_info/time_within_train_step": 2.5222697257995605, "step": 2328} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 2328} {"info/global_step": 2329, "train_info/time_within_train_step": 2.522728204727173, "step": 2329} {"train_info/time_between_train_steps": 0.003459930419921875, "step": 2329} {"info/global_step": 2330, "train_info/time_within_train_step": 2.523176908493042, "step": 2330} {"train_info/time_between_train_steps": 0.003468036651611328, "step": 2330} {"info/global_step": 2331, "train_info/time_within_train_step": 2.5231924057006836, "step": 2331} {"train_info/time_between_train_steps": 0.003434419631958008, "step": 2331} {"info/global_step": 2332, "train_info/time_within_train_step": 2.522517442703247, "step": 2332} {"train_info/time_between_train_steps": 0.0034737586975097656, "step": 2332} {"info/global_step": 2333, "train_info/time_within_train_step": 2.522603750228882, "step": 2333} {"train_info/time_between_train_steps": 0.0034766197204589844, "step": 2333} {"info/global_step": 2334, "train_info/time_within_train_step": 2.5232386589050293, "step": 2334} {"train_info/time_between_train_steps": 0.003453969955444336, "step": 2334} {"info/global_step": 2335, "train_info/time_within_train_step": 2.523401975631714, "step": 2335} {"train_info/time_between_train_steps": 0.0034399032592773438, "step": 2335} {"info/global_step": 2336, "train_info/time_within_train_step": 2.523313045501709, "step": 2336} {"train_info/time_between_train_steps": 0.003468751907348633, "step": 2336} {"info/global_step": 2337, "train_info/time_within_train_step": 2.7811691761016846, "step": 2337} {"train_info/time_between_train_steps": 0.003453493118286133, "step": 2337} {"info/global_step": 2338, "train_info/time_within_train_step": 2.5237836837768555, "step": 2338} {"train_info/time_between_train_steps": 0.003435373306274414, "step": 2338} {"info/global_step": 2339, "train_info/time_within_train_step": 2.5233359336853027, "step": 2339} {"train_info/time_between_train_steps": 0.003471851348876953, "step": 2339} {"info/global_step": 2340, "train_info/time_within_train_step": 2.523007869720459, "step": 2340} {"train_info/time_between_train_steps": 0.003485441207885742, "step": 2340} {"info/global_step": 2341, "train_info/time_within_train_step": 2.5226759910583496, "step": 2341} {"train_info/time_between_train_steps": 0.003451108932495117, "step": 2341} {"info/global_step": 2342, "train_info/time_within_train_step": 2.5229172706604004, "step": 2342} {"train_info/time_between_train_steps": 0.003448009490966797, "step": 2342} {"info/global_step": 2343, "train_info/time_within_train_step": 2.522078514099121, "step": 2343} {"train_info/time_between_train_steps": 0.0034608840942382812, "step": 2343} {"info/global_step": 2344, "train_info/time_within_train_step": 2.522611141204834, "step": 2344} {"train_info/time_between_train_steps": 0.003434896469116211, "step": 2344} {"info/global_step": 2345, "train_info/time_within_train_step": 2.5227468013763428, "step": 2345} {"train_info/time_between_train_steps": 0.003452301025390625, "step": 2345} {"info/global_step": 2346, "train_info/time_within_train_step": 2.5235159397125244, "step": 2346} {"train_info/time_between_train_steps": 0.0034601688385009766, "step": 2346} {"info/global_step": 2347, "train_info/time_within_train_step": 2.5707435607910156, "step": 2347} {"train_info/time_between_train_steps": 0.0034792423248291016, "step": 2347} {"info/global_step": 2348, "train_info/time_within_train_step": 2.523298978805542, "step": 2348} {"train_info/time_between_train_steps": 0.003472566604614258, "step": 2348} {"info/global_step": 2349, "train_info/time_within_train_step": 2.523265838623047, "step": 2349} {"train_info/time_between_train_steps": 0.0034732818603515625, "step": 2349} {"info/global_step": 2350, "train_info/time_within_train_step": 2.5225391387939453, "step": 2350} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746329351, "_runtime": 6399}, "step": 2350} {"logs": {"train/loss": 4.018, "train/learning_rate": 0.0001444444444444444, "train/epoch": 2.19, "_timestamp": 1746329351, "_runtime": 6399}, "step": 2350} {"train_info/time_between_train_steps": 0.025074005126953125, "step": 2350} {"info/global_step": 2351, "train_info/time_within_train_step": 2.5235393047332764, "step": 2351} {"train_info/time_between_train_steps": 0.003438234329223633, "step": 2351} {"info/global_step": 2352, "train_info/time_within_train_step": 2.522855520248413, "step": 2352} {"train_info/time_between_train_steps": 0.0034346580505371094, "step": 2352} {"info/global_step": 2353, "train_info/time_within_train_step": 2.5236048698425293, "step": 2353} {"train_info/time_between_train_steps": 0.0034966468811035156, "step": 2353} {"info/global_step": 2354, "train_info/time_within_train_step": 2.5236124992370605, "step": 2354} {"train_info/time_between_train_steps": 0.003519773483276367, "step": 2354} {"info/global_step": 2355, "train_info/time_within_train_step": 2.5232648849487305, "step": 2355} {"train_info/time_between_train_steps": 0.0034797191619873047, "step": 2355} {"info/global_step": 2356, "train_info/time_within_train_step": 2.5231642723083496, "step": 2356} {"train_info/time_between_train_steps": 0.0034308433532714844, "step": 2356} {"info/global_step": 2357, "train_info/time_within_train_step": 2.5240325927734375, "step": 2357} {"train_info/time_between_train_steps": 0.0036516189575195312, "step": 2357} {"info/global_step": 2358, "train_info/time_within_train_step": 2.523104667663574, "step": 2358} {"train_info/time_between_train_steps": 0.0035343170166015625, "step": 2358} {"info/global_step": 2359, "train_info/time_within_train_step": 2.524303436279297, "step": 2359} {"train_info/time_between_train_steps": 0.003759145736694336, "step": 2359} {"info/global_step": 2360, "train_info/time_within_train_step": 2.5571908950805664, "step": 2360} {"train_info/time_between_train_steps": 0.003503561019897461, "step": 2360} {"info/global_step": 2361, "train_info/time_within_train_step": 2.5231001377105713, "step": 2361} {"train_info/time_between_train_steps": 0.0034918785095214844, "step": 2361} {"info/global_step": 2362, "train_info/time_within_train_step": 2.5235867500305176, "step": 2362} {"train_info/time_between_train_steps": 0.003498554229736328, "step": 2362} {"info/global_step": 2363, "train_info/time_within_train_step": 2.523364305496216, "step": 2363} {"train_info/time_between_train_steps": 0.0034589767456054688, "step": 2363} {"info/global_step": 2364, "train_info/time_within_train_step": 2.532747268676758, "step": 2364} {"train_info/time_between_train_steps": 0.0031108856201171875, "step": 2364} {"info/global_step": 2365, "train_info/time_within_train_step": 2.521045684814453, "step": 2365} {"train_info/time_between_train_steps": 0.0031011104583740234, "step": 2365} {"info/global_step": 2366, "train_info/time_within_train_step": 2.5217642784118652, "step": 2366} {"train_info/time_between_train_steps": 0.003106832504272461, "step": 2366} {"info/global_step": 2367, "train_info/time_within_train_step": 2.521627902984619, "step": 2367} {"train_info/time_between_train_steps": 0.0032465457916259766, "step": 2367} {"info/global_step": 2368, "train_info/time_within_train_step": 2.521366834640503, "step": 2368} {"train_info/time_between_train_steps": 0.0032958984375, "step": 2368} {"info/global_step": 2369, "train_info/time_within_train_step": 2.5202877521514893, "step": 2369} {"train_info/time_between_train_steps": 0.0032720565795898438, "step": 2369} {"info/global_step": 2370, "train_info/time_within_train_step": 2.5213775634765625, "step": 2370} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 2370} {"info/global_step": 2371, "train_info/time_within_train_step": 2.5206551551818848, "step": 2371} {"train_info/time_between_train_steps": 0.003286123275756836, "step": 2371} {"info/global_step": 2372, "train_info/time_within_train_step": 2.521313428878784, "step": 2372} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 2372} {"info/global_step": 2373, "train_info/time_within_train_step": 2.5214364528656006, "step": 2373} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 2373} {"info/global_step": 2374, "train_info/time_within_train_step": 2.5217926502227783, "step": 2374} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 2374} {"info/global_step": 2375, "train_info/time_within_train_step": 2.522287368774414, "step": 2375} {"train_info/time_between_train_steps": 0.003339529037475586, "step": 2375} {"info/global_step": 2376, "train_info/time_within_train_step": 2.520453929901123, "step": 2376} {"train_info/time_between_train_steps": 0.0033333301544189453, "step": 2376} {"info/global_step": 2377, "train_info/time_within_train_step": 2.5210447311401367, "step": 2377} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 2377} {"info/global_step": 2378, "train_info/time_within_train_step": 2.521256446838379, "step": 2378} {"train_info/time_between_train_steps": 0.003073453903198242, "step": 2378} {"info/global_step": 2379, "train_info/time_within_train_step": 2.520899772644043, "step": 2379} {"train_info/time_between_train_steps": 0.003242969512939453, "step": 2379} {"info/global_step": 2380, "train_info/time_within_train_step": 2.5209152698516846, "step": 2380} {"train_info/time_between_train_steps": 0.003119230270385742, "step": 2380} {"info/global_step": 2381, "train_info/time_within_train_step": 2.5207364559173584, "step": 2381} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 2381} {"info/global_step": 2382, "train_info/time_within_train_step": 2.521003484725952, "step": 2382} {"train_info/time_between_train_steps": 0.003094911575317383, "step": 2382} {"info/global_step": 2383, "train_info/time_within_train_step": 2.5199406147003174, "step": 2383} {"train_info/time_between_train_steps": 0.0030651092529296875, "step": 2383} {"info/global_step": 2384, "train_info/time_within_train_step": 2.5206058025360107, "step": 2384} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 2384} {"info/global_step": 2385, "train_info/time_within_train_step": 2.5202829837799072, "step": 2385} {"train_info/time_between_train_steps": 0.0031070709228515625, "step": 2385} {"info/global_step": 2386, "train_info/time_within_train_step": 2.52121901512146, "step": 2386} {"train_info/time_between_train_steps": 0.0030820369720458984, "step": 2386} {"info/global_step": 2387, "train_info/time_within_train_step": 2.521329641342163, "step": 2387} {"train_info/time_between_train_steps": 0.0030672550201416016, "step": 2387} {"info/global_step": 2388, "train_info/time_within_train_step": 2.5212948322296143, "step": 2388} {"train_info/time_between_train_steps": 0.003072023391723633, "step": 2388} {"info/global_step": 2389, "train_info/time_within_train_step": 2.5204122066497803, "step": 2389} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 2389} {"info/global_step": 2390, "train_info/time_within_train_step": 2.5209696292877197, "step": 2390} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 2390} {"info/global_step": 2391, "train_info/time_within_train_step": 2.5207712650299072, "step": 2391} {"train_info/time_between_train_steps": 0.003078937530517578, "step": 2391} {"info/global_step": 2392, "train_info/time_within_train_step": 2.5211825370788574, "step": 2392} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 2392} {"info/global_step": 2393, "train_info/time_within_train_step": 2.5213112831115723, "step": 2393} {"train_info/time_between_train_steps": 0.003373861312866211, "step": 2393} {"info/global_step": 2394, "train_info/time_within_train_step": 2.5207762718200684, "step": 2394} {"train_info/time_between_train_steps": 0.0030930042266845703, "step": 2394} {"info/global_step": 2395, "train_info/time_within_train_step": 2.5205588340759277, "step": 2395} {"train_info/time_between_train_steps": 0.003078937530517578, "step": 2395} {"info/global_step": 2396, "train_info/time_within_train_step": 2.549342155456543, "step": 2396} {"train_info/time_between_train_steps": 0.003327608108520508, "step": 2396} {"info/global_step": 2397, "train_info/time_within_train_step": 2.521399974822998, "step": 2397} {"train_info/time_between_train_steps": 0.003070354461669922, "step": 2397} {"info/global_step": 2398, "train_info/time_within_train_step": 2.52093243598938, "step": 2398} {"train_info/time_between_train_steps": 0.003097057342529297, "step": 2398} {"info/global_step": 2399, "train_info/time_within_train_step": 2.5215184688568115, "step": 2399} {"train_info/time_between_train_steps": 0.003272533416748047, "step": 2399} {"info/global_step": 2400, "train_info/time_within_train_step": 2.521296501159668, "step": 2400} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746329478, "_runtime": 6526}, "step": 2400} {"logs": {"train/loss": 4.0038, "train/learning_rate": 0.0001333333333333333, "train/epoch": 2.21, "_timestamp": 1746329478, "_runtime": 6526}, "step": 2400} {"train_info/time_between_train_steps": 12.920542478561401, "step": 2400} {"info/global_step": 2401, "train_info/time_within_train_step": 2.335667610168457, "step": 2401} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 2401} {"info/global_step": 2402, "train_info/time_within_train_step": 2.3280999660491943, "step": 2402} {"train_info/time_between_train_steps": 0.003055095672607422, "step": 2402} {"info/global_step": 2403, "train_info/time_within_train_step": 2.5020763874053955, "step": 2403} {"train_info/time_between_train_steps": 0.003074169158935547, "step": 2403} {"info/global_step": 2404, "train_info/time_within_train_step": 2.5195164680480957, "step": 2404} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 2404} {"info/global_step": 2405, "train_info/time_within_train_step": 2.5200047492980957, "step": 2405} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 2405} {"info/global_step": 2406, "train_info/time_within_train_step": 2.521226167678833, "step": 2406} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 2406} {"info/global_step": 2407, "train_info/time_within_train_step": 2.5210912227630615, "step": 2407} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 2407} {"info/global_step": 2408, "train_info/time_within_train_step": 2.5203139781951904, "step": 2408} {"train_info/time_between_train_steps": 0.0032749176025390625, "step": 2408} {"info/global_step": 2409, "train_info/time_within_train_step": 2.5215003490448, "step": 2409} {"train_info/time_between_train_steps": 0.003183126449584961, "step": 2409} {"info/global_step": 2410, "train_info/time_within_train_step": 2.5209827423095703, "step": 2410} {"train_info/time_between_train_steps": 0.003047466278076172, "step": 2410} {"info/global_step": 2411, "train_info/time_within_train_step": 2.5209906101226807, "step": 2411} {"train_info/time_between_train_steps": 0.0030994415283203125, "step": 2411} {"info/global_step": 2412, "train_info/time_within_train_step": 2.5218660831451416, "step": 2412} {"train_info/time_between_train_steps": 0.003038167953491211, "step": 2412} {"info/global_step": 2413, "train_info/time_within_train_step": 2.5222175121307373, "step": 2413} {"train_info/time_between_train_steps": 0.0031299591064453125, "step": 2413} {"info/global_step": 2414, "train_info/time_within_train_step": 2.5218868255615234, "step": 2414} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 2414} {"info/global_step": 2415, "train_info/time_within_train_step": 2.7243449687957764, "step": 2415} {"train_info/time_between_train_steps": 0.003110170364379883, "step": 2415} {"info/global_step": 2416, "train_info/time_within_train_step": 2.521669864654541, "step": 2416} {"train_info/time_between_train_steps": 0.0030944347381591797, "step": 2416} {"info/global_step": 2417, "train_info/time_within_train_step": 2.5229763984680176, "step": 2417} {"train_info/time_between_train_steps": 0.003106832504272461, "step": 2417} {"info/global_step": 2418, "train_info/time_within_train_step": 2.5217394828796387, "step": 2418} {"train_info/time_between_train_steps": 0.003104686737060547, "step": 2418} {"info/global_step": 2419, "train_info/time_within_train_step": 2.5218868255615234, "step": 2419} {"train_info/time_between_train_steps": 0.003275632858276367, "step": 2419} {"info/global_step": 2420, "train_info/time_within_train_step": 2.5230553150177, "step": 2420} {"train_info/time_between_train_steps": 0.0030906200408935547, "step": 2420} {"info/global_step": 2421, "train_info/time_within_train_step": 2.5231587886810303, "step": 2421} {"train_info/time_between_train_steps": 0.0032911300659179688, "step": 2421} {"info/global_step": 2422, "train_info/time_within_train_step": 2.522742986679077, "step": 2422} {"train_info/time_between_train_steps": 0.0031118392944335938, "step": 2422} {"info/global_step": 2423, "train_info/time_within_train_step": 2.522024631500244, "step": 2423} {"train_info/time_between_train_steps": 0.003403186798095703, "step": 2423} {"info/global_step": 2424, "train_info/time_within_train_step": 2.522272825241089, "step": 2424} {"train_info/time_between_train_steps": 0.0030541419982910156, "step": 2424} {"info/global_step": 2425, "train_info/time_within_train_step": 2.522094488143921, "step": 2425} {"train_info/time_between_train_steps": 0.0032758712768554688, "step": 2425} {"info/global_step": 2426, "train_info/time_within_train_step": 2.5546696186065674, "step": 2426} {"train_info/time_between_train_steps": 0.0033380985260009766, "step": 2426} {"info/global_step": 2427, "train_info/time_within_train_step": 2.5231094360351562, "step": 2427} {"train_info/time_between_train_steps": 0.003117084503173828, "step": 2427} {"info/global_step": 2428, "train_info/time_within_train_step": 2.5217549800872803, "step": 2428} {"train_info/time_between_train_steps": 0.0032510757446289062, "step": 2428} {"info/global_step": 2429, "train_info/time_within_train_step": 2.521625280380249, "step": 2429} {"train_info/time_between_train_steps": 0.003052234649658203, "step": 2429} {"info/global_step": 2430, "train_info/time_within_train_step": 2.5219204425811768, "step": 2430} {"train_info/time_between_train_steps": 0.0033211708068847656, "step": 2430} {"info/global_step": 2431, "train_info/time_within_train_step": 2.522003650665283, "step": 2431} {"train_info/time_between_train_steps": 0.003092050552368164, "step": 2431} {"info/global_step": 2432, "train_info/time_within_train_step": 2.523042678833008, "step": 2432} {"train_info/time_between_train_steps": 0.0030965805053710938, "step": 2432} {"info/global_step": 2433, "train_info/time_within_train_step": 2.523041009902954, "step": 2433} {"train_info/time_between_train_steps": 0.0033109188079833984, "step": 2433} {"info/global_step": 2434, "train_info/time_within_train_step": 2.5221049785614014, "step": 2434} {"train_info/time_between_train_steps": 0.00304412841796875, "step": 2434} {"info/global_step": 2435, "train_info/time_within_train_step": 2.5223448276519775, "step": 2435} {"train_info/time_between_train_steps": 0.00311279296875, "step": 2435} {"info/global_step": 2436, "train_info/time_within_train_step": 2.5223960876464844, "step": 2436} {"train_info/time_between_train_steps": 0.0030426979064941406, "step": 2436} {"info/global_step": 2437, "train_info/time_within_train_step": 2.522752046585083, "step": 2437} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 2437} {"info/global_step": 2438, "train_info/time_within_train_step": 2.5227878093719482, "step": 2438} {"train_info/time_between_train_steps": 0.0030808448791503906, "step": 2438} {"info/global_step": 2439, "train_info/time_within_train_step": 2.52274489402771, "step": 2439} {"train_info/time_between_train_steps": 0.0030722618103027344, "step": 2439} {"info/global_step": 2440, "train_info/time_within_train_step": 2.5231826305389404, "step": 2440} {"train_info/time_between_train_steps": 0.003316640853881836, "step": 2440} {"info/global_step": 2441, "train_info/time_within_train_step": 2.5223395824432373, "step": 2441} {"train_info/time_between_train_steps": 0.0030939579010009766, "step": 2441} {"info/global_step": 2442, "train_info/time_within_train_step": 2.521535873413086, "step": 2442} {"train_info/time_between_train_steps": 0.0032744407653808594, "step": 2442} {"info/global_step": 2443, "train_info/time_within_train_step": 2.522279739379883, "step": 2443} {"train_info/time_between_train_steps": 0.0030553340911865234, "step": 2443} {"info/global_step": 2444, "train_info/time_within_train_step": 2.5224108695983887, "step": 2444} {"train_info/time_between_train_steps": 0.0030739307403564453, "step": 2444} {"info/global_step": 2445, "train_info/time_within_train_step": 2.5216739177703857, "step": 2445} {"train_info/time_between_train_steps": 0.0032427310943603516, "step": 2445} {"info/global_step": 2446, "train_info/time_within_train_step": 2.5221872329711914, "step": 2446} {"train_info/time_between_train_steps": 0.0030775070190429688, "step": 2446} {"info/global_step": 2447, "train_info/time_within_train_step": 2.5215580463409424, "step": 2447} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 2447} {"info/global_step": 2448, "train_info/time_within_train_step": 2.522705078125, "step": 2448} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 2448} {"info/global_step": 2449, "train_info/time_within_train_step": 2.522108554840088, "step": 2449} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 2449} {"info/global_step": 2450, "train_info/time_within_train_step": 2.52272891998291, "step": 2450} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746329618, "_runtime": 6666}, "step": 2450} {"logs": {"train/loss": 3.9859, "train/learning_rate": 0.00012222222222222221, "train/epoch": 2.22, "_timestamp": 1746329618, "_runtime": 6666}, "step": 2450} {"train_info/time_between_train_steps": 0.02484869956970215, "step": 2450} {"info/global_step": 2451, "train_info/time_within_train_step": 2.5230393409729004, "step": 2451} {"train_info/time_between_train_steps": 0.0032639503479003906, "step": 2451} {"info/global_step": 2452, "train_info/time_within_train_step": 2.5225894451141357, "step": 2452} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 2452} {"info/global_step": 2453, "train_info/time_within_train_step": 2.522552490234375, "step": 2453} {"train_info/time_between_train_steps": 0.003116607666015625, "step": 2453} {"info/global_step": 2454, "train_info/time_within_train_step": 2.5226423740386963, "step": 2454} {"train_info/time_between_train_steps": 0.003080129623413086, "step": 2454} {"info/global_step": 2455, "train_info/time_within_train_step": 2.522688627243042, "step": 2455} {"train_info/time_between_train_steps": 0.0030617713928222656, "step": 2455} {"info/global_step": 2456, "train_info/time_within_train_step": 2.697152853012085, "step": 2456} {"train_info/time_between_train_steps": 0.00308990478515625, "step": 2456} {"info/global_step": 2457, "train_info/time_within_train_step": 2.521514892578125, "step": 2457} {"train_info/time_between_train_steps": 0.0030913352966308594, "step": 2457} {"info/global_step": 2458, "train_info/time_within_train_step": 2.522049903869629, "step": 2458} {"train_info/time_between_train_steps": 0.0032608509063720703, "step": 2458} {"info/global_step": 2459, "train_info/time_within_train_step": 2.5225374698638916, "step": 2459} {"train_info/time_between_train_steps": 0.0031211376190185547, "step": 2459} {"info/global_step": 2460, "train_info/time_within_train_step": 2.521277904510498, "step": 2460} {"train_info/time_between_train_steps": 0.0030727386474609375, "step": 2460} {"info/global_step": 2461, "train_info/time_within_train_step": 2.521507740020752, "step": 2461} {"train_info/time_between_train_steps": 0.0032587051391601562, "step": 2461} {"info/global_step": 2462, "train_info/time_within_train_step": 2.549513101577759, "step": 2462} {"train_info/time_between_train_steps": 0.0033364295959472656, "step": 2462} {"info/global_step": 2463, "train_info/time_within_train_step": 2.522446870803833, "step": 2463} {"train_info/time_between_train_steps": 0.0030782222747802734, "step": 2463} {"info/global_step": 2464, "train_info/time_within_train_step": 2.521764039993286, "step": 2464} {"train_info/time_between_train_steps": 0.003361940383911133, "step": 2464} {"info/global_step": 2465, "train_info/time_within_train_step": 2.522082805633545, "step": 2465} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 2465} {"info/global_step": 2466, "train_info/time_within_train_step": 2.5221471786499023, "step": 2466} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 2466} {"info/global_step": 2467, "train_info/time_within_train_step": 2.5215606689453125, "step": 2467} {"train_info/time_between_train_steps": 0.0030705928802490234, "step": 2467} {"info/global_step": 2468, "train_info/time_within_train_step": 2.5216965675354004, "step": 2468} {"train_info/time_between_train_steps": 0.0031168460845947266, "step": 2468} {"info/global_step": 2469, "train_info/time_within_train_step": 2.522348642349243, "step": 2469} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 2469} {"info/global_step": 2470, "train_info/time_within_train_step": 2.5221195220947266, "step": 2470} {"train_info/time_between_train_steps": 0.003531217575073242, "step": 2470} {"info/global_step": 2471, "train_info/time_within_train_step": 2.52347993850708, "step": 2471} {"train_info/time_between_train_steps": 0.003236055374145508, "step": 2471} {"info/global_step": 2472, "train_info/time_within_train_step": 2.5222291946411133, "step": 2472} {"train_info/time_between_train_steps": 0.0033769607543945312, "step": 2472} {"info/global_step": 2473, "train_info/time_within_train_step": 2.52193284034729, "step": 2473} {"train_info/time_between_train_steps": 0.0033037662506103516, "step": 2473} {"info/global_step": 2474, "train_info/time_within_train_step": 2.5222833156585693, "step": 2474} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 2474} {"info/global_step": 2475, "train_info/time_within_train_step": 2.522887706756592, "step": 2475} {"train_info/time_between_train_steps": 0.0033414363861083984, "step": 2475} {"info/global_step": 2476, "train_info/time_within_train_step": 2.5222160816192627, "step": 2476} {"train_info/time_between_train_steps": 0.003319263458251953, "step": 2476} {"info/global_step": 2477, "train_info/time_within_train_step": 2.5218257904052734, "step": 2477} {"train_info/time_between_train_steps": 0.0034313201904296875, "step": 2477} {"info/global_step": 2478, "train_info/time_within_train_step": 2.5224287509918213, "step": 2478} {"train_info/time_between_train_steps": 0.00345611572265625, "step": 2478} {"info/global_step": 2479, "train_info/time_within_train_step": 2.5213069915771484, "step": 2479} {"train_info/time_between_train_steps": 0.003419160842895508, "step": 2479} {"info/global_step": 2480, "train_info/time_within_train_step": 2.5217909812927246, "step": 2480} {"train_info/time_between_train_steps": 0.0031478404998779297, "step": 2480} {"info/global_step": 2481, "train_info/time_within_train_step": 2.5214152336120605, "step": 2481} {"train_info/time_between_train_steps": 0.003123760223388672, "step": 2481} {"info/global_step": 2482, "train_info/time_within_train_step": 2.522120952606201, "step": 2482} {"train_info/time_between_train_steps": 0.0032966136932373047, "step": 2482} {"info/global_step": 2483, "train_info/time_within_train_step": 2.521306276321411, "step": 2483} {"train_info/time_between_train_steps": 0.0034012794494628906, "step": 2483} {"info/global_step": 2484, "train_info/time_within_train_step": 2.5232009887695312, "step": 2484} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 2484} {"info/global_step": 2485, "train_info/time_within_train_step": 2.5220348834991455, "step": 2485} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 2485} {"info/global_step": 2486, "train_info/time_within_train_step": 2.5220253467559814, "step": 2486} {"train_info/time_between_train_steps": 0.0033178329467773438, "step": 2486} {"info/global_step": 2487, "train_info/time_within_train_step": 2.5215466022491455, "step": 2487} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 2487} {"info/global_step": 2488, "train_info/time_within_train_step": 2.5227105617523193, "step": 2488} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 2488} {"info/global_step": 2489, "train_info/time_within_train_step": 2.523001194000244, "step": 2489} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 2489} {"info/global_step": 2490, "train_info/time_within_train_step": 2.522075891494751, "step": 2490} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 2490} {"info/global_step": 2491, "train_info/time_within_train_step": 2.5224125385284424, "step": 2491} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 2491} {"info/global_step": 2492, "train_info/time_within_train_step": 2.5221047401428223, "step": 2492} {"train_info/time_between_train_steps": 0.0034313201904296875, "step": 2492} {"info/global_step": 2493, "train_info/time_within_train_step": 2.521207809448242, "step": 2493} {"train_info/time_between_train_steps": 0.0033943653106689453, "step": 2493} {"info/global_step": 2494, "train_info/time_within_train_step": 2.5217223167419434, "step": 2494} {"train_info/time_between_train_steps": 0.0032868385314941406, "step": 2494} {"info/global_step": 2495, "train_info/time_within_train_step": 2.521692991256714, "step": 2495} {"train_info/time_between_train_steps": 0.003391742706298828, "step": 2495} {"info/global_step": 2496, "train_info/time_within_train_step": 2.521096706390381, "step": 2496} {"train_info/time_between_train_steps": 0.003245830535888672, "step": 2496} {"info/global_step": 2497, "train_info/time_within_train_step": 2.5213513374328613, "step": 2497} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 2497} {"info/global_step": 2498, "train_info/time_within_train_step": 2.5221145153045654, "step": 2498} {"train_info/time_between_train_steps": 0.0033423900604248047, "step": 2498} {"info/global_step": 2499, "train_info/time_within_train_step": 3.012606620788574, "step": 2499} {"train_info/time_between_train_steps": 0.0032186508178710938, "step": 2499} {"info/global_step": 2500, "train_info/time_within_train_step": 2.52189564704895, "step": 2500} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746329746, "_runtime": 6794}, "step": 2500} {"logs": {"train/loss": 3.9707, "train/learning_rate": 0.00011111111111111109, "train/epoch": 2.24, "_timestamp": 1746329746, "_runtime": 6794}, "step": 2500} {"train_info/time_between_train_steps": 12.578936100006104, "step": 2500} {"info/global_step": 2501, "train_info/time_within_train_step": 2.3323540687561035, "step": 2501} {"train_info/time_between_train_steps": 0.003309965133666992, "step": 2501} {"info/global_step": 2502, "train_info/time_within_train_step": 2.321894407272339, "step": 2502} {"train_info/time_between_train_steps": 0.003284454345703125, "step": 2502} {"info/global_step": 2503, "train_info/time_within_train_step": 2.488507032394409, "step": 2503} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 2503} {"info/global_step": 2504, "train_info/time_within_train_step": 2.519998550415039, "step": 2504} {"train_info/time_between_train_steps": 0.0035059452056884766, "step": 2504} {"info/global_step": 2505, "train_info/time_within_train_step": 2.518958568572998, "step": 2505} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 2505} {"info/global_step": 2506, "train_info/time_within_train_step": 2.5211076736450195, "step": 2506} {"train_info/time_between_train_steps": 0.003269195556640625, "step": 2506} {"info/global_step": 2507, "train_info/time_within_train_step": 2.521439790725708, "step": 2507} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 2507} {"info/global_step": 2508, "train_info/time_within_train_step": 2.5205490589141846, "step": 2508} {"train_info/time_between_train_steps": 0.0033593177795410156, "step": 2508} {"info/global_step": 2509, "train_info/time_within_train_step": 2.5212607383728027, "step": 2509} {"train_info/time_between_train_steps": 0.003293275833129883, "step": 2509} {"info/global_step": 2510, "train_info/time_within_train_step": 2.5210182666778564, "step": 2510} {"train_info/time_between_train_steps": 0.0033490657806396484, "step": 2510} {"info/global_step": 2511, "train_info/time_within_train_step": 2.520646572113037, "step": 2511} {"train_info/time_between_train_steps": 0.003306150436401367, "step": 2511} {"info/global_step": 2512, "train_info/time_within_train_step": 2.5207903385162354, "step": 2512} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 2512} {"info/global_step": 2513, "train_info/time_within_train_step": 2.521627902984619, "step": 2513} {"train_info/time_between_train_steps": 0.003388643264770508, "step": 2513} {"info/global_step": 2514, "train_info/time_within_train_step": 2.5206756591796875, "step": 2514} {"train_info/time_between_train_steps": 0.0031681060791015625, "step": 2514} {"info/global_step": 2515, "train_info/time_within_train_step": 2.521240711212158, "step": 2515} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 2515} {"info/global_step": 2516, "train_info/time_within_train_step": 2.5211021900177, "step": 2516} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 2516} {"info/global_step": 2517, "train_info/time_within_train_step": 2.522169589996338, "step": 2517} {"train_info/time_between_train_steps": 0.0034515857696533203, "step": 2517} {"info/global_step": 2518, "train_info/time_within_train_step": 2.5218164920806885, "step": 2518} {"train_info/time_between_train_steps": 0.003214597702026367, "step": 2518} {"info/global_step": 2519, "train_info/time_within_train_step": 2.521421432495117, "step": 2519} {"train_info/time_between_train_steps": 0.003337860107421875, "step": 2519} {"info/global_step": 2520, "train_info/time_within_train_step": 2.5227713584899902, "step": 2520} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 2520} {"info/global_step": 2521, "train_info/time_within_train_step": 2.5221149921417236, "step": 2521} {"train_info/time_between_train_steps": 0.0031261444091796875, "step": 2521} {"info/global_step": 2522, "train_info/time_within_train_step": 2.522798538208008, "step": 2522} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 2522} {"info/global_step": 2523, "train_info/time_within_train_step": 2.5216403007507324, "step": 2523} {"train_info/time_between_train_steps": 0.003284454345703125, "step": 2523} {"info/global_step": 2524, "train_info/time_within_train_step": 2.521665334701538, "step": 2524} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 2524} {"info/global_step": 2525, "train_info/time_within_train_step": 2.5272750854492188, "step": 2525} {"train_info/time_between_train_steps": 0.0032808780670166016, "step": 2525} {"info/global_step": 2526, "train_info/time_within_train_step": 2.5219428539276123, "step": 2526} {"train_info/time_between_train_steps": 0.0033922195434570312, "step": 2526} {"info/global_step": 2527, "train_info/time_within_train_step": 2.521761655807495, "step": 2527} {"train_info/time_between_train_steps": 0.0033750534057617188, "step": 2527} {"info/global_step": 2528, "train_info/time_within_train_step": 2.5507326126098633, "step": 2528} {"train_info/time_between_train_steps": 0.0034203529357910156, "step": 2528} {"info/global_step": 2529, "train_info/time_within_train_step": 2.5227980613708496, "step": 2529} {"train_info/time_between_train_steps": 0.003450155258178711, "step": 2529} {"info/global_step": 2530, "train_info/time_within_train_step": 2.5228819847106934, "step": 2530} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 2530} {"info/global_step": 2531, "train_info/time_within_train_step": 2.5235278606414795, "step": 2531} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 2531} {"info/global_step": 2532, "train_info/time_within_train_step": 2.5217783451080322, "step": 2532} {"train_info/time_between_train_steps": 0.0033347606658935547, "step": 2532} {"info/global_step": 2533, "train_info/time_within_train_step": 2.522178888320923, "step": 2533} {"train_info/time_between_train_steps": 0.003333568572998047, "step": 2533} {"info/global_step": 2534, "train_info/time_within_train_step": 2.5222959518432617, "step": 2534} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 2534} {"info/global_step": 2535, "train_info/time_within_train_step": 2.5226058959960938, "step": 2535} {"train_info/time_between_train_steps": 0.0031104087829589844, "step": 2535} {"info/global_step": 2536, "train_info/time_within_train_step": 2.521986246109009, "step": 2536} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 2536} {"info/global_step": 2537, "train_info/time_within_train_step": 2.5212860107421875, "step": 2537} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 2537} {"info/global_step": 2538, "train_info/time_within_train_step": 2.522716760635376, "step": 2538} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 2538} {"info/global_step": 2539, "train_info/time_within_train_step": 2.5223147869110107, "step": 2539} {"train_info/time_between_train_steps": 0.003337383270263672, "step": 2539} {"info/global_step": 2540, "train_info/time_within_train_step": 2.5233256816864014, "step": 2540} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 2540} {"info/global_step": 2541, "train_info/time_within_train_step": 2.522028923034668, "step": 2541} {"train_info/time_between_train_steps": 0.003113985061645508, "step": 2541} {"info/global_step": 2542, "train_info/time_within_train_step": 2.521714210510254, "step": 2542} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 2542} {"info/global_step": 2543, "train_info/time_within_train_step": 2.5231916904449463, "step": 2543} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 2543} {"info/global_step": 2544, "train_info/time_within_train_step": 2.5225822925567627, "step": 2544} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 2544} {"info/global_step": 2545, "train_info/time_within_train_step": 2.523132562637329, "step": 2545} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 2545} {"info/global_step": 2546, "train_info/time_within_train_step": 2.521662950515747, "step": 2546} {"train_info/time_between_train_steps": 0.0031681060791015625, "step": 2546} {"info/global_step": 2547, "train_info/time_within_train_step": 2.521127462387085, "step": 2547} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 2547} {"info/global_step": 2548, "train_info/time_within_train_step": 2.521423101425171, "step": 2548} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 2548} {"info/global_step": 2549, "train_info/time_within_train_step": 2.5213747024536133, "step": 2549} {"train_info/time_between_train_steps": 0.0033905506134033203, "step": 2549} {"info/global_step": 2550, "train_info/time_within_train_step": 2.5219125747680664, "step": 2550} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746329886, "_runtime": 6934}, "step": 2550} {"logs": {"train/loss": 3.9512, "train/learning_rate": 9.999999999999999e-05, "train/epoch": 2.26, "_timestamp": 1746329886, "_runtime": 6934}, "step": 2550} {"train_info/time_between_train_steps": 0.024204015731811523, "step": 2550} {"info/global_step": 2551, "train_info/time_within_train_step": 2.521740198135376, "step": 2551} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 2551} {"info/global_step": 2552, "train_info/time_within_train_step": 2.5223913192749023, "step": 2552} {"train_info/time_between_train_steps": 0.0034492015838623047, "step": 2552} {"info/global_step": 2553, "train_info/time_within_train_step": 2.5219528675079346, "step": 2553} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 2553} {"info/global_step": 2554, "train_info/time_within_train_step": 2.5209500789642334, "step": 2554} {"train_info/time_between_train_steps": 0.0034461021423339844, "step": 2554} {"info/global_step": 2555, "train_info/time_within_train_step": 2.666609287261963, "step": 2555} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 2555} {"info/global_step": 2556, "train_info/time_within_train_step": 2.5219082832336426, "step": 2556} {"train_info/time_between_train_steps": 0.003228425979614258, "step": 2556} {"info/global_step": 2557, "train_info/time_within_train_step": 2.5214288234710693, "step": 2557} {"train_info/time_between_train_steps": 0.003255605697631836, "step": 2557} {"info/global_step": 2558, "train_info/time_within_train_step": 2.5211048126220703, "step": 2558} {"train_info/time_between_train_steps": 0.0030994415283203125, "step": 2558} {"info/global_step": 2559, "train_info/time_within_train_step": 2.521575927734375, "step": 2559} {"train_info/time_between_train_steps": 0.0033271312713623047, "step": 2559} {"info/global_step": 2560, "train_info/time_within_train_step": 2.5224554538726807, "step": 2560} {"train_info/time_between_train_steps": 0.0033652782440185547, "step": 2560} {"info/global_step": 2561, "train_info/time_within_train_step": 2.5488979816436768, "step": 2561} {"train_info/time_between_train_steps": 0.003348112106323242, "step": 2561} {"info/global_step": 2562, "train_info/time_within_train_step": 2.5227038860321045, "step": 2562} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 2562} {"info/global_step": 2563, "train_info/time_within_train_step": 2.5539515018463135, "step": 2563} {"train_info/time_between_train_steps": 0.0030639171600341797, "step": 2563} {"info/global_step": 2564, "train_info/time_within_train_step": 2.521015167236328, "step": 2564} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 2564} {"info/global_step": 2565, "train_info/time_within_train_step": 2.521145820617676, "step": 2565} {"train_info/time_between_train_steps": 0.0033371448516845703, "step": 2565} {"info/global_step": 2566, "train_info/time_within_train_step": 2.5222322940826416, "step": 2566} {"train_info/time_between_train_steps": 0.0031266212463378906, "step": 2566} {"info/global_step": 2567, "train_info/time_within_train_step": 2.5208919048309326, "step": 2567} {"train_info/time_between_train_steps": 0.0032470226287841797, "step": 2567} {"info/global_step": 2568, "train_info/time_within_train_step": 2.5206828117370605, "step": 2568} {"train_info/time_between_train_steps": 0.0033805370330810547, "step": 2568} {"info/global_step": 2569, "train_info/time_within_train_step": 2.5214385986328125, "step": 2569} {"train_info/time_between_train_steps": 0.0032444000244140625, "step": 2569} {"info/global_step": 2570, "train_info/time_within_train_step": 2.5219056606292725, "step": 2570} {"train_info/time_between_train_steps": 0.0032591819763183594, "step": 2570} {"info/global_step": 2571, "train_info/time_within_train_step": 2.521721601486206, "step": 2571} {"train_info/time_between_train_steps": 0.0033249855041503906, "step": 2571} {"info/global_step": 2572, "train_info/time_within_train_step": 2.521362781524658, "step": 2572} {"train_info/time_between_train_steps": 0.0032668113708496094, "step": 2572} {"info/global_step": 2573, "train_info/time_within_train_step": 2.5226504802703857, "step": 2573} {"train_info/time_between_train_steps": 0.0032868385314941406, "step": 2573} {"info/global_step": 2574, "train_info/time_within_train_step": 2.522249221801758, "step": 2574} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 2574} {"info/global_step": 2575, "train_info/time_within_train_step": 2.521923780441284, "step": 2575} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 2575} {"info/global_step": 2576, "train_info/time_within_train_step": 2.5224790573120117, "step": 2576} {"train_info/time_between_train_steps": 0.0034198760986328125, "step": 2576} {"info/global_step": 2577, "train_info/time_within_train_step": 2.5222856998443604, "step": 2577} {"train_info/time_between_train_steps": 0.0034890174865722656, "step": 2577} {"info/global_step": 2578, "train_info/time_within_train_step": 2.5212442874908447, "step": 2578} {"train_info/time_between_train_steps": 0.0033478736877441406, "step": 2578} {"info/global_step": 2579, "train_info/time_within_train_step": 2.521310806274414, "step": 2579} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 2579} {"info/global_step": 2580, "train_info/time_within_train_step": 2.5208804607391357, "step": 2580} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 2580} {"info/global_step": 2581, "train_info/time_within_train_step": 2.5209224224090576, "step": 2581} {"train_info/time_between_train_steps": 0.0032682418823242188, "step": 2581} {"info/global_step": 2582, "train_info/time_within_train_step": 2.5201056003570557, "step": 2582} {"train_info/time_between_train_steps": 0.003117084503173828, "step": 2582} {"info/global_step": 2583, "train_info/time_within_train_step": 2.520622491836548, "step": 2583} {"train_info/time_between_train_steps": 0.0035071372985839844, "step": 2583} {"info/global_step": 2584, "train_info/time_within_train_step": 2.521726131439209, "step": 2584} {"train_info/time_between_train_steps": 0.0034227371215820312, "step": 2584} {"info/global_step": 2585, "train_info/time_within_train_step": 2.5208678245544434, "step": 2585} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 2585} {"info/global_step": 2586, "train_info/time_within_train_step": 2.520667791366577, "step": 2586} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 2586} {"info/global_step": 2587, "train_info/time_within_train_step": 2.5201077461242676, "step": 2587} {"train_info/time_between_train_steps": 0.003255128860473633, "step": 2587} {"info/global_step": 2588, "train_info/time_within_train_step": 2.5203306674957275, "step": 2588} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 2588} {"info/global_step": 2589, "train_info/time_within_train_step": 2.5203967094421387, "step": 2589} {"train_info/time_between_train_steps": 0.003378152847290039, "step": 2589} {"info/global_step": 2590, "train_info/time_within_train_step": 2.521319627761841, "step": 2590} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 2590} {"info/global_step": 2591, "train_info/time_within_train_step": 2.5212764739990234, "step": 2591} {"train_info/time_between_train_steps": 0.0032062530517578125, "step": 2591} {"info/global_step": 2592, "train_info/time_within_train_step": 2.5219554901123047, "step": 2592} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 2592} {"info/global_step": 2593, "train_info/time_within_train_step": 2.5219013690948486, "step": 2593} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 2593} {"info/global_step": 2594, "train_info/time_within_train_step": 2.5215606689453125, "step": 2594} {"train_info/time_between_train_steps": 0.003231525421142578, "step": 2594} {"info/global_step": 2595, "train_info/time_within_train_step": 2.522895336151123, "step": 2595} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 2595} {"info/global_step": 2596, "train_info/time_within_train_step": 2.522162437438965, "step": 2596} {"train_info/time_between_train_steps": 0.0032308101654052734, "step": 2596} {"info/global_step": 2597, "train_info/time_within_train_step": 2.5222792625427246, "step": 2597} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 2597} {"info/global_step": 2598, "train_info/time_within_train_step": 2.5230236053466797, "step": 2598} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 2598} {"info/global_step": 2599, "train_info/time_within_train_step": 2.5219883918762207, "step": 2599} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 2599} {"info/global_step": 2600, "train_info/time_within_train_step": 2.522472381591797, "step": 2600} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746330013, "_runtime": 7061}, "step": 2600} {"logs": {"train/loss": 3.9411, "train/learning_rate": 8.888888888888888e-05, "train/epoch": 2.27, "_timestamp": 1746330013, "_runtime": 7061}, "step": 2600} {"train_info/time_between_train_steps": 12.361456871032715, "step": 2600} {"info/global_step": 2601, "train_info/time_within_train_step": 2.335391044616699, "step": 2601} {"train_info/time_between_train_steps": 0.0032494068145751953, "step": 2601} {"info/global_step": 2602, "train_info/time_within_train_step": 2.3236684799194336, "step": 2602} {"train_info/time_between_train_steps": 0.0033550262451171875, "step": 2602} {"info/global_step": 2603, "train_info/time_within_train_step": 2.4929261207580566, "step": 2603} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 2603} {"info/global_step": 2604, "train_info/time_within_train_step": 2.5190062522888184, "step": 2604} {"train_info/time_between_train_steps": 0.0033142566680908203, "step": 2604} {"info/global_step": 2605, "train_info/time_within_train_step": 2.518714666366577, "step": 2605} {"train_info/time_between_train_steps": 0.00341796875, "step": 2605} {"info/global_step": 2606, "train_info/time_within_train_step": 2.519804000854492, "step": 2606} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 2606} {"info/global_step": 2607, "train_info/time_within_train_step": 2.519753932952881, "step": 2607} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 2607} {"info/global_step": 2608, "train_info/time_within_train_step": 2.5207483768463135, "step": 2608} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 2608} {"info/global_step": 2609, "train_info/time_within_train_step": 2.620798110961914, "step": 2609} {"train_info/time_between_train_steps": 0.003416776657104492, "step": 2609} {"info/global_step": 2610, "train_info/time_within_train_step": 2.521470546722412, "step": 2610} {"train_info/time_between_train_steps": 0.003094196319580078, "step": 2610} {"info/global_step": 2611, "train_info/time_within_train_step": 2.520692825317383, "step": 2611} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 2611} {"info/global_step": 2612, "train_info/time_within_train_step": 2.5218634605407715, "step": 2612} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 2612} {"info/global_step": 2613, "train_info/time_within_train_step": 2.520768404006958, "step": 2613} {"train_info/time_between_train_steps": 0.003199338912963867, "step": 2613} {"info/global_step": 2614, "train_info/time_within_train_step": 2.521449327468872, "step": 2614} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 2614} {"info/global_step": 2615, "train_info/time_within_train_step": 2.5224406719207764, "step": 2615} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 2615} {"info/global_step": 2616, "train_info/time_within_train_step": 2.521716833114624, "step": 2616} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 2616} {"info/global_step": 2617, "train_info/time_within_train_step": 2.5229721069335938, "step": 2617} {"train_info/time_between_train_steps": 0.003457784652709961, "step": 2617} {"info/global_step": 2618, "train_info/time_within_train_step": 2.5215046405792236, "step": 2618} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 2618} {"info/global_step": 2619, "train_info/time_within_train_step": 2.521306037902832, "step": 2619} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 2619} {"info/global_step": 2620, "train_info/time_within_train_step": 2.5211470127105713, "step": 2620} {"train_info/time_between_train_steps": 0.003227710723876953, "step": 2620} {"info/global_step": 2621, "train_info/time_within_train_step": 2.5213119983673096, "step": 2621} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 2621} {"info/global_step": 2622, "train_info/time_within_train_step": 2.5211398601531982, "step": 2622} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 2622} {"info/global_step": 2623, "train_info/time_within_train_step": 2.520798683166504, "step": 2623} {"train_info/time_between_train_steps": 0.0033354759216308594, "step": 2623} {"info/global_step": 2624, "train_info/time_within_train_step": 2.521981716156006, "step": 2624} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 2624} {"info/global_step": 2625, "train_info/time_within_train_step": 2.5212790966033936, "step": 2625} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 2625} {"info/global_step": 2626, "train_info/time_within_train_step": 2.5204222202301025, "step": 2626} {"train_info/time_between_train_steps": 0.003383636474609375, "step": 2626} {"info/global_step": 2627, "train_info/time_within_train_step": 2.5206706523895264, "step": 2627} {"train_info/time_between_train_steps": 0.0035860538482666016, "step": 2627} {"info/global_step": 2628, "train_info/time_within_train_step": 2.520977258682251, "step": 2628} {"train_info/time_between_train_steps": 0.0032362937927246094, "step": 2628} {"info/global_step": 2629, "train_info/time_within_train_step": 2.52173113822937, "step": 2629} {"train_info/time_between_train_steps": 0.003343343734741211, "step": 2629} {"info/global_step": 2630, "train_info/time_within_train_step": 2.5223817825317383, "step": 2630} {"train_info/time_between_train_steps": 0.0032744407653808594, "step": 2630} {"info/global_step": 2631, "train_info/time_within_train_step": 2.520570755004883, "step": 2631} {"train_info/time_between_train_steps": 0.003270864486694336, "step": 2631} {"info/global_step": 2632, "train_info/time_within_train_step": 2.5202088356018066, "step": 2632} {"train_info/time_between_train_steps": 0.003367900848388672, "step": 2632} {"info/global_step": 2633, "train_info/time_within_train_step": 2.52077054977417, "step": 2633} {"train_info/time_between_train_steps": 0.0032606124877929688, "step": 2633} {"info/global_step": 2634, "train_info/time_within_train_step": 2.521653413772583, "step": 2634} {"train_info/time_between_train_steps": 0.0033216476440429688, "step": 2634} {"info/global_step": 2635, "train_info/time_within_train_step": 2.520318031311035, "step": 2635} {"train_info/time_between_train_steps": 0.0035393238067626953, "step": 2635} {"info/global_step": 2636, "train_info/time_within_train_step": 2.5204107761383057, "step": 2636} {"train_info/time_between_train_steps": 0.003380298614501953, "step": 2636} {"info/global_step": 2637, "train_info/time_within_train_step": 2.5206634998321533, "step": 2637} {"train_info/time_between_train_steps": 0.003371715545654297, "step": 2637} {"info/global_step": 2638, "train_info/time_within_train_step": 2.5213558673858643, "step": 2638} {"train_info/time_between_train_steps": 0.003256082534790039, "step": 2638} {"info/global_step": 2639, "train_info/time_within_train_step": 2.520650863647461, "step": 2639} {"train_info/time_between_train_steps": 0.003496885299682617, "step": 2639} {"info/global_step": 2640, "train_info/time_within_train_step": 2.5205001831054688, "step": 2640} {"train_info/time_between_train_steps": 0.0033407211303710938, "step": 2640} {"info/global_step": 2641, "train_info/time_within_train_step": 2.5217950344085693, "step": 2641} {"train_info/time_between_train_steps": 0.0032935142517089844, "step": 2641} {"info/global_step": 2642, "train_info/time_within_train_step": 2.5203781127929688, "step": 2642} {"train_info/time_between_train_steps": 0.0034711360931396484, "step": 2642} {"info/global_step": 2643, "train_info/time_within_train_step": 2.520705461502075, "step": 2643} {"train_info/time_between_train_steps": 0.003279447555541992, "step": 2643} {"info/global_step": 2644, "train_info/time_within_train_step": 2.5211939811706543, "step": 2644} {"train_info/time_between_train_steps": 0.0034475326538085938, "step": 2644} {"info/global_step": 2645, "train_info/time_within_train_step": 2.5217857360839844, "step": 2645} {"train_info/time_between_train_steps": 0.0032863616943359375, "step": 2645} {"info/global_step": 2646, "train_info/time_within_train_step": 2.6060595512390137, "step": 2646} {"train_info/time_between_train_steps": 0.003231048583984375, "step": 2646} {"info/global_step": 2647, "train_info/time_within_train_step": 2.5217137336730957, "step": 2647} {"train_info/time_between_train_steps": 0.003430604934692383, "step": 2647} {"info/global_step": 2648, "train_info/time_within_train_step": 2.520967960357666, "step": 2648} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 2648} {"info/global_step": 2649, "train_info/time_within_train_step": 2.5212249755859375, "step": 2649} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 2649} {"info/global_step": 2650, "train_info/time_within_train_step": 2.5206756591796875, "step": 2650} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746330152, "_runtime": 7200}, "step": 2650} {"logs": {"train/loss": 3.9293, "train/learning_rate": 7.777777777777777e-05, "train/epoch": 2.29, "_timestamp": 1746330152, "_runtime": 7200}, "step": 2650} {"train_info/time_between_train_steps": 0.02539682388305664, "step": 2650} {"info/global_step": 2651, "train_info/time_within_train_step": 2.547969102859497, "step": 2651} {"train_info/time_between_train_steps": 0.0033762454986572266, "step": 2651} {"info/global_step": 2652, "train_info/time_within_train_step": 2.5206003189086914, "step": 2652} {"train_info/time_between_train_steps": 0.0030715465545654297, "step": 2652} {"info/global_step": 2653, "train_info/time_within_train_step": 2.554901599884033, "step": 2653} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 2653} {"info/global_step": 2654, "train_info/time_within_train_step": 2.520970582962036, "step": 2654} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 2654} {"info/global_step": 2655, "train_info/time_within_train_step": 2.5219290256500244, "step": 2655} {"train_info/time_between_train_steps": 0.0036389827728271484, "step": 2655} {"info/global_step": 2656, "train_info/time_within_train_step": 2.5215232372283936, "step": 2656} {"train_info/time_between_train_steps": 0.0034961700439453125, "step": 2656} {"info/global_step": 2657, "train_info/time_within_train_step": 2.52160906791687, "step": 2657} {"train_info/time_between_train_steps": 0.0032203197479248047, "step": 2657} {"info/global_step": 2658, "train_info/time_within_train_step": 2.5230228900909424, "step": 2658} {"train_info/time_between_train_steps": 0.0036554336547851562, "step": 2658} {"info/global_step": 2659, "train_info/time_within_train_step": 2.5222744941711426, "step": 2659} {"train_info/time_between_train_steps": 0.0038111209869384766, "step": 2659} {"info/global_step": 2660, "train_info/time_within_train_step": 2.521472930908203, "step": 2660} {"train_info/time_between_train_steps": 0.0034525394439697266, "step": 2660} {"info/global_step": 2661, "train_info/time_within_train_step": 2.5219056606292725, "step": 2661} {"train_info/time_between_train_steps": 0.003775358200073242, "step": 2661} {"info/global_step": 2662, "train_info/time_within_train_step": 2.523049831390381, "step": 2662} {"train_info/time_between_train_steps": 0.003713846206665039, "step": 2662} {"info/global_step": 2663, "train_info/time_within_train_step": 2.5213637351989746, "step": 2663} {"train_info/time_between_train_steps": 0.0036449432373046875, "step": 2663} {"info/global_step": 2664, "train_info/time_within_train_step": 2.5221993923187256, "step": 2664} {"train_info/time_between_train_steps": 0.003764629364013672, "step": 2664} {"info/global_step": 2665, "train_info/time_within_train_step": 2.521730899810791, "step": 2665} {"train_info/time_between_train_steps": 0.003416776657104492, "step": 2665} {"info/global_step": 2666, "train_info/time_within_train_step": 2.52164363861084, "step": 2666} {"train_info/time_between_train_steps": 0.003681659698486328, "step": 2666} {"info/global_step": 2667, "train_info/time_within_train_step": 2.521498203277588, "step": 2667} {"train_info/time_between_train_steps": 0.0037360191345214844, "step": 2667} {"info/global_step": 2668, "train_info/time_within_train_step": 2.5220136642456055, "step": 2668} {"train_info/time_between_train_steps": 0.0034499168395996094, "step": 2668} {"info/global_step": 2669, "train_info/time_within_train_step": 2.5213844776153564, "step": 2669} {"train_info/time_between_train_steps": 0.003862142562866211, "step": 2669} {"info/global_step": 2670, "train_info/time_within_train_step": 2.5228068828582764, "step": 2670} {"train_info/time_between_train_steps": 0.004141807556152344, "step": 2670} {"info/global_step": 2671, "train_info/time_within_train_step": 2.5231411457061768, "step": 2671} {"train_info/time_between_train_steps": 0.0038437843322753906, "step": 2671} {"info/global_step": 2672, "train_info/time_within_train_step": 2.5220539569854736, "step": 2672} {"train_info/time_between_train_steps": 0.0038483142852783203, "step": 2672} {"info/global_step": 2673, "train_info/time_within_train_step": 2.5229690074920654, "step": 2673} {"train_info/time_between_train_steps": 0.00406646728515625, "step": 2673} {"info/global_step": 2674, "train_info/time_within_train_step": 2.5229222774505615, "step": 2674} {"train_info/time_between_train_steps": 0.0038471221923828125, "step": 2674} {"info/global_step": 2675, "train_info/time_within_train_step": 2.52289080619812, "step": 2675} {"train_info/time_between_train_steps": 0.004388332366943359, "step": 2675} {"info/global_step": 2676, "train_info/time_within_train_step": 2.52376389503479, "step": 2676} {"train_info/time_between_train_steps": 0.004240989685058594, "step": 2676} {"train_info/time_between_train_steps": 2.8488080501556396, "step": 2676} {"info/global_step": 2677, "train_info/time_within_train_step": 2.8257977962493896, "step": 2677} {"train_info/time_between_train_steps": 0.003465414047241211, "step": 2677} {"info/global_step": 2678, "train_info/time_within_train_step": 2.5195791721343994, "step": 2678} {"train_info/time_between_train_steps": 0.0034971237182617188, "step": 2678} {"info/global_step": 2679, "train_info/time_within_train_step": 2.5196585655212402, "step": 2679} {"train_info/time_between_train_steps": 0.003359556198120117, "step": 2679} {"info/global_step": 2680, "train_info/time_within_train_step": 2.520334005355835, "step": 2680} {"train_info/time_between_train_steps": 0.0035276412963867188, "step": 2680} {"info/global_step": 2681, "train_info/time_within_train_step": 2.5211524963378906, "step": 2681} {"train_info/time_between_train_steps": 0.003423929214477539, "step": 2681} {"info/global_step": 2682, "train_info/time_within_train_step": 2.520352840423584, "step": 2682} {"train_info/time_between_train_steps": 0.003374338150024414, "step": 2682} {"info/global_step": 2683, "train_info/time_within_train_step": 2.5208659172058105, "step": 2683} {"train_info/time_between_train_steps": 0.0033664703369140625, "step": 2683} {"info/global_step": 2684, "train_info/time_within_train_step": 2.5211715698242188, "step": 2684} {"train_info/time_between_train_steps": 0.003447294235229492, "step": 2684} {"info/global_step": 2685, "train_info/time_within_train_step": 2.520841121673584, "step": 2685} {"train_info/time_between_train_steps": 0.0035240650177001953, "step": 2685} {"info/global_step": 2686, "train_info/time_within_train_step": 2.5203006267547607, "step": 2686} {"train_info/time_between_train_steps": 0.003549337387084961, "step": 2686} {"info/global_step": 2687, "train_info/time_within_train_step": 2.5214102268218994, "step": 2687} {"train_info/time_between_train_steps": 0.0033974647521972656, "step": 2687} {"info/global_step": 2688, "train_info/time_within_train_step": 2.5207929611206055, "step": 2688} {"train_info/time_between_train_steps": 0.0033376216888427734, "step": 2688} {"info/global_step": 2689, "train_info/time_within_train_step": 2.5212934017181396, "step": 2689} {"train_info/time_between_train_steps": 0.0035164356231689453, "step": 2689} {"info/global_step": 2690, "train_info/time_within_train_step": 2.5212697982788086, "step": 2690} {"train_info/time_between_train_steps": 0.003627777099609375, "step": 2690} {"info/global_step": 2691, "train_info/time_within_train_step": 2.520984172821045, "step": 2691} {"train_info/time_between_train_steps": 0.0034711360931396484, "step": 2691} {"info/global_step": 2692, "train_info/time_within_train_step": 2.520287275314331, "step": 2692} {"train_info/time_between_train_steps": 0.003371715545654297, "step": 2692} {"info/global_step": 2693, "train_info/time_within_train_step": 2.5200235843658447, "step": 2693} {"train_info/time_between_train_steps": 0.003573894500732422, "step": 2693} {"info/global_step": 2694, "train_info/time_within_train_step": 2.5218770503997803, "step": 2694} {"train_info/time_between_train_steps": 0.003622770309448242, "step": 2694} {"info/global_step": 2695, "train_info/time_within_train_step": 2.5203959941864014, "step": 2695} {"train_info/time_between_train_steps": 0.0035555362701416016, "step": 2695} {"info/global_step": 2696, "train_info/time_within_train_step": 2.521522283554077, "step": 2696} {"train_info/time_between_train_steps": 0.0034475326538085938, "step": 2696} {"info/global_step": 2697, "train_info/time_within_train_step": 2.544260025024414, "step": 2697} {"train_info/time_between_train_steps": 0.0036973953247070312, "step": 2697} {"info/global_step": 2698, "train_info/time_within_train_step": 2.5207877159118652, "step": 2698} {"train_info/time_between_train_steps": 0.003685474395751953, "step": 2698} {"info/global_step": 2699, "train_info/time_within_train_step": 2.5212175846099854, "step": 2699} {"train_info/time_between_train_steps": 0.003668069839477539, "step": 2699} {"info/global_step": 2700, "train_info/time_within_train_step": 2.5220627784729004, "step": 2700} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746330283, "_runtime": 7331}, "step": 2700} {"logs": {"train/loss": 3.958, "train/learning_rate": 6.666666666666666e-05, "train/epoch": 3.01, "_timestamp": 1746330283, "_runtime": 7331}, "step": 2700} {"train_info/time_between_train_steps": 13.01904296875, "step": 2700} {"info/global_step": 2701, "train_info/time_within_train_step": 2.3271844387054443, "step": 2701} {"train_info/time_between_train_steps": 0.004014015197753906, "step": 2701} {"info/global_step": 2702, "train_info/time_within_train_step": 2.318838596343994, "step": 2702} {"train_info/time_between_train_steps": 0.003636598587036133, "step": 2702} {"info/global_step": 2703, "train_info/time_within_train_step": 2.4877078533172607, "step": 2703} {"train_info/time_between_train_steps": 0.003612041473388672, "step": 2703} {"info/global_step": 2704, "train_info/time_within_train_step": 2.5179808139801025, "step": 2704} {"train_info/time_between_train_steps": 0.0035495758056640625, "step": 2704} {"info/global_step": 2705, "train_info/time_within_train_step": 2.5199995040893555, "step": 2705} {"train_info/time_between_train_steps": 0.0037720203399658203, "step": 2705} {"info/global_step": 2706, "train_info/time_within_train_step": 2.5210933685302734, "step": 2706} {"train_info/time_between_train_steps": 0.003810882568359375, "step": 2706} {"info/global_step": 2707, "train_info/time_within_train_step": 2.5216293334960938, "step": 2707} {"train_info/time_between_train_steps": 0.003461122512817383, "step": 2707} {"info/global_step": 2708, "train_info/time_within_train_step": 2.521092176437378, "step": 2708} {"train_info/time_between_train_steps": 0.003482818603515625, "step": 2708} {"info/global_step": 2709, "train_info/time_within_train_step": 2.5220437049865723, "step": 2709} {"train_info/time_between_train_steps": 0.003537893295288086, "step": 2709} {"info/global_step": 2710, "train_info/time_within_train_step": 2.5222346782684326, "step": 2710} {"train_info/time_between_train_steps": 0.0035619735717773438, "step": 2710} {"info/global_step": 2711, "train_info/time_within_train_step": 2.5213561058044434, "step": 2711} {"train_info/time_between_train_steps": 0.0034554004669189453, "step": 2711} {"info/global_step": 2712, "train_info/time_within_train_step": 2.5208065509796143, "step": 2712} {"train_info/time_between_train_steps": 0.0036704540252685547, "step": 2712} {"info/global_step": 2713, "train_info/time_within_train_step": 2.5217318534851074, "step": 2713} {"train_info/time_between_train_steps": 0.003575563430786133, "step": 2713} {"info/global_step": 2714, "train_info/time_within_train_step": 2.5227575302124023, "step": 2714} {"train_info/time_between_train_steps": 0.003551006317138672, "step": 2714} {"info/global_step": 2715, "train_info/time_within_train_step": 2.5226175785064697, "step": 2715} {"train_info/time_between_train_steps": 0.0034589767456054688, "step": 2715} {"info/global_step": 2716, "train_info/time_within_train_step": 2.5227136611938477, "step": 2716} {"train_info/time_between_train_steps": 0.003719329833984375, "step": 2716} {"info/global_step": 2717, "train_info/time_within_train_step": 2.521713972091675, "step": 2717} {"train_info/time_between_train_steps": 0.0033822059631347656, "step": 2717} {"info/global_step": 2718, "train_info/time_within_train_step": 2.5221850872039795, "step": 2718} {"train_info/time_between_train_steps": 0.0038330554962158203, "step": 2718} {"info/global_step": 2719, "train_info/time_within_train_step": 2.5237298011779785, "step": 2719} {"train_info/time_between_train_steps": 0.003608226776123047, "step": 2719} {"info/global_step": 2720, "train_info/time_within_train_step": 2.524491548538208, "step": 2720} {"train_info/time_between_train_steps": 0.003563404083251953, "step": 2720} {"info/global_step": 2721, "train_info/time_within_train_step": 2.809866428375244, "step": 2721} {"train_info/time_between_train_steps": 0.0036635398864746094, "step": 2721} {"info/global_step": 2722, "train_info/time_within_train_step": 2.5217084884643555, "step": 2722} {"train_info/time_between_train_steps": 0.0035827159881591797, "step": 2722} {"info/global_step": 2723, "train_info/time_within_train_step": 2.52243709564209, "step": 2723} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 2723} {"info/global_step": 2724, "train_info/time_within_train_step": 2.5226500034332275, "step": 2724} {"train_info/time_between_train_steps": 0.003415346145629883, "step": 2724} {"info/global_step": 2725, "train_info/time_within_train_step": 2.522547721862793, "step": 2725} {"train_info/time_between_train_steps": 0.0035750865936279297, "step": 2725} {"info/global_step": 2726, "train_info/time_within_train_step": 2.522397994995117, "step": 2726} {"train_info/time_between_train_steps": 0.0034978389739990234, "step": 2726} {"info/global_step": 2727, "train_info/time_within_train_step": 2.522237539291382, "step": 2727} {"train_info/time_between_train_steps": 0.003461599349975586, "step": 2727} {"info/global_step": 2728, "train_info/time_within_train_step": 2.522953748703003, "step": 2728} {"train_info/time_between_train_steps": 0.003739595413208008, "step": 2728} {"info/global_step": 2729, "train_info/time_within_train_step": 2.52260684967041, "step": 2729} {"train_info/time_between_train_steps": 0.0036749839782714844, "step": 2729} {"info/global_step": 2730, "train_info/time_within_train_step": 2.5221750736236572, "step": 2730} {"train_info/time_between_train_steps": 0.003564596176147461, "step": 2730} {"info/global_step": 2731, "train_info/time_within_train_step": 2.523219347000122, "step": 2731} {"train_info/time_between_train_steps": 0.0035202503204345703, "step": 2731} {"info/global_step": 2732, "train_info/time_within_train_step": 2.5227303504943848, "step": 2732} {"train_info/time_between_train_steps": 0.003518819808959961, "step": 2732} {"info/global_step": 2733, "train_info/time_within_train_step": 2.5223639011383057, "step": 2733} {"train_info/time_between_train_steps": 0.003724813461303711, "step": 2733} {"info/global_step": 2734, "train_info/time_within_train_step": 2.5227606296539307, "step": 2734} {"train_info/time_between_train_steps": 0.0035881996154785156, "step": 2734} {"info/global_step": 2735, "train_info/time_within_train_step": 2.521970272064209, "step": 2735} {"train_info/time_between_train_steps": 0.003459930419921875, "step": 2735} {"info/global_step": 2736, "train_info/time_within_train_step": 2.5236546993255615, "step": 2736} {"train_info/time_between_train_steps": 0.003506183624267578, "step": 2736} {"info/global_step": 2737, "train_info/time_within_train_step": 2.5226328372955322, "step": 2737} {"train_info/time_between_train_steps": 0.0035982131958007812, "step": 2737} {"info/global_step": 2738, "train_info/time_within_train_step": 2.5241305828094482, "step": 2738} {"train_info/time_between_train_steps": 0.0034079551696777344, "step": 2738} {"info/global_step": 2739, "train_info/time_within_train_step": 2.6492559909820557, "step": 2739} {"train_info/time_between_train_steps": 0.003580808639526367, "step": 2739} {"info/global_step": 2740, "train_info/time_within_train_step": 2.5225021839141846, "step": 2740} {"train_info/time_between_train_steps": 0.0036470890045166016, "step": 2740} {"info/global_step": 2741, "train_info/time_within_train_step": 2.5231473445892334, "step": 2741} {"train_info/time_between_train_steps": 0.003628969192504883, "step": 2741} {"info/global_step": 2742, "train_info/time_within_train_step": 2.522825002670288, "step": 2742} {"train_info/time_between_train_steps": 0.0033845901489257812, "step": 2742} {"info/global_step": 2743, "train_info/time_within_train_step": 2.522097110748291, "step": 2743} {"train_info/time_between_train_steps": 0.0034699440002441406, "step": 2743} {"info/global_step": 2744, "train_info/time_within_train_step": 2.522733211517334, "step": 2744} {"train_info/time_between_train_steps": 0.003599405288696289, "step": 2744} {"info/global_step": 2745, "train_info/time_within_train_step": 2.5225648880004883, "step": 2745} {"train_info/time_between_train_steps": 0.0036263465881347656, "step": 2745} {"info/global_step": 2746, "train_info/time_within_train_step": 2.5225274562835693, "step": 2746} {"train_info/time_between_train_steps": 0.0034780502319335938, "step": 2746} {"info/global_step": 2747, "train_info/time_within_train_step": 2.521775960922241, "step": 2747} {"train_info/time_between_train_steps": 0.0033626556396484375, "step": 2747} {"info/global_step": 2748, "train_info/time_within_train_step": 2.522082567214966, "step": 2748} {"train_info/time_between_train_steps": 0.0035789012908935547, "step": 2748} {"info/global_step": 2749, "train_info/time_within_train_step": 3.0065107345581055, "step": 2749} {"train_info/time_between_train_steps": 0.003389120101928711, "step": 2749} {"info/global_step": 2750, "train_info/time_within_train_step": 2.5219838619232178, "step": 2750} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746330424, "_runtime": 7472}, "step": 2750} {"logs": {"train/loss": 3.9048, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 3.02, "_timestamp": 1746330424, "_runtime": 7472}, "step": 2750} {"train_info/time_between_train_steps": 0.02948927879333496, "step": 2750} {"info/global_step": 2751, "train_info/time_within_train_step": 2.5222034454345703, "step": 2751} {"train_info/time_between_train_steps": 0.0033986568450927734, "step": 2751} {"info/global_step": 2752, "train_info/time_within_train_step": 2.5217478275299072, "step": 2752} {"train_info/time_between_train_steps": 0.0034894943237304688, "step": 2752} {"info/global_step": 2753, "train_info/time_within_train_step": 2.5229132175445557, "step": 2753} {"train_info/time_between_train_steps": 0.003378152847290039, "step": 2753} {"info/global_step": 2754, "train_info/time_within_train_step": 2.52321720123291, "step": 2754} {"train_info/time_between_train_steps": 0.0034093856811523438, "step": 2754} {"info/global_step": 2755, "train_info/time_within_train_step": 2.5232815742492676, "step": 2755} {"train_info/time_between_train_steps": 0.0035080909729003906, "step": 2755} {"info/global_step": 2756, "train_info/time_within_train_step": 2.5219576358795166, "step": 2756} {"train_info/time_between_train_steps": 0.0035996437072753906, "step": 2756} {"info/global_step": 2757, "train_info/time_within_train_step": 2.521972179412842, "step": 2757} {"train_info/time_between_train_steps": 0.0034017562866210938, "step": 2757} {"info/global_step": 2758, "train_info/time_within_train_step": 2.5215554237365723, "step": 2758} {"train_info/time_between_train_steps": 0.003615140914916992, "step": 2758} {"info/global_step": 2759, "train_info/time_within_train_step": 2.5213463306427, "step": 2759} {"train_info/time_between_train_steps": 0.003396749496459961, "step": 2759} {"info/global_step": 2760, "train_info/time_within_train_step": 2.52219557762146, "step": 2760} {"train_info/time_between_train_steps": 0.003484964370727539, "step": 2760} {"info/global_step": 2761, "train_info/time_within_train_step": 2.770873785018921, "step": 2761} {"train_info/time_between_train_steps": 0.0033555030822753906, "step": 2761} {"info/global_step": 2762, "train_info/time_within_train_step": 2.5222933292388916, "step": 2762} {"train_info/time_between_train_steps": 0.003377676010131836, "step": 2762} {"info/global_step": 2763, "train_info/time_within_train_step": 2.5211048126220703, "step": 2763} {"train_info/time_between_train_steps": 0.0034253597259521484, "step": 2763} {"info/global_step": 2764, "train_info/time_within_train_step": 2.521629810333252, "step": 2764} {"train_info/time_between_train_steps": 0.00347900390625, "step": 2764} {"info/global_step": 2765, "train_info/time_within_train_step": 2.5279455184936523, "step": 2765} {"train_info/time_between_train_steps": 0.0035049915313720703, "step": 2765} {"info/global_step": 2766, "train_info/time_within_train_step": 2.5230846405029297, "step": 2766} {"train_info/time_between_train_steps": 0.0034210681915283203, "step": 2766} {"info/global_step": 2767, "train_info/time_within_train_step": 2.5228209495544434, "step": 2767} {"train_info/time_between_train_steps": 0.0035600662231445312, "step": 2767} {"info/global_step": 2768, "train_info/time_within_train_step": 2.5230507850646973, "step": 2768} {"train_info/time_between_train_steps": 0.0033521652221679688, "step": 2768} {"info/global_step": 2769, "train_info/time_within_train_step": 2.522165298461914, "step": 2769} {"train_info/time_between_train_steps": 0.0033576488494873047, "step": 2769} {"info/global_step": 2770, "train_info/time_within_train_step": 2.5228378772735596, "step": 2770} {"train_info/time_between_train_steps": 0.0035512447357177734, "step": 2770} {"info/global_step": 2771, "train_info/time_within_train_step": 2.5232930183410645, "step": 2771} {"train_info/time_between_train_steps": 0.0035676956176757812, "step": 2771} {"info/global_step": 2772, "train_info/time_within_train_step": 2.5225319862365723, "step": 2772} {"train_info/time_between_train_steps": 0.003381490707397461, "step": 2772} {"info/global_step": 2773, "train_info/time_within_train_step": 2.522818088531494, "step": 2773} {"train_info/time_between_train_steps": 0.003450155258178711, "step": 2773} {"info/global_step": 2774, "train_info/time_within_train_step": 2.5223724842071533, "step": 2774} {"train_info/time_between_train_steps": 0.003539562225341797, "step": 2774} {"info/global_step": 2775, "train_info/time_within_train_step": 2.5223774909973145, "step": 2775} {"train_info/time_between_train_steps": 0.0033903121948242188, "step": 2775} {"info/global_step": 2776, "train_info/time_within_train_step": 2.521864175796509, "step": 2776} {"train_info/time_between_train_steps": 0.003727436065673828, "step": 2776} {"info/global_step": 2777, "train_info/time_within_train_step": 2.5207598209381104, "step": 2777} {"train_info/time_between_train_steps": 0.0034799575805664062, "step": 2777} {"info/global_step": 2778, "train_info/time_within_train_step": 2.5212185382843018, "step": 2778} {"train_info/time_between_train_steps": 0.003586292266845703, "step": 2778} {"info/global_step": 2779, "train_info/time_within_train_step": 2.5212278366088867, "step": 2779} {"train_info/time_between_train_steps": 0.0036606788635253906, "step": 2779} {"info/global_step": 2780, "train_info/time_within_train_step": 2.5216660499572754, "step": 2780} {"train_info/time_between_train_steps": 0.0034584999084472656, "step": 2780} {"info/global_step": 2781, "train_info/time_within_train_step": 2.521245002746582, "step": 2781} {"train_info/time_between_train_steps": 0.003452301025390625, "step": 2781} {"info/global_step": 2782, "train_info/time_within_train_step": 2.5209171772003174, "step": 2782} {"train_info/time_between_train_steps": 0.0034437179565429688, "step": 2782} {"info/global_step": 2783, "train_info/time_within_train_step": 2.5219221115112305, "step": 2783} {"train_info/time_between_train_steps": 0.0033986568450927734, "step": 2783} {"info/global_step": 2784, "train_info/time_within_train_step": 2.522613286972046, "step": 2784} {"train_info/time_between_train_steps": 0.003374814987182617, "step": 2784} {"info/global_step": 2785, "train_info/time_within_train_step": 2.5223376750946045, "step": 2785} {"train_info/time_between_train_steps": 0.0033533573150634766, "step": 2785} {"info/global_step": 2786, "train_info/time_within_train_step": 2.5225648880004883, "step": 2786} {"train_info/time_between_train_steps": 0.0034704208374023438, "step": 2786} {"info/global_step": 2787, "train_info/time_within_train_step": 2.522014617919922, "step": 2787} {"train_info/time_between_train_steps": 0.0035562515258789062, "step": 2787} {"info/global_step": 2788, "train_info/time_within_train_step": 2.5229427814483643, "step": 2788} {"train_info/time_between_train_steps": 0.003584623336791992, "step": 2788} {"info/global_step": 2789, "train_info/time_within_train_step": 2.523101568222046, "step": 2789} {"train_info/time_between_train_steps": 0.0034046173095703125, "step": 2789} {"info/global_step": 2790, "train_info/time_within_train_step": 2.5224368572235107, "step": 2790} {"train_info/time_between_train_steps": 0.0036211013793945312, "step": 2790} {"info/global_step": 2791, "train_info/time_within_train_step": 2.521890640258789, "step": 2791} {"train_info/time_between_train_steps": 0.003403902053833008, "step": 2791} {"info/global_step": 2792, "train_info/time_within_train_step": 2.5219314098358154, "step": 2792} {"train_info/time_between_train_steps": 0.0033714771270751953, "step": 2792} {"info/global_step": 2793, "train_info/time_within_train_step": 2.5217976570129395, "step": 2793} {"train_info/time_between_train_steps": 0.003400564193725586, "step": 2793} {"info/global_step": 2794, "train_info/time_within_train_step": 2.521456241607666, "step": 2794} {"train_info/time_between_train_steps": 0.003352642059326172, "step": 2794} {"info/global_step": 2795, "train_info/time_within_train_step": 2.5217909812927246, "step": 2795} {"train_info/time_between_train_steps": 0.003656148910522461, "step": 2795} {"info/global_step": 2796, "train_info/time_within_train_step": 2.5220749378204346, "step": 2796} {"train_info/time_between_train_steps": 0.0033423900604248047, "step": 2796} {"info/global_step": 2797, "train_info/time_within_train_step": 2.521934986114502, "step": 2797} {"train_info/time_between_train_steps": 0.0034275054931640625, "step": 2797} {"info/global_step": 2798, "train_info/time_within_train_step": 2.5215635299682617, "step": 2798} {"train_info/time_between_train_steps": 0.0033555030822753906, "step": 2798} {"info/global_step": 2799, "train_info/time_within_train_step": 2.521165609359741, "step": 2799} {"train_info/time_between_train_steps": 0.003374814987182617, "step": 2799} {"info/global_step": 2800, "train_info/time_within_train_step": 2.767631769180298, "step": 2800} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746330552, "_runtime": 7600}, "step": 2800} {"logs": {"train/loss": 3.8889, "train/learning_rate": 4.444444444444444e-05, "train/epoch": 3.04, "_timestamp": 1746330552, "_runtime": 7600}, "step": 2800} {"train_info/time_between_train_steps": 21.479042768478394, "step": 2800} {"info/global_step": 2801, "train_info/time_within_train_step": 2.3309926986694336, "step": 2801} {"train_info/time_between_train_steps": 0.12539124488830566, "step": 2801} {"info/global_step": 2802, "train_info/time_within_train_step": 2.314328670501709, "step": 2802} {"train_info/time_between_train_steps": 0.003398418426513672, "step": 2802} {"info/global_step": 2803, "train_info/time_within_train_step": 2.4492270946502686, "step": 2803} {"train_info/time_between_train_steps": 0.003409147262573242, "step": 2803} {"info/global_step": 2804, "train_info/time_within_train_step": 2.519078016281128, "step": 2804} {"train_info/time_between_train_steps": 0.003560781478881836, "step": 2804} {"info/global_step": 2805, "train_info/time_within_train_step": 2.5194520950317383, "step": 2805} {"train_info/time_between_train_steps": 0.003404855728149414, "step": 2805} {"info/global_step": 2806, "train_info/time_within_train_step": 2.5215747356414795, "step": 2806} {"train_info/time_between_train_steps": 0.0034508705139160156, "step": 2806} {"info/global_step": 2807, "train_info/time_within_train_step": 2.521944284439087, "step": 2807} {"train_info/time_between_train_steps": 0.003624439239501953, "step": 2807} {"info/global_step": 2808, "train_info/time_within_train_step": 2.522213935852051, "step": 2808} {"train_info/time_between_train_steps": 0.0033762454986572266, "step": 2808} {"info/global_step": 2809, "train_info/time_within_train_step": 2.521800994873047, "step": 2809} {"train_info/time_between_train_steps": 0.0036017894744873047, "step": 2809} {"info/global_step": 2810, "train_info/time_within_train_step": 2.5216877460479736, "step": 2810} {"train_info/time_between_train_steps": 0.0033981800079345703, "step": 2810} {"info/global_step": 2811, "train_info/time_within_train_step": 2.522014856338501, "step": 2811} {"train_info/time_between_train_steps": 0.0036568641662597656, "step": 2811} {"info/global_step": 2812, "train_info/time_within_train_step": 2.521941900253296, "step": 2812} {"train_info/time_between_train_steps": 0.0035457611083984375, "step": 2812} {"info/global_step": 2813, "train_info/time_within_train_step": 2.5220658779144287, "step": 2813} {"train_info/time_between_train_steps": 0.0036270618438720703, "step": 2813} {"info/global_step": 2814, "train_info/time_within_train_step": 2.522040367126465, "step": 2814} {"train_info/time_between_train_steps": 0.0033681392669677734, "step": 2814} {"info/global_step": 2815, "train_info/time_within_train_step": 2.52215838432312, "step": 2815} {"train_info/time_between_train_steps": 0.0033597946166992188, "step": 2815} {"info/global_step": 2816, "train_info/time_within_train_step": 2.5230658054351807, "step": 2816} {"train_info/time_between_train_steps": 0.003335237503051758, "step": 2816} {"info/global_step": 2817, "train_info/time_within_train_step": 2.52237868309021, "step": 2817} {"train_info/time_between_train_steps": 0.0036439895629882812, "step": 2817} {"info/global_step": 2818, "train_info/time_within_train_step": 2.5227067470550537, "step": 2818} {"train_info/time_between_train_steps": 0.003356456756591797, "step": 2818} {"info/global_step": 2819, "train_info/time_within_train_step": 2.5226802825927734, "step": 2819} {"train_info/time_between_train_steps": 0.0036139488220214844, "step": 2819} {"info/global_step": 2820, "train_info/time_within_train_step": 2.523042917251587, "step": 2820} {"train_info/time_between_train_steps": 0.003395557403564453, "step": 2820} {"info/global_step": 2821, "train_info/time_within_train_step": 2.5227487087249756, "step": 2821} {"train_info/time_between_train_steps": 0.0034210681915283203, "step": 2821} {"info/global_step": 2822, "train_info/time_within_train_step": 2.5236213207244873, "step": 2822} {"train_info/time_between_train_steps": 0.0033617019653320312, "step": 2822} {"info/global_step": 2823, "train_info/time_within_train_step": 2.522324800491333, "step": 2823} {"train_info/time_between_train_steps": 0.003373384475708008, "step": 2823} {"info/global_step": 2824, "train_info/time_within_train_step": 2.5221493244171143, "step": 2824} {"train_info/time_between_train_steps": 0.003404378890991211, "step": 2824} {"info/global_step": 2825, "train_info/time_within_train_step": 2.5229239463806152, "step": 2825} {"train_info/time_between_train_steps": 0.0033431053161621094, "step": 2825} {"info/global_step": 2826, "train_info/time_within_train_step": 2.522394895553589, "step": 2826} {"train_info/time_between_train_steps": 0.0033500194549560547, "step": 2826} {"info/global_step": 2827, "train_info/time_within_train_step": 2.5221810340881348, "step": 2827} {"train_info/time_between_train_steps": 0.003374338150024414, "step": 2827} {"info/global_step": 2828, "train_info/time_within_train_step": 2.522456645965576, "step": 2828} {"train_info/time_between_train_steps": 0.0033614635467529297, "step": 2828} {"info/global_step": 2829, "train_info/time_within_train_step": 2.521864891052246, "step": 2829} {"train_info/time_between_train_steps": 0.0036237239837646484, "step": 2829} {"info/global_step": 2830, "train_info/time_within_train_step": 2.5217716693878174, "step": 2830} {"train_info/time_between_train_steps": 0.003597259521484375, "step": 2830} {"info/global_step": 2831, "train_info/time_within_train_step": 2.5224215984344482, "step": 2831} {"train_info/time_between_train_steps": 0.0036559104919433594, "step": 2831} {"info/global_step": 2832, "train_info/time_within_train_step": 2.522268772125244, "step": 2832} {"train_info/time_between_train_steps": 0.003453493118286133, "step": 2832} {"info/global_step": 2833, "train_info/time_within_train_step": 2.5221285820007324, "step": 2833} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 2833} {"info/global_step": 2834, "train_info/time_within_train_step": 2.522639751434326, "step": 2834} {"train_info/time_between_train_steps": 0.0033669471740722656, "step": 2834} {"info/global_step": 2835, "train_info/time_within_train_step": 2.522671937942505, "step": 2835} {"train_info/time_between_train_steps": 0.0035178661346435547, "step": 2835} {"info/global_step": 2836, "train_info/time_within_train_step": 2.5229547023773193, "step": 2836} {"train_info/time_between_train_steps": 0.003445148468017578, "step": 2836} {"info/global_step": 2837, "train_info/time_within_train_step": 2.522423505783081, "step": 2837} {"train_info/time_between_train_steps": 0.0033693313598632812, "step": 2837} {"info/global_step": 2838, "train_info/time_within_train_step": 2.5234627723693848, "step": 2838} {"train_info/time_between_train_steps": 0.003392934799194336, "step": 2838} {"info/global_step": 2839, "train_info/time_within_train_step": 2.5228662490844727, "step": 2839} {"train_info/time_between_train_steps": 0.0033822059631347656, "step": 2839} {"info/global_step": 2840, "train_info/time_within_train_step": 2.5221638679504395, "step": 2840} {"train_info/time_between_train_steps": 0.0033812522888183594, "step": 2840} {"info/global_step": 2841, "train_info/time_within_train_step": 2.5216689109802246, "step": 2841} {"train_info/time_between_train_steps": 0.003376483917236328, "step": 2841} {"info/global_step": 2842, "train_info/time_within_train_step": 2.5454347133636475, "step": 2842} {"train_info/time_between_train_steps": 0.003339529037475586, "step": 2842} {"info/global_step": 2843, "train_info/time_within_train_step": 2.522540330886841, "step": 2843} {"train_info/time_between_train_steps": 0.003382444381713867, "step": 2843} {"info/global_step": 2844, "train_info/time_within_train_step": 2.5221619606018066, "step": 2844} {"train_info/time_between_train_steps": 0.0033593177795410156, "step": 2844} {"info/global_step": 2845, "train_info/time_within_train_step": 2.521949529647827, "step": 2845} {"train_info/time_between_train_steps": 0.003935813903808594, "step": 2845} {"info/global_step": 2846, "train_info/time_within_train_step": 2.5217909812927246, "step": 2846} {"train_info/time_between_train_steps": 0.0033719539642333984, "step": 2846} {"info/global_step": 2847, "train_info/time_within_train_step": 2.522557020187378, "step": 2847} {"train_info/time_between_train_steps": 0.003376007080078125, "step": 2847} {"info/global_step": 2848, "train_info/time_within_train_step": 2.5223724842071533, "step": 2848} {"train_info/time_between_train_steps": 0.0037178993225097656, "step": 2848} {"info/global_step": 2849, "train_info/time_within_train_step": 2.522552490234375, "step": 2849} {"train_info/time_between_train_steps": 0.0036096572875976562, "step": 2849} {"info/global_step": 2850, "train_info/time_within_train_step": 2.5212619304656982, "step": 2850} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746330700, "_runtime": 7748}, "step": 2850} {"logs": {"train/loss": 3.8836, "train/learning_rate": 3.333333333333333e-05, "train/epoch": 3.06, "_timestamp": 1746330700, "_runtime": 7748}, "step": 2850} {"train_info/time_between_train_steps": 0.05077314376831055, "step": 2850} {"info/global_step": 2851, "train_info/time_within_train_step": 2.5227043628692627, "step": 2851} {"train_info/time_between_train_steps": 0.0035877227783203125, "step": 2851} {"info/global_step": 2852, "train_info/time_within_train_step": 2.5513999462127686, "step": 2852} {"train_info/time_between_train_steps": 0.0034117698669433594, "step": 2852} {"info/global_step": 2853, "train_info/time_within_train_step": 2.5228142738342285, "step": 2853} {"train_info/time_between_train_steps": 0.0035202503204345703, "step": 2853} {"info/global_step": 2854, "train_info/time_within_train_step": 2.52280855178833, "step": 2854} {"train_info/time_between_train_steps": 0.003481626510620117, "step": 2854} {"info/global_step": 2855, "train_info/time_within_train_step": 2.5227982997894287, "step": 2855} {"train_info/time_between_train_steps": 0.0034513473510742188, "step": 2855} {"info/global_step": 2856, "train_info/time_within_train_step": 2.5229008197784424, "step": 2856} {"train_info/time_between_train_steps": 0.00365447998046875, "step": 2856} {"info/global_step": 2857, "train_info/time_within_train_step": 2.523097276687622, "step": 2857} {"train_info/time_between_train_steps": 0.0037584304809570312, "step": 2857} {"info/global_step": 2858, "train_info/time_within_train_step": 2.5223116874694824, "step": 2858} {"train_info/time_between_train_steps": 0.003675699234008789, "step": 2858} {"info/global_step": 2859, "train_info/time_within_train_step": 2.522411584854126, "step": 2859} {"train_info/time_between_train_steps": 0.0034623146057128906, "step": 2859} {"info/global_step": 2860, "train_info/time_within_train_step": 2.5232250690460205, "step": 2860} {"train_info/time_between_train_steps": 0.003540515899658203, "step": 2860} {"info/global_step": 2861, "train_info/time_within_train_step": 2.522799491882324, "step": 2861} {"train_info/time_between_train_steps": 0.003480195999145508, "step": 2861} {"info/global_step": 2862, "train_info/time_within_train_step": 2.521764039993286, "step": 2862} {"train_info/time_between_train_steps": 0.003435373306274414, "step": 2862} {"info/global_step": 2863, "train_info/time_within_train_step": 2.5216281414031982, "step": 2863} {"train_info/time_between_train_steps": 0.0035953521728515625, "step": 2863} {"info/global_step": 2864, "train_info/time_within_train_step": 2.6558761596679688, "step": 2864} {"train_info/time_between_train_steps": 0.0034673213958740234, "step": 2864} {"info/global_step": 2865, "train_info/time_within_train_step": 2.522747278213501, "step": 2865} {"train_info/time_between_train_steps": 0.0035200119018554688, "step": 2865} {"info/global_step": 2866, "train_info/time_within_train_step": 2.521678924560547, "step": 2866} {"train_info/time_between_train_steps": 0.0036919116973876953, "step": 2866} {"info/global_step": 2867, "train_info/time_within_train_step": 2.5231404304504395, "step": 2867} {"train_info/time_between_train_steps": 0.0035867691040039062, "step": 2867} {"info/global_step": 2868, "train_info/time_within_train_step": 2.52250075340271, "step": 2868} {"train_info/time_between_train_steps": 0.0034682750701904297, "step": 2868} {"info/global_step": 2869, "train_info/time_within_train_step": 2.521613121032715, "step": 2869} {"train_info/time_between_train_steps": 0.0035631656646728516, "step": 2869} {"info/global_step": 2870, "train_info/time_within_train_step": 2.522216796875, "step": 2870} {"train_info/time_between_train_steps": 0.0035054683685302734, "step": 2870} {"info/global_step": 2871, "train_info/time_within_train_step": 2.522129535675049, "step": 2871} {"train_info/time_between_train_steps": 0.003580331802368164, "step": 2871} {"info/global_step": 2872, "train_info/time_within_train_step": 2.521588087081909, "step": 2872} {"train_info/time_between_train_steps": 0.003599882125854492, "step": 2872} {"info/global_step": 2873, "train_info/time_within_train_step": 2.5226423740386963, "step": 2873} {"train_info/time_between_train_steps": 0.003419637680053711, "step": 2873} {"info/global_step": 2874, "train_info/time_within_train_step": 2.5232431888580322, "step": 2874} {"train_info/time_between_train_steps": 0.003595113754272461, "step": 2874} {"info/global_step": 2875, "train_info/time_within_train_step": 2.5216662883758545, "step": 2875} {"train_info/time_between_train_steps": 0.003510713577270508, "step": 2875} {"info/global_step": 2876, "train_info/time_within_train_step": 2.5225894451141357, "step": 2876} {"train_info/time_between_train_steps": 0.003609180450439453, "step": 2876} {"info/global_step": 2877, "train_info/time_within_train_step": 2.5215299129486084, "step": 2877} {"train_info/time_between_train_steps": 0.0036077499389648438, "step": 2877} {"info/global_step": 2878, "train_info/time_within_train_step": 2.522775888442993, "step": 2878} {"train_info/time_between_train_steps": 0.0035352706909179688, "step": 2878} {"info/global_step": 2879, "train_info/time_within_train_step": 2.5227866172790527, "step": 2879} {"train_info/time_between_train_steps": 0.003652334213256836, "step": 2879} {"info/global_step": 2880, "train_info/time_within_train_step": 2.5223207473754883, "step": 2880} {"train_info/time_between_train_steps": 0.003589153289794922, "step": 2880} {"info/global_step": 2881, "train_info/time_within_train_step": 2.522197961807251, "step": 2881} {"train_info/time_between_train_steps": 0.0036880970001220703, "step": 2881} {"info/global_step": 2882, "train_info/time_within_train_step": 2.5227270126342773, "step": 2882} {"train_info/time_between_train_steps": 0.0034554004669189453, "step": 2882} {"info/global_step": 2883, "train_info/time_within_train_step": 2.5234599113464355, "step": 2883} {"train_info/time_between_train_steps": 0.003532886505126953, "step": 2883} {"info/global_step": 2884, "train_info/time_within_train_step": 2.5230600833892822, "step": 2884} {"train_info/time_between_train_steps": 0.003458738327026367, "step": 2884} {"info/global_step": 2885, "train_info/time_within_train_step": 2.5232129096984863, "step": 2885} {"train_info/time_between_train_steps": 0.003721475601196289, "step": 2885} {"info/global_step": 2886, "train_info/time_within_train_step": 2.5224075317382812, "step": 2886} {"train_info/time_between_train_steps": 0.0037384033203125, "step": 2886} {"info/global_step": 2887, "train_info/time_within_train_step": 2.8299293518066406, "step": 2887} {"train_info/time_between_train_steps": 0.0034151077270507812, "step": 2887} {"info/global_step": 2888, "train_info/time_within_train_step": 2.5218377113342285, "step": 2888} {"train_info/time_between_train_steps": 0.003642559051513672, "step": 2888} {"info/global_step": 2889, "train_info/time_within_train_step": 2.5209383964538574, "step": 2889} {"train_info/time_between_train_steps": 0.003694295883178711, "step": 2889} {"info/global_step": 2890, "train_info/time_within_train_step": 2.5235893726348877, "step": 2890} {"train_info/time_between_train_steps": 0.0036094188690185547, "step": 2890} {"info/global_step": 2891, "train_info/time_within_train_step": 2.521022319793701, "step": 2891} {"train_info/time_between_train_steps": 0.0034132003784179688, "step": 2891} {"info/global_step": 2892, "train_info/time_within_train_step": 2.5217669010162354, "step": 2892} {"train_info/time_between_train_steps": 0.0035314559936523438, "step": 2892} {"info/global_step": 2893, "train_info/time_within_train_step": 2.521369218826294, "step": 2893} {"train_info/time_between_train_steps": 0.0033707618713378906, "step": 2893} {"info/global_step": 2894, "train_info/time_within_train_step": 2.5224616527557373, "step": 2894} {"train_info/time_between_train_steps": 0.00337982177734375, "step": 2894} {"info/global_step": 2895, "train_info/time_within_train_step": 2.521557331085205, "step": 2895} {"train_info/time_between_train_steps": 0.003370523452758789, "step": 2895} {"info/global_step": 2896, "train_info/time_within_train_step": 2.5230138301849365, "step": 2896} {"train_info/time_between_train_steps": 0.0034084320068359375, "step": 2896} {"info/global_step": 2897, "train_info/time_within_train_step": 2.522630453109741, "step": 2897} {"train_info/time_between_train_steps": 0.003460407257080078, "step": 2897} {"info/global_step": 2898, "train_info/time_within_train_step": 2.521667003631592, "step": 2898} {"train_info/time_between_train_steps": 0.0036132335662841797, "step": 2898} {"info/global_step": 2899, "train_info/time_within_train_step": 2.5226528644561768, "step": 2899} {"train_info/time_between_train_steps": 0.0033648014068603516, "step": 2899} {"info/global_step": 2900, "train_info/time_within_train_step": 2.522434711456299, "step": 2900} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746330828, "_runtime": 7876}, "step": 2900} {"logs": {"train/loss": 3.8646, "train/learning_rate": 2.222222222222222e-05, "train/epoch": 3.07, "_timestamp": 1746330828, "_runtime": 7876}, "step": 2900} {"train_info/time_between_train_steps": 17.876408100128174, "step": 2900} {"info/global_step": 2901, "train_info/time_within_train_step": 2.332646369934082, "step": 2901} {"train_info/time_between_train_steps": 0.003643512725830078, "step": 2901} {"info/global_step": 2902, "train_info/time_within_train_step": 2.316782236099243, "step": 2902} {"train_info/time_between_train_steps": 0.003443002700805664, "step": 2902} {"info/global_step": 2903, "train_info/time_within_train_step": 2.4511725902557373, "step": 2903} {"train_info/time_between_train_steps": 0.0036153793334960938, "step": 2903} {"info/global_step": 2904, "train_info/time_within_train_step": 2.5183162689208984, "step": 2904} {"train_info/time_between_train_steps": 0.0033724308013916016, "step": 2904} {"info/global_step": 2905, "train_info/time_within_train_step": 2.5197081565856934, "step": 2905} {"train_info/time_between_train_steps": 0.003444194793701172, "step": 2905} {"info/global_step": 2906, "train_info/time_within_train_step": 2.5206031799316406, "step": 2906} {"train_info/time_between_train_steps": 0.0034492015838623047, "step": 2906} {"info/global_step": 2907, "train_info/time_within_train_step": 2.521287441253662, "step": 2907} {"train_info/time_between_train_steps": 0.0033740997314453125, "step": 2907} {"info/global_step": 2908, "train_info/time_within_train_step": 2.5210683345794678, "step": 2908} {"train_info/time_between_train_steps": 0.003542184829711914, "step": 2908} {"info/global_step": 2909, "train_info/time_within_train_step": 2.521695852279663, "step": 2909} {"train_info/time_between_train_steps": 0.0036096572875976562, "step": 2909} {"info/global_step": 2910, "train_info/time_within_train_step": 2.5218987464904785, "step": 2910} {"train_info/time_between_train_steps": 0.003559589385986328, "step": 2910} {"info/global_step": 2911, "train_info/time_within_train_step": 2.5223772525787354, "step": 2911} {"train_info/time_between_train_steps": 0.0034134387969970703, "step": 2911} {"info/global_step": 2912, "train_info/time_within_train_step": 2.522843599319458, "step": 2912} {"train_info/time_between_train_steps": 0.0034818649291992188, "step": 2912} {"info/global_step": 2913, "train_info/time_within_train_step": 2.5229642391204834, "step": 2913} {"train_info/time_between_train_steps": 0.0036194324493408203, "step": 2913} {"info/global_step": 2914, "train_info/time_within_train_step": 2.5229880809783936, "step": 2914} {"train_info/time_between_train_steps": 0.003521442413330078, "step": 2914} {"info/global_step": 2915, "train_info/time_within_train_step": 2.522313117980957, "step": 2915} {"train_info/time_between_train_steps": 0.003468036651611328, "step": 2915} {"info/global_step": 2916, "train_info/time_within_train_step": 2.5233683586120605, "step": 2916} {"train_info/time_between_train_steps": 0.0036640167236328125, "step": 2916} {"info/global_step": 2917, "train_info/time_within_train_step": 2.5227415561676025, "step": 2917} {"train_info/time_between_train_steps": 0.003399372100830078, "step": 2917} {"info/global_step": 2918, "train_info/time_within_train_step": 2.522217035293579, "step": 2918} {"train_info/time_between_train_steps": 0.0036110877990722656, "step": 2918} {"info/global_step": 2919, "train_info/time_within_train_step": 2.522669553756714, "step": 2919} {"train_info/time_between_train_steps": 0.003560304641723633, "step": 2919} {"info/global_step": 2920, "train_info/time_within_train_step": 2.522611379623413, "step": 2920} {"train_info/time_between_train_steps": 0.0035119056701660156, "step": 2920} {"info/global_step": 2921, "train_info/time_within_train_step": 2.522428512573242, "step": 2921} {"train_info/time_between_train_steps": 0.0033762454986572266, "step": 2921} {"info/global_step": 2922, "train_info/time_within_train_step": 2.5239553451538086, "step": 2922} {"train_info/time_between_train_steps": 0.0036590099334716797, "step": 2922} {"info/global_step": 2923, "train_info/time_within_train_step": 2.5228521823883057, "step": 2923} {"train_info/time_between_train_steps": 0.003654003143310547, "step": 2923} {"info/global_step": 2924, "train_info/time_within_train_step": 2.5237088203430176, "step": 2924} {"train_info/time_between_train_steps": 0.0035316944122314453, "step": 2924} {"info/global_step": 2925, "train_info/time_within_train_step": 2.522710084915161, "step": 2925} {"train_info/time_between_train_steps": 0.00347900390625, "step": 2925} {"info/global_step": 2926, "train_info/time_within_train_step": 2.523265838623047, "step": 2926} {"train_info/time_between_train_steps": 0.13180971145629883, "step": 2926} {"info/global_step": 2927, "train_info/time_within_train_step": 2.55145263671875, "step": 2927} {"train_info/time_between_train_steps": 0.003737926483154297, "step": 2927} {"info/global_step": 2928, "train_info/time_within_train_step": 2.5234177112579346, "step": 2928} {"train_info/time_between_train_steps": 0.0035452842712402344, "step": 2928} {"info/global_step": 2929, "train_info/time_within_train_step": 2.523594856262207, "step": 2929} {"train_info/time_between_train_steps": 0.003484964370727539, "step": 2929} {"info/global_step": 2930, "train_info/time_within_train_step": 2.523001194000244, "step": 2930} {"train_info/time_between_train_steps": 0.003526926040649414, "step": 2930} {"info/global_step": 2931, "train_info/time_within_train_step": 2.839935302734375, "step": 2931} {"train_info/time_between_train_steps": 0.003522634506225586, "step": 2931} {"info/global_step": 2932, "train_info/time_within_train_step": 2.5223641395568848, "step": 2932} {"train_info/time_between_train_steps": 0.003428936004638672, "step": 2932} {"info/global_step": 2933, "train_info/time_within_train_step": 2.5219130516052246, "step": 2933} {"train_info/time_between_train_steps": 0.0034470558166503906, "step": 2933} {"info/global_step": 2934, "train_info/time_within_train_step": 2.5217878818511963, "step": 2934} {"train_info/time_between_train_steps": 0.0035212039947509766, "step": 2934} {"info/global_step": 2935, "train_info/time_within_train_step": 2.522486686706543, "step": 2935} {"train_info/time_between_train_steps": 0.0035109519958496094, "step": 2935} {"info/global_step": 2936, "train_info/time_within_train_step": 2.528090715408325, "step": 2936} {"train_info/time_between_train_steps": 0.0034825801849365234, "step": 2936} {"info/global_step": 2937, "train_info/time_within_train_step": 2.5238513946533203, "step": 2937} {"train_info/time_between_train_steps": 0.003648996353149414, "step": 2937} {"info/global_step": 2938, "train_info/time_within_train_step": 2.5225026607513428, "step": 2938} {"train_info/time_between_train_steps": 0.003508329391479492, "step": 2938} {"info/global_step": 2939, "train_info/time_within_train_step": 2.52396821975708, "step": 2939} {"train_info/time_between_train_steps": 0.0035512447357177734, "step": 2939} {"info/global_step": 2940, "train_info/time_within_train_step": 2.535614013671875, "step": 2940} {"train_info/time_between_train_steps": 0.003456592559814453, "step": 2940} {"info/global_step": 2941, "train_info/time_within_train_step": 2.523390531539917, "step": 2941} {"train_info/time_between_train_steps": 0.0034384727478027344, "step": 2941} {"info/global_step": 2942, "train_info/time_within_train_step": 2.5224764347076416, "step": 2942} {"train_info/time_between_train_steps": 0.0034127235412597656, "step": 2942} {"info/global_step": 2943, "train_info/time_within_train_step": 2.5223097801208496, "step": 2943} {"train_info/time_between_train_steps": 0.0035181045532226562, "step": 2943} {"info/global_step": 2944, "train_info/time_within_train_step": 2.5228235721588135, "step": 2944} {"train_info/time_between_train_steps": 0.003544330596923828, "step": 2944} {"info/global_step": 2945, "train_info/time_within_train_step": 2.522531032562256, "step": 2945} {"train_info/time_between_train_steps": 0.004016876220703125, "step": 2945} {"info/global_step": 2946, "train_info/time_within_train_step": 2.5221118927001953, "step": 2946} {"train_info/time_between_train_steps": 0.0034689903259277344, "step": 2946} {"info/global_step": 2947, "train_info/time_within_train_step": 2.5233047008514404, "step": 2947} {"train_info/time_between_train_steps": 0.0035910606384277344, "step": 2947} {"info/global_step": 2948, "train_info/time_within_train_step": 2.5228688716888428, "step": 2948} {"train_info/time_between_train_steps": 0.0035076141357421875, "step": 2948} {"info/global_step": 2949, "train_info/time_within_train_step": 2.521610736846924, "step": 2949} {"train_info/time_between_train_steps": 0.003600597381591797, "step": 2949} {"info/global_step": 2950, "train_info/time_within_train_step": 2.5222434997558594, "step": 2950} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746330973, "_runtime": 8021}, "step": 2950} {"logs": {"train/loss": 3.8518, "train/learning_rate": 1.111111111111111e-05, "train/epoch": 3.09, "_timestamp": 1746330973, "_runtime": 8021}, "step": 2950} {"train_info/time_between_train_steps": 0.025353193283081055, "step": 2950} {"info/global_step": 2951, "train_info/time_within_train_step": 2.5226149559020996, "step": 2951} {"train_info/time_between_train_steps": 0.0035495758056640625, "step": 2951} {"info/global_step": 2952, "train_info/time_within_train_step": 2.522974967956543, "step": 2952} {"train_info/time_between_train_steps": 0.0035915374755859375, "step": 2952} {"info/global_step": 2953, "train_info/time_within_train_step": 2.522846221923828, "step": 2953} {"train_info/time_between_train_steps": 0.003751516342163086, "step": 2953} {"info/global_step": 2954, "train_info/time_within_train_step": 2.522270679473877, "step": 2954} {"train_info/time_between_train_steps": 0.0034651756286621094, "step": 2954} {"info/global_step": 2955, "train_info/time_within_train_step": 2.5224151611328125, "step": 2955} {"train_info/time_between_train_steps": 0.0034613609313964844, "step": 2955} {"info/global_step": 2956, "train_info/time_within_train_step": 2.522695302963257, "step": 2956} {"train_info/time_between_train_steps": 0.003532886505126953, "step": 2956} {"info/global_step": 2957, "train_info/time_within_train_step": 2.521592617034912, "step": 2957} {"train_info/time_between_train_steps": 0.0034482479095458984, "step": 2957} {"info/global_step": 2958, "train_info/time_within_train_step": 2.5220143795013428, "step": 2958} {"train_info/time_between_train_steps": 0.003510713577270508, "step": 2958} {"info/global_step": 2959, "train_info/time_within_train_step": 2.5227017402648926, "step": 2959} {"train_info/time_between_train_steps": 0.0035295486450195312, "step": 2959} {"info/global_step": 2960, "train_info/time_within_train_step": 2.5224928855895996, "step": 2960} {"train_info/time_between_train_steps": 0.003676176071166992, "step": 2960} {"info/global_step": 2961, "train_info/time_within_train_step": 2.5226662158966064, "step": 2961} {"train_info/time_between_train_steps": 0.003712892532348633, "step": 2961} {"info/global_step": 2962, "train_info/time_within_train_step": 2.5226731300354004, "step": 2962} {"train_info/time_between_train_steps": 0.003659963607788086, "step": 2962} {"info/global_step": 2963, "train_info/time_within_train_step": 2.551222801208496, "step": 2963} {"train_info/time_between_train_steps": 0.003772258758544922, "step": 2963} {"info/global_step": 2964, "train_info/time_within_train_step": 2.522725820541382, "step": 2964} {"train_info/time_between_train_steps": 0.0036423206329345703, "step": 2964} {"info/global_step": 2965, "train_info/time_within_train_step": 2.5223259925842285, "step": 2965} {"train_info/time_between_train_steps": 0.00357818603515625, "step": 2965} {"info/global_step": 2966, "train_info/time_within_train_step": 2.5229077339172363, "step": 2966} {"train_info/time_between_train_steps": 0.0036988258361816406, "step": 2966} {"info/global_step": 2967, "train_info/time_within_train_step": 2.5225815773010254, "step": 2967} {"train_info/time_between_train_steps": 0.003551483154296875, "step": 2967} {"info/global_step": 2968, "train_info/time_within_train_step": 2.5227255821228027, "step": 2968} {"train_info/time_between_train_steps": 0.003665924072265625, "step": 2968} {"info/global_step": 2969, "train_info/time_within_train_step": 2.5222842693328857, "step": 2969} {"train_info/time_between_train_steps": 0.0034019947052001953, "step": 2969} {"info/global_step": 2970, "train_info/time_within_train_step": 2.5224292278289795, "step": 2970} {"train_info/time_between_train_steps": 0.0034394264221191406, "step": 2970} {"info/global_step": 2971, "train_info/time_within_train_step": 2.5229475498199463, "step": 2971} {"train_info/time_between_train_steps": 0.0035970211029052734, "step": 2971} {"info/global_step": 2972, "train_info/time_within_train_step": 2.5229246616363525, "step": 2972} {"train_info/time_between_train_steps": 0.003490924835205078, "step": 2972} {"info/global_step": 2973, "train_info/time_within_train_step": 2.5230355262756348, "step": 2973} {"train_info/time_between_train_steps": 0.0036830902099609375, "step": 2973} {"info/global_step": 2974, "train_info/time_within_train_step": 2.5273637771606445, "step": 2974} {"train_info/time_between_train_steps": 0.003421783447265625, "step": 2974} {"info/global_step": 2975, "train_info/time_within_train_step": 2.522357702255249, "step": 2975} {"train_info/time_between_train_steps": 0.003582000732421875, "step": 2975} {"info/global_step": 2976, "train_info/time_within_train_step": 2.522268295288086, "step": 2976} {"train_info/time_between_train_steps": 0.0034818649291992188, "step": 2976} {"info/global_step": 2977, "train_info/time_within_train_step": 2.5216431617736816, "step": 2977} {"train_info/time_between_train_steps": 0.003692626953125, "step": 2977} {"info/global_step": 2978, "train_info/time_within_train_step": 2.521604537963867, "step": 2978} {"train_info/time_between_train_steps": 0.0036928653717041016, "step": 2978} {"info/global_step": 2979, "train_info/time_within_train_step": 2.5220885276794434, "step": 2979} {"train_info/time_between_train_steps": 0.0035126209259033203, "step": 2979} {"info/global_step": 2980, "train_info/time_within_train_step": 2.5222830772399902, "step": 2980} {"train_info/time_between_train_steps": 0.003602743148803711, "step": 2980} {"info/global_step": 2981, "train_info/time_within_train_step": 2.522575616836548, "step": 2981} {"train_info/time_between_train_steps": 0.0034966468811035156, "step": 2981} {"info/global_step": 2982, "train_info/time_within_train_step": 2.5216610431671143, "step": 2982} {"train_info/time_between_train_steps": 0.003457784652709961, "step": 2982} {"info/global_step": 2983, "train_info/time_within_train_step": 2.5229544639587402, "step": 2983} {"train_info/time_between_train_steps": 0.0037131309509277344, "step": 2983} {"info/global_step": 2984, "train_info/time_within_train_step": 2.5314548015594482, "step": 2984} {"train_info/time_between_train_steps": 0.0034477710723876953, "step": 2984} {"info/global_step": 2985, "train_info/time_within_train_step": 2.522303342819214, "step": 2985} {"train_info/time_between_train_steps": 0.003589153289794922, "step": 2985} {"info/global_step": 2986, "train_info/time_within_train_step": 2.527296304702759, "step": 2986} {"train_info/time_between_train_steps": 0.0036153793334960938, "step": 2986} {"info/global_step": 2987, "train_info/time_within_train_step": 2.523036241531372, "step": 2987} {"train_info/time_between_train_steps": 0.003638029098510742, "step": 2987} {"info/global_step": 2988, "train_info/time_within_train_step": 2.522475004196167, "step": 2988} {"train_info/time_between_train_steps": 0.003480672836303711, "step": 2988} {"info/global_step": 2989, "train_info/time_within_train_step": 2.651033401489258, "step": 2989} {"train_info/time_between_train_steps": 0.0034942626953125, "step": 2989} {"info/global_step": 2990, "train_info/time_within_train_step": 2.522745370864868, "step": 2990} {"train_info/time_between_train_steps": 0.0036208629608154297, "step": 2990} {"info/global_step": 2991, "train_info/time_within_train_step": 2.5212337970733643, "step": 2991} {"train_info/time_between_train_steps": 0.003576040267944336, "step": 2991} {"info/global_step": 2992, "train_info/time_within_train_step": 2.5217366218566895, "step": 2992} {"train_info/time_between_train_steps": 0.0034694671630859375, "step": 2992} {"info/global_step": 2993, "train_info/time_within_train_step": 2.521775245666504, "step": 2993} {"train_info/time_between_train_steps": 0.003599882125854492, "step": 2993} {"info/global_step": 2994, "train_info/time_within_train_step": 2.521665334701538, "step": 2994} {"train_info/time_between_train_steps": 0.003664731979370117, "step": 2994} {"info/global_step": 2995, "train_info/time_within_train_step": 2.5226690769195557, "step": 2995} {"train_info/time_between_train_steps": 0.0037267208099365234, "step": 2995} {"info/global_step": 2996, "train_info/time_within_train_step": 2.521374464035034, "step": 2996} {"train_info/time_between_train_steps": 0.0036771297454833984, "step": 2996} {"info/global_step": 2997, "train_info/time_within_train_step": 2.526205062866211, "step": 2997} {"train_info/time_between_train_steps": 0.0035774707794189453, "step": 2997} {"info/global_step": 2998, "train_info/time_within_train_step": 2.5221195220947266, "step": 2998} {"train_info/time_between_train_steps": 0.0035216808319091797, "step": 2998} {"info/global_step": 2999, "train_info/time_within_train_step": 3.031888246536255, "step": 2999} {"train_info/time_between_train_steps": 0.003485441207885742, "step": 2999} {"info/global_step": 3000, "train_info/time_within_train_step": 2.5449326038360596, "step": 3000} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746331101, "_runtime": 8149}, "step": 3000} {"logs": {"train/loss": 3.8506, "train/learning_rate": 0.0, "train/epoch": 3.11, "_timestamp": 1746331101, "_runtime": 8149}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746331107, "_runtime": 8155}, "step": 3000} {"logs": {"eval/loss": 4.426107406616211, "eval/runtime": 5.1464, "eval/samples_per_second": 38.862, "eval/steps_per_second": 1.36, "train/epoch": 3.11, "_timestamp": 1746331107, "_runtime": 8155}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746331107, "_runtime": 8155}, "step": 3000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.426107406616211, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 83.60534108414623, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1464, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 38.862, "train/epoch": 3.11, "_timestamp": 1746331107, "_runtime": 8155}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1564.4814453125, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746331119, "_runtime": 8167}, "step": 3000} {"logs": {"train/train_runtime": 8173.0194, "train/train_samples_per_second": 23.492, "train/train_steps_per_second": 0.367, "train/total_flos": 2.5093441585152e+16, "train/train_loss": 4.6363153120676674, "train/epoch": 3.11, "_timestamp": 1746331119, "_runtime": 8167}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1564.48046875, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746331128, "_runtime": 8176}, "step": 3000} {"logs": {"eval/loss": 4.426107406616211, "eval/runtime": 4.6837, "eval/samples_per_second": 42.702, "eval/steps_per_second": 1.495, "train/epoch": 3.11, "_timestamp": 1746331128, "_runtime": 8176}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1564.48046875, "train_info/memory_max_allocated": 4880.08447265625, "train_info/memory_reserved": 7664.0, "train_info/memory_max_reserved": 7664.0, "_timestamp": 1746331128, "_runtime": 8176}, "step": 3000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.426107406616211, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 83.60534108414623, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 4.6837, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 42.702, "train/epoch": 3.11, "_timestamp": 1746331128, "_runtime": 8176}, "step": 3000}