{"num_parameters": 124439808, "trainable_parameters": 124439808, "step": 0} {"train_info/time_between_train_steps": 3.7880611419677734, "step": 0} {"info/global_step": 1, "train_info/time_within_train_step": 28.245509386062622, "step": 1} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 19761.71484375, "train_info/memory_reserved": 22624.0, "train_info/memory_max_reserved": 22624.0, "_timestamp": 1740824103, "_runtime": 52}, "step": 1} {"logs": {"train/loss": 11.0218, "train/learning_rate": 4.9999999999999996e-06, "train/epoch": 0.0, "_timestamp": 1740824103, "_runtime": 52}, "step": 1} {"train_info/time_between_train_steps": 0.026770353317260742, "step": 1} {"info/global_step": 2, "train_info/time_within_train_step": 27.87890863418579, "step": 2} {"train_info/time_between_train_steps": 0.005446434020996094, "step": 2} {"info/global_step": 3, "train_info/time_within_train_step": 27.714547395706177, "step": 3} {"train_info/time_between_train_steps": 0.005309581756591797, "step": 3} {"info/global_step": 4, "train_info/time_within_train_step": 27.873948097229004, "step": 4} {"train_info/time_between_train_steps": 0.0055294036865234375, "step": 4} {"info/global_step": 5, "train_info/time_within_train_step": 27.747509241104126, "step": 5} {"train_info/time_between_train_steps": 0.0058400630950927734, "step": 5} {"info/global_step": 6, "train_info/time_within_train_step": 27.868066549301147, "step": 6} {"train_info/time_between_train_steps": 0.005422353744506836, "step": 6} {"info/global_step": 7, "train_info/time_within_train_step": 27.72815752029419, "step": 7} {"train_info/time_between_train_steps": 0.006606101989746094, "step": 7} {"info/global_step": 8, "train_info/time_within_train_step": 27.752501487731934, "step": 8} {"train_info/time_between_train_steps": 0.005498409271240234, "step": 8} {"info/global_step": 9, "train_info/time_within_train_step": 27.771718978881836, "step": 9} {"train_info/time_between_train_steps": 0.005301237106323242, "step": 9} {"info/global_step": 10, "train_info/time_within_train_step": 27.69246006011963, "step": 10} {"train_info/time_between_train_steps": 0.005982875823974609, "step": 10} {"info/global_step": 11, "train_info/time_within_train_step": 27.705485820770264, "step": 11} {"train_info/time_between_train_steps": 0.006503582000732422, "step": 11} {"info/global_step": 12, "train_info/time_within_train_step": 27.706249952316284, "step": 12} {"train_info/time_between_train_steps": 0.005203962326049805, "step": 12} {"info/global_step": 13, "train_info/time_within_train_step": 27.734382390975952, "step": 13} {"train_info/time_between_train_steps": 0.006273031234741211, "step": 13} {"info/global_step": 14, "train_info/time_within_train_step": 27.726340532302856, "step": 14} {"train_info/time_between_train_steps": 0.005394935607910156, "step": 14} {"info/global_step": 15, "train_info/time_within_train_step": 27.75440740585327, "step": 15} {"train_info/time_between_train_steps": 0.005065202713012695, "step": 15} {"info/global_step": 16, "train_info/time_within_train_step": 27.809078216552734, "step": 16} {"train_info/time_between_train_steps": 0.0055561065673828125, "step": 16} {"info/global_step": 17, "train_info/time_within_train_step": 27.74449610710144, "step": 17} {"train_info/time_between_train_steps": 0.011729717254638672, "step": 17} {"info/global_step": 18, "train_info/time_within_train_step": 27.704740047454834, "step": 18} {"train_info/time_between_train_steps": 0.005122184753417969, "step": 18} {"info/global_step": 19, "train_info/time_within_train_step": 27.701870679855347, "step": 19} {"train_info/time_between_train_steps": 0.005314350128173828, "step": 19} {"info/global_step": 20, "train_info/time_within_train_step": 27.705451250076294, "step": 20} {"train_info/time_between_train_steps": 0.00513768196105957, "step": 20} {"info/global_step": 21, "train_info/time_within_train_step": 27.701735496520996, "step": 21} {"train_info/time_between_train_steps": 0.005435943603515625, "step": 21} {"info/global_step": 22, "train_info/time_within_train_step": 27.733572959899902, "step": 22} {"train_info/time_between_train_steps": 0.005304098129272461, "step": 22} {"info/global_step": 23, "train_info/time_within_train_step": 27.71440815925598, "step": 23} {"train_info/time_between_train_steps": 0.005193948745727539, "step": 23} {"info/global_step": 24, "train_info/time_within_train_step": 27.756873846054077, "step": 24} {"train_info/time_between_train_steps": 0.005127906799316406, "step": 24} {"info/global_step": 25, "train_info/time_within_train_step": 27.71349811553955, "step": 25} {"train_info/time_between_train_steps": 0.005140781402587891, "step": 25} {"info/global_step": 26, "train_info/time_within_train_step": 27.713382720947266, "step": 26} {"train_info/time_between_train_steps": 0.005600452423095703, "step": 26} {"info/global_step": 27, "train_info/time_within_train_step": 27.714730739593506, "step": 27} {"train_info/time_between_train_steps": 0.005333900451660156, "step": 27} {"train_info/time_between_train_steps": 29.786367416381836, "step": 27} {"info/global_step": 28, "train_info/time_within_train_step": 27.70686984062195, "step": 28} {"train_info/time_between_train_steps": 0.005510091781616211, "step": 28} {"info/global_step": 29, "train_info/time_within_train_step": 27.89784002304077, "step": 29} {"train_info/time_between_train_steps": 0.0059356689453125, "step": 29} {"info/global_step": 30, "train_info/time_within_train_step": 27.718737840652466, "step": 30} {"train_info/time_between_train_steps": 0.005293607711791992, "step": 30} {"info/global_step": 31, "train_info/time_within_train_step": 28.026788473129272, "step": 31} {"train_info/time_between_train_steps": 0.0055425167083740234, "step": 31} {"info/global_step": 32, "train_info/time_within_train_step": 27.74660015106201, "step": 32} {"train_info/time_between_train_steps": 0.005425453186035156, "step": 32} {"info/global_step": 33, "train_info/time_within_train_step": 27.89497995376587, "step": 33} {"train_info/time_between_train_steps": 0.0055332183837890625, "step": 33} {"info/global_step": 34, "train_info/time_within_train_step": 27.742093324661255, "step": 34} {"train_info/time_between_train_steps": 0.005185127258300781, "step": 34} {"info/global_step": 35, "train_info/time_within_train_step": 27.765562772750854, "step": 35} {"train_info/time_between_train_steps": 0.005435466766357422, "step": 35} {"info/global_step": 36, "train_info/time_within_train_step": 27.716415882110596, "step": 36} {"train_info/time_between_train_steps": 0.005165576934814453, "step": 36} {"info/global_step": 37, "train_info/time_within_train_step": 27.683839321136475, "step": 37} {"train_info/time_between_train_steps": 0.005215167999267578, "step": 37} {"info/global_step": 38, "train_info/time_within_train_step": 27.72301173210144, "step": 38} {"train_info/time_between_train_steps": 0.005124568939208984, "step": 38} {"info/global_step": 39, "train_info/time_within_train_step": 27.701402187347412, "step": 39} {"train_info/time_between_train_steps": 0.0050923824310302734, "step": 39} {"info/global_step": 40, "train_info/time_within_train_step": 27.74090552330017, "step": 40} {"train_info/time_between_train_steps": 0.0051996707916259766, "step": 40} {"info/global_step": 41, "train_info/time_within_train_step": 27.718098402023315, "step": 41} {"train_info/time_between_train_steps": 0.0051898956298828125, "step": 41} {"info/global_step": 42, "train_info/time_within_train_step": 27.69398307800293, "step": 42} {"train_info/time_between_train_steps": 0.005246400833129883, "step": 42} {"info/global_step": 43, "train_info/time_within_train_step": 27.724716663360596, "step": 43} {"train_info/time_between_train_steps": 0.005392551422119141, "step": 43} {"info/global_step": 44, "train_info/time_within_train_step": 27.723763704299927, "step": 44} {"train_info/time_between_train_steps": 0.0053653717041015625, "step": 44} {"info/global_step": 45, "train_info/time_within_train_step": 27.714212894439697, "step": 45} {"train_info/time_between_train_steps": 0.0053253173828125, "step": 45} {"info/global_step": 46, "train_info/time_within_train_step": 27.803465843200684, "step": 46} {"train_info/time_between_train_steps": 0.005133152008056641, "step": 46} {"info/global_step": 47, "train_info/time_within_train_step": 27.701971292495728, "step": 47} {"train_info/time_between_train_steps": 0.005021095275878906, "step": 47} {"info/global_step": 48, "train_info/time_within_train_step": 27.688178539276123, "step": 48} {"train_info/time_between_train_steps": 0.005251884460449219, "step": 48} {"info/global_step": 49, "train_info/time_within_train_step": 27.703673601150513, "step": 49} {"train_info/time_between_train_steps": 0.005212068557739258, "step": 49} {"info/global_step": 50, "train_info/time_within_train_step": 27.70495319366455, "step": 50} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740825493, "_runtime": 1442}, "step": 50} {"logs": {"train/loss": 7.9982, "train/learning_rate": 0.00025, "train/epoch": 1.02, "_timestamp": 1740825493, "_runtime": 1442}, "step": 50} {"train_info/time_between_train_steps": 0.026431560516357422, "step": 50} {"info/global_step": 51, "train_info/time_within_train_step": 27.7627694606781, "step": 51} {"train_info/time_between_train_steps": 0.005071401596069336, "step": 51} {"info/global_step": 52, "train_info/time_within_train_step": 27.727630138397217, "step": 52} {"train_info/time_between_train_steps": 0.005377054214477539, "step": 52} {"info/global_step": 53, "train_info/time_within_train_step": 27.698277950286865, "step": 53} {"train_info/time_between_train_steps": 0.005599021911621094, "step": 53} {"info/global_step": 54, "train_info/time_within_train_step": 27.729766845703125, "step": 54} {"train_info/time_between_train_steps": 0.005549907684326172, "step": 54} {"train_info/time_between_train_steps": 29.669888496398926, "step": 54} {"info/global_step": 55, "train_info/time_within_train_step": 27.71361541748047, "step": 55} {"train_info/time_between_train_steps": 0.005017518997192383, "step": 55} {"info/global_step": 56, "train_info/time_within_train_step": 27.823082208633423, "step": 56} {"train_info/time_between_train_steps": 0.005087375640869141, "step": 56} {"info/global_step": 57, "train_info/time_within_train_step": 27.702436685562134, "step": 57} {"train_info/time_between_train_steps": 0.005762815475463867, "step": 57} {"info/global_step": 58, "train_info/time_within_train_step": 27.824201822280884, "step": 58} {"train_info/time_between_train_steps": 0.005498170852661133, "step": 58} {"info/global_step": 59, "train_info/time_within_train_step": 27.705023527145386, "step": 59} {"train_info/time_between_train_steps": 0.005738973617553711, "step": 59} {"info/global_step": 60, "train_info/time_within_train_step": 27.87265110015869, "step": 60} {"train_info/time_between_train_steps": 0.00543522834777832, "step": 60} {"info/global_step": 61, "train_info/time_within_train_step": 27.939080476760864, "step": 61} {"train_info/time_between_train_steps": 0.005414009094238281, "step": 61} {"info/global_step": 62, "train_info/time_within_train_step": 27.787308931350708, "step": 62} {"train_info/time_between_train_steps": 0.005358695983886719, "step": 62} {"info/global_step": 63, "train_info/time_within_train_step": 27.905927658081055, "step": 63} {"train_info/time_between_train_steps": 0.005109548568725586, "step": 63} {"info/global_step": 64, "train_info/time_within_train_step": 27.74005699157715, "step": 64} {"train_info/time_between_train_steps": 0.005379438400268555, "step": 64} {"info/global_step": 65, "train_info/time_within_train_step": 27.714900493621826, "step": 65} {"train_info/time_between_train_steps": 0.0051991939544677734, "step": 65} {"info/global_step": 66, "train_info/time_within_train_step": 27.688419818878174, "step": 66} {"train_info/time_between_train_steps": 0.005120515823364258, "step": 66} {"info/global_step": 67, "train_info/time_within_train_step": 27.680577278137207, "step": 67} {"train_info/time_between_train_steps": 0.005227327346801758, "step": 67} {"info/global_step": 68, "train_info/time_within_train_step": 27.681684970855713, "step": 68} {"train_info/time_between_train_steps": 0.005062103271484375, "step": 68} {"info/global_step": 69, "train_info/time_within_train_step": 27.70560359954834, "step": 69} {"train_info/time_between_train_steps": 0.005250692367553711, "step": 69} {"info/global_step": 70, "train_info/time_within_train_step": 27.698724269866943, "step": 70} {"train_info/time_between_train_steps": 0.005117177963256836, "step": 70} {"info/global_step": 71, "train_info/time_within_train_step": 27.695756196975708, "step": 71} {"train_info/time_between_train_steps": 0.005283832550048828, "step": 71} {"info/global_step": 72, "train_info/time_within_train_step": 27.713040351867676, "step": 72} {"train_info/time_between_train_steps": 0.005185127258300781, "step": 72} {"info/global_step": 73, "train_info/time_within_train_step": 27.68972420692444, "step": 73} {"train_info/time_between_train_steps": 0.005155086517333984, "step": 73} {"info/global_step": 74, "train_info/time_within_train_step": 27.687261819839478, "step": 74} {"train_info/time_between_train_steps": 0.005108833312988281, "step": 74} {"info/global_step": 75, "train_info/time_within_train_step": 27.681994438171387, "step": 75} {"train_info/time_between_train_steps": 0.005167484283447266, "step": 75} {"info/global_step": 76, "train_info/time_within_train_step": 27.74064826965332, "step": 76} {"train_info/time_between_train_steps": 0.005753993988037109, "step": 76} {"info/global_step": 77, "train_info/time_within_train_step": 27.817914724349976, "step": 77} {"train_info/time_between_train_steps": 0.011017084121704102, "step": 77} {"info/global_step": 78, "train_info/time_within_train_step": 27.699766874313354, "step": 78} {"train_info/time_between_train_steps": 0.0052030086517333984, "step": 78} {"info/global_step": 79, "train_info/time_within_train_step": 27.697784662246704, "step": 79} {"train_info/time_between_train_steps": 0.0052759647369384766, "step": 79} {"info/global_step": 80, "train_info/time_within_train_step": 27.706557989120483, "step": 80} {"train_info/time_between_train_steps": 0.005483150482177734, "step": 80} {"info/global_step": 81, "train_info/time_within_train_step": 27.737077713012695, "step": 81} {"train_info/time_between_train_steps": 0.00672459602355957, "step": 81} {"train_info/time_between_train_steps": 29.999504566192627, "step": 81} {"info/global_step": 82, "train_info/time_within_train_step": 27.693124771118164, "step": 82} {"train_info/time_between_train_steps": 0.0054988861083984375, "step": 82} {"info/global_step": 83, "train_info/time_within_train_step": 27.870315313339233, "step": 83} {"train_info/time_between_train_steps": 0.0053081512451171875, "step": 83} {"info/global_step": 84, "train_info/time_within_train_step": 27.695530891418457, "step": 84} {"train_info/time_between_train_steps": 0.005259990692138672, "step": 84} {"info/global_step": 85, "train_info/time_within_train_step": 27.857964754104614, "step": 85} {"train_info/time_between_train_steps": 0.00534367561340332, "step": 85} {"info/global_step": 86, "train_info/time_within_train_step": 27.69622230529785, "step": 86} {"train_info/time_between_train_steps": 0.005288600921630859, "step": 86} {"info/global_step": 87, "train_info/time_within_train_step": 27.861531972885132, "step": 87} {"train_info/time_between_train_steps": 0.005279064178466797, "step": 87} {"info/global_step": 88, "train_info/time_within_train_step": 27.752924919128418, "step": 88} {"train_info/time_between_train_steps": 0.005209684371948242, "step": 88} {"info/global_step": 89, "train_info/time_within_train_step": 27.75864267349243, "step": 89} {"train_info/time_between_train_steps": 0.005182743072509766, "step": 89} {"info/global_step": 90, "train_info/time_within_train_step": 27.713009357452393, "step": 90} {"train_info/time_between_train_steps": 0.005054950714111328, "step": 90} {"info/global_step": 91, "train_info/time_within_train_step": 27.80310606956482, "step": 91} {"train_info/time_between_train_steps": 0.004907369613647461, "step": 91} {"info/global_step": 92, "train_info/time_within_train_step": 27.732232332229614, "step": 92} {"train_info/time_between_train_steps": 0.0051991939544677734, "step": 92} {"info/global_step": 93, "train_info/time_within_train_step": 27.69894313812256, "step": 93} {"train_info/time_between_train_steps": 0.005001068115234375, "step": 93} {"info/global_step": 94, "train_info/time_within_train_step": 27.740082502365112, "step": 94} {"train_info/time_between_train_steps": 0.005225181579589844, "step": 94} {"info/global_step": 95, "train_info/time_within_train_step": 27.71693444252014, "step": 95} {"train_info/time_between_train_steps": 0.005131244659423828, "step": 95} {"info/global_step": 96, "train_info/time_within_train_step": 27.743969440460205, "step": 96} {"train_info/time_between_train_steps": 0.005102396011352539, "step": 96} {"info/global_step": 97, "train_info/time_within_train_step": 27.715368032455444, "step": 97} {"train_info/time_between_train_steps": 0.005327701568603516, "step": 97} {"info/global_step": 98, "train_info/time_within_train_step": 27.717996835708618, "step": 98} {"train_info/time_between_train_steps": 0.005067586898803711, "step": 98} {"info/global_step": 99, "train_info/time_within_train_step": 27.728034734725952, "step": 99} {"train_info/time_between_train_steps": 0.005372285842895508, "step": 99} {"info/global_step": 100, "train_info/time_within_train_step": 27.704466819763184, "step": 100} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740826942, "_runtime": 2891}, "step": 100} {"logs": {"train/loss": 5.8003, "train/learning_rate": 0.0005, "train/epoch": 3.02, "_timestamp": 1740826942, "_runtime": 2891}, "step": 100} {"train_info/time_between_train_steps": 73.18370079994202, "step": 100} {"info/global_step": 101, "train_info/time_within_train_step": 27.70071578025818, "step": 101} {"train_info/time_between_train_steps": 0.0050547122955322266, "step": 101} {"info/global_step": 102, "train_info/time_within_train_step": 27.704102993011475, "step": 102} {"train_info/time_between_train_steps": 0.005181312561035156, "step": 102} {"info/global_step": 103, "train_info/time_within_train_step": 27.687839031219482, "step": 103} {"train_info/time_between_train_steps": 0.005050182342529297, "step": 103} {"info/global_step": 104, "train_info/time_within_train_step": 27.69083285331726, "step": 104} {"train_info/time_between_train_steps": 0.005153179168701172, "step": 104} {"info/global_step": 105, "train_info/time_within_train_step": 27.684593200683594, "step": 105} {"train_info/time_between_train_steps": 0.0050051212310791016, "step": 105} {"info/global_step": 106, "train_info/time_within_train_step": 27.701864004135132, "step": 106} {"train_info/time_between_train_steps": 0.005112648010253906, "step": 106} {"info/global_step": 107, "train_info/time_within_train_step": 27.822410583496094, "step": 107} {"train_info/time_between_train_steps": 0.005424022674560547, "step": 107} {"info/global_step": 108, "train_info/time_within_train_step": 27.744323015213013, "step": 108} {"train_info/time_between_train_steps": 0.005571126937866211, "step": 108} {"train_info/time_between_train_steps": 29.649384021759033, "step": 108} {"info/global_step": 109, "train_info/time_within_train_step": 27.70844078063965, "step": 109} {"train_info/time_between_train_steps": 0.0049898624420166016, "step": 109} {"info/global_step": 110, "train_info/time_within_train_step": 27.83847403526306, "step": 110} {"train_info/time_between_train_steps": 0.005169391632080078, "step": 110} {"info/global_step": 111, "train_info/time_within_train_step": 27.718424797058105, "step": 111} {"train_info/time_between_train_steps": 0.006288051605224609, "step": 111} {"info/global_step": 112, "train_info/time_within_train_step": 27.86815881729126, "step": 112} {"train_info/time_between_train_steps": 0.006147623062133789, "step": 112} {"info/global_step": 113, "train_info/time_within_train_step": 27.709745407104492, "step": 113} {"train_info/time_between_train_steps": 0.0065190792083740234, "step": 113} {"info/global_step": 114, "train_info/time_within_train_step": 27.847676277160645, "step": 114} {"train_info/time_between_train_steps": 0.005347490310668945, "step": 114} {"info/global_step": 115, "train_info/time_within_train_step": 27.72253918647766, "step": 115} {"train_info/time_between_train_steps": 0.0054378509521484375, "step": 115} {"info/global_step": 116, "train_info/time_within_train_step": 27.778765201568604, "step": 116} {"train_info/time_between_train_steps": 0.005368232727050781, "step": 116} {"info/global_step": 117, "train_info/time_within_train_step": 27.698750734329224, "step": 117} {"train_info/time_between_train_steps": 0.00494384765625, "step": 117} {"info/global_step": 118, "train_info/time_within_train_step": 27.740641355514526, "step": 118} {"train_info/time_between_train_steps": 0.009716272354125977, "step": 118} {"info/global_step": 119, "train_info/time_within_train_step": 27.79171395301819, "step": 119} {"train_info/time_between_train_steps": 0.010639429092407227, "step": 119} {"info/global_step": 120, "train_info/time_within_train_step": 27.720006227493286, "step": 120} {"train_info/time_between_train_steps": 0.00573277473449707, "step": 120} {"info/global_step": 121, "train_info/time_within_train_step": 27.75653839111328, "step": 121} {"train_info/time_between_train_steps": 0.006563425064086914, "step": 121} {"info/global_step": 122, "train_info/time_within_train_step": 27.860503673553467, "step": 122} {"train_info/time_between_train_steps": 0.006151676177978516, "step": 122} {"info/global_step": 123, "train_info/time_within_train_step": 27.915786504745483, "step": 123} {"train_info/time_between_train_steps": 0.006303548812866211, "step": 123} {"info/global_step": 124, "train_info/time_within_train_step": 27.774923086166382, "step": 124} {"train_info/time_between_train_steps": 0.006476879119873047, "step": 124} {"info/global_step": 125, "train_info/time_within_train_step": 27.770323276519775, "step": 125} {"train_info/time_between_train_steps": 0.006311178207397461, "step": 125} {"info/global_step": 126, "train_info/time_within_train_step": 27.759220123291016, "step": 126} {"train_info/time_between_train_steps": 0.011489152908325195, "step": 126} {"info/global_step": 127, "train_info/time_within_train_step": 27.742541313171387, "step": 127} {"train_info/time_between_train_steps": 0.006157875061035156, "step": 127} {"info/global_step": 128, "train_info/time_within_train_step": 27.749855041503906, "step": 128} {"train_info/time_between_train_steps": 0.011115312576293945, "step": 128} {"info/global_step": 129, "train_info/time_within_train_step": 27.781652688980103, "step": 129} {"train_info/time_between_train_steps": 0.006207704544067383, "step": 129} {"info/global_step": 130, "train_info/time_within_train_step": 27.744268655776978, "step": 130} {"train_info/time_between_train_steps": 0.011104583740234375, "step": 130} {"info/global_step": 131, "train_info/time_within_train_step": 27.742699146270752, "step": 131} {"train_info/time_between_train_steps": 0.006204843521118164, "step": 131} {"info/global_step": 132, "train_info/time_within_train_step": 27.73805809020996, "step": 132} {"train_info/time_between_train_steps": 0.005957365036010742, "step": 132} {"info/global_step": 133, "train_info/time_within_train_step": 27.74616503715515, "step": 133} {"train_info/time_between_train_steps": 0.006145000457763672, "step": 133} {"info/global_step": 134, "train_info/time_within_train_step": 27.747852087020874, "step": 134} {"train_info/time_between_train_steps": 0.006326198577880859, "step": 134} {"info/global_step": 135, "train_info/time_within_train_step": 27.76485538482666, "step": 135} {"train_info/time_between_train_steps": 0.011858463287353516, "step": 135} {"train_info/time_between_train_steps": 30.023730516433716, "step": 135} {"info/global_step": 136, "train_info/time_within_train_step": 27.80540156364441, "step": 136} {"train_info/time_between_train_steps": 0.005544424057006836, "step": 136} {"info/global_step": 137, "train_info/time_within_train_step": 27.887460470199585, "step": 137} {"train_info/time_between_train_steps": 0.010448694229125977, "step": 137} {"info/global_step": 138, "train_info/time_within_train_step": 27.706188678741455, "step": 138} {"train_info/time_between_train_steps": 0.008067607879638672, "step": 138} {"info/global_step": 139, "train_info/time_within_train_step": 27.814921617507935, "step": 139} {"train_info/time_between_train_steps": 0.005296945571899414, "step": 139} {"info/global_step": 140, "train_info/time_within_train_step": 27.697428464889526, "step": 140} {"train_info/time_between_train_steps": 0.010326385498046875, "step": 140} {"info/global_step": 141, "train_info/time_within_train_step": 27.820491790771484, "step": 141} {"train_info/time_between_train_steps": 0.010231256484985352, "step": 141} {"info/global_step": 142, "train_info/time_within_train_step": 27.685983419418335, "step": 142} {"train_info/time_between_train_steps": 0.0052149295806884766, "step": 142} {"info/global_step": 143, "train_info/time_within_train_step": 27.77022075653076, "step": 143} {"train_info/time_between_train_steps": 0.005195140838623047, "step": 143} {"info/global_step": 144, "train_info/time_within_train_step": 27.701437950134277, "step": 144} {"train_info/time_between_train_steps": 0.0050733089447021484, "step": 144} {"info/global_step": 145, "train_info/time_within_train_step": 27.675015449523926, "step": 145} {"train_info/time_between_train_steps": 0.0049974918365478516, "step": 145} {"info/global_step": 146, "train_info/time_within_train_step": 27.73888850212097, "step": 146} {"train_info/time_between_train_steps": 0.005048036575317383, "step": 146} {"info/global_step": 147, "train_info/time_within_train_step": 27.68892240524292, "step": 147} {"train_info/time_between_train_steps": 0.005126953125, "step": 147} {"info/global_step": 148, "train_info/time_within_train_step": 27.738964796066284, "step": 148} {"train_info/time_between_train_steps": 0.005072593688964844, "step": 148} {"info/global_step": 149, "train_info/time_within_train_step": 27.82083797454834, "step": 149} {"train_info/time_between_train_steps": 0.00516510009765625, "step": 149} {"info/global_step": 150, "train_info/time_within_train_step": 27.738208055496216, "step": 150} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740828465, "_runtime": 4414}, "step": 150} {"logs": {"train/loss": 5.17, "train/learning_rate": 0.0005833333333333333, "train/epoch": 5.01, "_timestamp": 1740828465, "_runtime": 4414}, "step": 150} {"train_info/time_between_train_steps": 0.02614760398864746, "step": 150} {"info/global_step": 151, "train_info/time_within_train_step": 27.68132209777832, "step": 151} {"train_info/time_between_train_steps": 0.005135536193847656, "step": 151} {"info/global_step": 152, "train_info/time_within_train_step": 27.818657398223877, "step": 152} {"train_info/time_between_train_steps": 0.010589122772216797, "step": 152} {"info/global_step": 153, "train_info/time_within_train_step": 27.722400188446045, "step": 153} {"train_info/time_between_train_steps": 0.0053479671478271484, "step": 153} {"info/global_step": 154, "train_info/time_within_train_step": 27.69991970062256, "step": 154} {"train_info/time_between_train_steps": 0.005299091339111328, "step": 154} {"info/global_step": 155, "train_info/time_within_train_step": 27.694236040115356, "step": 155} {"train_info/time_between_train_steps": 0.005053997039794922, "step": 155} {"info/global_step": 156, "train_info/time_within_train_step": 27.691053867340088, "step": 156} {"train_info/time_between_train_steps": 0.005323886871337891, "step": 156} {"info/global_step": 157, "train_info/time_within_train_step": 27.72681498527527, "step": 157} {"train_info/time_between_train_steps": 0.005190610885620117, "step": 157} {"info/global_step": 158, "train_info/time_within_train_step": 27.73736310005188, "step": 158} {"train_info/time_between_train_steps": 0.005418539047241211, "step": 158} {"info/global_step": 159, "train_info/time_within_train_step": 28.796908617019653, "step": 159} {"train_info/time_between_train_steps": 0.005344867706298828, "step": 159} {"info/global_step": 160, "train_info/time_within_train_step": 27.70088291168213, "step": 160} {"train_info/time_between_train_steps": 0.00513148307800293, "step": 160} {"info/global_step": 161, "train_info/time_within_train_step": 27.737423419952393, "step": 161} {"train_info/time_between_train_steps": 0.005547046661376953, "step": 161} {"info/global_step": 162, "train_info/time_within_train_step": 27.718035221099854, "step": 162} {"train_info/time_between_train_steps": 0.0066585540771484375, "step": 162} {"train_info/time_between_train_steps": 30.146008014678955, "step": 162} {"info/global_step": 163, "train_info/time_within_train_step": 27.691269636154175, "step": 163} {"train_info/time_between_train_steps": 0.009775161743164062, "step": 163} {"info/global_step": 164, "train_info/time_within_train_step": 27.79708456993103, "step": 164} {"train_info/time_between_train_steps": 0.00982809066772461, "step": 164} {"info/global_step": 165, "train_info/time_within_train_step": 27.7124981880188, "step": 165} {"train_info/time_between_train_steps": 0.010118961334228516, "step": 165} {"info/global_step": 166, "train_info/time_within_train_step": 27.86442995071411, "step": 166} {"train_info/time_between_train_steps": 0.005469083786010742, "step": 166} {"info/global_step": 167, "train_info/time_within_train_step": 27.796879529953003, "step": 167} {"train_info/time_between_train_steps": 0.005290031433105469, "step": 167} {"info/global_step": 168, "train_info/time_within_train_step": 27.87415337562561, "step": 168} {"train_info/time_between_train_steps": 0.005539417266845703, "step": 168} {"info/global_step": 169, "train_info/time_within_train_step": 27.772125720977783, "step": 169} {"train_info/time_between_train_steps": 0.005262613296508789, "step": 169} {"info/global_step": 170, "train_info/time_within_train_step": 27.792458534240723, "step": 170} {"train_info/time_between_train_steps": 0.0053174495697021484, "step": 170} {"info/global_step": 171, "train_info/time_within_train_step": 27.729955434799194, "step": 171} {"train_info/time_between_train_steps": 0.005135297775268555, "step": 171} {"info/global_step": 172, "train_info/time_within_train_step": 27.682992458343506, "step": 172} {"train_info/time_between_train_steps": 0.005150794982910156, "step": 172} {"info/global_step": 173, "train_info/time_within_train_step": 27.70274257659912, "step": 173} {"train_info/time_between_train_steps": 0.005312442779541016, "step": 173} {"info/global_step": 174, "train_info/time_within_train_step": 27.6839861869812, "step": 174} {"train_info/time_between_train_steps": 0.004984617233276367, "step": 174} {"info/global_step": 175, "train_info/time_within_train_step": 27.68492579460144, "step": 175} {"train_info/time_between_train_steps": 0.005352497100830078, "step": 175} {"info/global_step": 176, "train_info/time_within_train_step": 27.682879209518433, "step": 176} {"train_info/time_between_train_steps": 0.0051381587982177734, "step": 176} {"info/global_step": 177, "train_info/time_within_train_step": 27.690643072128296, "step": 177} {"train_info/time_between_train_steps": 0.005058765411376953, "step": 177} {"info/global_step": 178, "train_info/time_within_train_step": 27.70091676712036, "step": 178} {"train_info/time_between_train_steps": 0.005292654037475586, "step": 178} {"info/global_step": 179, "train_info/time_within_train_step": 27.700216054916382, "step": 179} {"train_info/time_between_train_steps": 0.005173444747924805, "step": 179} {"info/global_step": 180, "train_info/time_within_train_step": 27.686551332473755, "step": 180} {"train_info/time_between_train_steps": 0.005277156829833984, "step": 180} {"info/global_step": 181, "train_info/time_within_train_step": 27.723023414611816, "step": 181} {"train_info/time_between_train_steps": 0.0051898956298828125, "step": 181} {"info/global_step": 182, "train_info/time_within_train_step": 27.78919553756714, "step": 182} {"train_info/time_between_train_steps": 0.005093812942504883, "step": 182} {"info/global_step": 183, "train_info/time_within_train_step": 27.707981824874878, "step": 183} {"train_info/time_between_train_steps": 0.0053501129150390625, "step": 183} {"info/global_step": 184, "train_info/time_within_train_step": 27.712560176849365, "step": 184} {"train_info/time_between_train_steps": 0.009626150131225586, "step": 184} {"info/global_step": 185, "train_info/time_within_train_step": 27.69282865524292, "step": 185} {"train_info/time_between_train_steps": 0.010521888732910156, "step": 185} {"info/global_step": 186, "train_info/time_within_train_step": 27.744566679000854, "step": 186} {"train_info/time_between_train_steps": 0.010106325149536133, "step": 186} {"info/global_step": 187, "train_info/time_within_train_step": 27.683058977127075, "step": 187} {"train_info/time_between_train_steps": 0.010000467300415039, "step": 187} {"info/global_step": 188, "train_info/time_within_train_step": 27.705600023269653, "step": 188} {"train_info/time_between_train_steps": 0.010479211807250977, "step": 188} {"info/global_step": 189, "train_info/time_within_train_step": 27.70455288887024, "step": 189} {"train_info/time_between_train_steps": 0.005850791931152344, "step": 189} {"train_info/time_between_train_steps": 29.765056610107422, "step": 189} {"info/global_step": 190, "train_info/time_within_train_step": 27.69384789466858, "step": 190} {"train_info/time_between_train_steps": 0.005122661590576172, "step": 190} {"info/global_step": 191, "train_info/time_within_train_step": 27.852377891540527, "step": 191} {"train_info/time_between_train_steps": 0.006392002105712891, "step": 191} {"info/global_step": 192, "train_info/time_within_train_step": 27.702239274978638, "step": 192} {"train_info/time_between_train_steps": 0.0054666996002197266, "step": 192} {"info/global_step": 193, "train_info/time_within_train_step": 27.823495149612427, "step": 193} {"train_info/time_between_train_steps": 0.005356788635253906, "step": 193} {"info/global_step": 194, "train_info/time_within_train_step": 27.693451404571533, "step": 194} {"train_info/time_between_train_steps": 0.005388498306274414, "step": 194} {"info/global_step": 195, "train_info/time_within_train_step": 27.867023229599, "step": 195} {"train_info/time_between_train_steps": 0.005517721176147461, "step": 195} {"info/global_step": 196, "train_info/time_within_train_step": 27.70014214515686, "step": 196} {"train_info/time_between_train_steps": 0.005280971527099609, "step": 196} {"info/global_step": 197, "train_info/time_within_train_step": 27.886200666427612, "step": 197} {"train_info/time_between_train_steps": 0.006073951721191406, "step": 197} {"info/global_step": 198, "train_info/time_within_train_step": 27.691112518310547, "step": 198} {"train_info/time_between_train_steps": 0.004974365234375, "step": 198} {"info/global_step": 199, "train_info/time_within_train_step": 27.677524089813232, "step": 199} {"train_info/time_between_train_steps": 0.0051081180572509766, "step": 199} {"info/global_step": 200, "train_info/time_within_train_step": 27.685187816619873, "step": 200} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740829914, "_runtime": 5863}, "step": 200} {"logs": {"train/loss": 4.9158, "train/learning_rate": 0.0005555555555555556, "train/epoch": 7.01, "_timestamp": 1740829914, "_runtime": 5863}, "step": 200} {"train_info/time_between_train_steps": 68.65972971916199, "step": 200} {"info/global_step": 201, "train_info/time_within_train_step": 27.690451860427856, "step": 201} {"train_info/time_between_train_steps": 0.005060434341430664, "step": 201} {"info/global_step": 202, "train_info/time_within_train_step": 27.70335078239441, "step": 202} {"train_info/time_between_train_steps": 0.005304813385009766, "step": 202} {"info/global_step": 203, "train_info/time_within_train_step": 27.68970012664795, "step": 203} {"train_info/time_between_train_steps": 0.00506901741027832, "step": 203} {"info/global_step": 204, "train_info/time_within_train_step": 27.706671237945557, "step": 204} {"train_info/time_between_train_steps": 0.005129337310791016, "step": 204} {"info/global_step": 205, "train_info/time_within_train_step": 27.731332063674927, "step": 205} {"train_info/time_between_train_steps": 0.00535893440246582, "step": 205} {"info/global_step": 206, "train_info/time_within_train_step": 27.77019691467285, "step": 206} {"train_info/time_between_train_steps": 0.00987100601196289, "step": 206} {"info/global_step": 207, "train_info/time_within_train_step": 27.700847148895264, "step": 207} {"train_info/time_between_train_steps": 0.0052220821380615234, "step": 207} {"info/global_step": 208, "train_info/time_within_train_step": 27.733834266662598, "step": 208} {"train_info/time_between_train_steps": 0.0052220821380615234, "step": 208} {"info/global_step": 209, "train_info/time_within_train_step": 27.68312120437622, "step": 209} {"train_info/time_between_train_steps": 0.005187273025512695, "step": 209} {"info/global_step": 210, "train_info/time_within_train_step": 27.69752073287964, "step": 210} {"train_info/time_between_train_steps": 0.005288600921630859, "step": 210} {"info/global_step": 211, "train_info/time_within_train_step": 27.694874048233032, "step": 211} {"train_info/time_between_train_steps": 0.005369901657104492, "step": 211} {"info/global_step": 212, "train_info/time_within_train_step": 27.697333335876465, "step": 212} {"train_info/time_between_train_steps": 0.005258321762084961, "step": 212} {"info/global_step": 213, "train_info/time_within_train_step": 27.79727029800415, "step": 213} {"train_info/time_between_train_steps": 0.00532841682434082, "step": 213} {"info/global_step": 214, "train_info/time_within_train_step": 27.6985981464386, "step": 214} {"train_info/time_between_train_steps": 0.005286693572998047, "step": 214} {"info/global_step": 215, "train_info/time_within_train_step": 27.710121631622314, "step": 215} {"train_info/time_between_train_steps": 0.005738496780395508, "step": 215} {"info/global_step": 216, "train_info/time_within_train_step": 27.706376552581787, "step": 216} {"train_info/time_between_train_steps": 0.005585432052612305, "step": 216} {"train_info/time_between_train_steps": 29.84687614440918, "step": 216} {"info/global_step": 217, "train_info/time_within_train_step": 27.700008153915405, "step": 217} {"train_info/time_between_train_steps": 0.004994869232177734, "step": 217} {"info/global_step": 218, "train_info/time_within_train_step": 27.80018639564514, "step": 218} {"train_info/time_between_train_steps": 0.004944562911987305, "step": 218} {"info/global_step": 219, "train_info/time_within_train_step": 27.687668085098267, "step": 219} {"train_info/time_between_train_steps": 0.009992361068725586, "step": 219} {"info/global_step": 220, "train_info/time_within_train_step": 27.837613582611084, "step": 220} {"train_info/time_between_train_steps": 0.010288476943969727, "step": 220} {"info/global_step": 221, "train_info/time_within_train_step": 27.731398105621338, "step": 221} {"train_info/time_between_train_steps": 0.009811162948608398, "step": 221} {"info/global_step": 222, "train_info/time_within_train_step": 27.889615297317505, "step": 222} {"train_info/time_between_train_steps": 0.005448341369628906, "step": 222} {"info/global_step": 223, "train_info/time_within_train_step": 27.70195746421814, "step": 223} {"train_info/time_between_train_steps": 0.0052547454833984375, "step": 223} {"info/global_step": 224, "train_info/time_within_train_step": 27.830727338790894, "step": 224} {"train_info/time_between_train_steps": 0.005397319793701172, "step": 224} {"info/global_step": 225, "train_info/time_within_train_step": 27.706448078155518, "step": 225} {"train_info/time_between_train_steps": 0.0050852298736572266, "step": 225} {"info/global_step": 226, "train_info/time_within_train_step": 27.680111169815063, "step": 226} {"train_info/time_between_train_steps": 0.004983663558959961, "step": 226} {"info/global_step": 227, "train_info/time_within_train_step": 27.792027711868286, "step": 227} {"train_info/time_between_train_steps": 0.00510096549987793, "step": 227} {"info/global_step": 228, "train_info/time_within_train_step": 27.681824445724487, "step": 228} {"train_info/time_between_train_steps": 0.009984493255615234, "step": 228} {"info/global_step": 229, "train_info/time_within_train_step": 27.690601348876953, "step": 229} {"train_info/time_between_train_steps": 0.00533604621887207, "step": 229} {"info/global_step": 230, "train_info/time_within_train_step": 27.680262327194214, "step": 230} {"train_info/time_between_train_steps": 0.005041599273681641, "step": 230} {"info/global_step": 231, "train_info/time_within_train_step": 27.689854621887207, "step": 231} {"train_info/time_between_train_steps": 0.005084514617919922, "step": 231} {"info/global_step": 232, "train_info/time_within_train_step": 27.695849418640137, "step": 232} {"train_info/time_between_train_steps": 0.005303144454956055, "step": 232} {"info/global_step": 233, "train_info/time_within_train_step": 27.747002124786377, "step": 233} {"train_info/time_between_train_steps": 0.0051021575927734375, "step": 233} {"info/global_step": 234, "train_info/time_within_train_step": 27.70759344100952, "step": 234} {"train_info/time_between_train_steps": 0.005190372467041016, "step": 234} {"info/global_step": 235, "train_info/time_within_train_step": 27.739644050598145, "step": 235} {"train_info/time_between_train_steps": 0.00521397590637207, "step": 235} {"info/global_step": 236, "train_info/time_within_train_step": 27.684016704559326, "step": 236} {"train_info/time_between_train_steps": 0.005043506622314453, "step": 236} {"info/global_step": 237, "train_info/time_within_train_step": 27.690277099609375, "step": 237} {"train_info/time_between_train_steps": 0.01017141342163086, "step": 237} {"info/global_step": 238, "train_info/time_within_train_step": 27.69309973716736, "step": 238} {"train_info/time_between_train_steps": 0.005242347717285156, "step": 238} {"info/global_step": 239, "train_info/time_within_train_step": 27.695059299468994, "step": 239} {"train_info/time_between_train_steps": 0.00515294075012207, "step": 239} {"info/global_step": 240, "train_info/time_within_train_step": 27.707957983016968, "step": 240} {"train_info/time_between_train_steps": 0.005288839340209961, "step": 240} {"info/global_step": 241, "train_info/time_within_train_step": 27.69513201713562, "step": 241} {"train_info/time_between_train_steps": 0.005203723907470703, "step": 241} {"info/global_step": 242, "train_info/time_within_train_step": 27.752567291259766, "step": 242} {"train_info/time_between_train_steps": 0.0053021907806396484, "step": 242} {"info/global_step": 243, "train_info/time_within_train_step": 27.82372260093689, "step": 243} {"train_info/time_between_train_steps": 0.005800724029541016, "step": 243} {"train_info/time_between_train_steps": 30.004590272903442, "step": 243} {"info/global_step": 244, "train_info/time_within_train_step": 27.690030097961426, "step": 244} {"train_info/time_between_train_steps": 0.009923219680786133, "step": 244} {"info/global_step": 245, "train_info/time_within_train_step": 27.835737466812134, "step": 245} {"train_info/time_between_train_steps": 0.010064125061035156, "step": 245} {"info/global_step": 246, "train_info/time_within_train_step": 27.697606563568115, "step": 246} {"train_info/time_between_train_steps": 0.010331869125366211, "step": 246} {"info/global_step": 247, "train_info/time_within_train_step": 27.81367039680481, "step": 247} {"train_info/time_between_train_steps": 0.005342960357666016, "step": 247} {"info/global_step": 248, "train_info/time_within_train_step": 27.70019817352295, "step": 248} {"train_info/time_between_train_steps": 0.005235910415649414, "step": 248} {"info/global_step": 249, "train_info/time_within_train_step": 27.88652467727661, "step": 249} {"train_info/time_between_train_steps": 0.005324840545654297, "step": 249} {"info/global_step": 250, "train_info/time_within_train_step": 27.71311044692993, "step": 250} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740831430, "_runtime": 7379}, "step": 250} {"logs": {"train/loss": 4.7809, "train/learning_rate": 0.0005277777777777777, "train/epoch": 9.01, "_timestamp": 1740831430, "_runtime": 7379}, "step": 250} {"train_info/time_between_train_steps": 0.02584981918334961, "step": 250} {"info/global_step": 251, "train_info/time_within_train_step": 27.768550872802734, "step": 251} {"train_info/time_between_train_steps": 0.005216121673583984, "step": 251} {"info/global_step": 252, "train_info/time_within_train_step": 27.718239545822144, "step": 252} {"train_info/time_between_train_steps": 0.005140542984008789, "step": 252} {"info/global_step": 253, "train_info/time_within_train_step": 27.957794189453125, "step": 253} {"train_info/time_between_train_steps": 0.0055997371673583984, "step": 253} {"info/global_step": 254, "train_info/time_within_train_step": 29.324788808822632, "step": 254} {"train_info/time_between_train_steps": 0.009539365768432617, "step": 254} {"info/global_step": 255, "train_info/time_within_train_step": 27.686142444610596, "step": 255} {"train_info/time_between_train_steps": 0.009871959686279297, "step": 255} {"info/global_step": 256, "train_info/time_within_train_step": 27.707345724105835, "step": 256} {"train_info/time_between_train_steps": 0.0101318359375, "step": 256} {"info/global_step": 257, "train_info/time_within_train_step": 27.684229612350464, "step": 257} {"train_info/time_between_train_steps": 0.004990339279174805, "step": 257} {"info/global_step": 258, "train_info/time_within_train_step": 27.822718381881714, "step": 258} {"train_info/time_between_train_steps": 0.005110263824462891, "step": 258} {"info/global_step": 259, "train_info/time_within_train_step": 27.706258296966553, "step": 259} {"train_info/time_between_train_steps": 0.008712291717529297, "step": 259} {"info/global_step": 260, "train_info/time_within_train_step": 27.748253107070923, "step": 260} {"train_info/time_between_train_steps": 0.005133390426635742, "step": 260} {"info/global_step": 261, "train_info/time_within_train_step": 27.686441898345947, "step": 261} {"train_info/time_between_train_steps": 0.0050580501556396484, "step": 261} {"info/global_step": 262, "train_info/time_within_train_step": 27.73181176185608, "step": 262} {"train_info/time_between_train_steps": 0.005734920501708984, "step": 262} {"info/global_step": 263, "train_info/time_within_train_step": 27.6821072101593, "step": 263} {"train_info/time_between_train_steps": 0.005005359649658203, "step": 263} {"info/global_step": 264, "train_info/time_within_train_step": 27.725099325180054, "step": 264} {"train_info/time_between_train_steps": 0.005166292190551758, "step": 264} {"info/global_step": 265, "train_info/time_within_train_step": 27.691503286361694, "step": 265} {"train_info/time_between_train_steps": 0.0052411556243896484, "step": 265} {"info/global_step": 266, "train_info/time_within_train_step": 27.688347339630127, "step": 266} {"train_info/time_between_train_steps": 0.005199432373046875, "step": 266} {"info/global_step": 267, "train_info/time_within_train_step": 27.68877124786377, "step": 267} {"train_info/time_between_train_steps": 0.005328655242919922, "step": 267} {"info/global_step": 268, "train_info/time_within_train_step": 27.701383352279663, "step": 268} {"train_info/time_between_train_steps": 0.005228281021118164, "step": 268} {"info/global_step": 269, "train_info/time_within_train_step": 27.719315767288208, "step": 269} {"train_info/time_between_train_steps": 0.005315542221069336, "step": 269} {"info/global_step": 270, "train_info/time_within_train_step": 27.72285032272339, "step": 270} {"train_info/time_between_train_steps": 0.0058612823486328125, "step": 270} {"train_info/time_between_train_steps": 29.74225878715515, "step": 270} {"info/global_step": 271, "train_info/time_within_train_step": 27.699797868728638, "step": 271} {"train_info/time_between_train_steps": 0.004974842071533203, "step": 271} {"info/global_step": 272, "train_info/time_within_train_step": 27.974323987960815, "step": 272} {"train_info/time_between_train_steps": 0.005283832550048828, "step": 272} {"info/global_step": 273, "train_info/time_within_train_step": 27.71097707748413, "step": 273} {"train_info/time_between_train_steps": 0.005384206771850586, "step": 273} {"info/global_step": 274, "train_info/time_within_train_step": 27.852763891220093, "step": 274} {"train_info/time_between_train_steps": 0.005238056182861328, "step": 274} {"info/global_step": 275, "train_info/time_within_train_step": 27.69466280937195, "step": 275} {"train_info/time_between_train_steps": 0.005295515060424805, "step": 275} {"info/global_step": 276, "train_info/time_within_train_step": 27.86263680458069, "step": 276} {"train_info/time_between_train_steps": 0.0054552555084228516, "step": 276} {"info/global_step": 277, "train_info/time_within_train_step": 27.71383500099182, "step": 277} {"train_info/time_between_train_steps": 0.005296230316162109, "step": 277} {"info/global_step": 278, "train_info/time_within_train_step": 27.773378610610962, "step": 278} {"train_info/time_between_train_steps": 0.005466938018798828, "step": 278} {"info/global_step": 279, "train_info/time_within_train_step": 27.720260620117188, "step": 279} {"train_info/time_between_train_steps": 0.0051517486572265625, "step": 279} {"info/global_step": 280, "train_info/time_within_train_step": 27.68303108215332, "step": 280} {"train_info/time_between_train_steps": 0.005066633224487305, "step": 280} {"info/global_step": 281, "train_info/time_within_train_step": 27.699601650238037, "step": 281} {"train_info/time_between_train_steps": 0.005049228668212891, "step": 281} {"info/global_step": 282, "train_info/time_within_train_step": 27.687711477279663, "step": 282} {"train_info/time_between_train_steps": 0.005125999450683594, "step": 282} {"info/global_step": 283, "train_info/time_within_train_step": 27.739423513412476, "step": 283} {"train_info/time_between_train_steps": 0.005048274993896484, "step": 283} {"info/global_step": 284, "train_info/time_within_train_step": 27.696190118789673, "step": 284} {"train_info/time_between_train_steps": 0.005054473876953125, "step": 284} {"info/global_step": 285, "train_info/time_within_train_step": 27.7551748752594, "step": 285} {"train_info/time_between_train_steps": 0.004928112030029297, "step": 285} {"info/global_step": 286, "train_info/time_within_train_step": 27.709315061569214, "step": 286} {"train_info/time_between_train_steps": 0.0049762725830078125, "step": 286} {"info/global_step": 287, "train_info/time_within_train_step": 27.74649953842163, "step": 287} {"train_info/time_between_train_steps": 0.005185127258300781, "step": 287} {"info/global_step": 288, "train_info/time_within_train_step": 27.7759530544281, "step": 288} {"train_info/time_between_train_steps": 0.004976987838745117, "step": 288} {"info/global_step": 289, "train_info/time_within_train_step": 27.77699589729309, "step": 289} {"train_info/time_between_train_steps": 0.0052242279052734375, "step": 289} {"info/global_step": 290, "train_info/time_within_train_step": 27.66975450515747, "step": 290} {"train_info/time_between_train_steps": 0.004957675933837891, "step": 290} {"info/global_step": 291, "train_info/time_within_train_step": 27.696810007095337, "step": 291} {"train_info/time_between_train_steps": 0.0049936771392822266, "step": 291} {"info/global_step": 292, "train_info/time_within_train_step": 27.689391613006592, "step": 292} {"train_info/time_between_train_steps": 0.00511479377746582, "step": 292} {"info/global_step": 293, "train_info/time_within_train_step": 27.68093466758728, "step": 293} {"train_info/time_between_train_steps": 0.005021572113037109, "step": 293} {"info/global_step": 294, "train_info/time_within_train_step": 27.686478853225708, "step": 294} {"train_info/time_between_train_steps": 0.0057065486907958984, "step": 294} {"info/global_step": 295, "train_info/time_within_train_step": 27.676884412765503, "step": 295} {"train_info/time_between_train_steps": 0.004882335662841797, "step": 295} {"info/global_step": 296, "train_info/time_within_train_step": 27.744085550308228, "step": 296} {"train_info/time_between_train_steps": 0.005126953125, "step": 296} {"info/global_step": 297, "train_info/time_within_train_step": 27.702570915222168, "step": 297} {"train_info/time_between_train_steps": 0.00536036491394043, "step": 297} {"train_info/time_between_train_steps": 29.789317846298218, "step": 297} {"info/global_step": 298, "train_info/time_within_train_step": 27.684459924697876, "step": 298} {"train_info/time_between_train_steps": 0.0048944950103759766, "step": 298} {"info/global_step": 299, "train_info/time_within_train_step": 27.833518505096436, "step": 299} {"train_info/time_between_train_steps": 0.0049974918365478516, "step": 299} {"info/global_step": 300, "train_info/time_within_train_step": 27.6945378780365, "step": 300} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740832880, "_runtime": 8829}, "step": 300} {"logs": {"train/loss": 4.6208, "train/learning_rate": 0.0005, "train/epoch": 11.0, "_timestamp": 1740832880, "_runtime": 8829}, "step": 300} {"train_info/time_between_train_steps": 65.89691710472107, "step": 300} {"info/global_step": 301, "train_info/time_within_train_step": 28.31470823287964, "step": 301} {"train_info/time_between_train_steps": 0.010166645050048828, "step": 301} {"info/global_step": 302, "train_info/time_within_train_step": 27.703016757965088, "step": 302} {"train_info/time_between_train_steps": 0.005416393280029297, "step": 302} {"info/global_step": 303, "train_info/time_within_train_step": 27.96810746192932, "step": 303} {"train_info/time_between_train_steps": 0.005486488342285156, "step": 303} {"info/global_step": 304, "train_info/time_within_train_step": 27.700064182281494, "step": 304} {"train_info/time_between_train_steps": 0.0052280426025390625, "step": 304} {"info/global_step": 305, "train_info/time_within_train_step": 27.81597661972046, "step": 305} {"train_info/time_between_train_steps": 0.00540614128112793, "step": 305} {"info/global_step": 306, "train_info/time_within_train_step": 27.68986177444458, "step": 306} {"train_info/time_between_train_steps": 0.004990577697753906, "step": 306} {"info/global_step": 307, "train_info/time_within_train_step": 27.671053409576416, "step": 307} {"train_info/time_between_train_steps": 0.004998922348022461, "step": 307} {"info/global_step": 308, "train_info/time_within_train_step": 27.699034214019775, "step": 308} {"train_info/time_between_train_steps": 0.005150794982910156, "step": 308} {"info/global_step": 309, "train_info/time_within_train_step": 27.68761134147644, "step": 309} {"train_info/time_between_train_steps": 0.0050122737884521484, "step": 309} {"info/global_step": 310, "train_info/time_within_train_step": 27.728851318359375, "step": 310} {"train_info/time_between_train_steps": 0.005139827728271484, "step": 310} {"info/global_step": 311, "train_info/time_within_train_step": 27.689040422439575, "step": 311} {"train_info/time_between_train_steps": 0.005077838897705078, "step": 311} {"info/global_step": 312, "train_info/time_within_train_step": 27.74622416496277, "step": 312} {"train_info/time_between_train_steps": 0.004988908767700195, "step": 312} {"info/global_step": 313, "train_info/time_within_train_step": 27.69682765007019, "step": 313} {"train_info/time_between_train_steps": 0.005201101303100586, "step": 313} {"info/global_step": 314, "train_info/time_within_train_step": 27.77381134033203, "step": 314} {"train_info/time_between_train_steps": 0.0049626827239990234, "step": 314} {"info/global_step": 315, "train_info/time_within_train_step": 27.68382692337036, "step": 315} {"train_info/time_between_train_steps": 0.010013341903686523, "step": 315} {"info/global_step": 316, "train_info/time_within_train_step": 28.080734729766846, "step": 316} {"train_info/time_between_train_steps": 0.014333486557006836, "step": 316} {"info/global_step": 317, "train_info/time_within_train_step": 27.81632661819458, "step": 317} {"train_info/time_between_train_steps": 0.005003929138183594, "step": 317} {"info/global_step": 318, "train_info/time_within_train_step": 27.82829475402832, "step": 318} {"train_info/time_between_train_steps": 0.014801025390625, "step": 318} {"info/global_step": 319, "train_info/time_within_train_step": 27.73217535018921, "step": 319} {"train_info/time_between_train_steps": 0.009831905364990234, "step": 319} {"info/global_step": 320, "train_info/time_within_train_step": 27.795313596725464, "step": 320} {"train_info/time_between_train_steps": 0.010039806365966797, "step": 320} {"info/global_step": 321, "train_info/time_within_train_step": 27.756673097610474, "step": 321} {"train_info/time_between_train_steps": 0.005138874053955078, "step": 321} {"info/global_step": 322, "train_info/time_within_train_step": 27.68706202507019, "step": 322} {"train_info/time_between_train_steps": 0.005056142807006836, "step": 322} {"info/global_step": 323, "train_info/time_within_train_step": 27.746856212615967, "step": 323} {"train_info/time_between_train_steps": 0.005658626556396484, "step": 323} {"info/global_step": 324, "train_info/time_within_train_step": 27.71417546272278, "step": 324} {"train_info/time_between_train_steps": 0.005705356597900391, "step": 324} {"train_info/time_between_train_steps": 29.95971655845642, "step": 324} {"info/global_step": 325, "train_info/time_within_train_step": 27.683840036392212, "step": 325} {"train_info/time_between_train_steps": 0.004889249801635742, "step": 325} {"info/global_step": 326, "train_info/time_within_train_step": 27.82358717918396, "step": 326} {"train_info/time_between_train_steps": 0.005277156829833984, "step": 326} {"info/global_step": 327, "train_info/time_within_train_step": 27.729092359542847, "step": 327} {"train_info/time_between_train_steps": 0.0061452388763427734, "step": 327} {"info/global_step": 328, "train_info/time_within_train_step": 27.825883626937866, "step": 328} {"train_info/time_between_train_steps": 0.0052947998046875, "step": 328} {"info/global_step": 329, "train_info/time_within_train_step": 27.68842363357544, "step": 329} {"train_info/time_between_train_steps": 0.005503654479980469, "step": 329} {"info/global_step": 330, "train_info/time_within_train_step": 27.88675880432129, "step": 330} {"train_info/time_between_train_steps": 0.005421161651611328, "step": 330} {"info/global_step": 331, "train_info/time_within_train_step": 27.687194108963013, "step": 331} {"train_info/time_between_train_steps": 0.00525975227355957, "step": 331} {"info/global_step": 332, "train_info/time_within_train_step": 27.814470529556274, "step": 332} {"train_info/time_between_train_steps": 0.005290031433105469, "step": 332} {"info/global_step": 333, "train_info/time_within_train_step": 27.794780015945435, "step": 333} {"train_info/time_between_train_steps": 0.005058765411376953, "step": 333} {"info/global_step": 334, "train_info/time_within_train_step": 27.686293363571167, "step": 334} {"train_info/time_between_train_steps": 0.0050656795501708984, "step": 334} {"info/global_step": 335, "train_info/time_within_train_step": 27.739587783813477, "step": 335} {"train_info/time_between_train_steps": 0.005070686340332031, "step": 335} {"info/global_step": 336, "train_info/time_within_train_step": 27.68271493911743, "step": 336} {"train_info/time_between_train_steps": 0.005087137222290039, "step": 336} {"info/global_step": 337, "train_info/time_within_train_step": 27.72687554359436, "step": 337} {"train_info/time_between_train_steps": 0.005151987075805664, "step": 337} {"info/global_step": 338, "train_info/time_within_train_step": 27.696459531784058, "step": 338} {"train_info/time_between_train_steps": 0.005015850067138672, "step": 338} {"info/global_step": 339, "train_info/time_within_train_step": 27.739161491394043, "step": 339} {"train_info/time_between_train_steps": 0.005136966705322266, "step": 339} {"info/global_step": 340, "train_info/time_within_train_step": 27.698787450790405, "step": 340} {"train_info/time_between_train_steps": 0.005093097686767578, "step": 340} {"info/global_step": 341, "train_info/time_within_train_step": 27.721898317337036, "step": 341} {"train_info/time_between_train_steps": 0.0051343441009521484, "step": 341} {"info/global_step": 342, "train_info/time_within_train_step": 27.677818775177002, "step": 342} {"train_info/time_between_train_steps": 0.005182981491088867, "step": 342} {"info/global_step": 343, "train_info/time_within_train_step": 27.718980312347412, "step": 343} {"train_info/time_between_train_steps": 0.005194187164306641, "step": 343} {"info/global_step": 344, "train_info/time_within_train_step": 27.698964834213257, "step": 344} {"train_info/time_between_train_steps": 0.005169391632080078, "step": 344} {"info/global_step": 345, "train_info/time_within_train_step": 27.683090925216675, "step": 345} {"train_info/time_between_train_steps": 0.005137205123901367, "step": 345} {"info/global_step": 346, "train_info/time_within_train_step": 27.682157039642334, "step": 346} {"train_info/time_between_train_steps": 0.005159616470336914, "step": 346} {"info/global_step": 347, "train_info/time_within_train_step": 27.68567419052124, "step": 347} {"train_info/time_between_train_steps": 0.005208492279052734, "step": 347} {"info/global_step": 348, "train_info/time_within_train_step": 27.780143976211548, "step": 348} {"train_info/time_between_train_steps": 0.010355472564697266, "step": 348} {"info/global_step": 349, "train_info/time_within_train_step": 27.722211122512817, "step": 349} {"train_info/time_between_train_steps": 0.0056040287017822266, "step": 349} {"info/global_step": 350, "train_info/time_within_train_step": 29.383646726608276, "step": 350} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740834368, "_runtime": 10317}, "step": 350} {"logs": {"train/loss": 4.3481, "train/learning_rate": 0.00047222222222222224, "train/epoch": 12.02, "_timestamp": 1740834368, "_runtime": 10317}, "step": 350} {"train_info/time_between_train_steps": 0.7293825149536133, "step": 350} {"info/global_step": 351, "train_info/time_within_train_step": 27.71374201774597, "step": 351} {"train_info/time_between_train_steps": 0.005836963653564453, "step": 351} {"train_info/time_between_train_steps": 30.10848879814148, "step": 351} {"info/global_step": 352, "train_info/time_within_train_step": 27.692814111709595, "step": 352} {"train_info/time_between_train_steps": 0.0050792694091796875, "step": 352} {"info/global_step": 353, "train_info/time_within_train_step": 27.843517780303955, "step": 353} {"train_info/time_between_train_steps": 0.0052645206451416016, "step": 353} {"info/global_step": 354, "train_info/time_within_train_step": 27.688941717147827, "step": 354} {"train_info/time_between_train_steps": 0.00531458854675293, "step": 354} {"info/global_step": 355, "train_info/time_within_train_step": 27.858290672302246, "step": 355} {"train_info/time_between_train_steps": 0.0052776336669921875, "step": 355} {"info/global_step": 356, "train_info/time_within_train_step": 27.70293617248535, "step": 356} {"train_info/time_between_train_steps": 0.005409955978393555, "step": 356} {"info/global_step": 357, "train_info/time_within_train_step": 27.815258741378784, "step": 357} {"train_info/time_between_train_steps": 0.005219459533691406, "step": 357} {"info/global_step": 358, "train_info/time_within_train_step": 27.68798303604126, "step": 358} {"train_info/time_between_train_steps": 0.005445718765258789, "step": 358} {"info/global_step": 359, "train_info/time_within_train_step": 27.771528720855713, "step": 359} {"train_info/time_between_train_steps": 0.005360603332519531, "step": 359} {"info/global_step": 360, "train_info/time_within_train_step": 27.696993112564087, "step": 360} {"train_info/time_between_train_steps": 0.0050313472747802734, "step": 360} {"info/global_step": 361, "train_info/time_within_train_step": 27.67265224456787, "step": 361} {"train_info/time_between_train_steps": 0.0050811767578125, "step": 361} {"info/global_step": 362, "train_info/time_within_train_step": 27.71242332458496, "step": 362} {"train_info/time_between_train_steps": 0.004982948303222656, "step": 362} {"info/global_step": 363, "train_info/time_within_train_step": 27.78746271133423, "step": 363} {"train_info/time_between_train_steps": 0.005163431167602539, "step": 363} {"info/global_step": 364, "train_info/time_within_train_step": 27.685216426849365, "step": 364} {"train_info/time_between_train_steps": 0.0049974918365478516, "step": 364} {"info/global_step": 365, "train_info/time_within_train_step": 27.699547052383423, "step": 365} {"train_info/time_between_train_steps": 0.005105257034301758, "step": 365} {"info/global_step": 366, "train_info/time_within_train_step": 27.679184913635254, "step": 366} {"train_info/time_between_train_steps": 0.005199909210205078, "step": 366} {"info/global_step": 367, "train_info/time_within_train_step": 27.686453342437744, "step": 367} {"train_info/time_between_train_steps": 0.005114078521728516, "step": 367} {"info/global_step": 368, "train_info/time_within_train_step": 27.691442489624023, "step": 368} {"train_info/time_between_train_steps": 0.005526304244995117, "step": 368} {"info/global_step": 369, "train_info/time_within_train_step": 27.687214136123657, "step": 369} {"train_info/time_between_train_steps": 0.005266427993774414, "step": 369} {"info/global_step": 370, "train_info/time_within_train_step": 27.733667135238647, "step": 370} {"train_info/time_between_train_steps": 0.005341053009033203, "step": 370} {"info/global_step": 371, "train_info/time_within_train_step": 27.71192479133606, "step": 371} {"train_info/time_between_train_steps": 0.005162715911865234, "step": 371} {"info/global_step": 372, "train_info/time_within_train_step": 27.678988218307495, "step": 372} {"train_info/time_between_train_steps": 0.005349874496459961, "step": 372} {"info/global_step": 373, "train_info/time_within_train_step": 27.689069509506226, "step": 373} {"train_info/time_between_train_steps": 0.005288124084472656, "step": 373} {"info/global_step": 374, "train_info/time_within_train_step": 27.694862365722656, "step": 374} {"train_info/time_between_train_steps": 0.005211830139160156, "step": 374} {"info/global_step": 375, "train_info/time_within_train_step": 27.749579429626465, "step": 375} {"train_info/time_between_train_steps": 0.005239248275756836, "step": 375} {"info/global_step": 376, "train_info/time_within_train_step": 27.689353942871094, "step": 376} {"train_info/time_between_train_steps": 0.005298614501953125, "step": 376} {"info/global_step": 377, "train_info/time_within_train_step": 27.692123651504517, "step": 377} {"train_info/time_between_train_steps": 0.006635904312133789, "step": 377} {"info/global_step": 378, "train_info/time_within_train_step": 27.70120668411255, "step": 378} {"train_info/time_between_train_steps": 0.005726814270019531, "step": 378} {"train_info/time_between_train_steps": 29.77442169189453, "step": 378} {"info/global_step": 379, "train_info/time_within_train_step": 27.694073915481567, "step": 379} {"train_info/time_between_train_steps": 0.005371570587158203, "step": 379} {"info/global_step": 380, "train_info/time_within_train_step": 27.83268141746521, "step": 380} {"train_info/time_between_train_steps": 0.005142927169799805, "step": 380} {"info/global_step": 381, "train_info/time_within_train_step": 27.689643383026123, "step": 381} {"train_info/time_between_train_steps": 0.006165027618408203, "step": 381} {"info/global_step": 382, "train_info/time_within_train_step": 27.888978242874146, "step": 382} {"train_info/time_between_train_steps": 0.005408048629760742, "step": 382} {"info/global_step": 383, "train_info/time_within_train_step": 27.694881200790405, "step": 383} {"train_info/time_between_train_steps": 0.005347490310668945, "step": 383} {"info/global_step": 384, "train_info/time_within_train_step": 28.00465154647827, "step": 384} {"train_info/time_between_train_steps": 0.005627632141113281, "step": 384} {"info/global_step": 385, "train_info/time_within_train_step": 27.708280324935913, "step": 385} {"train_info/time_between_train_steps": 0.005397319793701172, "step": 385} {"info/global_step": 386, "train_info/time_within_train_step": 27.77204155921936, "step": 386} {"train_info/time_between_train_steps": 0.005115985870361328, "step": 386} {"info/global_step": 387, "train_info/time_within_train_step": 27.733999252319336, "step": 387} {"train_info/time_between_train_steps": 0.009888410568237305, "step": 387} {"info/global_step": 388, "train_info/time_within_train_step": 27.67678475379944, "step": 388} {"train_info/time_between_train_steps": 0.004895687103271484, "step": 388} {"info/global_step": 389, "train_info/time_within_train_step": 27.685023069381714, "step": 389} {"train_info/time_between_train_steps": 0.004931449890136719, "step": 389} {"info/global_step": 390, "train_info/time_within_train_step": 27.67155885696411, "step": 390} {"train_info/time_between_train_steps": 0.005100727081298828, "step": 390} {"info/global_step": 391, "train_info/time_within_train_step": 27.738587141036987, "step": 391} {"train_info/time_between_train_steps": 0.004996776580810547, "step": 391} {"info/global_step": 392, "train_info/time_within_train_step": 27.688738107681274, "step": 392} {"train_info/time_between_train_steps": 0.005154132843017578, "step": 392} {"info/global_step": 393, "train_info/time_within_train_step": 27.81110382080078, "step": 393} {"train_info/time_between_train_steps": 0.004900455474853516, "step": 393} {"info/global_step": 394, "train_info/time_within_train_step": 27.670275449752808, "step": 394} {"train_info/time_between_train_steps": 0.005010843276977539, "step": 394} {"info/global_step": 395, "train_info/time_within_train_step": 27.731797218322754, "step": 395} {"train_info/time_between_train_steps": 0.005105257034301758, "step": 395} {"info/global_step": 396, "train_info/time_within_train_step": 27.68563485145569, "step": 396} {"train_info/time_between_train_steps": 0.004901409149169922, "step": 396} {"info/global_step": 397, "train_info/time_within_train_step": 27.736372232437134, "step": 397} {"train_info/time_between_train_steps": 0.005099058151245117, "step": 397} {"info/global_step": 398, "train_info/time_within_train_step": 27.685951948165894, "step": 398} {"train_info/time_between_train_steps": 0.004903554916381836, "step": 398} {"info/global_step": 399, "train_info/time_within_train_step": 27.67534303665161, "step": 399} {"train_info/time_between_train_steps": 0.005183219909667969, "step": 399} {"info/global_step": 400, "train_info/time_within_train_step": 27.673490047454834, "step": 400} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740835816, "_runtime": 11765}, "step": 400} {"logs": {"train/loss": 4.2378, "train/learning_rate": 0.00044444444444444436, "train/epoch": 14.02, "_timestamp": 1740835816, "_runtime": 11765}, "step": 400} {"train_info/time_between_train_steps": 64.01022624969482, "step": 400} {"info/global_step": 401, "train_info/time_within_train_step": 27.715702295303345, "step": 401} {"train_info/time_between_train_steps": 0.005244731903076172, "step": 401} {"info/global_step": 402, "train_info/time_within_train_step": 27.691340923309326, "step": 402} {"train_info/time_between_train_steps": 0.004961967468261719, "step": 402} {"info/global_step": 403, "train_info/time_within_train_step": 27.705077409744263, "step": 403} {"train_info/time_between_train_steps": 0.005106210708618164, "step": 403} {"info/global_step": 404, "train_info/time_within_train_step": 27.694612741470337, "step": 404} {"train_info/time_between_train_steps": 0.005345344543457031, "step": 404} {"info/global_step": 405, "train_info/time_within_train_step": 27.696762561798096, "step": 405} {"train_info/time_between_train_steps": 0.005524158477783203, "step": 405} {"train_info/time_between_train_steps": 29.747445106506348, "step": 405} {"info/global_step": 406, "train_info/time_within_train_step": 27.695367097854614, "step": 406} {"train_info/time_between_train_steps": 0.004847288131713867, "step": 406} {"info/global_step": 407, "train_info/time_within_train_step": 27.857388734817505, "step": 407} {"train_info/time_between_train_steps": 0.005078315734863281, "step": 407} {"info/global_step": 408, "train_info/time_within_train_step": 27.793639659881592, "step": 408} {"train_info/time_between_train_steps": 0.005339622497558594, "step": 408} {"info/global_step": 409, "train_info/time_within_train_step": 27.83681297302246, "step": 409} {"train_info/time_between_train_steps": 0.005090951919555664, "step": 409} {"info/global_step": 410, "train_info/time_within_train_step": 27.721065998077393, "step": 410} {"train_info/time_between_train_steps": 0.005240917205810547, "step": 410} {"info/global_step": 411, "train_info/time_within_train_step": 27.846831560134888, "step": 411} {"train_info/time_between_train_steps": 0.005246400833129883, "step": 411} {"info/global_step": 412, "train_info/time_within_train_step": 27.68318271636963, "step": 412} {"train_info/time_between_train_steps": 0.004983186721801758, "step": 412} {"info/global_step": 413, "train_info/time_within_train_step": 27.79054307937622, "step": 413} {"train_info/time_between_train_steps": 0.010418891906738281, "step": 413} {"info/global_step": 414, "train_info/time_within_train_step": 27.710638523101807, "step": 414} {"train_info/time_between_train_steps": 0.004860877990722656, "step": 414} {"info/global_step": 415, "train_info/time_within_train_step": 27.735029935836792, "step": 415} {"train_info/time_between_train_steps": 0.009807348251342773, "step": 415} {"info/global_step": 416, "train_info/time_within_train_step": 27.702127933502197, "step": 416} {"train_info/time_between_train_steps": 0.004975080490112305, "step": 416} {"info/global_step": 417, "train_info/time_within_train_step": 27.669419288635254, "step": 417} {"train_info/time_between_train_steps": 0.004876852035522461, "step": 417} {"info/global_step": 418, "train_info/time_within_train_step": 27.723541498184204, "step": 418} {"train_info/time_between_train_steps": 0.009755611419677734, "step": 418} {"info/global_step": 419, "train_info/time_within_train_step": 27.684327602386475, "step": 419} {"train_info/time_between_train_steps": 0.004923105239868164, "step": 419} {"info/global_step": 420, "train_info/time_within_train_step": 27.727847576141357, "step": 420} {"train_info/time_between_train_steps": 0.004906654357910156, "step": 420} {"info/global_step": 421, "train_info/time_within_train_step": 27.688854217529297, "step": 421} {"train_info/time_between_train_steps": 0.00513911247253418, "step": 421} {"info/global_step": 422, "train_info/time_within_train_step": 27.6735999584198, "step": 422} {"train_info/time_between_train_steps": 0.009706497192382812, "step": 422} {"info/global_step": 423, "train_info/time_within_train_step": 27.669618368148804, "step": 423} {"train_info/time_between_train_steps": 0.00496673583984375, "step": 423} {"info/global_step": 424, "train_info/time_within_train_step": 27.767581701278687, "step": 424} {"train_info/time_between_train_steps": 0.010165929794311523, "step": 424} {"info/global_step": 425, "train_info/time_within_train_step": 27.670666694641113, "step": 425} {"train_info/time_between_train_steps": 0.009455680847167969, "step": 425} {"info/global_step": 426, "train_info/time_within_train_step": 27.67463207244873, "step": 426} {"train_info/time_between_train_steps": 0.005069732666015625, "step": 426} {"info/global_step": 427, "train_info/time_within_train_step": 27.675658464431763, "step": 427} {"train_info/time_between_train_steps": 0.005036115646362305, "step": 427} {"info/global_step": 428, "train_info/time_within_train_step": 27.673872709274292, "step": 428} {"train_info/time_between_train_steps": 0.005051612854003906, "step": 428} {"info/global_step": 429, "train_info/time_within_train_step": 27.67629361152649, "step": 429} {"train_info/time_between_train_steps": 0.00524592399597168, "step": 429} {"info/global_step": 430, "train_info/time_within_train_step": 27.681583881378174, "step": 430} {"train_info/time_between_train_steps": 0.005123615264892578, "step": 430} {"info/global_step": 431, "train_info/time_within_train_step": 27.693169593811035, "step": 431} {"train_info/time_between_train_steps": 0.005305051803588867, "step": 431} {"info/global_step": 432, "train_info/time_within_train_step": 27.69833278656006, "step": 432} {"train_info/time_between_train_steps": 0.010790348052978516, "step": 432} {"train_info/time_between_train_steps": 29.937363624572754, "step": 432} {"info/global_step": 433, "train_info/time_within_train_step": 27.687923908233643, "step": 433} {"train_info/time_between_train_steps": 0.00988459587097168, "step": 433} {"info/global_step": 434, "train_info/time_within_train_step": 27.857445001602173, "step": 434} {"train_info/time_between_train_steps": 0.009891510009765625, "step": 434} {"info/global_step": 435, "train_info/time_within_train_step": 27.67554807662964, "step": 435} {"train_info/time_between_train_steps": 0.009940624237060547, "step": 435} {"info/global_step": 436, "train_info/time_within_train_step": 27.79150629043579, "step": 436} {"train_info/time_between_train_steps": 0.009677648544311523, "step": 436} {"info/global_step": 437, "train_info/time_within_train_step": 27.675451517105103, "step": 437} {"train_info/time_between_train_steps": 0.005045413970947266, "step": 437} {"info/global_step": 438, "train_info/time_within_train_step": 27.98516273498535, "step": 438} {"train_info/time_between_train_steps": 0.0052640438079833984, "step": 438} {"info/global_step": 439, "train_info/time_within_train_step": 27.677082538604736, "step": 439} {"train_info/time_between_train_steps": 0.005086421966552734, "step": 439} {"info/global_step": 440, "train_info/time_within_train_step": 27.727195978164673, "step": 440} {"train_info/time_between_train_steps": 0.005097627639770508, "step": 440} {"info/global_step": 441, "train_info/time_within_train_step": 27.68182063102722, "step": 441} {"train_info/time_between_train_steps": 0.0049326419830322266, "step": 441} {"info/global_step": 442, "train_info/time_within_train_step": 27.665661096572876, "step": 442} {"train_info/time_between_train_steps": 0.004942655563354492, "step": 442} {"info/global_step": 443, "train_info/time_within_train_step": 27.67825198173523, "step": 443} {"train_info/time_between_train_steps": 0.004904270172119141, "step": 443} {"info/global_step": 444, "train_info/time_within_train_step": 27.681687116622925, "step": 444} {"train_info/time_between_train_steps": 0.004858255386352539, "step": 444} {"info/global_step": 445, "train_info/time_within_train_step": 29.499985456466675, "step": 445} {"train_info/time_between_train_steps": 0.005654811859130859, "step": 445} {"info/global_step": 446, "train_info/time_within_train_step": 27.797162532806396, "step": 446} {"train_info/time_between_train_steps": 0.00486445426940918, "step": 446} {"info/global_step": 447, "train_info/time_within_train_step": 27.720513582229614, "step": 447} {"train_info/time_between_train_steps": 0.004870891571044922, "step": 447} {"info/global_step": 448, "train_info/time_within_train_step": 27.697356700897217, "step": 448} {"train_info/time_between_train_steps": 0.005402088165283203, "step": 448} {"info/global_step": 449, "train_info/time_within_train_step": 27.726869106292725, "step": 449} {"train_info/time_between_train_steps": 0.00550532341003418, "step": 449} {"info/global_step": 450, "train_info/time_within_train_step": 27.684000253677368, "step": 450} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740837330, "_runtime": 13279}, "step": 450} {"logs": {"train/loss": 4.0729, "train/learning_rate": 0.00041666666666666664, "train/epoch": 16.02, "_timestamp": 1740837330, "_runtime": 13279}, "step": 450} {"train_info/time_between_train_steps": 0.025930166244506836, "step": 450} {"info/global_step": 451, "train_info/time_within_train_step": 27.73427438735962, "step": 451} {"train_info/time_between_train_steps": 0.005078315734863281, "step": 451} {"info/global_step": 452, "train_info/time_within_train_step": 27.684383153915405, "step": 452} {"train_info/time_between_train_steps": 0.004854440689086914, "step": 452} {"info/global_step": 453, "train_info/time_within_train_step": 27.677574396133423, "step": 453} {"train_info/time_between_train_steps": 0.004899740219116211, "step": 453} {"info/global_step": 454, "train_info/time_within_train_step": 27.80413317680359, "step": 454} {"train_info/time_between_train_steps": 0.005186796188354492, "step": 454} {"info/global_step": 455, "train_info/time_within_train_step": 27.690826177597046, "step": 455} {"train_info/time_between_train_steps": 0.004988193511962891, "step": 455} {"info/global_step": 456, "train_info/time_within_train_step": 27.71909523010254, "step": 456} {"train_info/time_between_train_steps": 0.004974842071533203, "step": 456} {"info/global_step": 457, "train_info/time_within_train_step": 27.686352729797363, "step": 457} {"train_info/time_between_train_steps": 0.005320072174072266, "step": 457} {"info/global_step": 458, "train_info/time_within_train_step": 27.71625781059265, "step": 458} {"train_info/time_between_train_steps": 0.005297660827636719, "step": 458} {"info/global_step": 459, "train_info/time_within_train_step": 27.711673498153687, "step": 459} {"train_info/time_between_train_steps": 0.005975008010864258, "step": 459} {"train_info/time_between_train_steps": 29.592323303222656, "step": 459} {"info/global_step": 460, "train_info/time_within_train_step": 27.677295684814453, "step": 460} {"train_info/time_between_train_steps": 0.004805803298950195, "step": 460} {"info/global_step": 461, "train_info/time_within_train_step": 27.846956729888916, "step": 461} {"train_info/time_between_train_steps": 0.005087375640869141, "step": 461} {"info/global_step": 462, "train_info/time_within_train_step": 27.69061017036438, "step": 462} {"train_info/time_between_train_steps": 0.0051424503326416016, "step": 462} {"info/global_step": 463, "train_info/time_within_train_step": 27.812079191207886, "step": 463} {"train_info/time_between_train_steps": 0.005174398422241211, "step": 463} {"info/global_step": 464, "train_info/time_within_train_step": 27.69693946838379, "step": 464} {"train_info/time_between_train_steps": 0.0055429935455322266, "step": 464} {"info/global_step": 465, "train_info/time_within_train_step": 27.84162712097168, "step": 465} {"train_info/time_between_train_steps": 0.0051915645599365234, "step": 465} {"info/global_step": 466, "train_info/time_within_train_step": 27.686394929885864, "step": 466} {"train_info/time_between_train_steps": 0.0054302215576171875, "step": 466} {"info/global_step": 467, "train_info/time_within_train_step": 27.76968502998352, "step": 467} {"train_info/time_between_train_steps": 0.005197763442993164, "step": 467} {"info/global_step": 468, "train_info/time_within_train_step": 27.7227725982666, "step": 468} {"train_info/time_between_train_steps": 0.0049970149993896484, "step": 468} {"info/global_step": 469, "train_info/time_within_train_step": 27.77405023574829, "step": 469} {"train_info/time_between_train_steps": 0.005004405975341797, "step": 469} {"info/global_step": 470, "train_info/time_within_train_step": 27.722710609436035, "step": 470} {"train_info/time_between_train_steps": 0.005176544189453125, "step": 470} {"info/global_step": 471, "train_info/time_within_train_step": 27.690796375274658, "step": 471} {"train_info/time_between_train_steps": 0.005308389663696289, "step": 471} {"info/global_step": 472, "train_info/time_within_train_step": 27.737648010253906, "step": 472} {"train_info/time_between_train_steps": 0.0050678253173828125, "step": 472} {"info/global_step": 473, "train_info/time_within_train_step": 27.690638780593872, "step": 473} {"train_info/time_between_train_steps": 0.004964113235473633, "step": 473} {"info/global_step": 474, "train_info/time_within_train_step": 27.7276713848114, "step": 474} {"train_info/time_between_train_steps": 0.005186796188354492, "step": 474} {"info/global_step": 475, "train_info/time_within_train_step": 27.677839994430542, "step": 475} {"train_info/time_between_train_steps": 0.00987553596496582, "step": 475} {"info/global_step": 476, "train_info/time_within_train_step": 27.776566982269287, "step": 476} {"train_info/time_between_train_steps": 0.005464076995849609, "step": 476} {"info/global_step": 477, "train_info/time_within_train_step": 27.699624061584473, "step": 477} {"train_info/time_between_train_steps": 0.005422830581665039, "step": 477} {"info/global_step": 478, "train_info/time_within_train_step": 27.673069715499878, "step": 478} {"train_info/time_between_train_steps": 0.005317211151123047, "step": 478} {"info/global_step": 479, "train_info/time_within_train_step": 27.68050718307495, "step": 479} {"train_info/time_between_train_steps": 0.00502777099609375, "step": 479} {"info/global_step": 480, "train_info/time_within_train_step": 27.67504906654358, "step": 480} {"train_info/time_between_train_steps": 0.005350828170776367, "step": 480} {"info/global_step": 481, "train_info/time_within_train_step": 27.692520141601562, "step": 481} {"train_info/time_between_train_steps": 0.0065155029296875, "step": 481} {"info/global_step": 482, "train_info/time_within_train_step": 27.818052291870117, "step": 482} {"train_info/time_between_train_steps": 0.014669179916381836, "step": 482} {"info/global_step": 483, "train_info/time_within_train_step": 27.7994704246521, "step": 483} {"train_info/time_between_train_steps": 0.0051119327545166016, "step": 483} {"info/global_step": 484, "train_info/time_within_train_step": 27.80413031578064, "step": 484} {"train_info/time_between_train_steps": 0.0051326751708984375, "step": 484} {"info/global_step": 485, "train_info/time_within_train_step": 27.73630380630493, "step": 485} {"train_info/time_between_train_steps": 0.005503654479980469, "step": 485} {"info/global_step": 486, "train_info/time_within_train_step": 27.70350408554077, "step": 486} {"train_info/time_between_train_steps": 0.01563715934753418, "step": 486} {"train_info/time_between_train_steps": 29.821906566619873, "step": 486} {"info/global_step": 487, "train_info/time_within_train_step": 27.707539081573486, "step": 487} {"train_info/time_between_train_steps": 0.005282163619995117, "step": 487} {"info/global_step": 488, "train_info/time_within_train_step": 27.866729974746704, "step": 488} {"train_info/time_between_train_steps": 0.0051441192626953125, "step": 488} {"info/global_step": 489, "train_info/time_within_train_step": 27.67479157447815, "step": 489} {"train_info/time_between_train_steps": 0.0051004886627197266, "step": 489} {"info/global_step": 490, "train_info/time_within_train_step": 27.8334903717041, "step": 490} {"train_info/time_between_train_steps": 0.005152463912963867, "step": 490} {"info/global_step": 491, "train_info/time_within_train_step": 27.793882131576538, "step": 491} {"train_info/time_between_train_steps": 0.005084991455078125, "step": 491} {"info/global_step": 492, "train_info/time_within_train_step": 27.805104732513428, "step": 492} {"train_info/time_between_train_steps": 0.00496673583984375, "step": 492} {"info/global_step": 493, "train_info/time_within_train_step": 27.720075845718384, "step": 493} {"train_info/time_between_train_steps": 0.007458686828613281, "step": 493} {"info/global_step": 494, "train_info/time_within_train_step": 27.76487708091736, "step": 494} {"train_info/time_between_train_steps": 0.0051152706146240234, "step": 494} {"info/global_step": 495, "train_info/time_within_train_step": 27.687869548797607, "step": 495} {"train_info/time_between_train_steps": 0.009567737579345703, "step": 495} {"info/global_step": 496, "train_info/time_within_train_step": 27.677684783935547, "step": 496} {"train_info/time_between_train_steps": 0.008967399597167969, "step": 496} {"info/global_step": 497, "train_info/time_within_train_step": 27.76382803916931, "step": 497} {"train_info/time_between_train_steps": 0.0049207210540771484, "step": 497} {"info/global_step": 498, "train_info/time_within_train_step": 27.669023275375366, "step": 498} {"train_info/time_between_train_steps": 0.005078315734863281, "step": 498} {"info/global_step": 499, "train_info/time_within_train_step": 27.763712882995605, "step": 499} {"train_info/time_between_train_steps": 0.004914760589599609, "step": 499} {"info/global_step": 500, "train_info/time_within_train_step": 27.672534942626953, "step": 500} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740838777, "_runtime": 14726}, "step": 500} {"logs": {"train/loss": 3.941, "train/learning_rate": 0.00038888888888888887, "train/epoch": 18.01, "_timestamp": 1740838777, "_runtime": 14726}, "step": 500} {"train_info/time_between_train_steps": 61.851787090301514, "step": 500} {"info/global_step": 501, "train_info/time_within_train_step": 28.538471460342407, "step": 501} {"train_info/time_between_train_steps": 0.004990816116333008, "step": 501} {"info/global_step": 502, "train_info/time_within_train_step": 27.690359354019165, "step": 502} {"train_info/time_between_train_steps": 0.0049610137939453125, "step": 502} {"info/global_step": 503, "train_info/time_within_train_step": 27.679474353790283, "step": 503} {"train_info/time_between_train_steps": 0.010022878646850586, "step": 503} {"info/global_step": 504, "train_info/time_within_train_step": 27.675956964492798, "step": 504} {"train_info/time_between_train_steps": 0.004946708679199219, "step": 504} {"info/global_step": 505, "train_info/time_within_train_step": 27.671958684921265, "step": 505} {"train_info/time_between_train_steps": 0.004989147186279297, "step": 505} {"info/global_step": 506, "train_info/time_within_train_step": 27.67660617828369, "step": 506} {"train_info/time_between_train_steps": 0.004991054534912109, "step": 506} {"info/global_step": 507, "train_info/time_within_train_step": 27.67815065383911, "step": 507} {"train_info/time_between_train_steps": 0.006908893585205078, "step": 507} {"info/global_step": 508, "train_info/time_within_train_step": 27.69458818435669, "step": 508} {"train_info/time_between_train_steps": 0.007827520370483398, "step": 508} {"info/global_step": 509, "train_info/time_within_train_step": 27.685293912887573, "step": 509} {"train_info/time_between_train_steps": 0.005198240280151367, "step": 509} {"info/global_step": 510, "train_info/time_within_train_step": 27.671449661254883, "step": 510} {"train_info/time_between_train_steps": 0.008224964141845703, "step": 510} {"info/global_step": 511, "train_info/time_within_train_step": 27.68022847175598, "step": 511} {"train_info/time_between_train_steps": 0.0051076412200927734, "step": 511} {"info/global_step": 512, "train_info/time_within_train_step": 27.683968544006348, "step": 512} {"train_info/time_between_train_steps": 0.005418539047241211, "step": 512} {"info/global_step": 513, "train_info/time_within_train_step": 27.695680379867554, "step": 513} {"train_info/time_between_train_steps": 0.005377531051635742, "step": 513} {"train_info/time_between_train_steps": 29.939750909805298, "step": 513} {"info/global_step": 514, "train_info/time_within_train_step": 27.774749040603638, "step": 514} {"train_info/time_between_train_steps": 0.009954452514648438, "step": 514} {"info/global_step": 515, "train_info/time_within_train_step": 27.82589077949524, "step": 515} {"train_info/time_between_train_steps": 0.00507044792175293, "step": 515} {"info/global_step": 516, "train_info/time_within_train_step": 27.692161798477173, "step": 516} {"train_info/time_between_train_steps": 0.005224466323852539, "step": 516} {"info/global_step": 517, "train_info/time_within_train_step": 27.851133823394775, "step": 517} {"train_info/time_between_train_steps": 0.005154848098754883, "step": 517} {"info/global_step": 518, "train_info/time_within_train_step": 27.709155559539795, "step": 518} {"train_info/time_between_train_steps": 0.005364418029785156, "step": 518} {"info/global_step": 519, "train_info/time_within_train_step": 27.838502407073975, "step": 519} {"train_info/time_between_train_steps": 0.0062253475189208984, "step": 519} {"info/global_step": 520, "train_info/time_within_train_step": 27.6978440284729, "step": 520} {"train_info/time_between_train_steps": 0.005019426345825195, "step": 520} {"info/global_step": 521, "train_info/time_within_train_step": 27.766270399093628, "step": 521} {"train_info/time_between_train_steps": 0.005234718322753906, "step": 521} {"info/global_step": 522, "train_info/time_within_train_step": 27.721823930740356, "step": 522} {"train_info/time_between_train_steps": 0.004953145980834961, "step": 522} {"info/global_step": 523, "train_info/time_within_train_step": 27.66607689857483, "step": 523} {"train_info/time_between_train_steps": 0.004929542541503906, "step": 523} {"info/global_step": 524, "train_info/time_within_train_step": 27.670429944992065, "step": 524} {"train_info/time_between_train_steps": 0.004975318908691406, "step": 524} {"info/global_step": 525, "train_info/time_within_train_step": 27.68411612510681, "step": 525} {"train_info/time_between_train_steps": 0.004883766174316406, "step": 525} {"info/global_step": 526, "train_info/time_within_train_step": 27.74719214439392, "step": 526} {"train_info/time_between_train_steps": 0.005048036575317383, "step": 526} {"info/global_step": 527, "train_info/time_within_train_step": 27.733570098876953, "step": 527} {"train_info/time_between_train_steps": 0.00487208366394043, "step": 527} {"info/global_step": 528, "train_info/time_within_train_step": 27.760092735290527, "step": 528} {"train_info/time_between_train_steps": 0.0050013065338134766, "step": 528} {"info/global_step": 529, "train_info/time_within_train_step": 27.797242164611816, "step": 529} {"train_info/time_between_train_steps": 0.0054492950439453125, "step": 529} {"info/global_step": 530, "train_info/time_within_train_step": 27.667036294937134, "step": 530} {"train_info/time_between_train_steps": 0.004889011383056641, "step": 530} {"info/global_step": 531, "train_info/time_within_train_step": 27.669853925704956, "step": 531} {"train_info/time_between_train_steps": 0.005079984664916992, "step": 531} {"info/global_step": 532, "train_info/time_within_train_step": 27.67752194404602, "step": 532} {"train_info/time_between_train_steps": 0.006651878356933594, "step": 532} {"info/global_step": 533, "train_info/time_within_train_step": 27.71123194694519, "step": 533} {"train_info/time_between_train_steps": 0.004915952682495117, "step": 533} {"info/global_step": 534, "train_info/time_within_train_step": 27.678771257400513, "step": 534} {"train_info/time_between_train_steps": 0.005084037780761719, "step": 534} {"info/global_step": 535, "train_info/time_within_train_step": 27.67933440208435, "step": 535} {"train_info/time_between_train_steps": 0.009957551956176758, "step": 535} {"info/global_step": 536, "train_info/time_within_train_step": 27.698485136032104, "step": 536} {"train_info/time_between_train_steps": 0.0051653385162353516, "step": 536} {"info/global_step": 537, "train_info/time_within_train_step": 27.695810317993164, "step": 537} {"train_info/time_between_train_steps": 0.008214950561523438, "step": 537} {"info/global_step": 538, "train_info/time_within_train_step": 27.695643186569214, "step": 538} {"train_info/time_between_train_steps": 0.005135297775268555, "step": 538} {"info/global_step": 539, "train_info/time_within_train_step": 27.757988452911377, "step": 539} {"train_info/time_between_train_steps": 0.005369663238525391, "step": 539} {"info/global_step": 540, "train_info/time_within_train_step": 27.717520475387573, "step": 540} {"train_info/time_between_train_steps": 0.010320186614990234, "step": 540} {"train_info/time_between_train_steps": 37.21029734611511, "step": 540} {"info/global_step": 541, "train_info/time_within_train_step": 28.03437066078186, "step": 541} {"train_info/time_between_train_steps": 0.005332469940185547, "step": 541} {"info/global_step": 542, "train_info/time_within_train_step": 31.623679637908936, "step": 542} {"train_info/time_between_train_steps": 0.005580425262451172, "step": 542} {"info/global_step": 543, "train_info/time_within_train_step": 28.279159784317017, "step": 543} {"train_info/time_between_train_steps": 0.010154485702514648, "step": 543} {"info/global_step": 544, "train_info/time_within_train_step": 27.9926176071167, "step": 544} {"train_info/time_between_train_steps": 0.005124092102050781, "step": 544} {"info/global_step": 545, "train_info/time_within_train_step": 27.67764401435852, "step": 545} {"train_info/time_between_train_steps": 0.005307674407958984, "step": 545} {"info/global_step": 546, "train_info/time_within_train_step": 27.866935968399048, "step": 546} {"train_info/time_between_train_steps": 0.005261898040771484, "step": 546} {"info/global_step": 547, "train_info/time_within_train_step": 27.680941104888916, "step": 547} {"train_info/time_between_train_steps": 0.005048990249633789, "step": 547} {"info/global_step": 548, "train_info/time_within_train_step": 27.812732219696045, "step": 548} {"train_info/time_between_train_steps": 0.0051500797271728516, "step": 548} {"info/global_step": 549, "train_info/time_within_train_step": 27.68227219581604, "step": 549} {"train_info/time_between_train_steps": 0.004887580871582031, "step": 549} {"info/global_step": 550, "train_info/time_within_train_step": 27.70200252532959, "step": 550} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740840303, "_runtime": 16252}, "step": 550} {"logs": {"train/loss": 3.826, "train/learning_rate": 0.0003611111111111111, "train/epoch": 20.01, "_timestamp": 1740840303, "_runtime": 16252}, "step": 550} {"train_info/time_between_train_steps": 0.0297696590423584, "step": 550} {"info/global_step": 551, "train_info/time_within_train_step": 27.68769860267639, "step": 551} {"train_info/time_between_train_steps": 0.0049915313720703125, "step": 551} {"info/global_step": 552, "train_info/time_within_train_step": 27.68511652946472, "step": 552} {"train_info/time_between_train_steps": 0.004961967468261719, "step": 552} {"info/global_step": 553, "train_info/time_within_train_step": 27.735146522521973, "step": 553} {"train_info/time_between_train_steps": 0.005128145217895508, "step": 553} {"info/global_step": 554, "train_info/time_within_train_step": 27.677552700042725, "step": 554} {"train_info/time_between_train_steps": 0.004854917526245117, "step": 554} {"info/global_step": 555, "train_info/time_within_train_step": 27.718973398208618, "step": 555} {"train_info/time_between_train_steps": 0.005406379699707031, "step": 555} {"info/global_step": 556, "train_info/time_within_train_step": 27.689841270446777, "step": 556} {"train_info/time_between_train_steps": 0.0051691532135009766, "step": 556} {"info/global_step": 557, "train_info/time_within_train_step": 27.731921434402466, "step": 557} {"train_info/time_between_train_steps": 0.005002260208129883, "step": 557} {"info/global_step": 558, "train_info/time_within_train_step": 27.695067644119263, "step": 558} {"train_info/time_between_train_steps": 0.00508427619934082, "step": 558} {"info/global_step": 559, "train_info/time_within_train_step": 27.748209238052368, "step": 559} {"train_info/time_between_train_steps": 0.004982471466064453, "step": 559} {"info/global_step": 560, "train_info/time_within_train_step": 27.767049312591553, "step": 560} {"train_info/time_between_train_steps": 0.005130767822265625, "step": 560} {"info/global_step": 561, "train_info/time_within_train_step": 27.674967765808105, "step": 561} {"train_info/time_between_train_steps": 0.005042552947998047, "step": 561} {"info/global_step": 562, "train_info/time_within_train_step": 27.689786911010742, "step": 562} {"train_info/time_between_train_steps": 0.0051746368408203125, "step": 562} {"info/global_step": 563, "train_info/time_within_train_step": 27.697322845458984, "step": 563} {"train_info/time_between_train_steps": 0.005582571029663086, "step": 563} {"info/global_step": 564, "train_info/time_within_train_step": 27.712852001190186, "step": 564} {"train_info/time_between_train_steps": 0.0050432682037353516, "step": 564} {"info/global_step": 565, "train_info/time_within_train_step": 27.697511911392212, "step": 565} {"train_info/time_between_train_steps": 0.0052607059478759766, "step": 565} {"info/global_step": 566, "train_info/time_within_train_step": 27.689690113067627, "step": 566} {"train_info/time_between_train_steps": 0.0052487850189208984, "step": 566} {"info/global_step": 567, "train_info/time_within_train_step": 27.697678089141846, "step": 567} {"train_info/time_between_train_steps": 0.005914211273193359, "step": 567} {"train_info/time_between_train_steps": 29.885384798049927, "step": 567} {"info/global_step": 568, "train_info/time_within_train_step": 27.664153575897217, "step": 568} {"train_info/time_between_train_steps": 0.009563446044921875, "step": 568} {"info/global_step": 569, "train_info/time_within_train_step": 27.828189849853516, "step": 569} {"train_info/time_between_train_steps": 0.005131721496582031, "step": 569} {"info/global_step": 570, "train_info/time_within_train_step": 27.694371223449707, "step": 570} {"train_info/time_between_train_steps": 0.005155801773071289, "step": 570} {"info/global_step": 571, "train_info/time_within_train_step": 27.818868160247803, "step": 571} {"train_info/time_between_train_steps": 0.005113840103149414, "step": 571} {"info/global_step": 572, "train_info/time_within_train_step": 27.68872094154358, "step": 572} {"train_info/time_between_train_steps": 0.005194425582885742, "step": 572} {"info/global_step": 573, "train_info/time_within_train_step": 27.789438247680664, "step": 573} {"train_info/time_between_train_steps": 0.005086660385131836, "step": 573} {"info/global_step": 574, "train_info/time_within_train_step": 27.773414134979248, "step": 574} {"train_info/time_between_train_steps": 0.005383968353271484, "step": 574} {"info/global_step": 575, "train_info/time_within_train_step": 27.775232553482056, "step": 575} {"train_info/time_between_train_steps": 0.005170583724975586, "step": 575} {"info/global_step": 576, "train_info/time_within_train_step": 27.695175170898438, "step": 576} {"train_info/time_between_train_steps": 0.004993438720703125, "step": 576} {"info/global_step": 577, "train_info/time_within_train_step": 27.665024995803833, "step": 577} {"train_info/time_between_train_steps": 0.004942178726196289, "step": 577} {"info/global_step": 578, "train_info/time_within_train_step": 27.71666145324707, "step": 578} {"train_info/time_between_train_steps": 0.009944915771484375, "step": 578} {"info/global_step": 579, "train_info/time_within_train_step": 27.67567729949951, "step": 579} {"train_info/time_between_train_steps": 0.004936933517456055, "step": 579} {"info/global_step": 580, "train_info/time_within_train_step": 27.706153631210327, "step": 580} {"train_info/time_between_train_steps": 0.005031585693359375, "step": 580} {"info/global_step": 581, "train_info/time_within_train_step": 27.674498319625854, "step": 581} {"train_info/time_between_train_steps": 0.004955768585205078, "step": 581} {"info/global_step": 582, "train_info/time_within_train_step": 27.683513164520264, "step": 582} {"train_info/time_between_train_steps": 0.005001544952392578, "step": 582} {"info/global_step": 583, "train_info/time_within_train_step": 27.67023468017578, "step": 583} {"train_info/time_between_train_steps": 0.005039691925048828, "step": 583} {"info/global_step": 584, "train_info/time_within_train_step": 27.689181804656982, "step": 584} {"train_info/time_between_train_steps": 0.004988908767700195, "step": 584} {"info/global_step": 585, "train_info/time_within_train_step": 27.685707092285156, "step": 585} {"train_info/time_between_train_steps": 0.0050334930419921875, "step": 585} {"info/global_step": 586, "train_info/time_within_train_step": 27.761868238449097, "step": 586} {"train_info/time_between_train_steps": 0.0049474239349365234, "step": 586} {"info/global_step": 587, "train_info/time_within_train_step": 27.67378544807434, "step": 587} {"train_info/time_between_train_steps": 0.0050318241119384766, "step": 587} {"info/global_step": 588, "train_info/time_within_train_step": 27.671586513519287, "step": 588} {"train_info/time_between_train_steps": 0.004948854446411133, "step": 588} {"info/global_step": 589, "train_info/time_within_train_step": 27.667776584625244, "step": 589} {"train_info/time_between_train_steps": 0.0050051212310791016, "step": 589} {"info/global_step": 590, "train_info/time_within_train_step": 27.782241582870483, "step": 590} {"train_info/time_between_train_steps": 0.0052356719970703125, "step": 590} {"info/global_step": 591, "train_info/time_within_train_step": 27.716526746749878, "step": 591} {"train_info/time_between_train_steps": 0.005022764205932617, "step": 591} {"info/global_step": 592, "train_info/time_within_train_step": 27.67828631401062, "step": 592} {"train_info/time_between_train_steps": 0.005151033401489258, "step": 592} {"info/global_step": 593, "train_info/time_within_train_step": 27.684534311294556, "step": 593} {"train_info/time_between_train_steps": 0.005425691604614258, "step": 593} {"info/global_step": 594, "train_info/time_within_train_step": 27.729870796203613, "step": 594} {"train_info/time_between_train_steps": 0.0054607391357421875, "step": 594} {"train_info/time_between_train_steps": 30.103595495224, "step": 594} {"info/global_step": 595, "train_info/time_within_train_step": 27.685643196105957, "step": 595} {"train_info/time_between_train_steps": 0.004884004592895508, "step": 595} {"info/global_step": 596, "train_info/time_within_train_step": 27.81301736831665, "step": 596} {"train_info/time_between_train_steps": 0.005746603012084961, "step": 596} {"info/global_step": 597, "train_info/time_within_train_step": 27.696244478225708, "step": 597} {"train_info/time_between_train_steps": 0.005352973937988281, "step": 597} {"info/global_step": 598, "train_info/time_within_train_step": 27.853381633758545, "step": 598} {"train_info/time_between_train_steps": 0.0050814151763916016, "step": 598} {"info/global_step": 599, "train_info/time_within_train_step": 27.68786597251892, "step": 599} {"train_info/time_between_train_steps": 0.005131959915161133, "step": 599} {"info/global_step": 600, "train_info/time_within_train_step": 27.846378564834595, "step": 600} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740841750, "_runtime": 17699}, "step": 600} {"logs": {"train/loss": 3.7276, "train/learning_rate": 0.0003333333333333333, "train/epoch": 22.0, "_timestamp": 1740841750, "_runtime": 17699}, "step": 600} {"train_info/time_between_train_steps": 57.27272868156433, "step": 600} {"info/global_step": 601, "train_info/time_within_train_step": 28.26378345489502, "step": 601} {"train_info/time_between_train_steps": 0.015015602111816406, "step": 601} {"info/global_step": 602, "train_info/time_within_train_step": 28.025111436843872, "step": 602} {"train_info/time_between_train_steps": 0.005140781402587891, "step": 602} {"info/global_step": 603, "train_info/time_within_train_step": 27.702581644058228, "step": 603} {"train_info/time_between_train_steps": 0.004887104034423828, "step": 603} {"info/global_step": 604, "train_info/time_within_train_step": 27.670287132263184, "step": 604} {"train_info/time_between_train_steps": 0.004877805709838867, "step": 604} {"info/global_step": 605, "train_info/time_within_train_step": 27.784454822540283, "step": 605} {"train_info/time_between_train_steps": 0.0052032470703125, "step": 605} {"info/global_step": 606, "train_info/time_within_train_step": 27.664655208587646, "step": 606} {"train_info/time_between_train_steps": 0.009766101837158203, "step": 606} {"info/global_step": 607, "train_info/time_within_train_step": 27.734017848968506, "step": 607} {"train_info/time_between_train_steps": 0.005088329315185547, "step": 607} {"info/global_step": 608, "train_info/time_within_train_step": 27.68215036392212, "step": 608} {"train_info/time_between_train_steps": 0.004853963851928711, "step": 608} {"info/global_step": 609, "train_info/time_within_train_step": 27.725008249282837, "step": 609} {"train_info/time_between_train_steps": 0.005091190338134766, "step": 609} {"info/global_step": 610, "train_info/time_within_train_step": 27.675264358520508, "step": 610} {"train_info/time_between_train_steps": 0.005095243453979492, "step": 610} {"info/global_step": 611, "train_info/time_within_train_step": 27.73589515686035, "step": 611} {"train_info/time_between_train_steps": 0.004917144775390625, "step": 611} {"info/global_step": 612, "train_info/time_within_train_step": 27.689215898513794, "step": 612} {"train_info/time_between_train_steps": 0.005128383636474609, "step": 612} {"info/global_step": 613, "train_info/time_within_train_step": 27.716068029403687, "step": 613} {"train_info/time_between_train_steps": 0.004960775375366211, "step": 613} {"info/global_step": 614, "train_info/time_within_train_step": 27.689669847488403, "step": 614} {"train_info/time_between_train_steps": 0.004925727844238281, "step": 614} {"info/global_step": 615, "train_info/time_within_train_step": 27.67919421195984, "step": 615} {"train_info/time_between_train_steps": 0.0050737857818603516, "step": 615} {"info/global_step": 616, "train_info/time_within_train_step": 27.668785333633423, "step": 616} {"train_info/time_between_train_steps": 0.005002260208129883, "step": 616} {"info/global_step": 617, "train_info/time_within_train_step": 27.691757440567017, "step": 617} {"train_info/time_between_train_steps": 0.005064249038696289, "step": 617} {"info/global_step": 618, "train_info/time_within_train_step": 27.677024364471436, "step": 618} {"train_info/time_between_train_steps": 0.005033254623413086, "step": 618} {"info/global_step": 619, "train_info/time_within_train_step": 27.684285163879395, "step": 619} {"train_info/time_between_train_steps": 0.005181074142456055, "step": 619} {"info/global_step": 620, "train_info/time_within_train_step": 28.08976101875305, "step": 620} {"train_info/time_between_train_steps": 0.010335206985473633, "step": 620} {"info/global_step": 621, "train_info/time_within_train_step": 27.692357063293457, "step": 621} {"train_info/time_between_train_steps": 0.005265712738037109, "step": 621} {"train_info/time_between_train_steps": 29.709611654281616, "step": 621} {"info/global_step": 622, "train_info/time_within_train_step": 27.78045415878296, "step": 622} {"train_info/time_between_train_steps": 0.006834745407104492, "step": 622} {"info/global_step": 623, "train_info/time_within_train_step": 27.885828971862793, "step": 623} {"train_info/time_between_train_steps": 0.005908966064453125, "step": 623} {"info/global_step": 624, "train_info/time_within_train_step": 27.710910081863403, "step": 624} {"train_info/time_between_train_steps": 0.005643606185913086, "step": 624} {"info/global_step": 625, "train_info/time_within_train_step": 27.92944598197937, "step": 625} {"train_info/time_between_train_steps": 0.005697727203369141, "step": 625} {"info/global_step": 626, "train_info/time_within_train_step": 27.84441876411438, "step": 626} {"train_info/time_between_train_steps": 0.005472421646118164, "step": 626} {"info/global_step": 627, "train_info/time_within_train_step": 27.876531839370728, "step": 627} {"train_info/time_between_train_steps": 0.005527973175048828, "step": 627} {"info/global_step": 628, "train_info/time_within_train_step": 27.73575735092163, "step": 628} {"train_info/time_between_train_steps": 0.0057964324951171875, "step": 628} {"info/global_step": 629, "train_info/time_within_train_step": 27.7913076877594, "step": 629} {"train_info/time_between_train_steps": 0.005209445953369141, "step": 629} {"info/global_step": 630, "train_info/time_within_train_step": 27.705824613571167, "step": 630} {"train_info/time_between_train_steps": 0.00518488883972168, "step": 630} {"info/global_step": 631, "train_info/time_within_train_step": 27.687830924987793, "step": 631} {"train_info/time_between_train_steps": 0.005135059356689453, "step": 631} {"info/global_step": 632, "train_info/time_within_train_step": 27.727758407592773, "step": 632} {"train_info/time_between_train_steps": 0.010061264038085938, "step": 632} {"info/global_step": 633, "train_info/time_within_train_step": 27.69417929649353, "step": 633} {"train_info/time_between_train_steps": 0.004924297332763672, "step": 633} {"info/global_step": 634, "train_info/time_within_train_step": 27.676318645477295, "step": 634} {"train_info/time_between_train_steps": 0.00527644157409668, "step": 634} {"info/global_step": 635, "train_info/time_within_train_step": 27.769784212112427, "step": 635} {"train_info/time_between_train_steps": 0.005064725875854492, "step": 635} {"info/global_step": 636, "train_info/time_within_train_step": 27.722774744033813, "step": 636} {"train_info/time_between_train_steps": 0.005045652389526367, "step": 636} {"info/global_step": 637, "train_info/time_within_train_step": 27.686607360839844, "step": 637} {"train_info/time_between_train_steps": 0.005286455154418945, "step": 637} {"info/global_step": 638, "train_info/time_within_train_step": 27.671982049942017, "step": 638} {"train_info/time_between_train_steps": 0.005297183990478516, "step": 638} {"info/global_step": 639, "train_info/time_within_train_step": 27.909485578536987, "step": 639} {"train_info/time_between_train_steps": 0.005059242248535156, "step": 639} {"info/global_step": 640, "train_info/time_within_train_step": 27.862473249435425, "step": 640} {"train_info/time_between_train_steps": 0.005169868469238281, "step": 640} {"info/global_step": 641, "train_info/time_within_train_step": 27.673311710357666, "step": 641} {"train_info/time_between_train_steps": 0.005018949508666992, "step": 641} {"info/global_step": 642, "train_info/time_within_train_step": 27.68473792076111, "step": 642} {"train_info/time_between_train_steps": 0.005134105682373047, "step": 642} {"info/global_step": 643, "train_info/time_within_train_step": 27.678916215896606, "step": 643} {"train_info/time_between_train_steps": 0.005121469497680664, "step": 643} {"info/global_step": 644, "train_info/time_within_train_step": 27.680357217788696, "step": 644} {"train_info/time_between_train_steps": 0.00513768196105957, "step": 644} {"info/global_step": 645, "train_info/time_within_train_step": 27.68493127822876, "step": 645} {"train_info/time_between_train_steps": 0.0050656795501708984, "step": 645} {"info/global_step": 646, "train_info/time_within_train_step": 27.70220136642456, "step": 646} {"train_info/time_between_train_steps": 0.00519108772277832, "step": 646} {"info/global_step": 647, "train_info/time_within_train_step": 27.686874389648438, "step": 647} {"train_info/time_between_train_steps": 0.005599021911621094, "step": 647} {"info/global_step": 648, "train_info/time_within_train_step": 27.701208353042603, "step": 648} {"train_info/time_between_train_steps": 0.00643157958984375, "step": 648} {"train_info/time_between_train_steps": 29.752322912216187, "step": 648} {"info/global_step": 649, "train_info/time_within_train_step": 27.783902168273926, "step": 649} {"train_info/time_between_train_steps": 0.0048749446868896484, "step": 649} {"info/global_step": 650, "train_info/time_within_train_step": 27.81309223175049, "step": 650} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740843257, "_runtime": 19206}, "step": 650} {"logs": {"train/loss": 3.6415, "train/learning_rate": 0.00030555555555555555, "train/epoch": 24.0, "_timestamp": 1740843257, "_runtime": 19206}, "step": 650} {"train_info/time_between_train_steps": 0.02568840980529785, "step": 650} {"info/global_step": 651, "train_info/time_within_train_step": 27.699673414230347, "step": 651} {"train_info/time_between_train_steps": 0.0052835941314697266, "step": 651} {"info/global_step": 652, "train_info/time_within_train_step": 27.877374172210693, "step": 652} {"train_info/time_between_train_steps": 0.005191802978515625, "step": 652} {"info/global_step": 653, "train_info/time_within_train_step": 27.68099308013916, "step": 653} {"train_info/time_between_train_steps": 0.005148887634277344, "step": 653} {"info/global_step": 654, "train_info/time_within_train_step": 27.812268018722534, "step": 654} {"train_info/time_between_train_steps": 0.005180835723876953, "step": 654} {"info/global_step": 655, "train_info/time_within_train_step": 27.721638679504395, "step": 655} {"train_info/time_between_train_steps": 0.005434989929199219, "step": 655} {"info/global_step": 656, "train_info/time_within_train_step": 27.73462200164795, "step": 656} {"train_info/time_between_train_steps": 0.0062596797943115234, "step": 656} {"info/global_step": 657, "train_info/time_within_train_step": 27.692196130752563, "step": 657} {"train_info/time_between_train_steps": 0.005011796951293945, "step": 657} {"info/global_step": 658, "train_info/time_within_train_step": 27.66310429573059, "step": 658} {"train_info/time_between_train_steps": 0.004877567291259766, "step": 658} {"info/global_step": 659, "train_info/time_within_train_step": 27.666418075561523, "step": 659} {"train_info/time_between_train_steps": 0.005001544952392578, "step": 659} {"info/global_step": 660, "train_info/time_within_train_step": 27.677677869796753, "step": 660} {"train_info/time_between_train_steps": 0.004837512969970703, "step": 660} {"info/global_step": 661, "train_info/time_within_train_step": 27.741764783859253, "step": 661} {"train_info/time_between_train_steps": 0.0049228668212890625, "step": 661} {"info/global_step": 662, "train_info/time_within_train_step": 27.67442560195923, "step": 662} {"train_info/time_between_train_steps": 0.005023479461669922, "step": 662} {"info/global_step": 663, "train_info/time_within_train_step": 27.667781829833984, "step": 663} {"train_info/time_between_train_steps": 0.0050351619720458984, "step": 663} {"info/global_step": 664, "train_info/time_within_train_step": 27.668005228042603, "step": 664} {"train_info/time_between_train_steps": 0.0049610137939453125, "step": 664} {"info/global_step": 665, "train_info/time_within_train_step": 27.79037094116211, "step": 665} {"train_info/time_between_train_steps": 0.0048980712890625, "step": 665} {"info/global_step": 666, "train_info/time_within_train_step": 27.69136643409729, "step": 666} {"train_info/time_between_train_steps": 0.0054547786712646484, "step": 666} {"info/global_step": 667, "train_info/time_within_train_step": 27.680794954299927, "step": 667} {"train_info/time_between_train_steps": 0.00494384765625, "step": 667} {"info/global_step": 668, "train_info/time_within_train_step": 27.682769298553467, "step": 668} {"train_info/time_between_train_steps": 0.005079030990600586, "step": 668} {"info/global_step": 669, "train_info/time_within_train_step": 27.683570861816406, "step": 669} {"train_info/time_between_train_steps": 0.005063772201538086, "step": 669} {"info/global_step": 670, "train_info/time_within_train_step": 27.69808602333069, "step": 670} {"train_info/time_between_train_steps": 0.005298137664794922, "step": 670} {"info/global_step": 671, "train_info/time_within_train_step": 27.71128487586975, "step": 671} {"train_info/time_between_train_steps": 0.0050067901611328125, "step": 671} {"info/global_step": 672, "train_info/time_within_train_step": 27.68874764442444, "step": 672} {"train_info/time_between_train_steps": 0.0051081180572509766, "step": 672} {"info/global_step": 673, "train_info/time_within_train_step": 27.683480739593506, "step": 673} {"train_info/time_between_train_steps": 0.005063772201538086, "step": 673} {"info/global_step": 674, "train_info/time_within_train_step": 27.74240732192993, "step": 674} {"train_info/time_between_train_steps": 0.005105018615722656, "step": 674} {"info/global_step": 675, "train_info/time_within_train_step": 27.712934494018555, "step": 675} {"train_info/time_between_train_steps": 0.005464315414428711, "step": 675} {"train_info/time_between_train_steps": 29.910584211349487, "step": 675} {"info/global_step": 676, "train_info/time_within_train_step": 27.698601007461548, "step": 676} {"train_info/time_between_train_steps": 0.004916191101074219, "step": 676} {"info/global_step": 677, "train_info/time_within_train_step": 27.857526302337646, "step": 677} {"train_info/time_between_train_steps": 0.004795551300048828, "step": 677} {"info/global_step": 678, "train_info/time_within_train_step": 27.68055295944214, "step": 678} {"train_info/time_between_train_steps": 0.0048177242279052734, "step": 678} {"info/global_step": 679, "train_info/time_within_train_step": 27.866209745407104, "step": 679} {"train_info/time_between_train_steps": 0.005165815353393555, "step": 679} {"info/global_step": 680, "train_info/time_within_train_step": 27.823453664779663, "step": 680} {"train_info/time_between_train_steps": 0.005391120910644531, "step": 680} {"info/global_step": 681, "train_info/time_within_train_step": 27.827982425689697, "step": 681} {"train_info/time_between_train_steps": 0.005140066146850586, "step": 681} {"info/global_step": 682, "train_info/time_within_train_step": 27.697964668273926, "step": 682} {"train_info/time_between_train_steps": 0.005079030990600586, "step": 682} {"info/global_step": 683, "train_info/time_within_train_step": 27.75378727912903, "step": 683} {"train_info/time_between_train_steps": 0.00513458251953125, "step": 683} {"info/global_step": 684, "train_info/time_within_train_step": 27.709417581558228, "step": 684} {"train_info/time_between_train_steps": 0.005217552185058594, "step": 684} {"info/global_step": 685, "train_info/time_within_train_step": 27.68973660469055, "step": 685} {"train_info/time_between_train_steps": 0.005190134048461914, "step": 685} {"info/global_step": 686, "train_info/time_within_train_step": 27.746852159500122, "step": 686} {"train_info/time_between_train_steps": 0.015586614608764648, "step": 686} {"info/global_step": 687, "train_info/time_within_train_step": 27.719690322875977, "step": 687} {"train_info/time_between_train_steps": 0.00505828857421875, "step": 687} {"info/global_step": 688, "train_info/time_within_train_step": 27.69042706489563, "step": 688} {"train_info/time_between_train_steps": 0.005038261413574219, "step": 688} {"info/global_step": 689, "train_info/time_within_train_step": 27.678998231887817, "step": 689} {"train_info/time_between_train_steps": 0.0060541629791259766, "step": 689} {"info/global_step": 690, "train_info/time_within_train_step": 27.75462532043457, "step": 690} {"train_info/time_between_train_steps": 0.004940032958984375, "step": 690} {"info/global_step": 691, "train_info/time_within_train_step": 27.70759153366089, "step": 691} {"train_info/time_between_train_steps": 0.005103349685668945, "step": 691} {"info/global_step": 692, "train_info/time_within_train_step": 27.72522258758545, "step": 692} {"train_info/time_between_train_steps": 0.005373477935791016, "step": 692} {"info/global_step": 693, "train_info/time_within_train_step": 27.6722252368927, "step": 693} {"train_info/time_between_train_steps": 0.004964351654052734, "step": 693} {"info/global_step": 694, "train_info/time_within_train_step": 27.697333097457886, "step": 694} {"train_info/time_between_train_steps": 0.004899740219116211, "step": 694} {"info/global_step": 695, "train_info/time_within_train_step": 27.803155660629272, "step": 695} {"train_info/time_between_train_steps": 0.00487828254699707, "step": 695} {"info/global_step": 696, "train_info/time_within_train_step": 27.68677592277527, "step": 696} {"train_info/time_between_train_steps": 0.005341768264770508, "step": 696} {"info/global_step": 697, "train_info/time_within_train_step": 27.683055639266968, "step": 697} {"train_info/time_between_train_steps": 0.0053369998931884766, "step": 697} {"info/global_step": 698, "train_info/time_within_train_step": 27.698196411132812, "step": 698} {"train_info/time_between_train_steps": 0.004990816116333008, "step": 698} {"info/global_step": 699, "train_info/time_within_train_step": 27.703386068344116, "step": 699} {"train_info/time_between_train_steps": 0.00511622428894043, "step": 699} {"info/global_step": 700, "train_info/time_within_train_step": 27.685921669006348, "step": 700} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740844675, "_runtime": 20624}, "step": 700} {"logs": {"train/loss": 3.4952, "train/learning_rate": 0.0002777777777777778, "train/epoch": 25.02, "_timestamp": 1740844675, "_runtime": 20624}, "step": 700} {"train_info/time_between_train_steps": 205.7708718776703, "step": 700} {"info/global_step": 701, "train_info/time_within_train_step": 28.254541635513306, "step": 701} {"train_info/time_between_train_steps": 0.00508427619934082, "step": 701} {"info/global_step": 702, "train_info/time_within_train_step": 27.70797324180603, "step": 702} {"train_info/time_between_train_steps": 0.0053348541259765625, "step": 702} {"train_info/time_between_train_steps": 30.087986946105957, "step": 702} {"info/global_step": 703, "train_info/time_within_train_step": 27.708192348480225, "step": 703} {"train_info/time_between_train_steps": 0.005136728286743164, "step": 703} {"info/global_step": 704, "train_info/time_within_train_step": 27.84008288383484, "step": 704} {"train_info/time_between_train_steps": 0.005040407180786133, "step": 704} {"info/global_step": 705, "train_info/time_within_train_step": 27.746328830718994, "step": 705} {"train_info/time_between_train_steps": 0.00483250617980957, "step": 705} {"info/global_step": 706, "train_info/time_within_train_step": 27.84048843383789, "step": 706} {"train_info/time_between_train_steps": 0.005275249481201172, "step": 706} {"info/global_step": 707, "train_info/time_within_train_step": 27.735986471176147, "step": 707} {"train_info/time_between_train_steps": 0.0054204463958740234, "step": 707} {"info/global_step": 708, "train_info/time_within_train_step": 27.886640310287476, "step": 708} {"train_info/time_between_train_steps": 0.005254030227661133, "step": 708} {"info/global_step": 709, "train_info/time_within_train_step": 27.687414407730103, "step": 709} {"train_info/time_between_train_steps": 0.005116939544677734, "step": 709} {"info/global_step": 710, "train_info/time_within_train_step": 27.858542442321777, "step": 710} {"train_info/time_between_train_steps": 0.005039691925048828, "step": 710} {"info/global_step": 711, "train_info/time_within_train_step": 27.702407121658325, "step": 711} {"train_info/time_between_train_steps": 0.004914999008178711, "step": 711} {"info/global_step": 712, "train_info/time_within_train_step": 27.722926139831543, "step": 712} {"train_info/time_between_train_steps": 0.006056785583496094, "step": 712} {"info/global_step": 713, "train_info/time_within_train_step": 27.683764457702637, "step": 713} {"train_info/time_between_train_steps": 0.0052797794342041016, "step": 713} {"info/global_step": 714, "train_info/time_within_train_step": 27.71592426300049, "step": 714} {"train_info/time_between_train_steps": 0.004989147186279297, "step": 714} {"info/global_step": 715, "train_info/time_within_train_step": 27.705907583236694, "step": 715} {"train_info/time_between_train_steps": 0.0049211978912353516, "step": 715} {"info/global_step": 716, "train_info/time_within_train_step": 27.700575590133667, "step": 716} {"train_info/time_between_train_steps": 0.005867958068847656, "step": 716} {"info/global_step": 717, "train_info/time_within_train_step": 27.699155807495117, "step": 717} {"train_info/time_between_train_steps": 0.005313873291015625, "step": 717} {"info/global_step": 718, "train_info/time_within_train_step": 27.73455286026001, "step": 718} {"train_info/time_between_train_steps": 0.005024433135986328, "step": 718} {"info/global_step": 719, "train_info/time_within_train_step": 27.68619132041931, "step": 719} {"train_info/time_between_train_steps": 0.004867076873779297, "step": 719} {"info/global_step": 720, "train_info/time_within_train_step": 27.702112674713135, "step": 720} {"train_info/time_between_train_steps": 0.005155086517333984, "step": 720} {"info/global_step": 721, "train_info/time_within_train_step": 27.748716831207275, "step": 721} {"train_info/time_between_train_steps": 0.005070209503173828, "step": 721} {"info/global_step": 722, "train_info/time_within_train_step": 27.686864852905273, "step": 722} {"train_info/time_between_train_steps": 0.005057573318481445, "step": 722} {"info/global_step": 723, "train_info/time_within_train_step": 27.681989908218384, "step": 723} {"train_info/time_between_train_steps": 0.005129337310791016, "step": 723} {"info/global_step": 724, "train_info/time_within_train_step": 27.71997308731079, "step": 724} {"train_info/time_between_train_steps": 0.005264759063720703, "step": 724} {"info/global_step": 725, "train_info/time_within_train_step": 27.709550142288208, "step": 725} {"train_info/time_between_train_steps": 0.005185604095458984, "step": 725} {"info/global_step": 726, "train_info/time_within_train_step": 27.773688316345215, "step": 726} {"train_info/time_between_train_steps": 0.005421876907348633, "step": 726} {"info/global_step": 727, "train_info/time_within_train_step": 27.723800897598267, "step": 727} {"train_info/time_between_train_steps": 0.0050432682037353516, "step": 727} {"info/global_step": 728, "train_info/time_within_train_step": 27.732863426208496, "step": 728} {"train_info/time_between_train_steps": 0.0052280426025390625, "step": 728} {"info/global_step": 729, "train_info/time_within_train_step": 27.782514333724976, "step": 729} {"train_info/time_between_train_steps": 0.0053691864013671875, "step": 729} {"train_info/time_between_train_steps": 29.764040231704712, "step": 729} {"info/global_step": 730, "train_info/time_within_train_step": 31.10205841064453, "step": 730} {"train_info/time_between_train_steps": 0.005063772201538086, "step": 730} {"info/global_step": 731, "train_info/time_within_train_step": 28.25043773651123, "step": 731} {"train_info/time_between_train_steps": 0.005301475524902344, "step": 731} {"info/global_step": 732, "train_info/time_within_train_step": 30.852128505706787, "step": 732} {"train_info/time_between_train_steps": 0.005167245864868164, "step": 732} {"info/global_step": 733, "train_info/time_within_train_step": 28.004018783569336, "step": 733} {"train_info/time_between_train_steps": 0.005093574523925781, "step": 733} {"info/global_step": 734, "train_info/time_within_train_step": 27.715487718582153, "step": 734} {"train_info/time_between_train_steps": 0.005473613739013672, "step": 734} {"info/global_step": 735, "train_info/time_within_train_step": 27.825292348861694, "step": 735} {"train_info/time_between_train_steps": 0.005259513854980469, "step": 735} {"info/global_step": 736, "train_info/time_within_train_step": 27.698736667633057, "step": 736} {"train_info/time_between_train_steps": 0.005049228668212891, "step": 736} {"info/global_step": 737, "train_info/time_within_train_step": 27.772340059280396, "step": 737} {"train_info/time_between_train_steps": 0.005064725875854492, "step": 737} {"info/global_step": 738, "train_info/time_within_train_step": 27.728332042694092, "step": 738} {"train_info/time_between_train_steps": 0.004832029342651367, "step": 738} {"info/global_step": 739, "train_info/time_within_train_step": 27.731085777282715, "step": 739} {"train_info/time_between_train_steps": 0.0048978328704833984, "step": 739} {"info/global_step": 740, "train_info/time_within_train_step": 27.786435842514038, "step": 740} {"train_info/time_between_train_steps": 0.00596928596496582, "step": 740} {"info/global_step": 741, "train_info/time_within_train_step": 27.7187340259552, "step": 741} {"train_info/time_between_train_steps": 0.0059778690338134766, "step": 741} {"info/global_step": 742, "train_info/time_within_train_step": 27.711377382278442, "step": 742} {"train_info/time_between_train_steps": 0.0050389766693115234, "step": 742} {"info/global_step": 743, "train_info/time_within_train_step": 27.7295925617218, "step": 743} {"train_info/time_between_train_steps": 0.004990816116333008, "step": 743} {"info/global_step": 744, "train_info/time_within_train_step": 27.69840669631958, "step": 744} {"train_info/time_between_train_steps": 0.0051081180572509766, "step": 744} {"info/global_step": 745, "train_info/time_within_train_step": 27.721356868743896, "step": 745} {"train_info/time_between_train_steps": 0.0051076412200927734, "step": 745} {"info/global_step": 746, "train_info/time_within_train_step": 27.694146394729614, "step": 746} {"train_info/time_between_train_steps": 0.0048677921295166016, "step": 746} {"info/global_step": 747, "train_info/time_within_train_step": 27.70768404006958, "step": 747} {"train_info/time_between_train_steps": 0.004968881607055664, "step": 747} {"info/global_step": 748, "train_info/time_within_train_step": 27.684829711914062, "step": 748} {"train_info/time_between_train_steps": 0.005113124847412109, "step": 748} {"info/global_step": 749, "train_info/time_within_train_step": 27.681796550750732, "step": 749} {"train_info/time_between_train_steps": 0.005017995834350586, "step": 749} {"info/global_step": 750, "train_info/time_within_train_step": 27.711034774780273, "step": 750} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740846343, "_runtime": 22292}, "step": 750} {"logs": {"train/loss": 3.4946, "train/learning_rate": 0.00025, "train/epoch": 27.02, "_timestamp": 1740846343, "_runtime": 22292}, "step": 750} {"train_info/time_between_train_steps": 0.026391029357910156, "step": 750} {"info/global_step": 751, "train_info/time_within_train_step": 27.68461775779724, "step": 751} {"train_info/time_between_train_steps": 0.006167411804199219, "step": 751} {"info/global_step": 752, "train_info/time_within_train_step": 27.696069717407227, "step": 752} {"train_info/time_between_train_steps": 0.0051271915435791016, "step": 752} {"info/global_step": 753, "train_info/time_within_train_step": 27.717214822769165, "step": 753} {"train_info/time_between_train_steps": 0.005079984664916992, "step": 753} {"info/global_step": 754, "train_info/time_within_train_step": 27.72770857810974, "step": 754} {"train_info/time_between_train_steps": 0.005025148391723633, "step": 754} {"info/global_step": 755, "train_info/time_within_train_step": 27.699385166168213, "step": 755} {"train_info/time_between_train_steps": 0.005212545394897461, "step": 755} {"info/global_step": 756, "train_info/time_within_train_step": 27.78471326828003, "step": 756} {"train_info/time_between_train_steps": 0.0056688785552978516, "step": 756} {"train_info/time_between_train_steps": 29.823610544204712, "step": 756} {"info/global_step": 757, "train_info/time_within_train_step": 27.679866313934326, "step": 757} {"train_info/time_between_train_steps": 0.00493621826171875, "step": 757} {"info/global_step": 758, "train_info/time_within_train_step": 27.8112313747406, "step": 758} {"train_info/time_between_train_steps": 0.005324363708496094, "step": 758} {"info/global_step": 759, "train_info/time_within_train_step": 27.68957543373108, "step": 759} {"train_info/time_between_train_steps": 0.0048601627349853516, "step": 759} {"info/global_step": 760, "train_info/time_within_train_step": 27.849790811538696, "step": 760} {"train_info/time_between_train_steps": 0.005031108856201172, "step": 760} {"info/global_step": 761, "train_info/time_within_train_step": 27.72820258140564, "step": 761} {"train_info/time_between_train_steps": 0.0052068233489990234, "step": 761} {"info/global_step": 762, "train_info/time_within_train_step": 27.8509202003479, "step": 762} {"train_info/time_between_train_steps": 0.0051119327545166016, "step": 762} {"info/global_step": 763, "train_info/time_within_train_step": 27.72571110725403, "step": 763} {"train_info/time_between_train_steps": 0.005269527435302734, "step": 763} {"info/global_step": 764, "train_info/time_within_train_step": 27.78406834602356, "step": 764} {"train_info/time_between_train_steps": 0.005171775817871094, "step": 764} {"info/global_step": 765, "train_info/time_within_train_step": 27.699117183685303, "step": 765} {"train_info/time_between_train_steps": 0.005185365676879883, "step": 765} {"info/global_step": 766, "train_info/time_within_train_step": 27.700966835021973, "step": 766} {"train_info/time_between_train_steps": 0.005179643630981445, "step": 766} {"info/global_step": 767, "train_info/time_within_train_step": 27.686622858047485, "step": 767} {"train_info/time_between_train_steps": 0.004982948303222656, "step": 767} {"info/global_step": 768, "train_info/time_within_train_step": 27.74769377708435, "step": 768} {"train_info/time_between_train_steps": 0.004995107650756836, "step": 768} {"info/global_step": 769, "train_info/time_within_train_step": 27.724650859832764, "step": 769} {"train_info/time_between_train_steps": 0.005130767822265625, "step": 769} {"info/global_step": 770, "train_info/time_within_train_step": 27.760494470596313, "step": 770} {"train_info/time_between_train_steps": 0.0060443878173828125, "step": 770} {"info/global_step": 771, "train_info/time_within_train_step": 27.799352407455444, "step": 771} {"train_info/time_between_train_steps": 0.004956483840942383, "step": 771} {"info/global_step": 772, "train_info/time_within_train_step": 27.706594467163086, "step": 772} {"train_info/time_between_train_steps": 0.006472110748291016, "step": 772} {"info/global_step": 773, "train_info/time_within_train_step": 27.69157338142395, "step": 773} {"train_info/time_between_train_steps": 0.0052106380462646484, "step": 773} {"info/global_step": 774, "train_info/time_within_train_step": 27.708574771881104, "step": 774} {"train_info/time_between_train_steps": 0.006930351257324219, "step": 774} {"info/global_step": 775, "train_info/time_within_train_step": 27.69233775138855, "step": 775} {"train_info/time_between_train_steps": 0.005071401596069336, "step": 775} {"info/global_step": 776, "train_info/time_within_train_step": 27.68123173713684, "step": 776} {"train_info/time_between_train_steps": 0.00507044792175293, "step": 776} {"info/global_step": 777, "train_info/time_within_train_step": 27.720924615859985, "step": 777} {"train_info/time_between_train_steps": 0.0062656402587890625, "step": 777} {"info/global_step": 778, "train_info/time_within_train_step": 27.725847005844116, "step": 778} {"train_info/time_between_train_steps": 0.004975318908691406, "step": 778} {"info/global_step": 779, "train_info/time_within_train_step": 27.736603021621704, "step": 779} {"train_info/time_between_train_steps": 0.006090641021728516, "step": 779} {"info/global_step": 780, "train_info/time_within_train_step": 27.705061435699463, "step": 780} {"train_info/time_between_train_steps": 0.005053520202636719, "step": 780} {"info/global_step": 781, "train_info/time_within_train_step": 27.730817556381226, "step": 781} {"train_info/time_between_train_steps": 0.005067348480224609, "step": 781} {"info/global_step": 782, "train_info/time_within_train_step": 27.70754909515381, "step": 782} {"train_info/time_between_train_steps": 0.00535893440246582, "step": 782} {"info/global_step": 783, "train_info/time_within_train_step": 27.706660747528076, "step": 783} {"train_info/time_between_train_steps": 0.0056362152099609375, "step": 783} {"train_info/time_between_train_steps": 29.51830768585205, "step": 783} {"info/global_step": 784, "train_info/time_within_train_step": 27.703696250915527, "step": 784} {"train_info/time_between_train_steps": 0.0057141780853271484, "step": 784} {"info/global_step": 785, "train_info/time_within_train_step": 27.95079803466797, "step": 785} {"train_info/time_between_train_steps": 0.0051479339599609375, "step": 785} {"info/global_step": 786, "train_info/time_within_train_step": 27.73789930343628, "step": 786} {"train_info/time_between_train_steps": 0.00510406494140625, "step": 786} {"info/global_step": 787, "train_info/time_within_train_step": 27.833077907562256, "step": 787} {"train_info/time_between_train_steps": 0.005252361297607422, "step": 787} {"info/global_step": 788, "train_info/time_within_train_step": 27.706275939941406, "step": 788} {"train_info/time_between_train_steps": 0.005204677581787109, "step": 788} {"info/global_step": 789, "train_info/time_within_train_step": 27.868988752365112, "step": 789} {"train_info/time_between_train_steps": 0.005631685256958008, "step": 789} {"info/global_step": 790, "train_info/time_within_train_step": 27.724032402038574, "step": 790} {"train_info/time_between_train_steps": 0.011478900909423828, "step": 790} {"info/global_step": 791, "train_info/time_within_train_step": 27.78103232383728, "step": 791} {"train_info/time_between_train_steps": 0.005250692367553711, "step": 791} {"info/global_step": 792, "train_info/time_within_train_step": 27.693026304244995, "step": 792} {"train_info/time_between_train_steps": 0.005300998687744141, "step": 792} {"info/global_step": 793, "train_info/time_within_train_step": 27.681272745132446, "step": 793} {"train_info/time_between_train_steps": 0.005112171173095703, "step": 793} {"info/global_step": 794, "train_info/time_within_train_step": 27.67368173599243, "step": 794} {"train_info/time_between_train_steps": 0.0051059722900390625, "step": 794} {"info/global_step": 795, "train_info/time_within_train_step": 27.68716335296631, "step": 795} {"train_info/time_between_train_steps": 0.0049059391021728516, "step": 795} {"info/global_step": 796, "train_info/time_within_train_step": 27.672405242919922, "step": 796} {"train_info/time_between_train_steps": 0.005040168762207031, "step": 796} {"info/global_step": 797, "train_info/time_within_train_step": 27.675934314727783, "step": 797} {"train_info/time_between_train_steps": 0.004956722259521484, "step": 797} {"info/global_step": 798, "train_info/time_within_train_step": 27.696499824523926, "step": 798} {"train_info/time_between_train_steps": 0.005181550979614258, "step": 798} {"info/global_step": 799, "train_info/time_within_train_step": 27.696920156478882, "step": 799} {"train_info/time_between_train_steps": 0.0051593780517578125, "step": 799} {"info/global_step": 800, "train_info/time_within_train_step": 27.68538737297058, "step": 800} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740847791, "_runtime": 23740}, "step": 800} {"logs": {"train/loss": 3.4295, "train/learning_rate": 0.00022222222222222218, "train/epoch": 29.01, "_timestamp": 1740847791, "_runtime": 23740}, "step": 800} {"train_info/time_between_train_steps": 45.34138894081116, "step": 800} {"info/global_step": 801, "train_info/time_within_train_step": 28.04743719100952, "step": 801} {"train_info/time_between_train_steps": 0.00522160530090332, "step": 801} {"info/global_step": 802, "train_info/time_within_train_step": 27.984935522079468, "step": 802} {"train_info/time_between_train_steps": 0.0052394866943359375, "step": 802} {"info/global_step": 803, "train_info/time_within_train_step": 27.734066247940063, "step": 803} {"train_info/time_between_train_steps": 0.005075931549072266, "step": 803} {"info/global_step": 804, "train_info/time_within_train_step": 27.705271244049072, "step": 804} {"train_info/time_between_train_steps": 0.005868196487426758, "step": 804} {"info/global_step": 805, "train_info/time_within_train_step": 27.700191020965576, "step": 805} {"train_info/time_between_train_steps": 0.005052804946899414, "step": 805} {"info/global_step": 806, "train_info/time_within_train_step": 27.703271865844727, "step": 806} {"train_info/time_between_train_steps": 0.005578279495239258, "step": 806} {"info/global_step": 807, "train_info/time_within_train_step": 27.703209400177002, "step": 807} {"train_info/time_between_train_steps": 0.005028963088989258, "step": 807} {"info/global_step": 808, "train_info/time_within_train_step": 27.72884178161621, "step": 808} {"train_info/time_between_train_steps": 0.0053598880767822266, "step": 808} {"info/global_step": 809, "train_info/time_within_train_step": 27.72204566001892, "step": 809} {"train_info/time_between_train_steps": 0.0055620670318603516, "step": 809} {"info/global_step": 810, "train_info/time_within_train_step": 27.731279611587524, "step": 810} {"train_info/time_between_train_steps": 0.006745100021362305, "step": 810} {"train_info/time_between_train_steps": 29.725592851638794, "step": 810} {"info/global_step": 811, "train_info/time_within_train_step": 27.714940547943115, "step": 811} {"train_info/time_between_train_steps": 0.005440235137939453, "step": 811} {"info/global_step": 812, "train_info/time_within_train_step": 27.8736469745636, "step": 812} {"train_info/time_between_train_steps": 0.0052759647369384766, "step": 812} {"info/global_step": 813, "train_info/time_within_train_step": 27.694947719573975, "step": 813} {"train_info/time_between_train_steps": 0.005990028381347656, "step": 813} {"info/global_step": 814, "train_info/time_within_train_step": 27.814206838607788, "step": 814} {"train_info/time_between_train_steps": 0.005049943923950195, "step": 814} {"info/global_step": 815, "train_info/time_within_train_step": 27.692090272903442, "step": 815} {"train_info/time_between_train_steps": 0.005128622055053711, "step": 815} {"info/global_step": 816, "train_info/time_within_train_step": 27.920867919921875, "step": 816} {"train_info/time_between_train_steps": 0.005758762359619141, "step": 816} {"info/global_step": 817, "train_info/time_within_train_step": 27.699326515197754, "step": 817} {"train_info/time_between_train_steps": 0.005112886428833008, "step": 817} {"info/global_step": 818, "train_info/time_within_train_step": 27.78337836265564, "step": 818} {"train_info/time_between_train_steps": 0.005307674407958984, "step": 818} {"info/global_step": 819, "train_info/time_within_train_step": 27.701679706573486, "step": 819} {"train_info/time_between_train_steps": 0.004866838455200195, "step": 819} {"info/global_step": 820, "train_info/time_within_train_step": 27.688483238220215, "step": 820} {"train_info/time_between_train_steps": 0.004977703094482422, "step": 820} {"info/global_step": 821, "train_info/time_within_train_step": 27.67960524559021, "step": 821} {"train_info/time_between_train_steps": 0.0051631927490234375, "step": 821} {"info/global_step": 822, "train_info/time_within_train_step": 27.67815113067627, "step": 822} {"train_info/time_between_train_steps": 0.009550809860229492, "step": 822} {"info/global_step": 823, "train_info/time_within_train_step": 27.675416231155396, "step": 823} {"train_info/time_between_train_steps": 0.004899740219116211, "step": 823} {"info/global_step": 824, "train_info/time_within_train_step": 27.677238702774048, "step": 824} {"train_info/time_between_train_steps": 0.009716272354125977, "step": 824} {"info/global_step": 825, "train_info/time_within_train_step": 27.677024841308594, "step": 825} {"train_info/time_between_train_steps": 0.005070209503173828, "step": 825} {"info/global_step": 826, "train_info/time_within_train_step": 27.691486120224, "step": 826} {"train_info/time_between_train_steps": 0.0050432682037353516, "step": 826} {"info/global_step": 827, "train_info/time_within_train_step": 27.742215394973755, "step": 827} {"train_info/time_between_train_steps": 0.009226322174072266, "step": 827} {"info/global_step": 828, "train_info/time_within_train_step": 27.676904678344727, "step": 828} {"train_info/time_between_train_steps": 0.01007390022277832, "step": 828} {"info/global_step": 829, "train_info/time_within_train_step": 29.15452742576599, "step": 829} {"train_info/time_between_train_steps": 0.005240201950073242, "step": 829} {"info/global_step": 830, "train_info/time_within_train_step": 27.972545385360718, "step": 830} {"train_info/time_between_train_steps": 0.004892826080322266, "step": 830} {"info/global_step": 831, "train_info/time_within_train_step": 27.798168420791626, "step": 831} {"train_info/time_between_train_steps": 0.004880428314208984, "step": 831} {"info/global_step": 832, "train_info/time_within_train_step": 27.68090796470642, "step": 832} {"train_info/time_between_train_steps": 0.004984855651855469, "step": 832} {"info/global_step": 833, "train_info/time_within_train_step": 27.693134546279907, "step": 833} {"train_info/time_between_train_steps": 0.005284547805786133, "step": 833} {"info/global_step": 834, "train_info/time_within_train_step": 27.680370330810547, "step": 834} {"train_info/time_between_train_steps": 0.004912614822387695, "step": 834} {"info/global_step": 835, "train_info/time_within_train_step": 27.69346523284912, "step": 835} {"train_info/time_between_train_steps": 0.005159616470336914, "step": 835} {"info/global_step": 836, "train_info/time_within_train_step": 27.69474506378174, "step": 836} {"train_info/time_between_train_steps": 0.005087375640869141, "step": 836} {"info/global_step": 837, "train_info/time_within_train_step": 27.715152502059937, "step": 837} {"train_info/time_between_train_steps": 0.0056650638580322266, "step": 837} {"train_info/time_between_train_steps": 29.846271276474, "step": 837} {"info/global_step": 838, "train_info/time_within_train_step": 27.688467264175415, "step": 838} {"train_info/time_between_train_steps": 0.004858255386352539, "step": 838} {"info/global_step": 839, "train_info/time_within_train_step": 27.86183524131775, "step": 839} {"train_info/time_between_train_steps": 0.005103349685668945, "step": 839} {"info/global_step": 840, "train_info/time_within_train_step": 27.69709014892578, "step": 840} {"train_info/time_between_train_steps": 0.0051958560943603516, "step": 840} {"info/global_step": 841, "train_info/time_within_train_step": 27.81467866897583, "step": 841} {"train_info/time_between_train_steps": 0.005251646041870117, "step": 841} {"info/global_step": 842, "train_info/time_within_train_step": 27.6943678855896, "step": 842} {"train_info/time_between_train_steps": 0.005115985870361328, "step": 842} {"info/global_step": 843, "train_info/time_within_train_step": 27.794877290725708, "step": 843} {"train_info/time_between_train_steps": 0.0050771236419677734, "step": 843} {"info/global_step": 844, "train_info/time_within_train_step": 27.711644887924194, "step": 844} {"train_info/time_between_train_steps": 0.005217313766479492, "step": 844} {"info/global_step": 845, "train_info/time_within_train_step": 27.818432092666626, "step": 845} {"train_info/time_between_train_steps": 0.005041837692260742, "step": 845} {"info/global_step": 846, "train_info/time_within_train_step": 27.864030599594116, "step": 846} {"train_info/time_between_train_steps": 0.004914760589599609, "step": 846} {"info/global_step": 847, "train_info/time_within_train_step": 27.690366744995117, "step": 847} {"train_info/time_between_train_steps": 0.004836559295654297, "step": 847} {"info/global_step": 848, "train_info/time_within_train_step": 27.676128149032593, "step": 848} {"train_info/time_between_train_steps": 0.005042552947998047, "step": 848} {"info/global_step": 849, "train_info/time_within_train_step": 27.66452431678772, "step": 849} {"train_info/time_between_train_steps": 0.004755258560180664, "step": 849} {"info/global_step": 850, "train_info/time_within_train_step": 27.685068607330322, "step": 850} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740849287, "_runtime": 25236}, "step": 850} {"logs": {"train/loss": 3.3698, "train/learning_rate": 0.00019444444444444443, "train/epoch": 31.01, "_timestamp": 1740849287, "_runtime": 25236}, "step": 850} {"train_info/time_between_train_steps": 0.02595996856689453, "step": 850} {"info/global_step": 851, "train_info/time_within_train_step": 27.68273949623108, "step": 851} {"train_info/time_between_train_steps": 0.005045652389526367, "step": 851} {"info/global_step": 852, "train_info/time_within_train_step": 27.74963641166687, "step": 852} {"train_info/time_between_train_steps": 0.004904508590698242, "step": 852} {"info/global_step": 853, "train_info/time_within_train_step": 27.67134380340576, "step": 853} {"train_info/time_between_train_steps": 0.004901885986328125, "step": 853} {"info/global_step": 854, "train_info/time_within_train_step": 27.672852993011475, "step": 854} {"train_info/time_between_train_steps": 0.005174160003662109, "step": 854} {"info/global_step": 855, "train_info/time_within_train_step": 27.678083419799805, "step": 855} {"train_info/time_between_train_steps": 0.005341053009033203, "step": 855} {"info/global_step": 856, "train_info/time_within_train_step": 27.68304181098938, "step": 856} {"train_info/time_between_train_steps": 0.004997730255126953, "step": 856} {"info/global_step": 857, "train_info/time_within_train_step": 27.696062803268433, "step": 857} {"train_info/time_between_train_steps": 0.004931449890136719, "step": 857} {"info/global_step": 858, "train_info/time_within_train_step": 27.744391441345215, "step": 858} {"train_info/time_between_train_steps": 0.005387067794799805, "step": 858} {"info/global_step": 859, "train_info/time_within_train_step": 27.710028409957886, "step": 859} {"train_info/time_between_train_steps": 0.005006551742553711, "step": 859} {"info/global_step": 860, "train_info/time_within_train_step": 27.673850774765015, "step": 860} {"train_info/time_between_train_steps": 0.005009651184082031, "step": 860} {"info/global_step": 861, "train_info/time_within_train_step": 27.67987632751465, "step": 861} {"train_info/time_between_train_steps": 0.0057752132415771484, "step": 861} {"info/global_step": 862, "train_info/time_within_train_step": 27.81851315498352, "step": 862} {"train_info/time_between_train_steps": 0.0054683685302734375, "step": 862} {"info/global_step": 863, "train_info/time_within_train_step": 27.84092140197754, "step": 863} {"train_info/time_between_train_steps": 0.005193948745727539, "step": 863} {"info/global_step": 864, "train_info/time_within_train_step": 27.70356583595276, "step": 864} {"train_info/time_between_train_steps": 0.005689859390258789, "step": 864} {"train_info/time_between_train_steps": 30.04367160797119, "step": 864} {"info/global_step": 865, "train_info/time_within_train_step": 27.707815885543823, "step": 865} {"train_info/time_between_train_steps": 0.0054378509521484375, "step": 865} {"info/global_step": 866, "train_info/time_within_train_step": 27.82947301864624, "step": 866} {"train_info/time_between_train_steps": 0.005258083343505859, "step": 866} {"info/global_step": 867, "train_info/time_within_train_step": 27.70136857032776, "step": 867} {"train_info/time_between_train_steps": 0.005247592926025391, "step": 867} {"info/global_step": 868, "train_info/time_within_train_step": 27.836562395095825, "step": 868} {"train_info/time_between_train_steps": 0.005228519439697266, "step": 868} {"info/global_step": 869, "train_info/time_within_train_step": 27.72334861755371, "step": 869} {"train_info/time_between_train_steps": 0.0050389766693115234, "step": 869} {"info/global_step": 870, "train_info/time_within_train_step": 27.819096326828003, "step": 870} {"train_info/time_between_train_steps": 0.005012035369873047, "step": 870} {"info/global_step": 871, "train_info/time_within_train_step": 27.717029333114624, "step": 871} {"train_info/time_between_train_steps": 0.005364894866943359, "step": 871} {"info/global_step": 872, "train_info/time_within_train_step": 27.806649684906006, "step": 872} {"train_info/time_between_train_steps": 0.0052394866943359375, "step": 872} {"info/global_step": 873, "train_info/time_within_train_step": 27.697376251220703, "step": 873} {"train_info/time_between_train_steps": 0.00490880012512207, "step": 873} {"info/global_step": 874, "train_info/time_within_train_step": 27.691839456558228, "step": 874} {"train_info/time_between_train_steps": 0.004852771759033203, "step": 874} {"info/global_step": 875, "train_info/time_within_train_step": 27.731909036636353, "step": 875} {"train_info/time_between_train_steps": 0.0049190521240234375, "step": 875} {"info/global_step": 876, "train_info/time_within_train_step": 27.80907416343689, "step": 876} {"train_info/time_between_train_steps": 0.005060434341430664, "step": 876} {"info/global_step": 877, "train_info/time_within_train_step": 27.709391117095947, "step": 877} {"train_info/time_between_train_steps": 0.005223989486694336, "step": 877} {"info/global_step": 878, "train_info/time_within_train_step": 27.696322441101074, "step": 878} {"train_info/time_between_train_steps": 0.004901409149169922, "step": 878} {"info/global_step": 879, "train_info/time_within_train_step": 27.703620433807373, "step": 879} {"train_info/time_between_train_steps": 0.005059242248535156, "step": 879} {"info/global_step": 880, "train_info/time_within_train_step": 27.715310096740723, "step": 880} {"train_info/time_between_train_steps": 0.005146980285644531, "step": 880} {"info/global_step": 881, "train_info/time_within_train_step": 27.750930547714233, "step": 881} {"train_info/time_between_train_steps": 0.005077362060546875, "step": 881} {"info/global_step": 882, "train_info/time_within_train_step": 27.681193351745605, "step": 882} {"train_info/time_between_train_steps": 0.004918575286865234, "step": 882} {"info/global_step": 883, "train_info/time_within_train_step": 27.733229875564575, "step": 883} {"train_info/time_between_train_steps": 0.009912490844726562, "step": 883} {"info/global_step": 884, "train_info/time_within_train_step": 27.683032989501953, "step": 884} {"train_info/time_between_train_steps": 0.005019187927246094, "step": 884} {"info/global_step": 885, "train_info/time_within_train_step": 27.68564009666443, "step": 885} {"train_info/time_between_train_steps": 0.005006074905395508, "step": 885} {"info/global_step": 886, "train_info/time_within_train_step": 27.719985961914062, "step": 886} {"train_info/time_between_train_steps": 0.004923582077026367, "step": 886} {"info/global_step": 887, "train_info/time_within_train_step": 27.67688298225403, "step": 887} {"train_info/time_between_train_steps": 0.005051612854003906, "step": 887} {"info/global_step": 888, "train_info/time_within_train_step": 27.680904626846313, "step": 888} {"train_info/time_between_train_steps": 0.005121469497680664, "step": 888} {"info/global_step": 889, "train_info/time_within_train_step": 27.682843685150146, "step": 889} {"train_info/time_between_train_steps": 0.005907297134399414, "step": 889} {"info/global_step": 890, "train_info/time_within_train_step": 27.68255043029785, "step": 890} {"train_info/time_between_train_steps": 0.00507044792175293, "step": 890} {"info/global_step": 891, "train_info/time_within_train_step": 27.69603943824768, "step": 891} {"train_info/time_between_train_steps": 0.005517721176147461, "step": 891} {"train_info/time_between_train_steps": 29.60942840576172, "step": 891} {"info/global_step": 892, "train_info/time_within_train_step": 27.69633412361145, "step": 892} {"train_info/time_between_train_steps": 0.004930019378662109, "step": 892} {"info/global_step": 893, "train_info/time_within_train_step": 27.82957124710083, "step": 893} {"train_info/time_between_train_steps": 0.004895210266113281, "step": 893} {"info/global_step": 894, "train_info/time_within_train_step": 27.702529191970825, "step": 894} {"train_info/time_between_train_steps": 0.004828691482543945, "step": 894} {"info/global_step": 895, "train_info/time_within_train_step": 27.80821132659912, "step": 895} {"train_info/time_between_train_steps": 0.005245208740234375, "step": 895} {"info/global_step": 896, "train_info/time_within_train_step": 27.69315457344055, "step": 896} {"train_info/time_between_train_steps": 0.0051805973052978516, "step": 896} {"info/global_step": 897, "train_info/time_within_train_step": 27.815571546554565, "step": 897} {"train_info/time_between_train_steps": 0.005429744720458984, "step": 897} {"info/global_step": 898, "train_info/time_within_train_step": 27.681856393814087, "step": 898} {"train_info/time_between_train_steps": 0.005034923553466797, "step": 898} {"info/global_step": 899, "train_info/time_within_train_step": 27.75200581550598, "step": 899} {"train_info/time_between_train_steps": 0.005106449127197266, "step": 899} {"info/global_step": 900, "train_info/time_within_train_step": 27.69036078453064, "step": 900} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740850734, "_runtime": 26683}, "step": 900} {"logs": {"train/loss": 3.3143, "train/learning_rate": 0.00016666666666666666, "train/epoch": 33.01, "_timestamp": 1740850734, "_runtime": 26683}, "step": 900} {"train_info/time_between_train_steps": 44.171876430511475, "step": 900} {"info/global_step": 901, "train_info/time_within_train_step": 27.90126132965088, "step": 901} {"train_info/time_between_train_steps": 0.005309581756591797, "step": 901} {"info/global_step": 902, "train_info/time_within_train_step": 28.000173807144165, "step": 902} {"train_info/time_between_train_steps": 0.005929231643676758, "step": 902} {"info/global_step": 903, "train_info/time_within_train_step": 27.743350505828857, "step": 903} {"train_info/time_between_train_steps": 0.006230592727661133, "step": 903} {"info/global_step": 904, "train_info/time_within_train_step": 27.69213557243347, "step": 904} {"train_info/time_between_train_steps": 0.005218982696533203, "step": 904} {"info/global_step": 905, "train_info/time_within_train_step": 27.6908016204834, "step": 905} {"train_info/time_between_train_steps": 0.005041837692260742, "step": 905} {"info/global_step": 906, "train_info/time_within_train_step": 27.697402715682983, "step": 906} {"train_info/time_between_train_steps": 0.005144834518432617, "step": 906} {"info/global_step": 907, "train_info/time_within_train_step": 27.82841181755066, "step": 907} {"train_info/time_between_train_steps": 0.005238056182861328, "step": 907} {"info/global_step": 908, "train_info/time_within_train_step": 27.710054397583008, "step": 908} {"train_info/time_between_train_steps": 0.005133152008056641, "step": 908} {"info/global_step": 909, "train_info/time_within_train_step": 27.760668992996216, "step": 909} {"train_info/time_between_train_steps": 0.0050885677337646484, "step": 909} {"info/global_step": 910, "train_info/time_within_train_step": 27.720417022705078, "step": 910} {"train_info/time_between_train_steps": 0.005059003829956055, "step": 910} {"info/global_step": 911, "train_info/time_within_train_step": 27.68888807296753, "step": 911} {"train_info/time_between_train_steps": 0.0051043033599853516, "step": 911} {"info/global_step": 912, "train_info/time_within_train_step": 27.732280731201172, "step": 912} {"train_info/time_between_train_steps": 0.006999492645263672, "step": 912} {"info/global_step": 913, "train_info/time_within_train_step": 27.718446493148804, "step": 913} {"train_info/time_between_train_steps": 0.004991054534912109, "step": 913} {"info/global_step": 914, "train_info/time_within_train_step": 27.696208715438843, "step": 914} {"train_info/time_between_train_steps": 0.0050618648529052734, "step": 914} {"info/global_step": 915, "train_info/time_within_train_step": 27.70871615409851, "step": 915} {"train_info/time_between_train_steps": 0.005080699920654297, "step": 915} {"info/global_step": 916, "train_info/time_within_train_step": 27.746038913726807, "step": 916} {"train_info/time_between_train_steps": 0.005143165588378906, "step": 916} {"info/global_step": 917, "train_info/time_within_train_step": 27.689635038375854, "step": 917} {"train_info/time_between_train_steps": 0.0054738521575927734, "step": 917} {"info/global_step": 918, "train_info/time_within_train_step": 27.698549509048462, "step": 918} {"train_info/time_between_train_steps": 0.005518913269042969, "step": 918} {"train_info/time_between_train_steps": 29.767155408859253, "step": 918} {"info/global_step": 919, "train_info/time_within_train_step": 27.719228267669678, "step": 919} {"train_info/time_between_train_steps": 0.0048389434814453125, "step": 919} {"info/global_step": 920, "train_info/time_within_train_step": 27.799683094024658, "step": 920} {"train_info/time_between_train_steps": 0.0049591064453125, "step": 920} {"info/global_step": 921, "train_info/time_within_train_step": 27.77600622177124, "step": 921} {"train_info/time_between_train_steps": 0.00482940673828125, "step": 921} {"info/global_step": 922, "train_info/time_within_train_step": 27.83393359184265, "step": 922} {"train_info/time_between_train_steps": 0.005200862884521484, "step": 922} {"info/global_step": 923, "train_info/time_within_train_step": 27.68931746482849, "step": 923} {"train_info/time_between_train_steps": 0.0054569244384765625, "step": 923} {"info/global_step": 924, "train_info/time_within_train_step": 27.79341435432434, "step": 924} {"train_info/time_between_train_steps": 0.007645130157470703, "step": 924} {"info/global_step": 925, "train_info/time_within_train_step": 29.26663827896118, "step": 925} {"train_info/time_between_train_steps": 0.005210161209106445, "step": 925} {"info/global_step": 926, "train_info/time_within_train_step": 27.76277184486389, "step": 926} {"train_info/time_between_train_steps": 0.0075664520263671875, "step": 926} {"info/global_step": 927, "train_info/time_within_train_step": 27.711672067642212, "step": 927} {"train_info/time_between_train_steps": 0.005106449127197266, "step": 927} {"info/global_step": 928, "train_info/time_within_train_step": 27.696779012680054, "step": 928} {"train_info/time_between_train_steps": 0.004862070083618164, "step": 928} {"info/global_step": 929, "train_info/time_within_train_step": 27.668912172317505, "step": 929} {"train_info/time_between_train_steps": 0.00500035285949707, "step": 929} {"info/global_step": 930, "train_info/time_within_train_step": 27.67416501045227, "step": 930} {"train_info/time_between_train_steps": 0.0050923824310302734, "step": 930} {"info/global_step": 931, "train_info/time_within_train_step": 27.712637662887573, "step": 931} {"train_info/time_between_train_steps": 0.00502777099609375, "step": 931} {"info/global_step": 932, "train_info/time_within_train_step": 27.692540884017944, "step": 932} {"train_info/time_between_train_steps": 0.005145072937011719, "step": 932} {"info/global_step": 933, "train_info/time_within_train_step": 27.68569779396057, "step": 933} {"train_info/time_between_train_steps": 0.004904747009277344, "step": 933} {"info/global_step": 934, "train_info/time_within_train_step": 27.679091930389404, "step": 934} {"train_info/time_between_train_steps": 0.005093097686767578, "step": 934} {"info/global_step": 935, "train_info/time_within_train_step": 27.677348136901855, "step": 935} {"train_info/time_between_train_steps": 0.004998445510864258, "step": 935} {"info/global_step": 936, "train_info/time_within_train_step": 27.688747882843018, "step": 936} {"train_info/time_between_train_steps": 0.005153656005859375, "step": 936} {"info/global_step": 937, "train_info/time_within_train_step": 27.796393871307373, "step": 937} {"train_info/time_between_train_steps": 0.004910469055175781, "step": 937} {"info/global_step": 938, "train_info/time_within_train_step": 27.731524229049683, "step": 938} {"train_info/time_between_train_steps": 0.005928516387939453, "step": 938} {"info/global_step": 939, "train_info/time_within_train_step": 27.67755937576294, "step": 939} {"train_info/time_between_train_steps": 0.005316495895385742, "step": 939} {"info/global_step": 940, "train_info/time_within_train_step": 27.686074256896973, "step": 940} {"train_info/time_between_train_steps": 0.005161762237548828, "step": 940} {"info/global_step": 941, "train_info/time_within_train_step": 27.701130390167236, "step": 941} {"train_info/time_between_train_steps": 0.004944562911987305, "step": 941} {"info/global_step": 942, "train_info/time_within_train_step": 27.72839379310608, "step": 942} {"train_info/time_between_train_steps": 0.005320310592651367, "step": 942} {"info/global_step": 943, "train_info/time_within_train_step": 27.738743543624878, "step": 943} {"train_info/time_between_train_steps": 0.011515378952026367, "step": 943} {"info/global_step": 944, "train_info/time_within_train_step": 27.698099851608276, "step": 944} {"train_info/time_between_train_steps": 0.005238533020019531, "step": 944} {"info/global_step": 945, "train_info/time_within_train_step": 27.722442626953125, "step": 945} {"train_info/time_between_train_steps": 0.005635738372802734, "step": 945} {"train_info/time_between_train_steps": 29.960261821746826, "step": 945} {"info/global_step": 946, "train_info/time_within_train_step": 27.686065912246704, "step": 946} {"train_info/time_between_train_steps": 0.004873991012573242, "step": 946} {"info/global_step": 947, "train_info/time_within_train_step": 27.799901962280273, "step": 947} {"train_info/time_between_train_steps": 0.00489044189453125, "step": 947} {"info/global_step": 948, "train_info/time_within_train_step": 27.677647590637207, "step": 948} {"train_info/time_between_train_steps": 0.0053136348724365234, "step": 948} {"info/global_step": 949, "train_info/time_within_train_step": 27.84376072883606, "step": 949} {"train_info/time_between_train_steps": 0.006299495697021484, "step": 949} {"info/global_step": 950, "train_info/time_within_train_step": 27.759663581848145, "step": 950} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740852229, "_runtime": 28178}, "step": 950} {"logs": {"train/loss": 3.2639, "train/learning_rate": 0.0001388888888888889, "train/epoch": 35.0, "_timestamp": 1740852229, "_runtime": 28178}, "step": 950} {"train_info/time_between_train_steps": 0.025829076766967773, "step": 950} {"info/global_step": 951, "train_info/time_within_train_step": 27.887420654296875, "step": 951} {"train_info/time_between_train_steps": 0.011326313018798828, "step": 951} {"info/global_step": 952, "train_info/time_within_train_step": 27.783405780792236, "step": 952} {"train_info/time_between_train_steps": 0.005148649215698242, "step": 952} {"info/global_step": 953, "train_info/time_within_train_step": 27.809897899627686, "step": 953} {"train_info/time_between_train_steps": 0.011486053466796875, "step": 953} {"info/global_step": 954, "train_info/time_within_train_step": 27.711515188217163, "step": 954} {"train_info/time_between_train_steps": 0.0050127506256103516, "step": 954} {"info/global_step": 955, "train_info/time_within_train_step": 27.697843551635742, "step": 955} {"train_info/time_between_train_steps": 0.005132436752319336, "step": 955} {"info/global_step": 956, "train_info/time_within_train_step": 27.754255056381226, "step": 956} {"train_info/time_between_train_steps": 0.00507044792175293, "step": 956} {"info/global_step": 957, "train_info/time_within_train_step": 27.7044677734375, "step": 957} {"train_info/time_between_train_steps": 0.00531768798828125, "step": 957} {"info/global_step": 958, "train_info/time_within_train_step": 27.72556233406067, "step": 958} {"train_info/time_between_train_steps": 0.005191802978515625, "step": 958} {"info/global_step": 959, "train_info/time_within_train_step": 27.699970960617065, "step": 959} {"train_info/time_between_train_steps": 0.004980802536010742, "step": 959} {"info/global_step": 960, "train_info/time_within_train_step": 27.704877138137817, "step": 960} {"train_info/time_between_train_steps": 0.0061206817626953125, "step": 960} {"info/global_step": 961, "train_info/time_within_train_step": 27.7079496383667, "step": 961} {"train_info/time_between_train_steps": 0.006025075912475586, "step": 961} {"info/global_step": 962, "train_info/time_within_train_step": 27.69909930229187, "step": 962} {"train_info/time_between_train_steps": 0.005297660827636719, "step": 962} {"info/global_step": 963, "train_info/time_within_train_step": 27.71964979171753, "step": 963} {"train_info/time_between_train_steps": 0.005063295364379883, "step": 963} {"info/global_step": 964, "train_info/time_within_train_step": 27.71163296699524, "step": 964} {"train_info/time_between_train_steps": 0.0050885677337646484, "step": 964} {"info/global_step": 965, "train_info/time_within_train_step": 27.719051599502563, "step": 965} {"train_info/time_between_train_steps": 0.004924774169921875, "step": 965} {"info/global_step": 966, "train_info/time_within_train_step": 27.702669143676758, "step": 966} {"train_info/time_between_train_steps": 0.005282878875732422, "step": 966} {"info/global_step": 967, "train_info/time_within_train_step": 27.768574953079224, "step": 967} {"train_info/time_between_train_steps": 0.00501704216003418, "step": 967} {"info/global_step": 968, "train_info/time_within_train_step": 27.69939923286438, "step": 968} {"train_info/time_between_train_steps": 0.0049474239349365234, "step": 968} {"info/global_step": 969, "train_info/time_within_train_step": 27.70941162109375, "step": 969} {"train_info/time_between_train_steps": 0.005654096603393555, "step": 969} {"info/global_step": 970, "train_info/time_within_train_step": 27.70650339126587, "step": 970} {"train_info/time_between_train_steps": 0.005235433578491211, "step": 970} {"info/global_step": 971, "train_info/time_within_train_step": 27.714507818222046, "step": 971} {"train_info/time_between_train_steps": 0.007652997970581055, "step": 971} {"info/global_step": 972, "train_info/time_within_train_step": 27.762444972991943, "step": 972} {"train_info/time_between_train_steps": 0.00531005859375, "step": 972} {"train_info/time_between_train_steps": 29.684876680374146, "step": 972} {"info/global_step": 973, "train_info/time_within_train_step": 27.769051551818848, "step": 973} {"train_info/time_between_train_steps": 0.005354642868041992, "step": 973} {"info/global_step": 974, "train_info/time_within_train_step": 27.832839727401733, "step": 974} {"train_info/time_between_train_steps": 0.005819082260131836, "step": 974} {"info/global_step": 975, "train_info/time_within_train_step": 27.714015007019043, "step": 975} {"train_info/time_between_train_steps": 0.005135774612426758, "step": 975} {"info/global_step": 976, "train_info/time_within_train_step": 27.804633617401123, "step": 976} {"train_info/time_between_train_steps": 0.005151271820068359, "step": 976} {"info/global_step": 977, "train_info/time_within_train_step": 27.736013889312744, "step": 977} {"train_info/time_between_train_steps": 0.006240129470825195, "step": 977} {"info/global_step": 978, "train_info/time_within_train_step": 27.83270764350891, "step": 978} {"train_info/time_between_train_steps": 0.0052607059478759766, "step": 978} {"info/global_step": 979, "train_info/time_within_train_step": 27.715281009674072, "step": 979} {"train_info/time_between_train_steps": 0.005099296569824219, "step": 979} {"info/global_step": 980, "train_info/time_within_train_step": 27.756693840026855, "step": 980} {"train_info/time_between_train_steps": 0.005257129669189453, "step": 980} {"info/global_step": 981, "train_info/time_within_train_step": 27.740006923675537, "step": 981} {"train_info/time_between_train_steps": 0.005687713623046875, "step": 981} {"info/global_step": 982, "train_info/time_within_train_step": 27.797641038894653, "step": 982} {"train_info/time_between_train_steps": 0.0050182342529296875, "step": 982} {"info/global_step": 983, "train_info/time_within_train_step": 27.716996669769287, "step": 983} {"train_info/time_between_train_steps": 0.0049076080322265625, "step": 983} {"info/global_step": 984, "train_info/time_within_train_step": 27.695619821548462, "step": 984} {"train_info/time_between_train_steps": 0.004867076873779297, "step": 984} {"info/global_step": 985, "train_info/time_within_train_step": 27.722055196762085, "step": 985} {"train_info/time_between_train_steps": 0.004982471466064453, "step": 985} {"info/global_step": 986, "train_info/time_within_train_step": 27.721017837524414, "step": 986} {"train_info/time_between_train_steps": 0.00493931770324707, "step": 986} {"info/global_step": 987, "train_info/time_within_train_step": 27.699114322662354, "step": 987} {"train_info/time_between_train_steps": 0.006012916564941406, "step": 987} {"info/global_step": 988, "train_info/time_within_train_step": 27.74301791191101, "step": 988} {"train_info/time_between_train_steps": 0.005124807357788086, "step": 988} {"info/global_step": 989, "train_info/time_within_train_step": 27.71071743965149, "step": 989} {"train_info/time_between_train_steps": 0.005101442337036133, "step": 989} {"info/global_step": 990, "train_info/time_within_train_step": 27.737481355667114, "step": 990} {"train_info/time_between_train_steps": 0.00513458251953125, "step": 990} {"info/global_step": 991, "train_info/time_within_train_step": 27.729920148849487, "step": 991} {"train_info/time_between_train_steps": 0.005026817321777344, "step": 991} {"info/global_step": 992, "train_info/time_within_train_step": 27.68966317176819, "step": 992} {"train_info/time_between_train_steps": 0.0060498714447021484, "step": 992} {"info/global_step": 993, "train_info/time_within_train_step": 27.695364952087402, "step": 993} {"train_info/time_between_train_steps": 0.005030393600463867, "step": 993} {"info/global_step": 994, "train_info/time_within_train_step": 27.706636905670166, "step": 994} {"train_info/time_between_train_steps": 0.006405353546142578, "step": 994} {"info/global_step": 995, "train_info/time_within_train_step": 27.69776749610901, "step": 995} {"train_info/time_between_train_steps": 0.009327173233032227, "step": 995} {"info/global_step": 996, "train_info/time_within_train_step": 27.715208768844604, "step": 996} {"train_info/time_between_train_steps": 0.004992008209228516, "step": 996} {"info/global_step": 997, "train_info/time_within_train_step": 27.7818500995636, "step": 997} {"train_info/time_between_train_steps": 0.0069026947021484375, "step": 997} {"info/global_step": 998, "train_info/time_within_train_step": 27.731788635253906, "step": 998} {"train_info/time_between_train_steps": 0.005379676818847656, "step": 998} {"info/global_step": 999, "train_info/time_within_train_step": 27.74721884727478, "step": 999} {"train_info/time_between_train_steps": 0.00545048713684082, "step": 999} {"train_info/time_between_train_steps": 29.724198818206787, "step": 999} {"info/global_step": 1000, "train_info/time_within_train_step": 27.688565254211426, "step": 1000} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740853676, "_runtime": 29625}, "step": 1000} {"logs": {"train/loss": 3.2163, "train/learning_rate": 0.00011111111111111109, "train/epoch": 37.0, "_timestamp": 1740853676, "_runtime": 29625}, "step": 1000} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740853680, "_runtime": 29629}, "step": 1000} {"logs": {"eval/loss": 4.151810169219971, "eval/runtime": 4.074, "eval/samples_per_second": 49.828, "eval/steps_per_second": 3.191, "train/epoch": 37.0, "_timestamp": 1740853680, "_runtime": 29629}, "step": 1000} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740853680, "_runtime": 29629}, "step": 1000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.151810169219971, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 63.548930563193956, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 4.074, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 49.828, "train/epoch": 37.0, "_timestamp": 1740853680, "_runtime": 29629}, "step": 1000} {"train_info/time_between_train_steps": 43.36605477333069, "step": 1000} {"info/global_step": 1001, "train_info/time_within_train_step": 28.000293493270874, "step": 1001} {"train_info/time_between_train_steps": 0.005351066589355469, "step": 1001} {"info/global_step": 1002, "train_info/time_within_train_step": 27.870596408843994, "step": 1002} {"train_info/time_between_train_steps": 0.0053098201751708984, "step": 1002} {"info/global_step": 1003, "train_info/time_within_train_step": 27.874591827392578, "step": 1003} {"train_info/time_between_train_steps": 0.009335756301879883, "step": 1003} {"info/global_step": 1004, "train_info/time_within_train_step": 27.702943086624146, "step": 1004} {"train_info/time_between_train_steps": 0.005999088287353516, "step": 1004} {"info/global_step": 1005, "train_info/time_within_train_step": 27.81688404083252, "step": 1005} {"train_info/time_between_train_steps": 0.0051996707916259766, "step": 1005} {"info/global_step": 1006, "train_info/time_within_train_step": 27.708719730377197, "step": 1006} {"train_info/time_between_train_steps": 0.005308866500854492, "step": 1006} {"info/global_step": 1007, "train_info/time_within_train_step": 27.78282356262207, "step": 1007} {"train_info/time_between_train_steps": 0.005166292190551758, "step": 1007} {"info/global_step": 1008, "train_info/time_within_train_step": 27.686821460723877, "step": 1008} {"train_info/time_between_train_steps": 0.004780292510986328, "step": 1008} {"info/global_step": 1009, "train_info/time_within_train_step": 27.703312635421753, "step": 1009} {"train_info/time_between_train_steps": 0.004992961883544922, "step": 1009} {"info/global_step": 1010, "train_info/time_within_train_step": 27.69071125984192, "step": 1010} {"train_info/time_between_train_steps": 0.005003690719604492, "step": 1010} {"info/global_step": 1011, "train_info/time_within_train_step": 27.71597695350647, "step": 1011} {"train_info/time_between_train_steps": 0.005227804183959961, "step": 1011} {"info/global_step": 1012, "train_info/time_within_train_step": 27.79442286491394, "step": 1012} {"train_info/time_between_train_steps": 0.005912303924560547, "step": 1012} {"info/global_step": 1013, "train_info/time_within_train_step": 27.686455965042114, "step": 1013} {"train_info/time_between_train_steps": 0.004822969436645508, "step": 1013} {"info/global_step": 1014, "train_info/time_within_train_step": 27.681681871414185, "step": 1014} {"train_info/time_between_train_steps": 0.00495147705078125, "step": 1014} {"info/global_step": 1015, "train_info/time_within_train_step": 27.703522443771362, "step": 1015} {"train_info/time_between_train_steps": 0.005167484283447266, "step": 1015} {"info/global_step": 1016, "train_info/time_within_train_step": 27.712687730789185, "step": 1016} {"train_info/time_between_train_steps": 0.004875898361206055, "step": 1016} {"info/global_step": 1017, "train_info/time_within_train_step": 27.671220064163208, "step": 1017} {"train_info/time_between_train_steps": 0.0050661563873291016, "step": 1017} {"info/global_step": 1018, "train_info/time_within_train_step": 27.696019649505615, "step": 1018} {"train_info/time_between_train_steps": 0.005045175552368164, "step": 1018} {"info/global_step": 1019, "train_info/time_within_train_step": 27.684862852096558, "step": 1019} {"train_info/time_between_train_steps": 0.01546478271484375, "step": 1019} {"info/global_step": 1020, "train_info/time_within_train_step": 27.67762017250061, "step": 1020} {"train_info/time_between_train_steps": 0.004844188690185547, "step": 1020} {"info/global_step": 1021, "train_info/time_within_train_step": 27.676417350769043, "step": 1021} {"train_info/time_between_train_steps": 0.004984378814697266, "step": 1021} {"info/global_step": 1022, "train_info/time_within_train_step": 27.695767879486084, "step": 1022} {"train_info/time_between_train_steps": 0.005397319793701172, "step": 1022} {"info/global_step": 1023, "train_info/time_within_train_step": 27.93650460243225, "step": 1023} {"train_info/time_between_train_steps": 0.00986337661743164, "step": 1023} {"info/global_step": 1024, "train_info/time_within_train_step": 27.712936878204346, "step": 1024} {"train_info/time_between_train_steps": 0.004930257797241211, "step": 1024} {"info/global_step": 1025, "train_info/time_within_train_step": 27.69081473350525, "step": 1025} {"train_info/time_between_train_steps": 0.0051648616790771484, "step": 1025} {"info/global_step": 1026, "train_info/time_within_train_step": 27.696756839752197, "step": 1026} {"train_info/time_between_train_steps": 0.005416393280029297, "step": 1026} {"train_info/time_between_train_steps": 29.801055431365967, "step": 1026} {"info/global_step": 1027, "train_info/time_within_train_step": 27.76788592338562, "step": 1027} {"train_info/time_between_train_steps": 0.005841255187988281, "step": 1027} {"info/global_step": 1028, "train_info/time_within_train_step": 27.792548656463623, "step": 1028} {"train_info/time_between_train_steps": 0.005135297775268555, "step": 1028} {"info/global_step": 1029, "train_info/time_within_train_step": 27.68139624595642, "step": 1029} {"train_info/time_between_train_steps": 0.004940986633300781, "step": 1029} {"info/global_step": 1030, "train_info/time_within_train_step": 27.79544425010681, "step": 1030} {"train_info/time_between_train_steps": 0.005193471908569336, "step": 1030} {"info/global_step": 1031, "train_info/time_within_train_step": 27.697800874710083, "step": 1031} {"train_info/time_between_train_steps": 0.005063295364379883, "step": 1031} {"info/global_step": 1032, "train_info/time_within_train_step": 27.871296405792236, "step": 1032} {"train_info/time_between_train_steps": 0.005288362503051758, "step": 1032} {"info/global_step": 1033, "train_info/time_within_train_step": 27.69260001182556, "step": 1033} {"train_info/time_between_train_steps": 0.005006074905395508, "step": 1033} {"info/global_step": 1034, "train_info/time_within_train_step": 27.757064819335938, "step": 1034} {"train_info/time_between_train_steps": 0.005165815353393555, "step": 1034} {"info/global_step": 1035, "train_info/time_within_train_step": 27.699219703674316, "step": 1035} {"train_info/time_between_train_steps": 0.004901885986328125, "step": 1035} {"info/global_step": 1036, "train_info/time_within_train_step": 27.716142654418945, "step": 1036} {"train_info/time_between_train_steps": 0.0048732757568359375, "step": 1036} {"info/global_step": 1037, "train_info/time_within_train_step": 27.704490423202515, "step": 1037} {"train_info/time_between_train_steps": 0.0050661563873291016, "step": 1037} {"info/global_step": 1038, "train_info/time_within_train_step": 27.6817569732666, "step": 1038} {"train_info/time_between_train_steps": 0.004983425140380859, "step": 1038} {"info/global_step": 1039, "train_info/time_within_train_step": 27.70174527168274, "step": 1039} {"train_info/time_between_train_steps": 0.005151033401489258, "step": 1039} {"info/global_step": 1040, "train_info/time_within_train_step": 27.68877911567688, "step": 1040} {"train_info/time_between_train_steps": 0.0049610137939453125, "step": 1040} {"info/global_step": 1041, "train_info/time_within_train_step": 27.72638511657715, "step": 1041} {"train_info/time_between_train_steps": 0.004918813705444336, "step": 1041} {"info/global_step": 1042, "train_info/time_within_train_step": 27.801883459091187, "step": 1042} {"train_info/time_between_train_steps": 0.0051496028900146484, "step": 1042} {"info/global_step": 1043, "train_info/time_within_train_step": 27.683640480041504, "step": 1043} {"train_info/time_between_train_steps": 0.004891872406005859, "step": 1043} {"info/global_step": 1044, "train_info/time_within_train_step": 27.679919004440308, "step": 1044} {"train_info/time_between_train_steps": 0.005937337875366211, "step": 1044} {"info/global_step": 1045, "train_info/time_within_train_step": 27.736676692962646, "step": 1045} {"train_info/time_between_train_steps": 0.005287647247314453, "step": 1045} {"info/global_step": 1046, "train_info/time_within_train_step": 27.70685315132141, "step": 1046} {"train_info/time_between_train_steps": 0.0052416324615478516, "step": 1046} {"info/global_step": 1047, "train_info/time_within_train_step": 27.70112657546997, "step": 1047} {"train_info/time_between_train_steps": 0.0051839351654052734, "step": 1047} {"info/global_step": 1048, "train_info/time_within_train_step": 27.70680546760559, "step": 1048} {"train_info/time_between_train_steps": 0.004974842071533203, "step": 1048} {"info/global_step": 1049, "train_info/time_within_train_step": 27.696149349212646, "step": 1049} {"train_info/time_between_train_steps": 0.005005836486816406, "step": 1049} {"info/global_step": 1050, "train_info/time_within_train_step": 27.69243288040161, "step": 1050} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740855138, "_runtime": 31087}, "step": 1050} {"logs": {"train/loss": 3.1173, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 38.02, "_timestamp": 1740855138, "_runtime": 31087}, "step": 1050} {"train_info/time_between_train_steps": 0.025829792022705078, "step": 1050} {"info/global_step": 1051, "train_info/time_within_train_step": 27.74435567855835, "step": 1051} {"train_info/time_between_train_steps": 0.005174160003662109, "step": 1051} {"info/global_step": 1052, "train_info/time_within_train_step": 27.74781060218811, "step": 1052} {"train_info/time_between_train_steps": 0.005259513854980469, "step": 1052} {"info/global_step": 1053, "train_info/time_within_train_step": 27.70914363861084, "step": 1053} {"train_info/time_between_train_steps": 0.005623340606689453, "step": 1053} {"train_info/time_between_train_steps": 29.710018396377563, "step": 1053} {"info/global_step": 1054, "train_info/time_within_train_step": 27.71225118637085, "step": 1054} {"train_info/time_between_train_steps": 0.0052947998046875, "step": 1054} {"info/global_step": 1055, "train_info/time_within_train_step": 27.84862518310547, "step": 1055} {"train_info/time_between_train_steps": 0.005180835723876953, "step": 1055} {"info/global_step": 1056, "train_info/time_within_train_step": 27.730132341384888, "step": 1056} {"train_info/time_between_train_steps": 0.005624055862426758, "step": 1056} {"info/global_step": 1057, "train_info/time_within_train_step": 27.94749617576599, "step": 1057} {"train_info/time_between_train_steps": 0.005332469940185547, "step": 1057} {"info/global_step": 1058, "train_info/time_within_train_step": 27.698956727981567, "step": 1058} {"train_info/time_between_train_steps": 0.005093812942504883, "step": 1058} {"info/global_step": 1059, "train_info/time_within_train_step": 27.832836151123047, "step": 1059} {"train_info/time_between_train_steps": 0.0049669742584228516, "step": 1059} {"info/global_step": 1060, "train_info/time_within_train_step": 27.70452380180359, "step": 1060} {"train_info/time_between_train_steps": 0.005288839340209961, "step": 1060} {"info/global_step": 1061, "train_info/time_within_train_step": 27.786941051483154, "step": 1061} {"train_info/time_between_train_steps": 0.0068171024322509766, "step": 1061} {"info/global_step": 1062, "train_info/time_within_train_step": 27.69574999809265, "step": 1062} {"train_info/time_between_train_steps": 0.005157470703125, "step": 1062} {"info/global_step": 1063, "train_info/time_within_train_step": 27.67673635482788, "step": 1063} {"train_info/time_between_train_steps": 0.0049746036529541016, "step": 1063} {"info/global_step": 1064, "train_info/time_within_train_step": 27.685830116271973, "step": 1064} {"train_info/time_between_train_steps": 0.004913806915283203, "step": 1064} {"info/global_step": 1065, "train_info/time_within_train_step": 27.69575810432434, "step": 1065} {"train_info/time_between_train_steps": 0.005175113677978516, "step": 1065} {"info/global_step": 1066, "train_info/time_within_train_step": 27.695711851119995, "step": 1066} {"train_info/time_between_train_steps": 0.004931211471557617, "step": 1066} {"info/global_step": 1067, "train_info/time_within_train_step": 27.954797983169556, "step": 1067} {"train_info/time_between_train_steps": 0.0048999786376953125, "step": 1067} {"info/global_step": 1068, "train_info/time_within_train_step": 27.712567806243896, "step": 1068} {"train_info/time_between_train_steps": 0.005145072937011719, "step": 1068} {"info/global_step": 1069, "train_info/time_within_train_step": 27.703584671020508, "step": 1069} {"train_info/time_between_train_steps": 0.005635499954223633, "step": 1069} {"info/global_step": 1070, "train_info/time_within_train_step": 27.741321563720703, "step": 1070} {"train_info/time_between_train_steps": 0.005042552947998047, "step": 1070} {"info/global_step": 1071, "train_info/time_within_train_step": 27.694608449935913, "step": 1071} {"train_info/time_between_train_steps": 0.005138874053955078, "step": 1071} {"info/global_step": 1072, "train_info/time_within_train_step": 27.73574995994568, "step": 1072} {"train_info/time_between_train_steps": 0.00514674186706543, "step": 1072} {"info/global_step": 1073, "train_info/time_within_train_step": 27.812591314315796, "step": 1073} {"train_info/time_between_train_steps": 0.004973649978637695, "step": 1073} {"info/global_step": 1074, "train_info/time_within_train_step": 27.69587540626526, "step": 1074} {"train_info/time_between_train_steps": 0.0050046443939208984, "step": 1074} {"info/global_step": 1075, "train_info/time_within_train_step": 27.730485439300537, "step": 1075} {"train_info/time_between_train_steps": 0.0048961639404296875, "step": 1075} {"info/global_step": 1076, "train_info/time_within_train_step": 27.696619033813477, "step": 1076} {"train_info/time_between_train_steps": 0.0049173831939697266, "step": 1076} {"info/global_step": 1077, "train_info/time_within_train_step": 27.674572706222534, "step": 1077} {"train_info/time_between_train_steps": 0.005046367645263672, "step": 1077} {"info/global_step": 1078, "train_info/time_within_train_step": 27.7299907207489, "step": 1078} {"train_info/time_between_train_steps": 0.005077838897705078, "step": 1078} {"info/global_step": 1079, "train_info/time_within_train_step": 27.712668657302856, "step": 1079} {"train_info/time_between_train_steps": 0.005385875701904297, "step": 1079} {"info/global_step": 1080, "train_info/time_within_train_step": 27.72298789024353, "step": 1080} {"train_info/time_between_train_steps": 0.005451202392578125, "step": 1080} {"train_info/time_between_train_steps": 29.762459993362427, "step": 1080} {"info/global_step": 1081, "train_info/time_within_train_step": 27.740341663360596, "step": 1081} {"train_info/time_between_train_steps": 0.005019426345825195, "step": 1081} {"info/global_step": 1082, "train_info/time_within_train_step": 27.85689353942871, "step": 1082} {"train_info/time_between_train_steps": 0.004942417144775391, "step": 1082} {"info/global_step": 1083, "train_info/time_within_train_step": 27.691681385040283, "step": 1083} {"train_info/time_between_train_steps": 0.005137443542480469, "step": 1083} {"info/global_step": 1084, "train_info/time_within_train_step": 27.83687734603882, "step": 1084} {"train_info/time_between_train_steps": 0.005265951156616211, "step": 1084} {"info/global_step": 1085, "train_info/time_within_train_step": 27.727338075637817, "step": 1085} {"train_info/time_between_train_steps": 0.00560760498046875, "step": 1085} {"info/global_step": 1086, "train_info/time_within_train_step": 27.904183626174927, "step": 1086} {"train_info/time_between_train_steps": 0.005445718765258789, "step": 1086} {"info/global_step": 1087, "train_info/time_within_train_step": 27.834667205810547, "step": 1087} {"train_info/time_between_train_steps": 0.0051877498626708984, "step": 1087} {"info/global_step": 1088, "train_info/time_within_train_step": 27.77045726776123, "step": 1088} {"train_info/time_between_train_steps": 0.0052182674407958984, "step": 1088} {"info/global_step": 1089, "train_info/time_within_train_step": 27.71987748146057, "step": 1089} {"train_info/time_between_train_steps": 0.00492405891418457, "step": 1089} {"info/global_step": 1090, "train_info/time_within_train_step": 27.695985794067383, "step": 1090} {"train_info/time_between_train_steps": 0.005131721496582031, "step": 1090} {"info/global_step": 1091, "train_info/time_within_train_step": 27.71149778366089, "step": 1091} {"train_info/time_between_train_steps": 0.00494837760925293, "step": 1091} {"info/global_step": 1092, "train_info/time_within_train_step": 27.738033294677734, "step": 1092} {"train_info/time_between_train_steps": 0.0054056644439697266, "step": 1092} {"info/global_step": 1093, "train_info/time_within_train_step": 27.685067892074585, "step": 1093} {"train_info/time_between_train_steps": 0.005060911178588867, "step": 1093} {"info/global_step": 1094, "train_info/time_within_train_step": 27.7299382686615, "step": 1094} {"train_info/time_between_train_steps": 0.004908561706542969, "step": 1094} {"info/global_step": 1095, "train_info/time_within_train_step": 27.68550181388855, "step": 1095} {"train_info/time_between_train_steps": 0.00502467155456543, "step": 1095} {"info/global_step": 1096, "train_info/time_within_train_step": 27.68264651298523, "step": 1096} {"train_info/time_between_train_steps": 0.005059242248535156, "step": 1096} {"info/global_step": 1097, "train_info/time_within_train_step": 27.719717979431152, "step": 1097} {"train_info/time_between_train_steps": 0.0051422119140625, "step": 1097} {"info/global_step": 1098, "train_info/time_within_train_step": 27.69098711013794, "step": 1098} {"train_info/time_between_train_steps": 0.005074501037597656, "step": 1098} {"info/global_step": 1099, "train_info/time_within_train_step": 27.68382740020752, "step": 1099} {"train_info/time_between_train_steps": 0.004937410354614258, "step": 1099} {"info/global_step": 1100, "train_info/time_within_train_step": 27.683674812316895, "step": 1100} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740856586, "_runtime": 32535}, "step": 1100} {"logs": {"train/loss": 3.142, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 40.02, "_timestamp": 1740856586, "_runtime": 32535}, "step": 1100} {"train_info/time_between_train_steps": 41.02827215194702, "step": 1100} {"info/global_step": 1101, "train_info/time_within_train_step": 27.998775243759155, "step": 1101} {"train_info/time_between_train_steps": 0.0052111148834228516, "step": 1101} {"info/global_step": 1102, "train_info/time_within_train_step": 28.6092848777771, "step": 1102} {"train_info/time_between_train_steps": 0.005062580108642578, "step": 1102} {"info/global_step": 1103, "train_info/time_within_train_step": 27.798083305358887, "step": 1103} {"train_info/time_between_train_steps": 0.005140781402587891, "step": 1103} {"info/global_step": 1104, "train_info/time_within_train_step": 27.723987579345703, "step": 1104} {"train_info/time_between_train_steps": 0.005644559860229492, "step": 1104} {"info/global_step": 1105, "train_info/time_within_train_step": 27.713963985443115, "step": 1105} {"train_info/time_between_train_steps": 0.005319833755493164, "step": 1105} {"info/global_step": 1106, "train_info/time_within_train_step": 27.74254536628723, "step": 1106} {"train_info/time_between_train_steps": 0.005207538604736328, "step": 1106} {"info/global_step": 1107, "train_info/time_within_train_step": 27.734828233718872, "step": 1107} {"train_info/time_between_train_steps": 0.005782604217529297, "step": 1107} {"train_info/time_between_train_steps": 30.005472898483276, "step": 1107} {"info/global_step": 1108, "train_info/time_within_train_step": 27.70647621154785, "step": 1108} {"train_info/time_between_train_steps": 0.004958391189575195, "step": 1108} {"info/global_step": 1109, "train_info/time_within_train_step": 27.84903049468994, "step": 1109} {"train_info/time_between_train_steps": 0.004988670349121094, "step": 1109} {"info/global_step": 1110, "train_info/time_within_train_step": 27.687151432037354, "step": 1110} {"train_info/time_between_train_steps": 0.004788398742675781, "step": 1110} {"info/global_step": 1111, "train_info/time_within_train_step": 27.840144395828247, "step": 1111} {"train_info/time_between_train_steps": 0.005113840103149414, "step": 1111} {"info/global_step": 1112, "train_info/time_within_train_step": 27.70552897453308, "step": 1112} {"train_info/time_between_train_steps": 0.005121946334838867, "step": 1112} {"info/global_step": 1113, "train_info/time_within_train_step": 27.824426651000977, "step": 1113} {"train_info/time_between_train_steps": 0.0052623748779296875, "step": 1113} {"info/global_step": 1114, "train_info/time_within_train_step": 27.709877490997314, "step": 1114} {"train_info/time_between_train_steps": 0.005372047424316406, "step": 1114} {"info/global_step": 1115, "train_info/time_within_train_step": 27.772328853607178, "step": 1115} {"train_info/time_between_train_steps": 0.0052165985107421875, "step": 1115} {"info/global_step": 1116, "train_info/time_within_train_step": 27.696478843688965, "step": 1116} {"train_info/time_between_train_steps": 0.005136966705322266, "step": 1116} {"info/global_step": 1117, "train_info/time_within_train_step": 27.686715126037598, "step": 1117} {"train_info/time_between_train_steps": 0.005037546157836914, "step": 1117} {"info/global_step": 1118, "train_info/time_within_train_step": 27.836971521377563, "step": 1118} {"train_info/time_between_train_steps": 0.005316734313964844, "step": 1118} {"info/global_step": 1119, "train_info/time_within_train_step": 28.03602147102356, "step": 1119} {"train_info/time_between_train_steps": 0.004899740219116211, "step": 1119} {"info/global_step": 1120, "train_info/time_within_train_step": 28.90098738670349, "step": 1120} {"train_info/time_between_train_steps": 0.005036354064941406, "step": 1120} {"info/global_step": 1121, "train_info/time_within_train_step": 27.708167552947998, "step": 1121} {"train_info/time_between_train_steps": 0.004911184310913086, "step": 1121} {"info/global_step": 1122, "train_info/time_within_train_step": 27.735175848007202, "step": 1122} {"train_info/time_between_train_steps": 0.005074501037597656, "step": 1122} {"info/global_step": 1123, "train_info/time_within_train_step": 27.688118934631348, "step": 1123} {"train_info/time_between_train_steps": 0.005179405212402344, "step": 1123} {"info/global_step": 1124, "train_info/time_within_train_step": 27.746726989746094, "step": 1124} {"train_info/time_between_train_steps": 0.0060520172119140625, "step": 1124} {"info/global_step": 1125, "train_info/time_within_train_step": 27.70869493484497, "step": 1125} {"train_info/time_between_train_steps": 0.004938364028930664, "step": 1125} {"info/global_step": 1126, "train_info/time_within_train_step": 27.744354724884033, "step": 1126} {"train_info/time_between_train_steps": 0.005226850509643555, "step": 1126} {"info/global_step": 1127, "train_info/time_within_train_step": 27.699812173843384, "step": 1127} {"train_info/time_between_train_steps": 0.005067110061645508, "step": 1127} {"info/global_step": 1128, "train_info/time_within_train_step": 27.692742109298706, "step": 1128} {"train_info/time_between_train_steps": 0.00508880615234375, "step": 1128} {"info/global_step": 1129, "train_info/time_within_train_step": 27.738450288772583, "step": 1129} {"train_info/time_between_train_steps": 0.0048291683197021484, "step": 1129} {"info/global_step": 1130, "train_info/time_within_train_step": 27.684617042541504, "step": 1130} {"train_info/time_between_train_steps": 0.005114078521728516, "step": 1130} {"info/global_step": 1131, "train_info/time_within_train_step": 27.7275333404541, "step": 1131} {"train_info/time_between_train_steps": 0.005097627639770508, "step": 1131} {"info/global_step": 1132, "train_info/time_within_train_step": 27.714468479156494, "step": 1132} {"train_info/time_between_train_steps": 0.005156040191650391, "step": 1132} {"info/global_step": 1133, "train_info/time_within_train_step": 27.846184015274048, "step": 1133} {"train_info/time_between_train_steps": 0.00514531135559082, "step": 1133} {"info/global_step": 1134, "train_info/time_within_train_step": 27.755210876464844, "step": 1134} {"train_info/time_between_train_steps": 0.005201578140258789, "step": 1134} {"train_info/time_between_train_steps": 29.83916997909546, "step": 1134} {"info/global_step": 1135, "train_info/time_within_train_step": 27.697821140289307, "step": 1135} {"train_info/time_between_train_steps": 0.005738019943237305, "step": 1135} {"info/global_step": 1136, "train_info/time_within_train_step": 27.847658395767212, "step": 1136} {"train_info/time_between_train_steps": 0.00481104850769043, "step": 1136} {"info/global_step": 1137, "train_info/time_within_train_step": 27.68674087524414, "step": 1137} {"train_info/time_between_train_steps": 0.004817008972167969, "step": 1137} {"info/global_step": 1138, "train_info/time_within_train_step": 27.867809534072876, "step": 1138} {"train_info/time_between_train_steps": 0.0051021575927734375, "step": 1138} {"info/global_step": 1139, "train_info/time_within_train_step": 27.762470483779907, "step": 1139} {"train_info/time_between_train_steps": 0.005422830581665039, "step": 1139} {"info/global_step": 1140, "train_info/time_within_train_step": 27.887553453445435, "step": 1140} {"train_info/time_between_train_steps": 0.01693558692932129, "step": 1140} {"info/global_step": 1141, "train_info/time_within_train_step": 27.73496985435486, "step": 1141} {"train_info/time_between_train_steps": 0.005130767822265625, "step": 1141} {"info/global_step": 1142, "train_info/time_within_train_step": 27.759283781051636, "step": 1142} {"train_info/time_between_train_steps": 0.0051577091217041016, "step": 1142} {"info/global_step": 1143, "train_info/time_within_train_step": 27.710222959518433, "step": 1143} {"train_info/time_between_train_steps": 0.004961252212524414, "step": 1143} {"info/global_step": 1144, "train_info/time_within_train_step": 27.687845945358276, "step": 1144} {"train_info/time_between_train_steps": 0.0058765411376953125, "step": 1144} {"info/global_step": 1145, "train_info/time_within_train_step": 27.707916736602783, "step": 1145} {"train_info/time_between_train_steps": 0.004926919937133789, "step": 1145} {"info/global_step": 1146, "train_info/time_within_train_step": 27.685908555984497, "step": 1146} {"train_info/time_between_train_steps": 0.00485682487487793, "step": 1146} {"info/global_step": 1147, "train_info/time_within_train_step": 27.72572922706604, "step": 1147} {"train_info/time_between_train_steps": 0.004899263381958008, "step": 1147} {"info/global_step": 1148, "train_info/time_within_train_step": 27.76492977142334, "step": 1148} {"train_info/time_between_train_steps": 0.009741544723510742, "step": 1148} {"info/global_step": 1149, "train_info/time_within_train_step": 27.723357439041138, "step": 1149} {"train_info/time_between_train_steps": 0.004979610443115234, "step": 1149} {"info/global_step": 1150, "train_info/time_within_train_step": 27.695191621780396, "step": 1150} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740858080, "_runtime": 34029}, "step": 1150} {"logs": {"train/loss": 3.1114, "train/learning_rate": 2.7777777777777772e-05, "train/epoch": 42.01, "_timestamp": 1740858080, "_runtime": 34029}, "step": 1150} {"train_info/time_between_train_steps": 0.02635049819946289, "step": 1150} {"info/global_step": 1151, "train_info/time_within_train_step": 27.67681336402893, "step": 1151} {"train_info/time_between_train_steps": 0.004891157150268555, "step": 1151} {"info/global_step": 1152, "train_info/time_within_train_step": 27.693902492523193, "step": 1152} {"train_info/time_between_train_steps": 0.00596928596496582, "step": 1152} {"info/global_step": 1153, "train_info/time_within_train_step": 27.69721508026123, "step": 1153} {"train_info/time_between_train_steps": 0.00495457649230957, "step": 1153} {"info/global_step": 1154, "train_info/time_within_train_step": 27.68316340446472, "step": 1154} {"train_info/time_between_train_steps": 0.005010843276977539, "step": 1154} {"info/global_step": 1155, "train_info/time_within_train_step": 27.68389368057251, "step": 1155} {"train_info/time_between_train_steps": 0.005175352096557617, "step": 1155} {"info/global_step": 1156, "train_info/time_within_train_step": 27.734208583831787, "step": 1156} {"train_info/time_between_train_steps": 0.005148887634277344, "step": 1156} {"info/global_step": 1157, "train_info/time_within_train_step": 27.703547716140747, "step": 1157} {"train_info/time_between_train_steps": 0.005231618881225586, "step": 1157} {"info/global_step": 1158, "train_info/time_within_train_step": 27.72550940513611, "step": 1158} {"train_info/time_between_train_steps": 0.005006551742553711, "step": 1158} {"info/global_step": 1159, "train_info/time_within_train_step": 27.690680503845215, "step": 1159} {"train_info/time_between_train_steps": 0.0054171085357666016, "step": 1159} {"info/global_step": 1160, "train_info/time_within_train_step": 27.73633646965027, "step": 1160} {"train_info/time_between_train_steps": 0.0052683353424072266, "step": 1160} {"info/global_step": 1161, "train_info/time_within_train_step": 27.72842502593994, "step": 1161} {"train_info/time_between_train_steps": 0.005506992340087891, "step": 1161} {"train_info/time_between_train_steps": 29.790043115615845, "step": 1161} {"info/global_step": 1162, "train_info/time_within_train_step": 27.7026150226593, "step": 1162} {"train_info/time_between_train_steps": 0.004858493804931641, "step": 1162} {"info/global_step": 1163, "train_info/time_within_train_step": 27.970237731933594, "step": 1163} {"train_info/time_between_train_steps": 0.00524449348449707, "step": 1163} {"info/global_step": 1164, "train_info/time_within_train_step": 27.69316864013672, "step": 1164} {"train_info/time_between_train_steps": 0.005135774612426758, "step": 1164} {"info/global_step": 1165, "train_info/time_within_train_step": 27.819489002227783, "step": 1165} {"train_info/time_between_train_steps": 0.0052144527435302734, "step": 1165} {"info/global_step": 1166, "train_info/time_within_train_step": 27.705933332443237, "step": 1166} {"train_info/time_between_train_steps": 0.004927158355712891, "step": 1166} {"info/global_step": 1167, "train_info/time_within_train_step": 27.819119453430176, "step": 1167} {"train_info/time_between_train_steps": 0.00518345832824707, "step": 1167} {"info/global_step": 1168, "train_info/time_within_train_step": 27.758617877960205, "step": 1168} {"train_info/time_between_train_steps": 0.00533294677734375, "step": 1168} {"info/global_step": 1169, "train_info/time_within_train_step": 27.79144310951233, "step": 1169} {"train_info/time_between_train_steps": 0.005267620086669922, "step": 1169} {"info/global_step": 1170, "train_info/time_within_train_step": 27.737929582595825, "step": 1170} {"train_info/time_between_train_steps": 0.0057294368743896484, "step": 1170} {"info/global_step": 1171, "train_info/time_within_train_step": 27.70017671585083, "step": 1171} {"train_info/time_between_train_steps": 0.0049936771392822266, "step": 1171} {"info/global_step": 1172, "train_info/time_within_train_step": 27.740699291229248, "step": 1172} {"train_info/time_between_train_steps": 0.004912614822387695, "step": 1172} {"info/global_step": 1173, "train_info/time_within_train_step": 27.68489980697632, "step": 1173} {"train_info/time_between_train_steps": 0.004923343658447266, "step": 1173} {"info/global_step": 1174, "train_info/time_within_train_step": 27.72490406036377, "step": 1174} {"train_info/time_between_train_steps": 0.005075931549072266, "step": 1174} {"info/global_step": 1175, "train_info/time_within_train_step": 27.68814754486084, "step": 1175} {"train_info/time_between_train_steps": 0.004799604415893555, "step": 1175} {"info/global_step": 1176, "train_info/time_within_train_step": 27.722071409225464, "step": 1176} {"train_info/time_between_train_steps": 0.0052225589752197266, "step": 1176} {"info/global_step": 1177, "train_info/time_within_train_step": 27.688185453414917, "step": 1177} {"train_info/time_between_train_steps": 0.0050847530364990234, "step": 1177} {"info/global_step": 1178, "train_info/time_within_train_step": 27.769520044326782, "step": 1178} {"train_info/time_between_train_steps": 0.0049211978912353516, "step": 1178} {"info/global_step": 1179, "train_info/time_within_train_step": 27.696720123291016, "step": 1179} {"train_info/time_between_train_steps": 0.0050046443939208984, "step": 1179} {"info/global_step": 1180, "train_info/time_within_train_step": 27.69837260246277, "step": 1180} {"train_info/time_between_train_steps": 0.005074024200439453, "step": 1180} {"info/global_step": 1181, "train_info/time_within_train_step": 27.717630863189697, "step": 1181} {"train_info/time_between_train_steps": 0.004993915557861328, "step": 1181} {"info/global_step": 1182, "train_info/time_within_train_step": 27.69912576675415, "step": 1182} {"train_info/time_between_train_steps": 0.005126476287841797, "step": 1182} {"info/global_step": 1183, "train_info/time_within_train_step": 27.730365753173828, "step": 1183} {"train_info/time_between_train_steps": 0.004946470260620117, "step": 1183} {"info/global_step": 1184, "train_info/time_within_train_step": 27.701728343963623, "step": 1184} {"train_info/time_between_train_steps": 0.004911899566650391, "step": 1184} {"info/global_step": 1185, "train_info/time_within_train_step": 27.73612904548645, "step": 1185} {"train_info/time_between_train_steps": 0.00519871711730957, "step": 1185} {"info/global_step": 1186, "train_info/time_within_train_step": 27.694844245910645, "step": 1186} {"train_info/time_between_train_steps": 0.005022287368774414, "step": 1186} {"info/global_step": 1187, "train_info/time_within_train_step": 27.734578132629395, "step": 1187} {"train_info/time_between_train_steps": 0.005408287048339844, "step": 1187} {"info/global_step": 1188, "train_info/time_within_train_step": 27.711532592773438, "step": 1188} {"train_info/time_between_train_steps": 0.0056231021881103516, "step": 1188} {"train_info/time_between_train_steps": 29.976243495941162, "step": 1188} {"info/global_step": 1189, "train_info/time_within_train_step": 27.691545724868774, "step": 1189} {"train_info/time_between_train_steps": 0.005637168884277344, "step": 1189} {"info/global_step": 1190, "train_info/time_within_train_step": 27.8354971408844, "step": 1190} {"train_info/time_between_train_steps": 0.005497455596923828, "step": 1190} {"info/global_step": 1191, "train_info/time_within_train_step": 27.717230081558228, "step": 1191} {"train_info/time_between_train_steps": 0.005144596099853516, "step": 1191} {"info/global_step": 1192, "train_info/time_within_train_step": 27.81442618370056, "step": 1192} {"train_info/time_between_train_steps": 0.00510406494140625, "step": 1192} {"info/global_step": 1193, "train_info/time_within_train_step": 27.837268829345703, "step": 1193} {"train_info/time_between_train_steps": 0.005037784576416016, "step": 1193} {"info/global_step": 1194, "train_info/time_within_train_step": 27.85683298110962, "step": 1194} {"train_info/time_between_train_steps": 0.005466461181640625, "step": 1194} {"info/global_step": 1195, "train_info/time_within_train_step": 27.75145387649536, "step": 1195} {"train_info/time_between_train_steps": 0.00521087646484375, "step": 1195} {"info/global_step": 1196, "train_info/time_within_train_step": 27.760989904403687, "step": 1196} {"train_info/time_between_train_steps": 0.005158662796020508, "step": 1196} {"info/global_step": 1197, "train_info/time_within_train_step": 27.6898353099823, "step": 1197} {"train_info/time_between_train_steps": 0.004963874816894531, "step": 1197} {"info/global_step": 1198, "train_info/time_within_train_step": 27.672107458114624, "step": 1198} {"train_info/time_between_train_steps": 0.004807233810424805, "step": 1198} {"info/global_step": 1199, "train_info/time_within_train_step": 27.719714641571045, "step": 1199} {"train_info/time_between_train_steps": 0.00517582893371582, "step": 1199} {"info/global_step": 1200, "train_info/time_within_train_step": 27.68014931678772, "step": 1200} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740859528, "_runtime": 35477}, "step": 1200} {"logs": {"train/loss": 3.0867, "train/learning_rate": 0.0, "train/epoch": 44.01, "_timestamp": 1740859528, "_runtime": 35477}, "step": 1200} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740859569, "_runtime": 35518}, "step": 1200} {"logs": {"train/train_runtime": 35519.5303, "train/train_samples_per_second": 17.298, "train/train_steps_per_second": 0.034, "train/total_flos": 3.32296573943808e+17, "train/train_loss": 4.049262095292409, "train/epoch": 44.01, "_timestamp": 1740859569, "_runtime": 35518}, "step": 1200} {"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740859599, "_runtime": 35548}, "step": 1200} {"logs": {"eval/loss": 4.187204837799072, "eval/runtime": 5.6239, "eval/samples_per_second": 36.096, "eval/steps_per_second": 2.312, "train/epoch": 44.01, "_timestamp": 1740859599, "_runtime": 35548}, "step": 1200} {"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740859600, "_runtime": 35549}, "step": 1200} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.187204837799072, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 65.83850422635916, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.6239, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.096, "train/epoch": 44.01, "_timestamp": 1740859600, "_runtime": 35549}, "step": 1200}