{"num_parameters": 108882432, "trainable_parameters": 108882432, "step": 0} {"train_info/time_between_train_steps": 2.2687289714813232, "step": 0} {"info/global_step": 1, "train_info/time_within_train_step": 4.450688362121582, "step": 1} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 4412.87744140625, "train_info/memory_reserved": 4642.0, "train_info/memory_max_reserved": 4642.0, "_timestamp": 1746311867, "_runtime": 23}, "step": 1} {"logs": {"train/loss": 10.3518, "train/learning_rate": 2e-06, "train/epoch": 0.0, "_timestamp": 1746311867, "_runtime": 23}, "step": 1} {"train_info/time_between_train_steps": 0.02458953857421875, "step": 1} {"info/global_step": 2, "train_info/time_within_train_step": 2.444490671157837, "step": 2} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 2} {"info/global_step": 3, "train_info/time_within_train_step": 2.447488307952881, "step": 3} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 3} {"info/global_step": 4, "train_info/time_within_train_step": 2.4509081840515137, "step": 4} {"train_info/time_between_train_steps": 0.003231048583984375, "step": 4} {"info/global_step": 5, "train_info/time_within_train_step": 2.4579179286956787, "step": 5} {"train_info/time_between_train_steps": 0.0033996105194091797, "step": 5} {"info/global_step": 6, "train_info/time_within_train_step": 2.456939220428467, "step": 6} {"train_info/time_between_train_steps": 0.0033597946166992188, "step": 6} {"info/global_step": 7, "train_info/time_within_train_step": 2.459333658218384, "step": 7} {"train_info/time_between_train_steps": 0.003360748291015625, "step": 7} {"info/global_step": 8, "train_info/time_within_train_step": 2.4784884452819824, "step": 8} {"train_info/time_between_train_steps": 0.003400564193725586, "step": 8} {"info/global_step": 9, "train_info/time_within_train_step": 2.6297953128814697, "step": 9} {"train_info/time_between_train_steps": 0.0032851696014404297, "step": 9} {"info/global_step": 10, "train_info/time_within_train_step": 2.6784520149230957, "step": 10} {"train_info/time_between_train_steps": 0.003301382064819336, "step": 10} {"info/global_step": 11, "train_info/time_within_train_step": 2.6772584915161133, "step": 11} {"train_info/time_between_train_steps": 0.0032634735107421875, "step": 11} {"info/global_step": 12, "train_info/time_within_train_step": 2.679006338119507, "step": 12} {"train_info/time_between_train_steps": 0.003650188446044922, "step": 12} {"info/global_step": 13, "train_info/time_within_train_step": 2.6789443492889404, "step": 13} {"train_info/time_between_train_steps": 0.003649473190307617, "step": 13} {"info/global_step": 14, "train_info/time_within_train_step": 2.679755926132202, "step": 14} {"train_info/time_between_train_steps": 0.0033979415893554688, "step": 14} {"info/global_step": 15, "train_info/time_within_train_step": 2.680030345916748, "step": 15} {"train_info/time_between_train_steps": 0.003512859344482422, "step": 15} {"info/global_step": 16, "train_info/time_within_train_step": 2.6820530891418457, "step": 16} {"train_info/time_between_train_steps": 0.003262758255004883, "step": 16} {"info/global_step": 17, "train_info/time_within_train_step": 2.6812615394592285, "step": 17} {"train_info/time_between_train_steps": 0.003633737564086914, "step": 17} {"info/global_step": 18, "train_info/time_within_train_step": 2.6828012466430664, "step": 18} {"train_info/time_between_train_steps": 0.0035521984100341797, "step": 18} {"info/global_step": 19, "train_info/time_within_train_step": 2.687525749206543, "step": 19} {"train_info/time_between_train_steps": 0.003512144088745117, "step": 19} {"info/global_step": 20, "train_info/time_within_train_step": 2.6830384731292725, "step": 20} {"train_info/time_between_train_steps": 0.0034072399139404297, "step": 20} {"info/global_step": 21, "train_info/time_within_train_step": 2.6835975646972656, "step": 21} {"train_info/time_between_train_steps": 0.0035772323608398438, "step": 21} {"info/global_step": 22, "train_info/time_within_train_step": 2.91353178024292, "step": 22} {"train_info/time_between_train_steps": 0.0035445690155029297, "step": 22} {"info/global_step": 23, "train_info/time_within_train_step": 2.6826841831207275, "step": 23} {"train_info/time_between_train_steps": 0.0034456253051757812, "step": 23} {"info/global_step": 24, "train_info/time_within_train_step": 2.6833250522613525, "step": 24} {"train_info/time_between_train_steps": 0.0033974647521972656, "step": 24} {"info/global_step": 25, "train_info/time_within_train_step": 2.6818835735321045, "step": 25} {"train_info/time_between_train_steps": 0.003414630889892578, "step": 25} {"info/global_step": 26, "train_info/time_within_train_step": 2.6822826862335205, "step": 26} {"train_info/time_between_train_steps": 0.0033283233642578125, "step": 26} {"info/global_step": 27, "train_info/time_within_train_step": 2.6820168495178223, "step": 27} {"train_info/time_between_train_steps": 0.0033698081970214844, "step": 27} {"info/global_step": 28, "train_info/time_within_train_step": 2.6818833351135254, "step": 28} {"train_info/time_between_train_steps": 0.0033326148986816406, "step": 28} {"info/global_step": 29, "train_info/time_within_train_step": 2.682904005050659, "step": 29} {"train_info/time_between_train_steps": 0.003292560577392578, "step": 29} {"info/global_step": 30, "train_info/time_within_train_step": 2.6823830604553223, "step": 30} {"train_info/time_between_train_steps": 0.0034558773040771484, "step": 30} {"info/global_step": 31, "train_info/time_within_train_step": 2.68233585357666, "step": 31} {"train_info/time_between_train_steps": 0.003389596939086914, "step": 31} {"info/global_step": 32, "train_info/time_within_train_step": 2.6824910640716553, "step": 32} {"train_info/time_between_train_steps": 0.0034089088439941406, "step": 32} {"info/global_step": 33, "train_info/time_within_train_step": 2.692337989807129, "step": 33} {"train_info/time_between_train_steps": 0.0034661293029785156, "step": 33} {"info/global_step": 34, "train_info/time_within_train_step": 2.682961940765381, "step": 34} {"train_info/time_between_train_steps": 0.003421783447265625, "step": 34} {"info/global_step": 35, "train_info/time_within_train_step": 2.682058811187744, "step": 35} {"train_info/time_between_train_steps": 0.0034286975860595703, "step": 35} {"info/global_step": 36, "train_info/time_within_train_step": 2.682705879211426, "step": 36} {"train_info/time_between_train_steps": 0.0034170150756835938, "step": 36} {"info/global_step": 37, "train_info/time_within_train_step": 2.682347059249878, "step": 37} {"train_info/time_between_train_steps": 0.0034368038177490234, "step": 37} {"info/global_step": 38, "train_info/time_within_train_step": 2.683103322982788, "step": 38} {"train_info/time_between_train_steps": 0.003438234329223633, "step": 38} {"info/global_step": 39, "train_info/time_within_train_step": 2.6888391971588135, "step": 39} {"train_info/time_between_train_steps": 0.0033292770385742188, "step": 39} {"info/global_step": 40, "train_info/time_within_train_step": 2.6824162006378174, "step": 40} {"train_info/time_between_train_steps": 0.0033364295959472656, "step": 40} {"info/global_step": 41, "train_info/time_within_train_step": 2.6969661712646484, "step": 41} {"train_info/time_between_train_steps": 0.003313302993774414, "step": 41} {"info/global_step": 42, "train_info/time_within_train_step": 2.6829845905303955, "step": 42} {"train_info/time_between_train_steps": 0.003308534622192383, "step": 42} {"info/global_step": 43, "train_info/time_within_train_step": 2.6825218200683594, "step": 43} {"train_info/time_between_train_steps": 0.0033621788024902344, "step": 43} {"info/global_step": 44, "train_info/time_within_train_step": 2.683629274368286, "step": 44} {"train_info/time_between_train_steps": 0.0034368038177490234, "step": 44} {"info/global_step": 45, "train_info/time_within_train_step": 2.6832804679870605, "step": 45} {"train_info/time_between_train_steps": 0.0034008026123046875, "step": 45} {"info/global_step": 46, "train_info/time_within_train_step": 2.6836254596710205, "step": 46} {"train_info/time_between_train_steps": 0.0034160614013671875, "step": 46} {"info/global_step": 47, "train_info/time_within_train_step": 2.6827309131622314, "step": 47} {"train_info/time_between_train_steps": 0.003385305404663086, "step": 47} {"info/global_step": 48, "train_info/time_within_train_step": 2.684028148651123, "step": 48} {"train_info/time_between_train_steps": 0.00362396240234375, "step": 48} {"info/global_step": 49, "train_info/time_within_train_step": 2.6836016178131104, "step": 49} {"train_info/time_between_train_steps": 0.0034728050231933594, "step": 49} {"info/global_step": 50, "train_info/time_within_train_step": 2.684372663497925, "step": 50} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746311998, "_runtime": 154}, "step": 50} {"logs": {"train/loss": 8.4064, "train/learning_rate": 9.999999999999999e-05, "train/epoch": 0.02, "_timestamp": 1746311998, "_runtime": 154}, "step": 50} {"train_info/time_between_train_steps": 0.024333477020263672, "step": 50} {"info/global_step": 51, "train_info/time_within_train_step": 2.6836965084075928, "step": 51} {"train_info/time_between_train_steps": 0.003586292266845703, "step": 51} {"info/global_step": 52, "train_info/time_within_train_step": 2.6836977005004883, "step": 52} {"train_info/time_between_train_steps": 0.0036554336547851562, "step": 52} {"info/global_step": 53, "train_info/time_within_train_step": 2.6832923889160156, "step": 53} {"train_info/time_between_train_steps": 0.003381490707397461, "step": 53} {"info/global_step": 54, "train_info/time_within_train_step": 2.682316541671753, "step": 54} {"train_info/time_between_train_steps": 0.003384828567504883, "step": 54} {"info/global_step": 55, "train_info/time_within_train_step": 2.6833786964416504, "step": 55} {"train_info/time_between_train_steps": 0.003565073013305664, "step": 55} {"info/global_step": 56, "train_info/time_within_train_step": 2.6837446689605713, "step": 56} {"train_info/time_between_train_steps": 0.0036094188690185547, "step": 56} {"info/global_step": 57, "train_info/time_within_train_step": 2.683642625808716, "step": 57} {"train_info/time_between_train_steps": 0.003412008285522461, "step": 57} {"info/global_step": 58, "train_info/time_within_train_step": 2.6813061237335205, "step": 58} {"train_info/time_between_train_steps": 0.0033736228942871094, "step": 58} {"info/global_step": 59, "train_info/time_within_train_step": 2.680297374725342, "step": 59} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 59} {"info/global_step": 60, "train_info/time_within_train_step": 2.6812734603881836, "step": 60} {"train_info/time_between_train_steps": 0.0035364627838134766, "step": 60} {"info/global_step": 61, "train_info/time_within_train_step": 2.6816625595092773, "step": 61} {"train_info/time_between_train_steps": 0.003238677978515625, "step": 61} {"info/global_step": 62, "train_info/time_within_train_step": 2.6816253662109375, "step": 62} {"train_info/time_between_train_steps": 0.0034568309783935547, "step": 62} {"info/global_step": 63, "train_info/time_within_train_step": 2.8097527027130127, "step": 63} {"train_info/time_between_train_steps": 0.0035545825958251953, "step": 63} {"info/global_step": 64, "train_info/time_within_train_step": 2.6822543144226074, "step": 64} {"train_info/time_between_train_steps": 0.0033140182495117188, "step": 64} {"info/global_step": 65, "train_info/time_within_train_step": 2.6814420223236084, "step": 65} {"train_info/time_between_train_steps": 0.003639698028564453, "step": 65} {"info/global_step": 66, "train_info/time_within_train_step": 2.682969331741333, "step": 66} {"train_info/time_between_train_steps": 0.0035445690155029297, "step": 66} {"info/global_step": 67, "train_info/time_within_train_step": 2.6822853088378906, "step": 67} {"train_info/time_between_train_steps": 0.0034983158111572266, "step": 67} {"info/global_step": 68, "train_info/time_within_train_step": 2.6881399154663086, "step": 68} {"train_info/time_between_train_steps": 0.0036034584045410156, "step": 68} {"info/global_step": 69, "train_info/time_within_train_step": 2.6830811500549316, "step": 69} {"train_info/time_between_train_steps": 0.0035157203674316406, "step": 69} {"info/global_step": 70, "train_info/time_within_train_step": 2.6829004287719727, "step": 70} {"train_info/time_between_train_steps": 0.003569364547729492, "step": 70} {"info/global_step": 71, "train_info/time_within_train_step": 2.6833081245422363, "step": 71} {"train_info/time_between_train_steps": 0.003541707992553711, "step": 71} {"info/global_step": 72, "train_info/time_within_train_step": 2.683074712753296, "step": 72} {"train_info/time_between_train_steps": 0.0035190582275390625, "step": 72} {"info/global_step": 73, "train_info/time_within_train_step": 2.6835997104644775, "step": 73} {"train_info/time_between_train_steps": 0.0035390853881835938, "step": 73} {"info/global_step": 74, "train_info/time_within_train_step": 2.683166265487671, "step": 74} {"train_info/time_between_train_steps": 0.0035104751586914062, "step": 74} {"info/global_step": 75, "train_info/time_within_train_step": 2.7047102451324463, "step": 75} {"train_info/time_between_train_steps": 0.0035257339477539062, "step": 75} {"info/global_step": 76, "train_info/time_within_train_step": 2.682401180267334, "step": 76} {"train_info/time_between_train_steps": 0.003503561019897461, "step": 76} {"info/global_step": 77, "train_info/time_within_train_step": 2.6827023029327393, "step": 77} {"train_info/time_between_train_steps": 0.00359344482421875, "step": 77} {"info/global_step": 78, "train_info/time_within_train_step": 2.6834540367126465, "step": 78} {"train_info/time_between_train_steps": 0.003570079803466797, "step": 78} {"info/global_step": 79, "train_info/time_within_train_step": 2.6835083961486816, "step": 79} {"train_info/time_between_train_steps": 0.003489255905151367, "step": 79} {"info/global_step": 80, "train_info/time_within_train_step": 2.6832454204559326, "step": 80} {"train_info/time_between_train_steps": 0.0035283565521240234, "step": 80} {"info/global_step": 81, "train_info/time_within_train_step": 2.6832501888275146, "step": 81} {"train_info/time_between_train_steps": 0.003598451614379883, "step": 81} {"info/global_step": 82, "train_info/time_within_train_step": 2.6844065189361572, "step": 82} {"train_info/time_between_train_steps": 0.003537416458129883, "step": 82} {"info/global_step": 83, "train_info/time_within_train_step": 2.683021306991577, "step": 83} {"train_info/time_between_train_steps": 0.0035071372985839844, "step": 83} {"info/global_step": 84, "train_info/time_within_train_step": 2.683457612991333, "step": 84} {"train_info/time_between_train_steps": 0.0034720897674560547, "step": 84} {"info/global_step": 85, "train_info/time_within_train_step": 2.6836047172546387, "step": 85} {"train_info/time_between_train_steps": 0.0034325122833251953, "step": 85} {"info/global_step": 86, "train_info/time_within_train_step": 2.6840121746063232, "step": 86} {"train_info/time_between_train_steps": 0.0035414695739746094, "step": 86} {"info/global_step": 87, "train_info/time_within_train_step": 2.6828620433807373, "step": 87} {"train_info/time_between_train_steps": 0.0035064220428466797, "step": 87} {"info/global_step": 88, "train_info/time_within_train_step": 2.682786464691162, "step": 88} {"train_info/time_between_train_steps": 0.0035037994384765625, "step": 88} {"info/global_step": 89, "train_info/time_within_train_step": 2.6851508617401123, "step": 89} {"train_info/time_between_train_steps": 0.0035440921783447266, "step": 89} {"info/global_step": 90, "train_info/time_within_train_step": 2.682860851287842, "step": 90} {"train_info/time_between_train_steps": 0.0035212039947509766, "step": 90} {"info/global_step": 91, "train_info/time_within_train_step": 2.6834144592285156, "step": 91} {"train_info/time_between_train_steps": 0.003574371337890625, "step": 91} {"info/global_step": 92, "train_info/time_within_train_step": 2.6836886405944824, "step": 92} {"train_info/time_between_train_steps": 0.0034983158111572266, "step": 92} {"info/global_step": 93, "train_info/time_within_train_step": 2.683241605758667, "step": 93} {"train_info/time_between_train_steps": 0.0035059452056884766, "step": 93} {"info/global_step": 94, "train_info/time_within_train_step": 2.6836507320404053, "step": 94} {"train_info/time_between_train_steps": 0.003493070602416992, "step": 94} {"info/global_step": 95, "train_info/time_within_train_step": 2.6828978061676025, "step": 95} {"train_info/time_between_train_steps": 0.003490924835205078, "step": 95} {"info/global_step": 96, "train_info/time_within_train_step": 2.6827845573425293, "step": 96} {"train_info/time_between_train_steps": 0.0034699440002441406, "step": 96} {"info/global_step": 97, "train_info/time_within_train_step": 2.6840217113494873, "step": 97} {"train_info/time_between_train_steps": 0.0034894943237304688, "step": 97} {"info/global_step": 98, "train_info/time_within_train_step": 2.6861133575439453, "step": 98} {"train_info/time_between_train_steps": 0.0036928653717041016, "step": 98} {"info/global_step": 99, "train_info/time_within_train_step": 2.6855361461639404, "step": 99} {"train_info/time_between_train_steps": 0.003642559051513672, "step": 99} {"info/global_step": 100, "train_info/time_within_train_step": 2.685563325881958, "step": 100} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746312133, "_runtime": 289}, "step": 100} {"logs": {"train/loss": 7.0031, "train/learning_rate": 0.00019999999999999998, "train/epoch": 0.03, "_timestamp": 1746312133, "_runtime": 289}, "step": 100} {"train_info/time_between_train_steps": 21.68894386291504, "step": 100} {"info/global_step": 101, "train_info/time_within_train_step": 2.479458808898926, "step": 101} {"train_info/time_between_train_steps": 0.003629446029663086, "step": 101} {"info/global_step": 102, "train_info/time_within_train_step": 2.475579261779785, "step": 102} {"train_info/time_between_train_steps": 0.003651857376098633, "step": 102} {"info/global_step": 103, "train_info/time_within_train_step": 3.006054162979126, "step": 103} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 103} {"info/global_step": 104, "train_info/time_within_train_step": 2.6816635131835938, "step": 104} {"train_info/time_between_train_steps": 0.0033588409423828125, "step": 104} {"info/global_step": 105, "train_info/time_within_train_step": 2.6810784339904785, "step": 105} {"train_info/time_between_train_steps": 0.0032625198364257812, "step": 105} {"info/global_step": 106, "train_info/time_within_train_step": 2.680999755859375, "step": 106} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 106} {"info/global_step": 107, "train_info/time_within_train_step": 2.6817843914031982, "step": 107} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 107} {"info/global_step": 108, "train_info/time_within_train_step": 2.6816513538360596, "step": 108} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 108} {"info/global_step": 109, "train_info/time_within_train_step": 2.681941270828247, "step": 109} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 109} {"info/global_step": 110, "train_info/time_within_train_step": 2.683006763458252, "step": 110} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 110} {"info/global_step": 111, "train_info/time_within_train_step": 2.6826577186584473, "step": 111} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 111} {"info/global_step": 112, "train_info/time_within_train_step": 2.683171510696411, "step": 112} {"train_info/time_between_train_steps": 0.0034248828887939453, "step": 112} {"info/global_step": 113, "train_info/time_within_train_step": 2.682640790939331, "step": 113} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 113} {"info/global_step": 114, "train_info/time_within_train_step": 2.683241844177246, "step": 114} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 114} {"info/global_step": 115, "train_info/time_within_train_step": 2.6829679012298584, "step": 115} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 115} {"info/global_step": 116, "train_info/time_within_train_step": 2.695716381072998, "step": 116} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 116} {"info/global_step": 117, "train_info/time_within_train_step": 2.7277374267578125, "step": 117} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 117} {"info/global_step": 118, "train_info/time_within_train_step": 2.740018367767334, "step": 118} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 118} {"info/global_step": 119, "train_info/time_within_train_step": 2.688718557357788, "step": 119} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 119} {"info/global_step": 120, "train_info/time_within_train_step": 2.690502405166626, "step": 120} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 120} {"info/global_step": 121, "train_info/time_within_train_step": 2.7126543521881104, "step": 121} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 121} {"info/global_step": 122, "train_info/time_within_train_step": 2.6988682746887207, "step": 122} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 122} {"info/global_step": 123, "train_info/time_within_train_step": 2.6831138134002686, "step": 123} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 123} {"info/global_step": 124, "train_info/time_within_train_step": 2.69785213470459, "step": 124} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 124} {"info/global_step": 125, "train_info/time_within_train_step": 2.7201755046844482, "step": 125} {"train_info/time_between_train_steps": 0.1253643035888672, "step": 125} {"info/global_step": 126, "train_info/time_within_train_step": 2.6837596893310547, "step": 126} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 126} {"info/global_step": 127, "train_info/time_within_train_step": 2.6879727840423584, "step": 127} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 127} {"info/global_step": 128, "train_info/time_within_train_step": 2.68228816986084, "step": 128} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 128} {"info/global_step": 129, "train_info/time_within_train_step": 2.6831114292144775, "step": 129} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 129} {"info/global_step": 130, "train_info/time_within_train_step": 2.68351674079895, "step": 130} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 130} {"info/global_step": 131, "train_info/time_within_train_step": 2.690915107727051, "step": 131} {"train_info/time_between_train_steps": 0.0031807422637939453, "step": 131} {"info/global_step": 132, "train_info/time_within_train_step": 2.7218399047851562, "step": 132} {"train_info/time_between_train_steps": 0.003264188766479492, "step": 132} {"info/global_step": 133, "train_info/time_within_train_step": 2.691594362258911, "step": 133} {"train_info/time_between_train_steps": 0.0033016204833984375, "step": 133} {"info/global_step": 134, "train_info/time_within_train_step": 2.7005865573883057, "step": 134} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 134} {"info/global_step": 135, "train_info/time_within_train_step": 2.684008836746216, "step": 135} {"train_info/time_between_train_steps": 0.003256082534790039, "step": 135} {"info/global_step": 136, "train_info/time_within_train_step": 2.6828620433807373, "step": 136} {"train_info/time_between_train_steps": 0.003271818161010742, "step": 136} {"info/global_step": 137, "train_info/time_within_train_step": 2.6833624839782715, "step": 137} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 137} {"info/global_step": 138, "train_info/time_within_train_step": 2.6843574047088623, "step": 138} {"train_info/time_between_train_steps": 0.0033555030822753906, "step": 138} {"info/global_step": 139, "train_info/time_within_train_step": 2.6852893829345703, "step": 139} {"train_info/time_between_train_steps": 0.00392460823059082, "step": 139} {"info/global_step": 140, "train_info/time_within_train_step": 2.6823160648345947, "step": 140} {"train_info/time_between_train_steps": 0.003558635711669922, "step": 140} {"info/global_step": 141, "train_info/time_within_train_step": 2.7096681594848633, "step": 141} {"train_info/time_between_train_steps": 0.003551006317138672, "step": 141} {"info/global_step": 142, "train_info/time_within_train_step": 2.720864772796631, "step": 142} {"train_info/time_between_train_steps": 0.003606557846069336, "step": 142} {"info/global_step": 143, "train_info/time_within_train_step": 2.684069871902466, "step": 143} {"train_info/time_between_train_steps": 0.0035448074340820312, "step": 143} {"info/global_step": 144, "train_info/time_within_train_step": 2.685476303100586, "step": 144} {"train_info/time_between_train_steps": 0.0035190582275390625, "step": 144} {"info/global_step": 145, "train_info/time_within_train_step": 2.686746597290039, "step": 145} {"train_info/time_between_train_steps": 0.0036764144897460938, "step": 145} {"info/global_step": 146, "train_info/time_within_train_step": 2.683403730392456, "step": 146} {"train_info/time_between_train_steps": 0.003574848175048828, "step": 146} {"info/global_step": 147, "train_info/time_within_train_step": 2.6834609508514404, "step": 147} {"train_info/time_between_train_steps": 0.003650665283203125, "step": 147} {"info/global_step": 148, "train_info/time_within_train_step": 2.6836302280426025, "step": 148} {"train_info/time_between_train_steps": 0.003613710403442383, "step": 148} {"info/global_step": 149, "train_info/time_within_train_step": 2.689486026763916, "step": 149} {"train_info/time_between_train_steps": 0.0035552978515625, "step": 149} {"info/global_step": 150, "train_info/time_within_train_step": 2.6952695846557617, "step": 150} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746312291, "_runtime": 447}, "step": 150} {"logs": {"train/loss": 6.591, "train/learning_rate": 0.0003, "train/epoch": 0.05, "_timestamp": 1746312291, "_runtime": 447}, "step": 150} {"train_info/time_between_train_steps": 0.024293899536132812, "step": 150} {"info/global_step": 151, "train_info/time_within_train_step": 2.688544511795044, "step": 151} {"train_info/time_between_train_steps": 0.0037958621978759766, "step": 151} {"info/global_step": 152, "train_info/time_within_train_step": 2.6864359378814697, "step": 152} {"train_info/time_between_train_steps": 0.0037097930908203125, "step": 152} {"info/global_step": 153, "train_info/time_within_train_step": 2.6860365867614746, "step": 153} {"train_info/time_between_train_steps": 0.0035665035247802734, "step": 153} {"info/global_step": 154, "train_info/time_within_train_step": 2.6846189498901367, "step": 154} {"train_info/time_between_train_steps": 0.003512859344482422, "step": 154} {"info/global_step": 155, "train_info/time_within_train_step": 2.683631658554077, "step": 155} {"train_info/time_between_train_steps": 0.0035364627838134766, "step": 155} {"info/global_step": 156, "train_info/time_within_train_step": 2.7074756622314453, "step": 156} {"train_info/time_between_train_steps": 0.0036001205444335938, "step": 156} {"info/global_step": 157, "train_info/time_within_train_step": 2.68450927734375, "step": 157} {"train_info/time_between_train_steps": 0.0035240650177001953, "step": 157} {"info/global_step": 158, "train_info/time_within_train_step": 2.684915781021118, "step": 158} {"train_info/time_between_train_steps": 0.0036177635192871094, "step": 158} {"info/global_step": 159, "train_info/time_within_train_step": 2.685006618499756, "step": 159} {"train_info/time_between_train_steps": 0.003559589385986328, "step": 159} {"info/global_step": 160, "train_info/time_within_train_step": 2.6850087642669678, "step": 160} {"train_info/time_between_train_steps": 0.0035593509674072266, "step": 160} {"info/global_step": 161, "train_info/time_within_train_step": 2.684356927871704, "step": 161} {"train_info/time_between_train_steps": 0.0035135746002197266, "step": 161} {"info/global_step": 162, "train_info/time_within_train_step": 2.684502363204956, "step": 162} {"train_info/time_between_train_steps": 0.003629922866821289, "step": 162} {"info/global_step": 163, "train_info/time_within_train_step": 2.6834354400634766, "step": 163} {"train_info/time_between_train_steps": 0.0035283565521240234, "step": 163} {"info/global_step": 164, "train_info/time_within_train_step": 2.6845266819000244, "step": 164} {"train_info/time_between_train_steps": 0.003567218780517578, "step": 164} {"info/global_step": 165, "train_info/time_within_train_step": 2.683286190032959, "step": 165} {"train_info/time_between_train_steps": 0.0035483837127685547, "step": 165} {"info/global_step": 166, "train_info/time_within_train_step": 2.6841320991516113, "step": 166} {"train_info/time_between_train_steps": 0.0035467147827148438, "step": 166} {"info/global_step": 167, "train_info/time_within_train_step": 2.6853480339050293, "step": 167} {"train_info/time_between_train_steps": 0.003534555435180664, "step": 167} {"info/global_step": 168, "train_info/time_within_train_step": 2.684033155441284, "step": 168} {"train_info/time_between_train_steps": 0.003574848175048828, "step": 168} {"info/global_step": 169, "train_info/time_within_train_step": 2.6847901344299316, "step": 169} {"train_info/time_between_train_steps": 0.0037069320678710938, "step": 169} {"info/global_step": 170, "train_info/time_within_train_step": 2.6858162879943848, "step": 170} {"train_info/time_between_train_steps": 0.0038290023803710938, "step": 170} {"info/global_step": 171, "train_info/time_within_train_step": 2.68760085105896, "step": 171} {"train_info/time_between_train_steps": 0.003720998764038086, "step": 171} {"info/global_step": 172, "train_info/time_within_train_step": 2.687086343765259, "step": 172} {"train_info/time_between_train_steps": 0.003682851791381836, "step": 172} {"info/global_step": 173, "train_info/time_within_train_step": 2.6885712146759033, "step": 173} {"train_info/time_between_train_steps": 0.0037393569946289062, "step": 173} {"info/global_step": 174, "train_info/time_within_train_step": 2.6850485801696777, "step": 174} {"train_info/time_between_train_steps": 0.003597736358642578, "step": 174} {"info/global_step": 175, "train_info/time_within_train_step": 2.6842730045318604, "step": 175} {"train_info/time_between_train_steps": 0.0036051273345947266, "step": 175} {"info/global_step": 176, "train_info/time_within_train_step": 2.6847386360168457, "step": 176} {"train_info/time_between_train_steps": 0.0035552978515625, "step": 176} {"info/global_step": 177, "train_info/time_within_train_step": 2.6837191581726074, "step": 177} {"train_info/time_between_train_steps": 0.003559112548828125, "step": 177} {"info/global_step": 178, "train_info/time_within_train_step": 2.6828389167785645, "step": 178} {"train_info/time_between_train_steps": 0.003532886505126953, "step": 178} {"info/global_step": 179, "train_info/time_within_train_step": 2.6838881969451904, "step": 179} {"train_info/time_between_train_steps": 0.0035719871520996094, "step": 179} {"info/global_step": 180, "train_info/time_within_train_step": 2.6843554973602295, "step": 180} {"train_info/time_between_train_steps": 0.0035126209259033203, "step": 180} {"info/global_step": 181, "train_info/time_within_train_step": 2.68320894241333, "step": 181} {"train_info/time_between_train_steps": 0.0034439563751220703, "step": 181} {"info/global_step": 182, "train_info/time_within_train_step": 2.682584285736084, "step": 182} {"train_info/time_between_train_steps": 0.003627777099609375, "step": 182} {"info/global_step": 183, "train_info/time_within_train_step": 2.682711124420166, "step": 183} {"train_info/time_between_train_steps": 0.0035827159881591797, "step": 183} {"info/global_step": 184, "train_info/time_within_train_step": 2.68387508392334, "step": 184} {"train_info/time_between_train_steps": 0.0036001205444335938, "step": 184} {"info/global_step": 185, "train_info/time_within_train_step": 2.6843392848968506, "step": 185} {"train_info/time_between_train_steps": 0.003584146499633789, "step": 185} {"info/global_step": 186, "train_info/time_within_train_step": 3.0362656116485596, "step": 186} {"train_info/time_between_train_steps": 0.0034132003784179688, "step": 186} {"info/global_step": 187, "train_info/time_within_train_step": 2.68639874458313, "step": 187} {"train_info/time_between_train_steps": 0.0033638477325439453, "step": 187} {"info/global_step": 188, "train_info/time_within_train_step": 2.8357765674591064, "step": 188} {"train_info/time_between_train_steps": 0.0034456253051757812, "step": 188} {"info/global_step": 189, "train_info/time_within_train_step": 2.684114933013916, "step": 189} {"train_info/time_between_train_steps": 0.0033864974975585938, "step": 189} {"info/global_step": 190, "train_info/time_within_train_step": 2.68540096282959, "step": 190} {"train_info/time_between_train_steps": 0.0033979415893554688, "step": 190} {"info/global_step": 191, "train_info/time_within_train_step": 2.6841373443603516, "step": 191} {"train_info/time_between_train_steps": 0.003382444381713867, "step": 191} {"info/global_step": 192, "train_info/time_within_train_step": 2.6847853660583496, "step": 192} {"train_info/time_between_train_steps": 0.003410816192626953, "step": 192} {"info/global_step": 193, "train_info/time_within_train_step": 2.684333086013794, "step": 193} {"train_info/time_between_train_steps": 0.0033833980560302734, "step": 193} {"info/global_step": 194, "train_info/time_within_train_step": 2.6877214908599854, "step": 194} {"train_info/time_between_train_steps": 0.003385305404663086, "step": 194} {"info/global_step": 195, "train_info/time_within_train_step": 2.684835910797119, "step": 195} {"train_info/time_between_train_steps": 0.003590822219848633, "step": 195} {"info/global_step": 196, "train_info/time_within_train_step": 2.6845638751983643, "step": 196} {"train_info/time_between_train_steps": 0.003359079360961914, "step": 196} {"info/global_step": 197, "train_info/time_within_train_step": 2.684990644454956, "step": 197} {"train_info/time_between_train_steps": 0.0034117698669433594, "step": 197} {"info/global_step": 198, "train_info/time_within_train_step": 2.6858134269714355, "step": 198} {"train_info/time_between_train_steps": 0.003448486328125, "step": 198} {"info/global_step": 199, "train_info/time_within_train_step": 2.685344696044922, "step": 199} {"train_info/time_between_train_steps": 0.0033960342407226562, "step": 199} {"info/global_step": 200, "train_info/time_within_train_step": 2.6840343475341797, "step": 200} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746312427, "_runtime": 583}, "step": 200} {"logs": {"train/loss": 6.3213, "train/learning_rate": 0.00039999999999999996, "train/epoch": 0.07, "_timestamp": 1746312427, "_runtime": 583}, "step": 200} {"train_info/time_between_train_steps": 20.914541006088257, "step": 200} {"info/global_step": 201, "train_info/time_within_train_step": 2.486384391784668, "step": 201} {"train_info/time_between_train_steps": 0.0034058094024658203, "step": 201} {"info/global_step": 202, "train_info/time_within_train_step": 2.479203462600708, "step": 202} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 202} {"info/global_step": 203, "train_info/time_within_train_step": 2.667409658432007, "step": 203} {"train_info/time_between_train_steps": 0.0032455921173095703, "step": 203} {"info/global_step": 204, "train_info/time_within_train_step": 2.6770918369293213, "step": 204} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 204} {"info/global_step": 205, "train_info/time_within_train_step": 2.6799728870391846, "step": 205} {"train_info/time_between_train_steps": 0.003215789794921875, "step": 205} {"info/global_step": 206, "train_info/time_within_train_step": 2.6810359954833984, "step": 206} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 206} {"info/global_step": 207, "train_info/time_within_train_step": 2.682150363922119, "step": 207} {"train_info/time_between_train_steps": 0.0032329559326171875, "step": 207} {"info/global_step": 208, "train_info/time_within_train_step": 2.6909096240997314, "step": 208} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 208} {"info/global_step": 209, "train_info/time_within_train_step": 2.680835723876953, "step": 209} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 209} {"info/global_step": 210, "train_info/time_within_train_step": 2.681232452392578, "step": 210} {"train_info/time_between_train_steps": 0.003265380859375, "step": 210} {"info/global_step": 211, "train_info/time_within_train_step": 2.6820623874664307, "step": 211} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 211} {"info/global_step": 212, "train_info/time_within_train_step": 2.68377685546875, "step": 212} {"train_info/time_between_train_steps": 0.003621339797973633, "step": 212} {"info/global_step": 213, "train_info/time_within_train_step": 2.6840240955352783, "step": 213} {"train_info/time_between_train_steps": 0.0036101341247558594, "step": 213} {"info/global_step": 214, "train_info/time_within_train_step": 2.716519594192505, "step": 214} {"train_info/time_between_train_steps": 0.003631114959716797, "step": 214} {"info/global_step": 215, "train_info/time_within_train_step": 2.8006606101989746, "step": 215} {"train_info/time_between_train_steps": 0.0036530494689941406, "step": 215} {"info/global_step": 216, "train_info/time_within_train_step": 2.7390389442443848, "step": 216} {"train_info/time_between_train_steps": 0.0036056041717529297, "step": 216} {"info/global_step": 217, "train_info/time_within_train_step": 2.7413032054901123, "step": 217} {"train_info/time_between_train_steps": 0.0035805702209472656, "step": 217} {"info/global_step": 218, "train_info/time_within_train_step": 2.733710289001465, "step": 218} {"train_info/time_between_train_steps": 0.003592967987060547, "step": 218} {"info/global_step": 219, "train_info/time_within_train_step": 2.7015297412872314, "step": 219} {"train_info/time_between_train_steps": 0.003561258316040039, "step": 219} {"info/global_step": 220, "train_info/time_within_train_step": 2.7275943756103516, "step": 220} {"train_info/time_between_train_steps": 0.0035810470581054688, "step": 220} {"info/global_step": 221, "train_info/time_within_train_step": 2.7011373043060303, "step": 221} {"train_info/time_between_train_steps": 0.003571748733520508, "step": 221} {"info/global_step": 222, "train_info/time_within_train_step": 2.690380573272705, "step": 222} {"train_info/time_between_train_steps": 0.0036008358001708984, "step": 222} {"info/global_step": 223, "train_info/time_within_train_step": 2.723234176635742, "step": 223} {"train_info/time_between_train_steps": 0.003556966781616211, "step": 223} {"info/global_step": 224, "train_info/time_within_train_step": 2.7139601707458496, "step": 224} {"train_info/time_between_train_steps": 0.0036551952362060547, "step": 224} {"info/global_step": 225, "train_info/time_within_train_step": 2.714925765991211, "step": 225} {"train_info/time_between_train_steps": 0.003611326217651367, "step": 225} {"info/global_step": 226, "train_info/time_within_train_step": 2.701268434524536, "step": 226} {"train_info/time_between_train_steps": 0.0036118030548095703, "step": 226} {"info/global_step": 227, "train_info/time_within_train_step": 2.7117819786071777, "step": 227} {"train_info/time_between_train_steps": 0.0036401748657226562, "step": 227} {"info/global_step": 228, "train_info/time_within_train_step": 3.051964044570923, "step": 228} {"train_info/time_between_train_steps": 0.003222942352294922, "step": 228} {"info/global_step": 229, "train_info/time_within_train_step": 2.6835360527038574, "step": 229} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 229} {"info/global_step": 230, "train_info/time_within_train_step": 2.682572364807129, "step": 230} {"train_info/time_between_train_steps": 0.003263711929321289, "step": 230} {"info/global_step": 231, "train_info/time_within_train_step": 2.6840436458587646, "step": 231} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 231} {"info/global_step": 232, "train_info/time_within_train_step": 2.683887243270874, "step": 232} {"train_info/time_between_train_steps": 0.003262758255004883, "step": 232} {"info/global_step": 233, "train_info/time_within_train_step": 2.699718713760376, "step": 233} {"train_info/time_between_train_steps": 0.0034050941467285156, "step": 233} {"info/global_step": 234, "train_info/time_within_train_step": 2.7065916061401367, "step": 234} {"train_info/time_between_train_steps": 0.0033216476440429688, "step": 234} {"info/global_step": 235, "train_info/time_within_train_step": 2.7046024799346924, "step": 235} {"train_info/time_between_train_steps": 0.0036401748657226562, "step": 235} {"info/global_step": 236, "train_info/time_within_train_step": 2.6859254837036133, "step": 236} {"train_info/time_between_train_steps": 0.0034160614013671875, "step": 236} {"info/global_step": 237, "train_info/time_within_train_step": 2.7014319896698, "step": 237} {"train_info/time_between_train_steps": 0.003587961196899414, "step": 237} {"info/global_step": 238, "train_info/time_within_train_step": 2.7231359481811523, "step": 238} {"train_info/time_between_train_steps": 0.0036191940307617188, "step": 238} {"info/global_step": 239, "train_info/time_within_train_step": 2.7043604850769043, "step": 239} {"train_info/time_between_train_steps": 0.0035886764526367188, "step": 239} {"info/global_step": 240, "train_info/time_within_train_step": 2.6999826431274414, "step": 240} {"train_info/time_between_train_steps": 0.0035958290100097656, "step": 240} {"info/global_step": 241, "train_info/time_within_train_step": 2.715510606765747, "step": 241} {"train_info/time_between_train_steps": 0.0035631656646728516, "step": 241} {"info/global_step": 242, "train_info/time_within_train_step": 2.685762882232666, "step": 242} {"train_info/time_between_train_steps": 0.0035686492919921875, "step": 242} {"info/global_step": 243, "train_info/time_within_train_step": 2.6841650009155273, "step": 243} {"train_info/time_between_train_steps": 0.003561735153198242, "step": 243} {"info/global_step": 244, "train_info/time_within_train_step": 2.692290782928467, "step": 244} {"train_info/time_between_train_steps": 0.0035409927368164062, "step": 244} {"info/global_step": 245, "train_info/time_within_train_step": 2.70078706741333, "step": 245} {"train_info/time_between_train_steps": 0.003554821014404297, "step": 245} {"info/global_step": 246, "train_info/time_within_train_step": 2.6849565505981445, "step": 246} {"train_info/time_between_train_steps": 0.003587484359741211, "step": 246} {"info/global_step": 247, "train_info/time_within_train_step": 2.6974880695343018, "step": 247} {"train_info/time_between_train_steps": 0.0035119056701660156, "step": 247} {"info/global_step": 248, "train_info/time_within_train_step": 2.7037675380706787, "step": 248} {"train_info/time_between_train_steps": 0.0035657882690429688, "step": 248} {"info/global_step": 249, "train_info/time_within_train_step": 2.694199800491333, "step": 249} {"train_info/time_between_train_steps": 0.003593921661376953, "step": 249} {"info/global_step": 250, "train_info/time_within_train_step": 3.5051164627075195, "step": 250} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746312585, "_runtime": 741}, "step": 250} {"logs": {"train/loss": 6.0723, "train/learning_rate": 0.0005, "train/epoch": 0.08, "_timestamp": 1746312585, "_runtime": 741}, "step": 250} {"train_info/time_between_train_steps": 0.1924750804901123, "step": 250} {"info/global_step": 251, "train_info/time_within_train_step": 2.6842148303985596, "step": 251} {"train_info/time_between_train_steps": 0.00341796875, "step": 251} {"info/global_step": 252, "train_info/time_within_train_step": 2.6828482151031494, "step": 252} {"train_info/time_between_train_steps": 0.003377199172973633, "step": 252} {"info/global_step": 253, "train_info/time_within_train_step": 2.683389902114868, "step": 253} {"train_info/time_between_train_steps": 0.003340005874633789, "step": 253} {"info/global_step": 254, "train_info/time_within_train_step": 2.6834161281585693, "step": 254} {"train_info/time_between_train_steps": 0.0034284591674804688, "step": 254} {"info/global_step": 255, "train_info/time_within_train_step": 2.6832306385040283, "step": 255} {"train_info/time_between_train_steps": 0.0036551952362060547, "step": 255} {"info/global_step": 256, "train_info/time_within_train_step": 2.682337999343872, "step": 256} {"train_info/time_between_train_steps": 0.0033202171325683594, "step": 256} {"info/global_step": 257, "train_info/time_within_train_step": 2.682157278060913, "step": 257} {"train_info/time_between_train_steps": 0.0032427310943603516, "step": 257} {"info/global_step": 258, "train_info/time_within_train_step": 2.6831982135772705, "step": 258} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 258} {"info/global_step": 259, "train_info/time_within_train_step": 2.6832406520843506, "step": 259} {"train_info/time_between_train_steps": 0.003297090530395508, "step": 259} {"info/global_step": 260, "train_info/time_within_train_step": 2.6818044185638428, "step": 260} {"train_info/time_between_train_steps": 0.003350496292114258, "step": 260} {"info/global_step": 261, "train_info/time_within_train_step": 2.6821486949920654, "step": 261} {"train_info/time_between_train_steps": 0.0032989978790283203, "step": 261} {"info/global_step": 262, "train_info/time_within_train_step": 2.681776762008667, "step": 262} {"train_info/time_between_train_steps": 0.003340005874633789, "step": 262} {"info/global_step": 263, "train_info/time_within_train_step": 2.681696891784668, "step": 263} {"train_info/time_between_train_steps": 0.003627777099609375, "step": 263} {"info/global_step": 264, "train_info/time_within_train_step": 2.682823896408081, "step": 264} {"train_info/time_between_train_steps": 0.0035164356231689453, "step": 264} {"info/global_step": 265, "train_info/time_within_train_step": 2.682671308517456, "step": 265} {"train_info/time_between_train_steps": 0.003507375717163086, "step": 265} {"info/global_step": 266, "train_info/time_within_train_step": 2.6822896003723145, "step": 266} {"train_info/time_between_train_steps": 0.0035085678100585938, "step": 266} {"info/global_step": 267, "train_info/time_within_train_step": 2.6826748847961426, "step": 267} {"train_info/time_between_train_steps": 0.0037522315979003906, "step": 267} {"info/global_step": 268, "train_info/time_within_train_step": 2.6843128204345703, "step": 268} {"train_info/time_between_train_steps": 0.0036864280700683594, "step": 268} {"info/global_step": 269, "train_info/time_within_train_step": 2.684530019760132, "step": 269} {"train_info/time_between_train_steps": 0.003824949264526367, "step": 269} {"info/global_step": 270, "train_info/time_within_train_step": 2.684979200363159, "step": 270} {"train_info/time_between_train_steps": 0.0037183761596679688, "step": 270} {"info/global_step": 271, "train_info/time_within_train_step": 2.6843109130859375, "step": 271} {"train_info/time_between_train_steps": 0.004243373870849609, "step": 271} {"info/global_step": 272, "train_info/time_within_train_step": 2.6837093830108643, "step": 272} {"train_info/time_between_train_steps": 0.0035178661346435547, "step": 272} {"info/global_step": 273, "train_info/time_within_train_step": 2.6827030181884766, "step": 273} {"train_info/time_between_train_steps": 0.0034842491149902344, "step": 273} {"info/global_step": 274, "train_info/time_within_train_step": 2.68257474899292, "step": 274} {"train_info/time_between_train_steps": 0.0034744739532470703, "step": 274} {"info/global_step": 275, "train_info/time_within_train_step": 2.682401180267334, "step": 275} {"train_info/time_between_train_steps": 0.003463268280029297, "step": 275} {"info/global_step": 276, "train_info/time_within_train_step": 2.6823041439056396, "step": 276} {"train_info/time_between_train_steps": 0.0035474300384521484, "step": 276} {"info/global_step": 277, "train_info/time_within_train_step": 2.6838815212249756, "step": 277} {"train_info/time_between_train_steps": 0.0035448074340820312, "step": 277} {"info/global_step": 278, "train_info/time_within_train_step": 2.684110164642334, "step": 278} {"train_info/time_between_train_steps": 0.0036003589630126953, "step": 278} {"info/global_step": 279, "train_info/time_within_train_step": 2.683919906616211, "step": 279} {"train_info/time_between_train_steps": 0.0036115646362304688, "step": 279} {"info/global_step": 280, "train_info/time_within_train_step": 2.6837880611419678, "step": 280} {"train_info/time_between_train_steps": 0.003750324249267578, "step": 280} {"info/global_step": 281, "train_info/time_within_train_step": 2.686202049255371, "step": 281} {"train_info/time_between_train_steps": 0.003794431686401367, "step": 281} {"info/global_step": 282, "train_info/time_within_train_step": 2.6846470832824707, "step": 282} {"train_info/time_between_train_steps": 0.003715038299560547, "step": 282} {"info/global_step": 283, "train_info/time_within_train_step": 2.6849217414855957, "step": 283} {"train_info/time_between_train_steps": 0.0037262439727783203, "step": 283} {"info/global_step": 284, "train_info/time_within_train_step": 2.6866343021392822, "step": 284} {"train_info/time_between_train_steps": 0.003687143325805664, "step": 284} {"info/global_step": 285, "train_info/time_within_train_step": 2.6847877502441406, "step": 285} {"train_info/time_between_train_steps": 0.0036950111389160156, "step": 285} {"info/global_step": 286, "train_info/time_within_train_step": 2.685159206390381, "step": 286} {"train_info/time_between_train_steps": 0.003740549087524414, "step": 286} {"info/global_step": 287, "train_info/time_within_train_step": 2.6849915981292725, "step": 287} {"train_info/time_between_train_steps": 0.0036687850952148438, "step": 287} {"info/global_step": 288, "train_info/time_within_train_step": 2.685418128967285, "step": 288} {"train_info/time_between_train_steps": 0.0036542415618896484, "step": 288} {"info/global_step": 289, "train_info/time_within_train_step": 2.6851391792297363, "step": 289} {"train_info/time_between_train_steps": 0.003736734390258789, "step": 289} {"info/global_step": 290, "train_info/time_within_train_step": 2.685711145401001, "step": 290} {"train_info/time_between_train_steps": 0.003640890121459961, "step": 290} {"info/global_step": 291, "train_info/time_within_train_step": 2.685296058654785, "step": 291} {"train_info/time_between_train_steps": 0.0036242008209228516, "step": 291} {"info/global_step": 292, "train_info/time_within_train_step": 2.6851308345794678, "step": 292} {"train_info/time_between_train_steps": 0.003669261932373047, "step": 292} {"info/global_step": 293, "train_info/time_within_train_step": 2.6841845512390137, "step": 293} {"train_info/time_between_train_steps": 0.0036377906799316406, "step": 293} {"info/global_step": 294, "train_info/time_within_train_step": 2.684034824371338, "step": 294} {"train_info/time_between_train_steps": 0.003675699234008789, "step": 294} {"info/global_step": 295, "train_info/time_within_train_step": 2.6829986572265625, "step": 295} {"train_info/time_between_train_steps": 0.0034542083740234375, "step": 295} {"info/global_step": 296, "train_info/time_within_train_step": 2.6825177669525146, "step": 296} {"train_info/time_between_train_steps": 0.003536701202392578, "step": 296} {"info/global_step": 297, "train_info/time_within_train_step": 2.683666706085205, "step": 297} {"train_info/time_between_train_steps": 0.0035049915313720703, "step": 297} {"info/global_step": 298, "train_info/time_within_train_step": 2.680788040161133, "step": 298} {"train_info/time_between_train_steps": 0.0035157203674316406, "step": 298} {"info/global_step": 299, "train_info/time_within_train_step": 2.682241201400757, "step": 299} {"train_info/time_between_train_steps": 0.003490924835205078, "step": 299} {"info/global_step": 300, "train_info/time_within_train_step": 2.682021379470825, "step": 300} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746312720, "_runtime": 876}, "step": 300} {"logs": {"train/loss": 5.9222, "train/learning_rate": 0.0006, "train/epoch": 0.1, "_timestamp": 1746312720, "_runtime": 876}, "step": 300} {"train_info/time_between_train_steps": 17.92772912979126, "step": 300} {"info/global_step": 301, "train_info/time_within_train_step": 2.475663423538208, "step": 301} {"train_info/time_between_train_steps": 0.003465890884399414, "step": 301} {"info/global_step": 302, "train_info/time_within_train_step": 2.478307008743286, "step": 302} {"train_info/time_between_train_steps": 0.003694772720336914, "step": 302} {"info/global_step": 303, "train_info/time_within_train_step": 2.67340087890625, "step": 303} {"train_info/time_between_train_steps": 0.0035982131958007812, "step": 303} {"info/global_step": 304, "train_info/time_within_train_step": 2.680415153503418, "step": 304} {"train_info/time_between_train_steps": 0.003519296646118164, "step": 304} {"info/global_step": 305, "train_info/time_within_train_step": 2.6804542541503906, "step": 305} {"train_info/time_between_train_steps": 0.0035135746002197266, "step": 305} {"info/global_step": 306, "train_info/time_within_train_step": 2.991041421890259, "step": 306} {"train_info/time_between_train_steps": 0.0034182071685791016, "step": 306} {"info/global_step": 307, "train_info/time_within_train_step": 2.681281566619873, "step": 307} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 307} {"info/global_step": 308, "train_info/time_within_train_step": 2.6812219619750977, "step": 308} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 308} {"info/global_step": 309, "train_info/time_within_train_step": 2.6802446842193604, "step": 309} {"train_info/time_between_train_steps": 0.0033104419708251953, "step": 309} {"info/global_step": 310, "train_info/time_within_train_step": 2.6807844638824463, "step": 310} {"train_info/time_between_train_steps": 0.0034291744232177734, "step": 310} {"info/global_step": 311, "train_info/time_within_train_step": 2.6815004348754883, "step": 311} {"train_info/time_between_train_steps": 0.0033347606658935547, "step": 311} {"info/global_step": 312, "train_info/time_within_train_step": 2.6814873218536377, "step": 312} {"train_info/time_between_train_steps": 0.003531932830810547, "step": 312} {"info/global_step": 313, "train_info/time_within_train_step": 2.8110830783843994, "step": 313} {"train_info/time_between_train_steps": 0.003406047821044922, "step": 313} {"info/global_step": 314, "train_info/time_within_train_step": 2.731940746307373, "step": 314} {"train_info/time_between_train_steps": 0.0032300949096679688, "step": 314} {"info/global_step": 315, "train_info/time_within_train_step": 2.7301313877105713, "step": 315} {"train_info/time_between_train_steps": 0.0034508705139160156, "step": 315} {"info/global_step": 316, "train_info/time_within_train_step": 2.7886698246002197, "step": 316} {"train_info/time_between_train_steps": 0.003255128860473633, "step": 316} {"info/global_step": 317, "train_info/time_within_train_step": 2.7768146991729736, "step": 317} {"train_info/time_between_train_steps": 0.0033125877380371094, "step": 317} {"info/global_step": 318, "train_info/time_within_train_step": 2.7063424587249756, "step": 318} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 318} {"info/global_step": 319, "train_info/time_within_train_step": 2.7186901569366455, "step": 319} {"train_info/time_between_train_steps": 0.003284454345703125, "step": 319} {"info/global_step": 320, "train_info/time_within_train_step": 2.7330222129821777, "step": 320} {"train_info/time_between_train_steps": 0.0036001205444335938, "step": 320} {"info/global_step": 321, "train_info/time_within_train_step": 2.688812494277954, "step": 321} {"train_info/time_between_train_steps": 0.0034437179565429688, "step": 321} {"info/global_step": 322, "train_info/time_within_train_step": 2.732999324798584, "step": 322} {"train_info/time_between_train_steps": 0.00366973876953125, "step": 322} {"info/global_step": 323, "train_info/time_within_train_step": 2.7128257751464844, "step": 323} {"train_info/time_between_train_steps": 0.0035805702209472656, "step": 323} {"info/global_step": 324, "train_info/time_within_train_step": 2.7187023162841797, "step": 324} {"train_info/time_between_train_steps": 0.003564596176147461, "step": 324} {"info/global_step": 325, "train_info/time_within_train_step": 2.7194368839263916, "step": 325} {"train_info/time_between_train_steps": 0.003490447998046875, "step": 325} {"info/global_step": 326, "train_info/time_within_train_step": 2.695143938064575, "step": 326} {"train_info/time_between_train_steps": 0.003545522689819336, "step": 326} {"info/global_step": 327, "train_info/time_within_train_step": 2.7047228813171387, "step": 327} {"train_info/time_between_train_steps": 0.0034313201904296875, "step": 327} {"info/global_step": 328, "train_info/time_within_train_step": 2.733598232269287, "step": 328} {"train_info/time_between_train_steps": 0.003472566604614258, "step": 328} {"info/global_step": 329, "train_info/time_within_train_step": 2.7220985889434814, "step": 329} {"train_info/time_between_train_steps": 0.003507852554321289, "step": 329} {"info/global_step": 330, "train_info/time_within_train_step": 2.7085518836975098, "step": 330} {"train_info/time_between_train_steps": 0.0035119056701660156, "step": 330} {"info/global_step": 331, "train_info/time_within_train_step": 2.7069365978240967, "step": 331} {"train_info/time_between_train_steps": 0.0034978389739990234, "step": 331} {"info/global_step": 332, "train_info/time_within_train_step": 2.6899354457855225, "step": 332} {"train_info/time_between_train_steps": 0.003465414047241211, "step": 332} {"info/global_step": 333, "train_info/time_within_train_step": 2.722155809402466, "step": 333} {"train_info/time_between_train_steps": 0.003471851348876953, "step": 333} {"info/global_step": 334, "train_info/time_within_train_step": 2.7035562992095947, "step": 334} {"train_info/time_between_train_steps": 0.0035097599029541016, "step": 334} {"info/global_step": 335, "train_info/time_within_train_step": 2.7140331268310547, "step": 335} {"train_info/time_between_train_steps": 0.0035724639892578125, "step": 335} {"info/global_step": 336, "train_info/time_within_train_step": 2.7128565311431885, "step": 336} {"train_info/time_between_train_steps": 0.003517627716064453, "step": 336} {"info/global_step": 337, "train_info/time_within_train_step": 2.710059404373169, "step": 337} {"train_info/time_between_train_steps": 0.0036051273345947266, "step": 337} {"info/global_step": 338, "train_info/time_within_train_step": 2.6828126907348633, "step": 338} {"train_info/time_between_train_steps": 0.0035400390625, "step": 338} {"info/global_step": 339, "train_info/time_within_train_step": 2.708526849746704, "step": 339} {"train_info/time_between_train_steps": 0.0035219192504882812, "step": 339} {"info/global_step": 340, "train_info/time_within_train_step": 2.705273151397705, "step": 340} {"train_info/time_between_train_steps": 0.003589153289794922, "step": 340} {"info/global_step": 341, "train_info/time_within_train_step": 2.7089385986328125, "step": 341} {"train_info/time_between_train_steps": 0.0035622119903564453, "step": 341} {"info/global_step": 342, "train_info/time_within_train_step": 2.7042417526245117, "step": 342} {"train_info/time_between_train_steps": 0.003572702407836914, "step": 342} {"info/global_step": 343, "train_info/time_within_train_step": 2.7021424770355225, "step": 343} {"train_info/time_between_train_steps": 0.0035445690155029297, "step": 343} {"info/global_step": 344, "train_info/time_within_train_step": 3.022218942642212, "step": 344} {"train_info/time_between_train_steps": 0.0034461021423339844, "step": 344} {"info/global_step": 345, "train_info/time_within_train_step": 2.684813976287842, "step": 345} {"train_info/time_between_train_steps": 0.0033478736877441406, "step": 345} {"info/global_step": 346, "train_info/time_within_train_step": 2.6844468116760254, "step": 346} {"train_info/time_between_train_steps": 0.0036411285400390625, "step": 346} {"info/global_step": 347, "train_info/time_within_train_step": 2.6829833984375, "step": 347} {"train_info/time_between_train_steps": 0.0036568641662597656, "step": 347} {"info/global_step": 348, "train_info/time_within_train_step": 2.6839194297790527, "step": 348} {"train_info/time_between_train_steps": 0.0035572052001953125, "step": 348} {"info/global_step": 349, "train_info/time_within_train_step": 2.699770927429199, "step": 349} {"train_info/time_between_train_steps": 0.0033676624298095703, "step": 349} {"info/global_step": 350, "train_info/time_within_train_step": 2.70680570602417, "step": 350} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746312875, "_runtime": 1031}, "step": 350} {"logs": {"train/loss": 5.7894, "train/learning_rate": 0.0005888888888888889, "train/epoch": 0.12, "_timestamp": 1746312875, "_runtime": 1031}, "step": 350} {"train_info/time_between_train_steps": 0.025051355361938477, "step": 350} {"info/global_step": 351, "train_info/time_within_train_step": 2.702678680419922, "step": 351} {"train_info/time_between_train_steps": 0.0034513473510742188, "step": 351} {"info/global_step": 352, "train_info/time_within_train_step": 2.682830810546875, "step": 352} {"train_info/time_between_train_steps": 0.0036194324493408203, "step": 352} {"info/global_step": 353, "train_info/time_within_train_step": 2.6834371089935303, "step": 353} {"train_info/time_between_train_steps": 0.003479480743408203, "step": 353} {"info/global_step": 354, "train_info/time_within_train_step": 2.6865334510803223, "step": 354} {"train_info/time_between_train_steps": 0.003509998321533203, "step": 354} {"info/global_step": 355, "train_info/time_within_train_step": 2.702054023742676, "step": 355} {"train_info/time_between_train_steps": 0.0033407211303710938, "step": 355} {"info/global_step": 356, "train_info/time_within_train_step": 2.685427665710449, "step": 356} {"train_info/time_between_train_steps": 0.0033245086669921875, "step": 356} {"info/global_step": 357, "train_info/time_within_train_step": 2.694227695465088, "step": 357} {"train_info/time_between_train_steps": 0.0035881996154785156, "step": 357} {"info/global_step": 358, "train_info/time_within_train_step": 2.7116053104400635, "step": 358} {"train_info/time_between_train_steps": 0.0034508705139160156, "step": 358} {"info/global_step": 359, "train_info/time_within_train_step": 2.6919429302215576, "step": 359} {"train_info/time_between_train_steps": 0.003464221954345703, "step": 359} {"info/global_step": 360, "train_info/time_within_train_step": 2.692033529281616, "step": 360} {"train_info/time_between_train_steps": 0.003452777862548828, "step": 360} {"info/global_step": 361, "train_info/time_within_train_step": 2.6849100589752197, "step": 361} {"train_info/time_between_train_steps": 0.0036101341247558594, "step": 361} {"info/global_step": 362, "train_info/time_within_train_step": 2.712268829345703, "step": 362} {"train_info/time_between_train_steps": 0.0034918785095214844, "step": 362} {"info/global_step": 363, "train_info/time_within_train_step": 2.70028018951416, "step": 363} {"train_info/time_between_train_steps": 0.003587961196899414, "step": 363} {"info/global_step": 364, "train_info/time_within_train_step": 2.6916112899780273, "step": 364} {"train_info/time_between_train_steps": 0.0035736560821533203, "step": 364} {"info/global_step": 365, "train_info/time_within_train_step": 2.683861255645752, "step": 365} {"train_info/time_between_train_steps": 0.003535747528076172, "step": 365} {"info/global_step": 366, "train_info/time_within_train_step": 2.7084224224090576, "step": 366} {"train_info/time_between_train_steps": 0.003492593765258789, "step": 366} {"info/global_step": 367, "train_info/time_within_train_step": 2.6878085136413574, "step": 367} {"train_info/time_between_train_steps": 0.003422975540161133, "step": 367} {"info/global_step": 368, "train_info/time_within_train_step": 2.686361074447632, "step": 368} {"train_info/time_between_train_steps": 0.0034351348876953125, "step": 368} {"info/global_step": 369, "train_info/time_within_train_step": 2.689176321029663, "step": 369} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 369} {"info/global_step": 370, "train_info/time_within_train_step": 2.6818621158599854, "step": 370} {"train_info/time_between_train_steps": 0.0032715797424316406, "step": 370} {"info/global_step": 371, "train_info/time_within_train_step": 2.6824657917022705, "step": 371} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 371} {"info/global_step": 372, "train_info/time_within_train_step": 2.682590961456299, "step": 372} {"train_info/time_between_train_steps": 0.0032384395599365234, "step": 372} {"info/global_step": 373, "train_info/time_within_train_step": 2.6839423179626465, "step": 373} {"train_info/time_between_train_steps": 0.00327301025390625, "step": 373} {"info/global_step": 374, "train_info/time_within_train_step": 2.683218002319336, "step": 374} {"train_info/time_between_train_steps": 0.0032320022583007812, "step": 374} {"info/global_step": 375, "train_info/time_within_train_step": 2.682382106781006, "step": 375} {"train_info/time_between_train_steps": 0.13315844535827637, "step": 375} {"info/global_step": 376, "train_info/time_within_train_step": 2.6824536323547363, "step": 376} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 376} {"info/global_step": 377, "train_info/time_within_train_step": 2.6813583374023438, "step": 377} {"train_info/time_between_train_steps": 0.0032694339752197266, "step": 377} {"info/global_step": 378, "train_info/time_within_train_step": 2.692894220352173, "step": 378} {"train_info/time_between_train_steps": 0.003381013870239258, "step": 378} {"info/global_step": 379, "train_info/time_within_train_step": 2.6809470653533936, "step": 379} {"train_info/time_between_train_steps": 0.0033783912658691406, "step": 379} {"info/global_step": 380, "train_info/time_within_train_step": 2.683802366256714, "step": 380} {"train_info/time_between_train_steps": 0.0035505294799804688, "step": 380} {"info/global_step": 381, "train_info/time_within_train_step": 2.684574842453003, "step": 381} {"train_info/time_between_train_steps": 0.003500699996948242, "step": 381} {"info/global_step": 382, "train_info/time_within_train_step": 2.9843943119049072, "step": 382} {"train_info/time_between_train_steps": 0.003489255905151367, "step": 382} {"info/global_step": 383, "train_info/time_within_train_step": 2.683298110961914, "step": 383} {"train_info/time_between_train_steps": 0.0034143924713134766, "step": 383} {"info/global_step": 384, "train_info/time_within_train_step": 2.688386917114258, "step": 384} {"train_info/time_between_train_steps": 0.0034143924713134766, "step": 384} {"info/global_step": 385, "train_info/time_within_train_step": 2.683570623397827, "step": 385} {"train_info/time_between_train_steps": 0.003428936004638672, "step": 385} {"info/global_step": 386, "train_info/time_within_train_step": 2.6823983192443848, "step": 386} {"train_info/time_between_train_steps": 0.0033712387084960938, "step": 386} {"info/global_step": 387, "train_info/time_within_train_step": 2.6830332279205322, "step": 387} {"train_info/time_between_train_steps": 0.0034210681915283203, "step": 387} {"info/global_step": 388, "train_info/time_within_train_step": 2.7069244384765625, "step": 388} {"train_info/time_between_train_steps": 0.0034978389739990234, "step": 388} {"info/global_step": 389, "train_info/time_within_train_step": 2.683378219604492, "step": 389} {"train_info/time_between_train_steps": 0.0036242008209228516, "step": 389} {"info/global_step": 390, "train_info/time_within_train_step": 2.683333396911621, "step": 390} {"train_info/time_between_train_steps": 0.003389120101928711, "step": 390} {"info/global_step": 391, "train_info/time_within_train_step": 2.6824240684509277, "step": 391} {"train_info/time_between_train_steps": 0.003431081771850586, "step": 391} {"info/global_step": 392, "train_info/time_within_train_step": 2.6825108528137207, "step": 392} {"train_info/time_between_train_steps": 0.0033974647521972656, "step": 392} {"info/global_step": 393, "train_info/time_within_train_step": 2.6834983825683594, "step": 393} {"train_info/time_between_train_steps": 0.003448963165283203, "step": 393} {"info/global_step": 394, "train_info/time_within_train_step": 2.6828248500823975, "step": 394} {"train_info/time_between_train_steps": 0.003347635269165039, "step": 394} {"info/global_step": 395, "train_info/time_within_train_step": 2.6829116344451904, "step": 395} {"train_info/time_between_train_steps": 0.003402233123779297, "step": 395} {"info/global_step": 396, "train_info/time_within_train_step": 2.6832287311553955, "step": 396} {"train_info/time_between_train_steps": 0.0035288333892822266, "step": 396} {"info/global_step": 397, "train_info/time_within_train_step": 2.682500123977661, "step": 397} {"train_info/time_between_train_steps": 0.0033125877380371094, "step": 397} {"info/global_step": 398, "train_info/time_within_train_step": 2.6876087188720703, "step": 398} {"train_info/time_between_train_steps": 0.003339529037475586, "step": 398} {"info/global_step": 399, "train_info/time_within_train_step": 2.6828160285949707, "step": 399} {"train_info/time_between_train_steps": 0.003312826156616211, "step": 399} {"info/global_step": 400, "train_info/time_within_train_step": 2.682687520980835, "step": 400} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746313011, "_runtime": 1167}, "step": 400} {"logs": {"train/loss": 5.6661, "train/learning_rate": 0.0005777777777777776, "train/epoch": 0.13, "_timestamp": 1746313011, "_runtime": 1167}, "step": 400} {"train_info/time_between_train_steps": 13.187009811401367, "step": 400} {"info/global_step": 401, "train_info/time_within_train_step": 2.4696717262268066, "step": 401} {"train_info/time_between_train_steps": 0.0033774375915527344, "step": 401} {"info/global_step": 402, "train_info/time_within_train_step": 2.515638828277588, "step": 402} {"train_info/time_between_train_steps": 0.0036656856536865234, "step": 402} {"info/global_step": 403, "train_info/time_within_train_step": 2.678760528564453, "step": 403} {"train_info/time_between_train_steps": 0.003701448440551758, "step": 403} {"info/global_step": 404, "train_info/time_within_train_step": 2.679264783859253, "step": 404} {"train_info/time_between_train_steps": 0.0034639835357666016, "step": 404} {"info/global_step": 405, "train_info/time_within_train_step": 2.6802992820739746, "step": 405} {"train_info/time_between_train_steps": 0.003791332244873047, "step": 405} {"info/global_step": 406, "train_info/time_within_train_step": 2.6807470321655273, "step": 406} {"train_info/time_between_train_steps": 0.0035982131958007812, "step": 406} {"info/global_step": 407, "train_info/time_within_train_step": 2.681833267211914, "step": 407} {"train_info/time_between_train_steps": 0.003493070602416992, "step": 407} {"info/global_step": 408, "train_info/time_within_train_step": 2.681443929672241, "step": 408} {"train_info/time_between_train_steps": 0.0035686492919921875, "step": 408} {"info/global_step": 409, "train_info/time_within_train_step": 2.6806304454803467, "step": 409} {"train_info/time_between_train_steps": 0.003550291061401367, "step": 409} {"info/global_step": 410, "train_info/time_within_train_step": 2.681852340698242, "step": 410} {"train_info/time_between_train_steps": 0.0034868717193603516, "step": 410} {"info/global_step": 411, "train_info/time_within_train_step": 2.6815125942230225, "step": 411} {"train_info/time_between_train_steps": 0.0034651756286621094, "step": 411} {"info/global_step": 412, "train_info/time_within_train_step": 2.6814284324645996, "step": 412} {"train_info/time_between_train_steps": 0.0035276412963867188, "step": 412} {"info/global_step": 413, "train_info/time_within_train_step": 2.684828996658325, "step": 413} {"train_info/time_between_train_steps": 0.003761768341064453, "step": 413} {"info/global_step": 414, "train_info/time_within_train_step": 2.846806526184082, "step": 414} {"train_info/time_between_train_steps": 0.003583192825317383, "step": 414} {"info/global_step": 415, "train_info/time_within_train_step": 2.8410537242889404, "step": 415} {"train_info/time_between_train_steps": 0.003567934036254883, "step": 415} {"info/global_step": 416, "train_info/time_within_train_step": 2.7339625358581543, "step": 416} {"train_info/time_between_train_steps": 0.003639698028564453, "step": 416} {"info/global_step": 417, "train_info/time_within_train_step": 2.721428871154785, "step": 417} {"train_info/time_between_train_steps": 0.0034172534942626953, "step": 417} {"info/global_step": 418, "train_info/time_within_train_step": 2.7173640727996826, "step": 418} {"train_info/time_between_train_steps": 0.0034859180450439453, "step": 418} {"info/global_step": 419, "train_info/time_within_train_step": 2.7476420402526855, "step": 419} {"train_info/time_between_train_steps": 0.0036776065826416016, "step": 419} {"info/global_step": 420, "train_info/time_within_train_step": 2.7091474533081055, "step": 420} {"train_info/time_between_train_steps": 0.0034596920013427734, "step": 420} {"info/global_step": 421, "train_info/time_within_train_step": 2.7064208984375, "step": 421} {"train_info/time_between_train_steps": 0.0034499168395996094, "step": 421} {"info/global_step": 422, "train_info/time_within_train_step": 2.7386772632598877, "step": 422} {"train_info/time_between_train_steps": 0.0034766197204589844, "step": 422} {"info/global_step": 423, "train_info/time_within_train_step": 2.6947784423828125, "step": 423} {"train_info/time_between_train_steps": 0.003740072250366211, "step": 423} {"info/global_step": 424, "train_info/time_within_train_step": 2.717144250869751, "step": 424} {"train_info/time_between_train_steps": 0.0039052963256835938, "step": 424} {"info/global_step": 425, "train_info/time_within_train_step": 2.7256276607513428, "step": 425} {"train_info/time_between_train_steps": 0.0038154125213623047, "step": 425} {"info/global_step": 426, "train_info/time_within_train_step": 2.721473455429077, "step": 426} {"train_info/time_between_train_steps": 0.003791332244873047, "step": 426} {"info/global_step": 427, "train_info/time_within_train_step": 2.7233941555023193, "step": 427} {"train_info/time_between_train_steps": 0.003751039505004883, "step": 427} {"info/global_step": 428, "train_info/time_within_train_step": 2.688692569732666, "step": 428} {"train_info/time_between_train_steps": 0.0036487579345703125, "step": 428} {"info/global_step": 429, "train_info/time_within_train_step": 3.0214004516601562, "step": 429} {"train_info/time_between_train_steps": 0.0037856101989746094, "step": 429} {"info/global_step": 430, "train_info/time_within_train_step": 2.68562388420105, "step": 430} {"train_info/time_between_train_steps": 0.0035927295684814453, "step": 430} {"info/global_step": 431, "train_info/time_within_train_step": 2.684938430786133, "step": 431} {"train_info/time_between_train_steps": 0.0035805702209472656, "step": 431} {"info/global_step": 432, "train_info/time_within_train_step": 2.695936918258667, "step": 432} {"train_info/time_between_train_steps": 0.0034062862396240234, "step": 432} {"info/global_step": 433, "train_info/time_within_train_step": 2.702176332473755, "step": 433} {"train_info/time_between_train_steps": 0.0033354759216308594, "step": 433} {"info/global_step": 434, "train_info/time_within_train_step": 2.695389747619629, "step": 434} {"train_info/time_between_train_steps": 0.0033714771270751953, "step": 434} {"info/global_step": 435, "train_info/time_within_train_step": 2.724985122680664, "step": 435} {"train_info/time_between_train_steps": 0.0034677982330322266, "step": 435} {"info/global_step": 436, "train_info/time_within_train_step": 2.715233564376831, "step": 436} {"train_info/time_between_train_steps": 0.0034046173095703125, "step": 436} {"info/global_step": 437, "train_info/time_within_train_step": 2.703791618347168, "step": 437} {"train_info/time_between_train_steps": 0.0034782886505126953, "step": 437} {"info/global_step": 438, "train_info/time_within_train_step": 2.8283708095550537, "step": 438} {"train_info/time_between_train_steps": 0.0034055709838867188, "step": 438} {"info/global_step": 439, "train_info/time_within_train_step": 2.683915853500366, "step": 439} {"train_info/time_between_train_steps": 0.0033359527587890625, "step": 439} {"info/global_step": 440, "train_info/time_within_train_step": 2.7012596130371094, "step": 440} {"train_info/time_between_train_steps": 0.0035724639892578125, "step": 440} {"info/global_step": 441, "train_info/time_within_train_step": 2.6963508129119873, "step": 441} {"train_info/time_between_train_steps": 0.0033986568450927734, "step": 441} {"info/global_step": 442, "train_info/time_within_train_step": 2.6845388412475586, "step": 442} {"train_info/time_between_train_steps": 0.0036020278930664062, "step": 442} {"info/global_step": 443, "train_info/time_within_train_step": 2.7067275047302246, "step": 443} {"train_info/time_between_train_steps": 0.0034193992614746094, "step": 443} {"info/global_step": 444, "train_info/time_within_train_step": 2.7072205543518066, "step": 444} {"train_info/time_between_train_steps": 0.0033721923828125, "step": 444} {"info/global_step": 445, "train_info/time_within_train_step": 2.690321922302246, "step": 445} {"train_info/time_between_train_steps": 0.0033562183380126953, "step": 445} {"info/global_step": 446, "train_info/time_within_train_step": 2.7206854820251465, "step": 446} {"train_info/time_between_train_steps": 0.003618955612182617, "step": 446} {"info/global_step": 447, "train_info/time_within_train_step": 2.6852142810821533, "step": 447} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 447} {"info/global_step": 448, "train_info/time_within_train_step": 2.6938538551330566, "step": 448} {"train_info/time_between_train_steps": 0.0035750865936279297, "step": 448} {"info/global_step": 449, "train_info/time_within_train_step": 2.713351011276245, "step": 449} {"train_info/time_between_train_steps": 0.0035398006439208984, "step": 449} {"info/global_step": 450, "train_info/time_within_train_step": 2.681309223175049, "step": 450} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746313161, "_runtime": 1317}, "step": 450} {"logs": {"train/loss": 5.5614, "train/learning_rate": 0.0005666666666666666, "train/epoch": 0.15, "_timestamp": 1746313161, "_runtime": 1317}, "step": 450} {"train_info/time_between_train_steps": 0.023989200592041016, "step": 450} {"info/global_step": 451, "train_info/time_within_train_step": 2.68213152885437, "step": 451} {"train_info/time_between_train_steps": 0.0032782554626464844, "step": 451} {"info/global_step": 452, "train_info/time_within_train_step": 2.690548896789551, "step": 452} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 452} {"info/global_step": 453, "train_info/time_within_train_step": 2.701108455657959, "step": 453} {"train_info/time_between_train_steps": 0.0032575130462646484, "step": 453} {"info/global_step": 454, "train_info/time_within_train_step": 2.7040891647338867, "step": 454} {"train_info/time_between_train_steps": 0.0032563209533691406, "step": 454} {"info/global_step": 455, "train_info/time_within_train_step": 2.683777332305908, "step": 455} {"train_info/time_between_train_steps": 0.0032165050506591797, "step": 455} {"info/global_step": 456, "train_info/time_within_train_step": 2.7112677097320557, "step": 456} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 456} {"info/global_step": 457, "train_info/time_within_train_step": 2.7054803371429443, "step": 457} {"train_info/time_between_train_steps": 0.0033974647521972656, "step": 457} {"info/global_step": 458, "train_info/time_within_train_step": 2.6844117641448975, "step": 458} {"train_info/time_between_train_steps": 0.003423452377319336, "step": 458} {"info/global_step": 459, "train_info/time_within_train_step": 2.6858582496643066, "step": 459} {"train_info/time_between_train_steps": 0.0034112930297851562, "step": 459} {"info/global_step": 460, "train_info/time_within_train_step": 2.702507972717285, "step": 460} {"train_info/time_between_train_steps": 0.0034105777740478516, "step": 460} {"info/global_step": 461, "train_info/time_within_train_step": 2.6927895545959473, "step": 461} {"train_info/time_between_train_steps": 0.003401041030883789, "step": 461} {"info/global_step": 462, "train_info/time_within_train_step": 2.6928458213806152, "step": 462} {"train_info/time_between_train_steps": 0.003450632095336914, "step": 462} {"info/global_step": 463, "train_info/time_within_train_step": 2.7071659564971924, "step": 463} {"train_info/time_between_train_steps": 0.003405332565307617, "step": 463} {"info/global_step": 464, "train_info/time_within_train_step": 2.6841468811035156, "step": 464} {"train_info/time_between_train_steps": 0.0033731460571289062, "step": 464} {"info/global_step": 465, "train_info/time_within_train_step": 2.6908750534057617, "step": 465} {"train_info/time_between_train_steps": 0.0034155845642089844, "step": 465} {"info/global_step": 466, "train_info/time_within_train_step": 2.6845552921295166, "step": 466} {"train_info/time_between_train_steps": 0.0034461021423339844, "step": 466} {"info/global_step": 467, "train_info/time_within_train_step": 2.6906814575195312, "step": 467} {"train_info/time_between_train_steps": 0.003435373306274414, "step": 467} {"info/global_step": 468, "train_info/time_within_train_step": 2.709689140319824, "step": 468} {"train_info/time_between_train_steps": 0.0036177635192871094, "step": 468} {"info/global_step": 469, "train_info/time_within_train_step": 2.6851630210876465, "step": 469} {"train_info/time_between_train_steps": 0.003603219985961914, "step": 469} {"info/global_step": 470, "train_info/time_within_train_step": 2.685615062713623, "step": 470} {"train_info/time_between_train_steps": 0.003534555435180664, "step": 470} {"info/global_step": 471, "train_info/time_within_train_step": 2.686626672744751, "step": 471} {"train_info/time_between_train_steps": 0.0036995410919189453, "step": 471} {"info/global_step": 472, "train_info/time_within_train_step": 2.684842824935913, "step": 472} {"train_info/time_between_train_steps": 0.003742694854736328, "step": 472} {"info/global_step": 473, "train_info/time_within_train_step": 2.6863155364990234, "step": 473} {"train_info/time_between_train_steps": 0.0036835670471191406, "step": 473} {"info/global_step": 474, "train_info/time_within_train_step": 2.685750722885132, "step": 474} {"train_info/time_between_train_steps": 0.003538370132446289, "step": 474} {"info/global_step": 475, "train_info/time_within_train_step": 2.6830973625183105, "step": 475} {"train_info/time_between_train_steps": 0.0034627914428710938, "step": 475} {"info/global_step": 476, "train_info/time_within_train_step": 2.6840131282806396, "step": 476} {"train_info/time_between_train_steps": 0.00350189208984375, "step": 476} {"info/global_step": 477, "train_info/time_within_train_step": 2.6845805644989014, "step": 477} {"train_info/time_between_train_steps": 0.0034296512603759766, "step": 477} {"info/global_step": 478, "train_info/time_within_train_step": 2.68371844291687, "step": 478} {"train_info/time_between_train_steps": 0.0034804344177246094, "step": 478} {"info/global_step": 479, "train_info/time_within_train_step": 2.6830432415008545, "step": 479} {"train_info/time_between_train_steps": 0.0034189224243164062, "step": 479} {"info/global_step": 480, "train_info/time_within_train_step": 2.681920051574707, "step": 480} {"train_info/time_between_train_steps": 0.0034999847412109375, "step": 480} {"info/global_step": 481, "train_info/time_within_train_step": 2.6832380294799805, "step": 481} {"train_info/time_between_train_steps": 0.0035104751586914062, "step": 481} {"info/global_step": 482, "train_info/time_within_train_step": 2.68412709236145, "step": 482} {"train_info/time_between_train_steps": 0.0033867359161376953, "step": 482} {"info/global_step": 483, "train_info/time_within_train_step": 2.6821861267089844, "step": 483} {"train_info/time_between_train_steps": 0.003443002700805664, "step": 483} {"info/global_step": 484, "train_info/time_within_train_step": 2.683730125427246, "step": 484} {"train_info/time_between_train_steps": 0.0034809112548828125, "step": 484} {"info/global_step": 485, "train_info/time_within_train_step": 2.6823513507843018, "step": 485} {"train_info/time_between_train_steps": 0.003504514694213867, "step": 485} {"info/global_step": 486, "train_info/time_within_train_step": 2.683739185333252, "step": 486} {"train_info/time_between_train_steps": 0.0034744739532470703, "step": 486} {"info/global_step": 487, "train_info/time_within_train_step": 2.6834874153137207, "step": 487} {"train_info/time_between_train_steps": 0.0034928321838378906, "step": 487} {"info/global_step": 488, "train_info/time_within_train_step": 2.68315052986145, "step": 488} {"train_info/time_between_train_steps": 0.0034019947052001953, "step": 488} {"info/global_step": 489, "train_info/time_within_train_step": 2.684370994567871, "step": 489} {"train_info/time_between_train_steps": 0.003520488739013672, "step": 489} {"info/global_step": 490, "train_info/time_within_train_step": 2.6831014156341553, "step": 490} {"train_info/time_between_train_steps": 0.0034825801849365234, "step": 490} {"info/global_step": 491, "train_info/time_within_train_step": 2.683314323425293, "step": 491} {"train_info/time_between_train_steps": 0.0034024715423583984, "step": 491} {"info/global_step": 492, "train_info/time_within_train_step": 2.6843302249908447, "step": 492} {"train_info/time_between_train_steps": 0.0034542083740234375, "step": 492} {"info/global_step": 493, "train_info/time_within_train_step": 2.6837596893310547, "step": 493} {"train_info/time_between_train_steps": 0.003423452377319336, "step": 493} {"info/global_step": 494, "train_info/time_within_train_step": 2.682854413986206, "step": 494} {"train_info/time_between_train_steps": 0.0033915042877197266, "step": 494} {"info/global_step": 495, "train_info/time_within_train_step": 2.683544158935547, "step": 495} {"train_info/time_between_train_steps": 0.0034325122833251953, "step": 495} {"info/global_step": 496, "train_info/time_within_train_step": 2.68347430229187, "step": 496} {"train_info/time_between_train_steps": 0.0035517215728759766, "step": 496} {"info/global_step": 497, "train_info/time_within_train_step": 2.683924674987793, "step": 497} {"train_info/time_between_train_steps": 0.003425121307373047, "step": 497} {"info/global_step": 498, "train_info/time_within_train_step": 2.683483600616455, "step": 498} {"train_info/time_between_train_steps": 0.0034890174865722656, "step": 498} {"info/global_step": 499, "train_info/time_within_train_step": 2.683837652206421, "step": 499} {"train_info/time_between_train_steps": 0.0035152435302734375, "step": 499} {"info/global_step": 500, "train_info/time_within_train_step": 3.2170186042785645, "step": 500} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746313297, "_runtime": 1453}, "step": 500} {"logs": {"train/loss": 5.4909, "train/learning_rate": 0.0005555555555555556, "train/epoch": 0.17, "_timestamp": 1746313297, "_runtime": 1453}, "step": 500} {"train_info/time_between_train_steps": 13.257297277450562, "step": 500} {"info/global_step": 501, "train_info/time_within_train_step": 2.4876699447631836, "step": 501} {"train_info/time_between_train_steps": 0.0033965110778808594, "step": 501} {"info/global_step": 502, "train_info/time_within_train_step": 2.4960029125213623, "step": 502} {"train_info/time_between_train_steps": 0.0033233165740966797, "step": 502} {"info/global_step": 503, "train_info/time_within_train_step": 2.6797361373901367, "step": 503} {"train_info/time_between_train_steps": 0.0033385753631591797, "step": 503} {"info/global_step": 504, "train_info/time_within_train_step": 2.680206060409546, "step": 504} {"train_info/time_between_train_steps": 0.003420591354370117, "step": 504} {"info/global_step": 505, "train_info/time_within_train_step": 2.6824729442596436, "step": 505} {"train_info/time_between_train_steps": 0.003245830535888672, "step": 505} {"info/global_step": 506, "train_info/time_within_train_step": 2.681429386138916, "step": 506} {"train_info/time_between_train_steps": 0.0032923221588134766, "step": 506} {"info/global_step": 507, "train_info/time_within_train_step": 2.6817421913146973, "step": 507} {"train_info/time_between_train_steps": 0.0033028125762939453, "step": 507} {"info/global_step": 508, "train_info/time_within_train_step": 2.9473578929901123, "step": 508} {"train_info/time_between_train_steps": 0.003238677978515625, "step": 508} {"info/global_step": 509, "train_info/time_within_train_step": 2.681849956512451, "step": 509} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 509} {"info/global_step": 510, "train_info/time_within_train_step": 2.6817378997802734, "step": 510} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 510} {"info/global_step": 511, "train_info/time_within_train_step": 2.684014081954956, "step": 511} {"train_info/time_between_train_steps": 0.0032858848571777344, "step": 511} {"info/global_step": 512, "train_info/time_within_train_step": 2.6829910278320312, "step": 512} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 512} {"info/global_step": 513, "train_info/time_within_train_step": 2.7135672569274902, "step": 513} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 513} {"info/global_step": 514, "train_info/time_within_train_step": 2.8892083168029785, "step": 514} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 514} {"info/global_step": 515, "train_info/time_within_train_step": 2.7744274139404297, "step": 515} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 515} {"info/global_step": 516, "train_info/time_within_train_step": 2.745964765548706, "step": 516} {"train_info/time_between_train_steps": 0.0037376880645751953, "step": 516} {"info/global_step": 517, "train_info/time_within_train_step": 2.712918519973755, "step": 517} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 517} {"info/global_step": 518, "train_info/time_within_train_step": 2.7268753051757812, "step": 518} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 518} {"info/global_step": 519, "train_info/time_within_train_step": 2.7614595890045166, "step": 519} {"train_info/time_between_train_steps": 0.003241300582885742, "step": 519} {"info/global_step": 520, "train_info/time_within_train_step": 2.7058467864990234, "step": 520} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 520} {"info/global_step": 521, "train_info/time_within_train_step": 2.7062063217163086, "step": 521} {"train_info/time_between_train_steps": 0.0035247802734375, "step": 521} {"info/global_step": 522, "train_info/time_within_train_step": 2.7307610511779785, "step": 522} {"train_info/time_between_train_steps": 0.0033707618713378906, "step": 522} {"info/global_step": 523, "train_info/time_within_train_step": 2.728337287902832, "step": 523} {"train_info/time_between_train_steps": 0.003350496292114258, "step": 523} {"info/global_step": 524, "train_info/time_within_train_step": 2.704833984375, "step": 524} {"train_info/time_between_train_steps": 0.0033807754516601562, "step": 524} {"info/global_step": 525, "train_info/time_within_train_step": 2.7435171604156494, "step": 525} {"train_info/time_between_train_steps": 0.0033507347106933594, "step": 525} {"info/global_step": 526, "train_info/time_within_train_step": 2.686688184738159, "step": 526} {"train_info/time_between_train_steps": 0.0033483505249023438, "step": 526} {"info/global_step": 527, "train_info/time_within_train_step": 2.7244279384613037, "step": 527} {"train_info/time_between_train_steps": 0.003352642059326172, "step": 527} {"info/global_step": 528, "train_info/time_within_train_step": 2.7338383197784424, "step": 528} {"train_info/time_between_train_steps": 0.003439188003540039, "step": 528} {"info/global_step": 529, "train_info/time_within_train_step": 2.6912248134613037, "step": 529} {"train_info/time_between_train_steps": 0.0034186840057373047, "step": 529} {"info/global_step": 530, "train_info/time_within_train_step": 2.7147815227508545, "step": 530} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 530} {"info/global_step": 531, "train_info/time_within_train_step": 2.7061803340911865, "step": 531} {"train_info/time_between_train_steps": 0.003382444381713867, "step": 531} {"info/global_step": 532, "train_info/time_within_train_step": 2.7091856002807617, "step": 532} {"train_info/time_between_train_steps": 0.0034093856811523438, "step": 532} {"info/global_step": 533, "train_info/time_within_train_step": 2.7026185989379883, "step": 533} {"train_info/time_between_train_steps": 0.0033791065216064453, "step": 533} {"info/global_step": 534, "train_info/time_within_train_step": 2.7127676010131836, "step": 534} {"train_info/time_between_train_steps": 0.003393888473510742, "step": 534} {"info/global_step": 535, "train_info/time_within_train_step": 2.7055788040161133, "step": 535} {"train_info/time_between_train_steps": 0.0036470890045166016, "step": 535} {"info/global_step": 536, "train_info/time_within_train_step": 2.7121505737304688, "step": 536} {"train_info/time_between_train_steps": 0.003300189971923828, "step": 536} {"info/global_step": 537, "train_info/time_within_train_step": 2.6947383880615234, "step": 537} {"train_info/time_between_train_steps": 0.0033767223358154297, "step": 537} {"info/global_step": 538, "train_info/time_within_train_step": 2.7142701148986816, "step": 538} {"train_info/time_between_train_steps": 0.003469705581665039, "step": 538} {"info/global_step": 539, "train_info/time_within_train_step": 2.70563006401062, "step": 539} {"train_info/time_between_train_steps": 0.003326416015625, "step": 539} {"info/global_step": 540, "train_info/time_within_train_step": 2.707777976989746, "step": 540} {"train_info/time_between_train_steps": 0.003328561782836914, "step": 540} {"info/global_step": 541, "train_info/time_within_train_step": 2.745025873184204, "step": 541} {"train_info/time_between_train_steps": 0.026518583297729492, "step": 541} {"info/global_step": 542, "train_info/time_within_train_step": 2.682694911956787, "step": 542} {"train_info/time_between_train_steps": 0.0029239654541015625, "step": 542} {"info/global_step": 543, "train_info/time_within_train_step": 2.7038931846618652, "step": 543} {"train_info/time_between_train_steps": 0.0030367374420166016, "step": 543} {"info/global_step": 544, "train_info/time_within_train_step": 2.6862945556640625, "step": 544} {"train_info/time_between_train_steps": 0.002950906753540039, "step": 544} {"info/global_step": 545, "train_info/time_within_train_step": 2.7270023822784424, "step": 545} {"train_info/time_between_train_steps": 0.0029447078704833984, "step": 545} {"info/global_step": 546, "train_info/time_within_train_step": 2.9315011501312256, "step": 546} {"train_info/time_between_train_steps": 0.0030870437622070312, "step": 546} {"info/global_step": 547, "train_info/time_within_train_step": 2.682664155960083, "step": 547} {"train_info/time_between_train_steps": 0.0028862953186035156, "step": 547} {"info/global_step": 548, "train_info/time_within_train_step": 2.6825995445251465, "step": 548} {"train_info/time_between_train_steps": 0.002998828887939453, "step": 548} {"info/global_step": 549, "train_info/time_within_train_step": 2.682081937789917, "step": 549} {"train_info/time_between_train_steps": 0.002973318099975586, "step": 549} {"info/global_step": 550, "train_info/time_within_train_step": 2.681947946548462, "step": 550} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746313447, "_runtime": 1603}, "step": 550} {"logs": {"train/loss": 5.4158, "train/learning_rate": 0.0005444444444444444, "train/epoch": 0.18, "_timestamp": 1746313447, "_runtime": 1603}, "step": 550} {"train_info/time_between_train_steps": 0.02494025230407715, "step": 550} {"info/global_step": 551, "train_info/time_within_train_step": 2.683459520339966, "step": 551} {"train_info/time_between_train_steps": 0.002966642379760742, "step": 551} {"info/global_step": 552, "train_info/time_within_train_step": 2.6935551166534424, "step": 552} {"train_info/time_between_train_steps": 0.002847909927368164, "step": 552} {"info/global_step": 553, "train_info/time_within_train_step": 2.713109016418457, "step": 553} {"train_info/time_between_train_steps": 0.003139972686767578, "step": 553} {"info/global_step": 554, "train_info/time_within_train_step": 2.7009029388427734, "step": 554} {"train_info/time_between_train_steps": 0.0028417110443115234, "step": 554} {"info/global_step": 555, "train_info/time_within_train_step": 2.6892216205596924, "step": 555} {"train_info/time_between_train_steps": 0.0030236244201660156, "step": 555} {"info/global_step": 556, "train_info/time_within_train_step": 2.685537099838257, "step": 556} {"train_info/time_between_train_steps": 0.0029871463775634766, "step": 556} {"info/global_step": 557, "train_info/time_within_train_step": 2.695756673812866, "step": 557} {"train_info/time_between_train_steps": 0.003088712692260742, "step": 557} {"info/global_step": 558, "train_info/time_within_train_step": 2.6928818225860596, "step": 558} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 558} {"info/global_step": 559, "train_info/time_within_train_step": 2.693881034851074, "step": 559} {"train_info/time_between_train_steps": 0.002942800521850586, "step": 559} {"info/global_step": 560, "train_info/time_within_train_step": 2.6993954181671143, "step": 560} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 560} {"info/global_step": 561, "train_info/time_within_train_step": 2.6841704845428467, "step": 561} {"train_info/time_between_train_steps": 0.0029337406158447266, "step": 561} {"info/global_step": 562, "train_info/time_within_train_step": 2.6871414184570312, "step": 562} {"train_info/time_between_train_steps": 0.0028853416442871094, "step": 562} {"info/global_step": 563, "train_info/time_within_train_step": 2.752511501312256, "step": 563} {"train_info/time_between_train_steps": 0.0029549598693847656, "step": 563} {"info/global_step": 564, "train_info/time_within_train_step": 2.6840968132019043, "step": 564} {"train_info/time_between_train_steps": 0.002959012985229492, "step": 564} {"info/global_step": 565, "train_info/time_within_train_step": 2.6875858306884766, "step": 565} {"train_info/time_between_train_steps": 0.002972126007080078, "step": 565} {"info/global_step": 566, "train_info/time_within_train_step": 2.6829640865325928, "step": 566} {"train_info/time_between_train_steps": 0.0029211044311523438, "step": 566} {"info/global_step": 567, "train_info/time_within_train_step": 2.6995339393615723, "step": 567} {"train_info/time_between_train_steps": 0.0029397010803222656, "step": 567} {"info/global_step": 568, "train_info/time_within_train_step": 2.682291269302368, "step": 568} {"train_info/time_between_train_steps": 0.002944469451904297, "step": 568} {"info/global_step": 569, "train_info/time_within_train_step": 2.6825170516967773, "step": 569} {"train_info/time_between_train_steps": 0.0029096603393554688, "step": 569} {"info/global_step": 570, "train_info/time_within_train_step": 2.681720495223999, "step": 570} {"train_info/time_between_train_steps": 0.002901792526245117, "step": 570} {"info/global_step": 571, "train_info/time_within_train_step": 2.689638137817383, "step": 571} {"train_info/time_between_train_steps": 0.0029745101928710938, "step": 571} {"info/global_step": 572, "train_info/time_within_train_step": 2.69738507270813, "step": 572} {"train_info/time_between_train_steps": 0.0029244422912597656, "step": 572} {"info/global_step": 573, "train_info/time_within_train_step": 2.6874942779541016, "step": 573} {"train_info/time_between_train_steps": 0.003509521484375, "step": 573} {"info/global_step": 574, "train_info/time_within_train_step": 2.6861681938171387, "step": 574} {"train_info/time_between_train_steps": 0.0029854774475097656, "step": 574} {"info/global_step": 575, "train_info/time_within_train_step": 2.6942381858825684, "step": 575} {"train_info/time_between_train_steps": 0.0029554367065429688, "step": 575} {"info/global_step": 576, "train_info/time_within_train_step": 2.6841700077056885, "step": 576} {"train_info/time_between_train_steps": 0.0029489994049072266, "step": 576} {"info/global_step": 577, "train_info/time_within_train_step": 2.682967185974121, "step": 577} {"train_info/time_between_train_steps": 0.0029168128967285156, "step": 577} {"info/global_step": 578, "train_info/time_within_train_step": 2.68342924118042, "step": 578} {"train_info/time_between_train_steps": 0.0029866695404052734, "step": 578} {"info/global_step": 579, "train_info/time_within_train_step": 2.683617353439331, "step": 579} {"train_info/time_between_train_steps": 0.003053426742553711, "step": 579} {"info/global_step": 580, "train_info/time_within_train_step": 2.6835622787475586, "step": 580} {"train_info/time_between_train_steps": 0.003008127212524414, "step": 580} {"info/global_step": 581, "train_info/time_within_train_step": 2.6826841831207275, "step": 581} {"train_info/time_between_train_steps": 0.0029802322387695312, "step": 581} {"info/global_step": 582, "train_info/time_within_train_step": 2.6830811500549316, "step": 582} {"train_info/time_between_train_steps": 0.002950906753540039, "step": 582} {"info/global_step": 583, "train_info/time_within_train_step": 2.6833689212799072, "step": 583} {"train_info/time_between_train_steps": 0.002986431121826172, "step": 583} {"info/global_step": 584, "train_info/time_within_train_step": 2.681907892227173, "step": 584} {"train_info/time_between_train_steps": 0.002961874008178711, "step": 584} {"info/global_step": 585, "train_info/time_within_train_step": 2.6822729110717773, "step": 585} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 585} {"info/global_step": 586, "train_info/time_within_train_step": 2.6812736988067627, "step": 586} {"train_info/time_between_train_steps": 0.0030145645141601562, "step": 586} {"info/global_step": 587, "train_info/time_within_train_step": 2.682286500930786, "step": 587} {"train_info/time_between_train_steps": 0.0029582977294921875, "step": 587} {"info/global_step": 588, "train_info/time_within_train_step": 2.6821889877319336, "step": 588} {"train_info/time_between_train_steps": 0.002968311309814453, "step": 588} {"info/global_step": 589, "train_info/time_within_train_step": 2.6817851066589355, "step": 589} {"train_info/time_between_train_steps": 0.002948284149169922, "step": 589} {"info/global_step": 590, "train_info/time_within_train_step": 2.6834049224853516, "step": 590} {"train_info/time_between_train_steps": 0.0029823780059814453, "step": 590} {"info/global_step": 591, "train_info/time_within_train_step": 2.682591438293457, "step": 591} {"train_info/time_between_train_steps": 0.002941608428955078, "step": 591} {"info/global_step": 592, "train_info/time_within_train_step": 2.6822569370269775, "step": 592} {"train_info/time_between_train_steps": 0.0029740333557128906, "step": 592} {"info/global_step": 593, "train_info/time_within_train_step": 2.6818466186523438, "step": 593} {"train_info/time_between_train_steps": 0.002988576889038086, "step": 593} {"info/global_step": 594, "train_info/time_within_train_step": 2.683103084564209, "step": 594} {"train_info/time_between_train_steps": 0.002952098846435547, "step": 594} {"info/global_step": 595, "train_info/time_within_train_step": 2.6831142902374268, "step": 595} {"train_info/time_between_train_steps": 0.0029349327087402344, "step": 595} {"info/global_step": 596, "train_info/time_within_train_step": 2.6828699111938477, "step": 596} {"train_info/time_between_train_steps": 0.0029816627502441406, "step": 596} {"info/global_step": 597, "train_info/time_within_train_step": 2.682565927505493, "step": 597} {"train_info/time_between_train_steps": 0.0030341148376464844, "step": 597} {"info/global_step": 598, "train_info/time_within_train_step": 2.683588743209839, "step": 598} {"train_info/time_between_train_steps": 0.0029668807983398438, "step": 598} {"info/global_step": 599, "train_info/time_within_train_step": 2.681666851043701, "step": 599} {"train_info/time_between_train_steps": 0.0029795169830322266, "step": 599} {"info/global_step": 600, "train_info/time_within_train_step": 2.68200945854187, "step": 600} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746313582, "_runtime": 1738}, "step": 600} {"logs": {"train/loss": 5.3499, "train/learning_rate": 0.0005333333333333333, "train/epoch": 0.2, "_timestamp": 1746313582, "_runtime": 1738}, "step": 600} {"train_info/time_between_train_steps": 13.071470022201538, "step": 600} {"info/global_step": 601, "train_info/time_within_train_step": 2.485992908477783, "step": 601} {"train_info/time_between_train_steps": 0.0029113292694091797, "step": 601} {"info/global_step": 602, "train_info/time_within_train_step": 2.541644811630249, "step": 602} {"train_info/time_between_train_steps": 0.002885580062866211, "step": 602} {"info/global_step": 603, "train_info/time_within_train_step": 2.677135467529297, "step": 603} {"train_info/time_between_train_steps": 0.003106832504272461, "step": 603} {"info/global_step": 604, "train_info/time_within_train_step": 2.6776974201202393, "step": 604} {"train_info/time_between_train_steps": 0.0029044151306152344, "step": 604} {"info/global_step": 605, "train_info/time_within_train_step": 2.68096923828125, "step": 605} {"train_info/time_between_train_steps": 0.0029659271240234375, "step": 605} {"info/global_step": 606, "train_info/time_within_train_step": 2.6799604892730713, "step": 606} {"train_info/time_between_train_steps": 0.002900362014770508, "step": 606} {"info/global_step": 607, "train_info/time_within_train_step": 2.680145740509033, "step": 607} {"train_info/time_between_train_steps": 0.002887248992919922, "step": 607} {"info/global_step": 608, "train_info/time_within_train_step": 2.680131435394287, "step": 608} {"train_info/time_between_train_steps": 0.002875804901123047, "step": 608} {"info/global_step": 609, "train_info/time_within_train_step": 2.6833603382110596, "step": 609} {"train_info/time_between_train_steps": 0.0028867721557617188, "step": 609} {"info/global_step": 610, "train_info/time_within_train_step": 2.681596040725708, "step": 610} {"train_info/time_between_train_steps": 0.002902507781982422, "step": 610} {"info/global_step": 611, "train_info/time_within_train_step": 2.682718515396118, "step": 611} {"train_info/time_between_train_steps": 0.002905130386352539, "step": 611} {"info/global_step": 612, "train_info/time_within_train_step": 2.6820225715637207, "step": 612} {"train_info/time_between_train_steps": 0.002903461456298828, "step": 612} {"info/global_step": 613, "train_info/time_within_train_step": 2.719475030899048, "step": 613} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 613} {"info/global_step": 614, "train_info/time_within_train_step": 2.882146120071411, "step": 614} {"train_info/time_between_train_steps": 0.0029382705688476562, "step": 614} {"info/global_step": 615, "train_info/time_within_train_step": 2.816563367843628, "step": 615} {"train_info/time_between_train_steps": 0.0029261112213134766, "step": 615} {"info/global_step": 616, "train_info/time_within_train_step": 2.7773759365081787, "step": 616} {"train_info/time_between_train_steps": 0.002919435501098633, "step": 616} {"info/global_step": 617, "train_info/time_within_train_step": 2.7075629234313965, "step": 617} {"train_info/time_between_train_steps": 0.0028836727142333984, "step": 617} {"info/global_step": 618, "train_info/time_within_train_step": 2.717772960662842, "step": 618} {"train_info/time_between_train_steps": 0.002971649169921875, "step": 618} {"info/global_step": 619, "train_info/time_within_train_step": 2.8640384674072266, "step": 619} {"train_info/time_between_train_steps": 0.0034394264221191406, "step": 619} {"info/global_step": 620, "train_info/time_within_train_step": 2.7108659744262695, "step": 620} {"train_info/time_between_train_steps": 0.0028901100158691406, "step": 620} {"info/global_step": 621, "train_info/time_within_train_step": 2.7082505226135254, "step": 621} {"train_info/time_between_train_steps": 0.0028693675994873047, "step": 621} {"info/global_step": 622, "train_info/time_within_train_step": 2.7559971809387207, "step": 622} {"train_info/time_between_train_steps": 0.0030057430267333984, "step": 622} {"info/global_step": 623, "train_info/time_within_train_step": 2.6932730674743652, "step": 623} {"train_info/time_between_train_steps": 0.002963542938232422, "step": 623} {"info/global_step": 624, "train_info/time_within_train_step": 2.7213613986968994, "step": 624} {"train_info/time_between_train_steps": 0.003005504608154297, "step": 624} {"info/global_step": 625, "train_info/time_within_train_step": 2.709451675415039, "step": 625} {"train_info/time_between_train_steps": 0.002895832061767578, "step": 625} {"info/global_step": 626, "train_info/time_within_train_step": 2.6997745037078857, "step": 626} {"train_info/time_between_train_steps": 0.002871990203857422, "step": 626} {"info/global_step": 627, "train_info/time_within_train_step": 2.7122018337249756, "step": 627} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 627} {"info/global_step": 628, "train_info/time_within_train_step": 2.716677665710449, "step": 628} {"train_info/time_between_train_steps": 0.0028831958770751953, "step": 628} {"info/global_step": 629, "train_info/time_within_train_step": 2.7045516967773438, "step": 629} {"train_info/time_between_train_steps": 0.0031070709228515625, "step": 629} {"info/global_step": 630, "train_info/time_within_train_step": 2.7038681507110596, "step": 630} {"train_info/time_between_train_steps": 0.0031232833862304688, "step": 630} {"info/global_step": 631, "train_info/time_within_train_step": 2.7194130420684814, "step": 631} {"train_info/time_between_train_steps": 0.002969026565551758, "step": 631} {"info/global_step": 632, "train_info/time_within_train_step": 2.7127976417541504, "step": 632} {"train_info/time_between_train_steps": 0.0028362274169921875, "step": 632} {"info/global_step": 633, "train_info/time_within_train_step": 2.6998775005340576, "step": 633} {"train_info/time_between_train_steps": 0.003086566925048828, "step": 633} {"info/global_step": 634, "train_info/time_within_train_step": 2.709111213684082, "step": 634} {"train_info/time_between_train_steps": 0.0029821395874023438, "step": 634} {"info/global_step": 635, "train_info/time_within_train_step": 2.71368145942688, "step": 635} {"train_info/time_between_train_steps": 0.0028412342071533203, "step": 635} {"info/global_step": 636, "train_info/time_within_train_step": 2.7083516120910645, "step": 636} {"train_info/time_between_train_steps": 0.003117084503173828, "step": 636} {"info/global_step": 637, "train_info/time_within_train_step": 2.7020883560180664, "step": 637} {"train_info/time_between_train_steps": 0.0028586387634277344, "step": 637} {"info/global_step": 638, "train_info/time_within_train_step": 2.698834180831909, "step": 638} {"train_info/time_between_train_steps": 0.0029668807983398438, "step": 638} {"info/global_step": 639, "train_info/time_within_train_step": 2.703594923019409, "step": 639} {"train_info/time_between_train_steps": 0.002948284149169922, "step": 639} {"info/global_step": 640, "train_info/time_within_train_step": 2.7218198776245117, "step": 640} {"train_info/time_between_train_steps": 0.0028793811798095703, "step": 640} {"info/global_step": 641, "train_info/time_within_train_step": 2.693199634552002, "step": 641} {"train_info/time_between_train_steps": 0.0029091835021972656, "step": 641} {"info/global_step": 642, "train_info/time_within_train_step": 2.6992294788360596, "step": 642} {"train_info/time_between_train_steps": 0.002897977828979492, "step": 642} {"info/global_step": 643, "train_info/time_within_train_step": 2.7063710689544678, "step": 643} {"train_info/time_between_train_steps": 0.002891063690185547, "step": 643} {"info/global_step": 644, "train_info/time_within_train_step": 2.7198469638824463, "step": 644} {"train_info/time_between_train_steps": 0.002973318099975586, "step": 644} {"info/global_step": 645, "train_info/time_within_train_step": 2.7101645469665527, "step": 645} {"train_info/time_between_train_steps": 0.002918720245361328, "step": 645} {"info/global_step": 646, "train_info/time_within_train_step": 2.706392765045166, "step": 646} {"train_info/time_between_train_steps": 0.002936124801635742, "step": 646} {"info/global_step": 647, "train_info/time_within_train_step": 2.6882266998291016, "step": 647} {"train_info/time_between_train_steps": 0.0029044151306152344, "step": 647} {"info/global_step": 648, "train_info/time_within_train_step": 2.702613115310669, "step": 648} {"train_info/time_between_train_steps": 0.002910614013671875, "step": 648} {"info/global_step": 649, "train_info/time_within_train_step": 2.7112107276916504, "step": 649} {"train_info/time_between_train_steps": 0.0028922557830810547, "step": 649} {"info/global_step": 650, "train_info/time_within_train_step": 2.681762218475342, "step": 650} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746313732, "_runtime": 1888}, "step": 650} {"logs": {"train/loss": 5.2595, "train/learning_rate": 0.0005222222222222222, "train/epoch": 0.22, "_timestamp": 1746313732, "_runtime": 1888}, "step": 650} {"train_info/time_between_train_steps": 0.02452254295349121, "step": 650} {"info/global_step": 651, "train_info/time_within_train_step": 2.6814746856689453, "step": 651} {"train_info/time_between_train_steps": 0.0028946399688720703, "step": 651} {"info/global_step": 652, "train_info/time_within_train_step": 2.6944942474365234, "step": 652} {"train_info/time_between_train_steps": 0.0029726028442382812, "step": 652} {"info/global_step": 653, "train_info/time_within_train_step": 2.693350076675415, "step": 653} {"train_info/time_between_train_steps": 0.002923727035522461, "step": 653} {"info/global_step": 654, "train_info/time_within_train_step": 2.68365478515625, "step": 654} {"train_info/time_between_train_steps": 0.002952098846435547, "step": 654} {"info/global_step": 655, "train_info/time_within_train_step": 2.70932936668396, "step": 655} {"train_info/time_between_train_steps": 0.0029244422912597656, "step": 655} {"info/global_step": 656, "train_info/time_within_train_step": 2.700282573699951, "step": 656} {"train_info/time_between_train_steps": 0.0029168128967285156, "step": 656} {"info/global_step": 657, "train_info/time_within_train_step": 2.6830992698669434, "step": 657} {"train_info/time_between_train_steps": 0.002906322479248047, "step": 657} {"info/global_step": 658, "train_info/time_within_train_step": 2.684058427810669, "step": 658} {"train_info/time_between_train_steps": 0.0028748512268066406, "step": 658} {"info/global_step": 659, "train_info/time_within_train_step": 2.701227903366089, "step": 659} {"train_info/time_between_train_steps": 0.0029196739196777344, "step": 659} {"info/global_step": 660, "train_info/time_within_train_step": 2.7030344009399414, "step": 660} {"train_info/time_between_train_steps": 0.002886056900024414, "step": 660} {"info/global_step": 661, "train_info/time_within_train_step": 2.6901464462280273, "step": 661} {"train_info/time_between_train_steps": 0.0029239654541015625, "step": 661} {"info/global_step": 662, "train_info/time_within_train_step": 2.6958067417144775, "step": 662} {"train_info/time_between_train_steps": 0.002901792526245117, "step": 662} {"info/global_step": 663, "train_info/time_within_train_step": 2.702880620956421, "step": 663} {"train_info/time_between_train_steps": 0.0029213428497314453, "step": 663} {"info/global_step": 664, "train_info/time_within_train_step": 2.6928582191467285, "step": 664} {"train_info/time_between_train_steps": 0.0029027462005615234, "step": 664} {"info/global_step": 665, "train_info/time_within_train_step": 2.682215929031372, "step": 665} {"train_info/time_between_train_steps": 0.002917051315307617, "step": 665} {"info/global_step": 666, "train_info/time_within_train_step": 2.6810734272003174, "step": 666} {"train_info/time_between_train_steps": 0.0028924942016601562, "step": 666} {"info/global_step": 667, "train_info/time_within_train_step": 2.690727710723877, "step": 667} {"train_info/time_between_train_steps": 0.0028870105743408203, "step": 667} {"info/global_step": 668, "train_info/time_within_train_step": 2.695768356323242, "step": 668} {"train_info/time_between_train_steps": 0.0029141902923583984, "step": 668} {"info/global_step": 669, "train_info/time_within_train_step": 2.7449190616607666, "step": 669} {"train_info/time_between_train_steps": 0.0029249191284179688, "step": 669} {"info/global_step": 670, "train_info/time_within_train_step": 2.680748224258423, "step": 670} {"train_info/time_between_train_steps": 0.002942800521850586, "step": 670} {"info/global_step": 671, "train_info/time_within_train_step": 2.6867830753326416, "step": 671} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 671} {"info/global_step": 672, "train_info/time_within_train_step": 2.682394027709961, "step": 672} {"train_info/time_between_train_steps": 0.0029087066650390625, "step": 672} {"info/global_step": 673, "train_info/time_within_train_step": 2.6905882358551025, "step": 673} {"train_info/time_between_train_steps": 0.0028867721557617188, "step": 673} {"info/global_step": 674, "train_info/time_within_train_step": 2.6807453632354736, "step": 674} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 674} {"info/global_step": 675, "train_info/time_within_train_step": 2.6819276809692383, "step": 675} {"train_info/time_between_train_steps": 0.0029211044311523438, "step": 675} {"info/global_step": 676, "train_info/time_within_train_step": 2.6947245597839355, "step": 676} {"train_info/time_between_train_steps": 0.0029239654541015625, "step": 676} {"info/global_step": 677, "train_info/time_within_train_step": 2.6886038780212402, "step": 677} {"train_info/time_between_train_steps": 0.002901315689086914, "step": 677} {"info/global_step": 678, "train_info/time_within_train_step": 2.682252883911133, "step": 678} {"train_info/time_between_train_steps": 0.0029175281524658203, "step": 678} {"info/global_step": 679, "train_info/time_within_train_step": 2.6864709854125977, "step": 679} {"train_info/time_between_train_steps": 0.002869844436645508, "step": 679} {"info/global_step": 680, "train_info/time_within_train_step": 2.6823596954345703, "step": 680} {"train_info/time_between_train_steps": 0.0028743743896484375, "step": 680} {"info/global_step": 681, "train_info/time_within_train_step": 2.6815526485443115, "step": 681} {"train_info/time_between_train_steps": 0.0028798580169677734, "step": 681} {"info/global_step": 682, "train_info/time_within_train_step": 2.68272066116333, "step": 682} {"train_info/time_between_train_steps": 0.002863645553588867, "step": 682} {"info/global_step": 683, "train_info/time_within_train_step": 2.6827638149261475, "step": 683} {"train_info/time_between_train_steps": 0.002900838851928711, "step": 683} {"info/global_step": 684, "train_info/time_within_train_step": 2.68280029296875, "step": 684} {"train_info/time_between_train_steps": 0.0029375553131103516, "step": 684} {"info/global_step": 685, "train_info/time_within_train_step": 2.6828737258911133, "step": 685} {"train_info/time_between_train_steps": 0.0029172897338867188, "step": 685} {"info/global_step": 686, "train_info/time_within_train_step": 2.6825685501098633, "step": 686} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 686} {"info/global_step": 687, "train_info/time_within_train_step": 2.68291974067688, "step": 687} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 687} {"info/global_step": 688, "train_info/time_within_train_step": 2.6827003955841064, "step": 688} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 688} {"info/global_step": 689, "train_info/time_within_train_step": 2.683549404144287, "step": 689} {"train_info/time_between_train_steps": 0.0029523372650146484, "step": 689} {"info/global_step": 690, "train_info/time_within_train_step": 2.682407855987549, "step": 690} {"train_info/time_between_train_steps": 0.002920866012573242, "step": 690} {"info/global_step": 691, "train_info/time_within_train_step": 2.6831624507904053, "step": 691} {"train_info/time_between_train_steps": 0.0029315948486328125, "step": 691} {"info/global_step": 692, "train_info/time_within_train_step": 2.6828136444091797, "step": 692} {"train_info/time_between_train_steps": 0.0029449462890625, "step": 692} {"info/global_step": 693, "train_info/time_within_train_step": 2.6838459968566895, "step": 693} {"train_info/time_between_train_steps": 0.003047943115234375, "step": 693} {"info/global_step": 694, "train_info/time_within_train_step": 2.68222975730896, "step": 694} {"train_info/time_between_train_steps": 0.0029196739196777344, "step": 694} {"info/global_step": 695, "train_info/time_within_train_step": 2.6829848289489746, "step": 695} {"train_info/time_between_train_steps": 0.0029125213623046875, "step": 695} {"info/global_step": 696, "train_info/time_within_train_step": 2.6819515228271484, "step": 696} {"train_info/time_between_train_steps": 0.002959012985229492, "step": 696} {"info/global_step": 697, "train_info/time_within_train_step": 2.6826624870300293, "step": 697} {"train_info/time_between_train_steps": 0.0029315948486328125, "step": 697} {"info/global_step": 698, "train_info/time_within_train_step": 2.680586814880371, "step": 698} {"train_info/time_between_train_steps": 0.002941608428955078, "step": 698} {"info/global_step": 699, "train_info/time_within_train_step": 2.68178391456604, "step": 699} {"train_info/time_between_train_steps": 0.0029244422912597656, "step": 699} {"info/global_step": 700, "train_info/time_within_train_step": 2.682776689529419, "step": 700} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746313868, "_runtime": 2024}, "step": 700} {"logs": {"train/loss": 5.1877, "train/learning_rate": 0.0005111111111111111, "train/epoch": 0.23, "_timestamp": 1746313868, "_runtime": 2024}, "step": 700} {"train_info/time_between_train_steps": 14.097192287445068, "step": 700} {"info/global_step": 701, "train_info/time_within_train_step": 2.5082085132598877, "step": 701} {"train_info/time_between_train_steps": 0.0029671192169189453, "step": 701} {"info/global_step": 702, "train_info/time_within_train_step": 2.5019145011901855, "step": 702} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 702} {"info/global_step": 703, "train_info/time_within_train_step": 2.680102825164795, "step": 703} {"train_info/time_between_train_steps": 0.002917766571044922, "step": 703} {"info/global_step": 704, "train_info/time_within_train_step": 2.678605556488037, "step": 704} {"train_info/time_between_train_steps": 0.002931356430053711, "step": 704} {"info/global_step": 705, "train_info/time_within_train_step": 2.679884195327759, "step": 705} {"train_info/time_between_train_steps": 0.002920866012573242, "step": 705} {"info/global_step": 706, "train_info/time_within_train_step": 2.679886817932129, "step": 706} {"train_info/time_between_train_steps": 0.002928495407104492, "step": 706} {"info/global_step": 707, "train_info/time_within_train_step": 2.793133497238159, "step": 707} {"train_info/time_between_train_steps": 0.0029327869415283203, "step": 707} {"info/global_step": 708, "train_info/time_within_train_step": 2.6791248321533203, "step": 708} {"train_info/time_between_train_steps": 0.002879619598388672, "step": 708} {"info/global_step": 709, "train_info/time_within_train_step": 2.6798107624053955, "step": 709} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 709} {"info/global_step": 710, "train_info/time_within_train_step": 2.679772138595581, "step": 710} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 710} {"info/global_step": 711, "train_info/time_within_train_step": 2.680436611175537, "step": 711} {"train_info/time_between_train_steps": 0.002956390380859375, "step": 711} {"info/global_step": 712, "train_info/time_within_train_step": 2.6796069145202637, "step": 712} {"train_info/time_between_train_steps": 0.0029561519622802734, "step": 712} {"info/global_step": 713, "train_info/time_within_train_step": 2.7214741706848145, "step": 713} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 713} {"info/global_step": 714, "train_info/time_within_train_step": 2.834320306777954, "step": 714} {"train_info/time_between_train_steps": 0.002939462661743164, "step": 714} {"info/global_step": 715, "train_info/time_within_train_step": 2.7656993865966797, "step": 715} {"train_info/time_between_train_steps": 0.0028922557830810547, "step": 715} {"info/global_step": 716, "train_info/time_within_train_step": 2.752859592437744, "step": 716} {"train_info/time_between_train_steps": 0.00296783447265625, "step": 716} {"info/global_step": 717, "train_info/time_within_train_step": 2.7216265201568604, "step": 717} {"train_info/time_between_train_steps": 0.0029058456420898438, "step": 717} {"info/global_step": 718, "train_info/time_within_train_step": 2.7381930351257324, "step": 718} {"train_info/time_between_train_steps": 0.002919912338256836, "step": 718} {"info/global_step": 719, "train_info/time_within_train_step": 2.754626750946045, "step": 719} {"train_info/time_between_train_steps": 0.0029180049896240234, "step": 719} {"info/global_step": 720, "train_info/time_within_train_step": 2.717982292175293, "step": 720} {"train_info/time_between_train_steps": 0.002942800521850586, "step": 720} {"info/global_step": 721, "train_info/time_within_train_step": 2.6997692584991455, "step": 721} {"train_info/time_between_train_steps": 0.002933025360107422, "step": 721} {"info/global_step": 722, "train_info/time_within_train_step": 2.712415933609009, "step": 722} {"train_info/time_between_train_steps": 0.002925395965576172, "step": 722} {"info/global_step": 723, "train_info/time_within_train_step": 2.7364068031311035, "step": 723} {"train_info/time_between_train_steps": 0.002898693084716797, "step": 723} {"info/global_step": 724, "train_info/time_within_train_step": 2.7217087745666504, "step": 724} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 724} {"info/global_step": 725, "train_info/time_within_train_step": 2.7029569149017334, "step": 725} {"train_info/time_between_train_steps": 0.002944469451904297, "step": 725} {"info/global_step": 726, "train_info/time_within_train_step": 2.702228546142578, "step": 726} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 726} {"info/global_step": 727, "train_info/time_within_train_step": 2.6932990550994873, "step": 727} {"train_info/time_between_train_steps": 0.0029478073120117188, "step": 727} {"info/global_step": 728, "train_info/time_within_train_step": 2.6824800968170166, "step": 728} {"train_info/time_between_train_steps": 0.00284576416015625, "step": 728} {"info/global_step": 729, "train_info/time_within_train_step": 2.7279844284057617, "step": 729} {"train_info/time_between_train_steps": 0.0030570030212402344, "step": 729} {"info/global_step": 730, "train_info/time_within_train_step": 2.712299108505249, "step": 730} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 730} {"info/global_step": 731, "train_info/time_within_train_step": 2.7086246013641357, "step": 731} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 731} {"info/global_step": 732, "train_info/time_within_train_step": 2.7185986042022705, "step": 732} {"train_info/time_between_train_steps": 0.0029299259185791016, "step": 732} {"info/global_step": 733, "train_info/time_within_train_step": 2.6879024505615234, "step": 733} {"train_info/time_between_train_steps": 0.002866983413696289, "step": 733} {"info/global_step": 734, "train_info/time_within_train_step": 2.7058377265930176, "step": 734} {"train_info/time_between_train_steps": 0.002875089645385742, "step": 734} {"info/global_step": 735, "train_info/time_within_train_step": 2.7080540657043457, "step": 735} {"train_info/time_between_train_steps": 0.0029134750366210938, "step": 735} {"info/global_step": 736, "train_info/time_within_train_step": 2.713078498840332, "step": 736} {"train_info/time_between_train_steps": 0.0030469894409179688, "step": 736} {"info/global_step": 737, "train_info/time_within_train_step": 2.7011892795562744, "step": 737} {"train_info/time_between_train_steps": 0.0031180381774902344, "step": 737} {"info/global_step": 738, "train_info/time_within_train_step": 2.7039687633514404, "step": 738} {"train_info/time_between_train_steps": 0.0036597251892089844, "step": 738} {"info/global_step": 739, "train_info/time_within_train_step": 2.7025887966156006, "step": 739} {"train_info/time_between_train_steps": 0.0028536319732666016, "step": 739} {"info/global_step": 740, "train_info/time_within_train_step": 2.706397533416748, "step": 740} {"train_info/time_between_train_steps": 0.003031015396118164, "step": 740} {"info/global_step": 741, "train_info/time_within_train_step": 2.706226348876953, "step": 741} {"train_info/time_between_train_steps": 0.002897024154663086, "step": 741} {"info/global_step": 742, "train_info/time_within_train_step": 2.6834583282470703, "step": 742} {"train_info/time_between_train_steps": 0.0031435489654541016, "step": 742} {"info/global_step": 743, "train_info/time_within_train_step": 2.6967086791992188, "step": 743} {"train_info/time_between_train_steps": 0.003092050552368164, "step": 743} {"info/global_step": 744, "train_info/time_within_train_step": 2.7235732078552246, "step": 744} {"train_info/time_between_train_steps": 0.0031092166900634766, "step": 744} {"info/global_step": 745, "train_info/time_within_train_step": 2.837923049926758, "step": 745} {"train_info/time_between_train_steps": 0.0028748512268066406, "step": 745} {"info/global_step": 746, "train_info/time_within_train_step": 2.6898951530456543, "step": 746} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 746} {"info/global_step": 747, "train_info/time_within_train_step": 2.682093858718872, "step": 747} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 747} {"info/global_step": 748, "train_info/time_within_train_step": 2.6945347785949707, "step": 748} {"train_info/time_between_train_steps": 0.0030760765075683594, "step": 748} {"info/global_step": 749, "train_info/time_within_train_step": 2.724581480026245, "step": 749} {"train_info/time_between_train_steps": 0.002905607223510742, "step": 749} {"info/global_step": 750, "train_info/time_within_train_step": 3.175031900405884, "step": 750} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746314019, "_runtime": 2175}, "step": 750} {"logs": {"train/loss": 5.1092, "train/learning_rate": 0.0005, "train/epoch": 0.25, "_timestamp": 1746314019, "_runtime": 2175}, "step": 750} {"train_info/time_between_train_steps": 0.024426937103271484, "step": 750} {"info/global_step": 751, "train_info/time_within_train_step": 2.6806328296661377, "step": 751} {"train_info/time_between_train_steps": 0.002917051315307617, "step": 751} {"info/global_step": 752, "train_info/time_within_train_step": 2.68174147605896, "step": 752} {"train_info/time_between_train_steps": 0.003097057342529297, "step": 752} {"info/global_step": 753, "train_info/time_within_train_step": 2.6817264556884766, "step": 753} {"train_info/time_between_train_steps": 0.0029344558715820312, "step": 753} {"info/global_step": 754, "train_info/time_within_train_step": 2.682365655899048, "step": 754} {"train_info/time_between_train_steps": 0.0030410289764404297, "step": 754} {"info/global_step": 755, "train_info/time_within_train_step": 2.6810033321380615, "step": 755} {"train_info/time_between_train_steps": 0.0028548240661621094, "step": 755} {"info/global_step": 756, "train_info/time_within_train_step": 2.6815781593322754, "step": 756} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 756} {"info/global_step": 757, "train_info/time_within_train_step": 2.6823954582214355, "step": 757} {"train_info/time_between_train_steps": 0.002920389175415039, "step": 757} {"info/global_step": 758, "train_info/time_within_train_step": 2.6828036308288574, "step": 758} {"train_info/time_between_train_steps": 0.0029630661010742188, "step": 758} {"info/global_step": 759, "train_info/time_within_train_step": 2.682384490966797, "step": 759} {"train_info/time_between_train_steps": 0.0028858184814453125, "step": 759} {"info/global_step": 760, "train_info/time_within_train_step": 2.6811342239379883, "step": 760} {"train_info/time_between_train_steps": 0.003081083297729492, "step": 760} {"info/global_step": 761, "train_info/time_within_train_step": 2.691012382507324, "step": 761} {"train_info/time_between_train_steps": 0.0028600692749023438, "step": 761} {"info/global_step": 762, "train_info/time_within_train_step": 2.6944315433502197, "step": 762} {"train_info/time_between_train_steps": 0.002917051315307617, "step": 762} {"info/global_step": 763, "train_info/time_within_train_step": 2.704808235168457, "step": 763} {"train_info/time_between_train_steps": 0.003043651580810547, "step": 763} {"info/global_step": 764, "train_info/time_within_train_step": 2.688793897628784, "step": 764} {"train_info/time_between_train_steps": 0.0029468536376953125, "step": 764} {"info/global_step": 765, "train_info/time_within_train_step": 2.6826066970825195, "step": 765} {"train_info/time_between_train_steps": 0.002872943878173828, "step": 765} {"info/global_step": 766, "train_info/time_within_train_step": 2.684988498687744, "step": 766} {"train_info/time_between_train_steps": 0.002974271774291992, "step": 766} {"info/global_step": 767, "train_info/time_within_train_step": 2.7227585315704346, "step": 767} {"train_info/time_between_train_steps": 0.0029647350311279297, "step": 767} {"info/global_step": 768, "train_info/time_within_train_step": 2.7013328075408936, "step": 768} {"train_info/time_between_train_steps": 0.0032186508178710938, "step": 768} {"info/global_step": 769, "train_info/time_within_train_step": 2.681384801864624, "step": 769} {"train_info/time_between_train_steps": 0.0031011104583740234, "step": 769} {"info/global_step": 770, "train_info/time_within_train_step": 2.6825642585754395, "step": 770} {"train_info/time_between_train_steps": 0.0029175281524658203, "step": 770} {"info/global_step": 771, "train_info/time_within_train_step": 2.6826682090759277, "step": 771} {"train_info/time_between_train_steps": 0.0028963088989257812, "step": 771} {"info/global_step": 772, "train_info/time_within_train_step": 2.680878162384033, "step": 772} {"train_info/time_between_train_steps": 0.002908945083618164, "step": 772} {"info/global_step": 773, "train_info/time_within_train_step": 2.681318759918213, "step": 773} {"train_info/time_between_train_steps": 0.003079652786254883, "step": 773} {"info/global_step": 774, "train_info/time_within_train_step": 2.6816651821136475, "step": 774} {"train_info/time_between_train_steps": 0.0028960704803466797, "step": 774} {"info/global_step": 775, "train_info/time_within_train_step": 2.6811933517456055, "step": 775} {"train_info/time_between_train_steps": 0.002931356430053711, "step": 775} {"info/global_step": 776, "train_info/time_within_train_step": 2.6807281970977783, "step": 776} {"train_info/time_between_train_steps": 0.0030815601348876953, "step": 776} {"info/global_step": 777, "train_info/time_within_train_step": 2.680483102798462, "step": 777} {"train_info/time_between_train_steps": 0.003139019012451172, "step": 777} {"info/global_step": 778, "train_info/time_within_train_step": 2.68037748336792, "step": 778} {"train_info/time_between_train_steps": 0.002835512161254883, "step": 778} {"info/global_step": 779, "train_info/time_within_train_step": 2.681375741958618, "step": 779} {"train_info/time_between_train_steps": 0.0028886795043945312, "step": 779} {"info/global_step": 780, "train_info/time_within_train_step": 2.681546449661255, "step": 780} {"train_info/time_between_train_steps": 0.0028367042541503906, "step": 780} {"info/global_step": 781, "train_info/time_within_train_step": 2.681133985519409, "step": 781} {"train_info/time_between_train_steps": 0.0030410289764404297, "step": 781} {"info/global_step": 782, "train_info/time_within_train_step": 2.6799705028533936, "step": 782} {"train_info/time_between_train_steps": 0.003040790557861328, "step": 782} {"info/global_step": 783, "train_info/time_within_train_step": 2.681340217590332, "step": 783} {"train_info/time_between_train_steps": 0.0028705596923828125, "step": 783} {"info/global_step": 784, "train_info/time_within_train_step": 2.6818015575408936, "step": 784} {"train_info/time_between_train_steps": 0.0029528141021728516, "step": 784} {"info/global_step": 785, "train_info/time_within_train_step": 2.6829569339752197, "step": 785} {"train_info/time_between_train_steps": 0.0029091835021972656, "step": 785} {"info/global_step": 786, "train_info/time_within_train_step": 2.6822428703308105, "step": 786} {"train_info/time_between_train_steps": 0.003110170364379883, "step": 786} {"info/global_step": 787, "train_info/time_within_train_step": 2.6808409690856934, "step": 787} {"train_info/time_between_train_steps": 0.0029861927032470703, "step": 787} {"info/global_step": 788, "train_info/time_within_train_step": 2.680734634399414, "step": 788} {"train_info/time_between_train_steps": 0.002904653549194336, "step": 788} {"info/global_step": 789, "train_info/time_within_train_step": 2.683297634124756, "step": 789} {"train_info/time_between_train_steps": 0.003095388412475586, "step": 789} {"info/global_step": 790, "train_info/time_within_train_step": 2.682750940322876, "step": 790} {"train_info/time_between_train_steps": 0.002947568893432617, "step": 790} {"info/global_step": 791, "train_info/time_within_train_step": 2.6831376552581787, "step": 791} {"train_info/time_between_train_steps": 0.003257274627685547, "step": 791} {"info/global_step": 792, "train_info/time_within_train_step": 2.6823928356170654, "step": 792} {"train_info/time_between_train_steps": 0.002983570098876953, "step": 792} {"info/global_step": 793, "train_info/time_within_train_step": 2.683682918548584, "step": 793} {"train_info/time_between_train_steps": 0.002943277359008789, "step": 793} {"info/global_step": 794, "train_info/time_within_train_step": 2.683535099029541, "step": 794} {"train_info/time_between_train_steps": 0.0029785633087158203, "step": 794} {"info/global_step": 795, "train_info/time_within_train_step": 2.682981014251709, "step": 795} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 795} {"info/global_step": 796, "train_info/time_within_train_step": 2.6820592880249023, "step": 796} {"train_info/time_between_train_steps": 0.0029740333557128906, "step": 796} {"info/global_step": 797, "train_info/time_within_train_step": 2.6820881366729736, "step": 797} {"train_info/time_between_train_steps": 0.002983570098876953, "step": 797} {"info/global_step": 798, "train_info/time_within_train_step": 2.682713747024536, "step": 798} {"train_info/time_between_train_steps": 0.0029888153076171875, "step": 798} {"info/global_step": 799, "train_info/time_within_train_step": 2.6815803050994873, "step": 799} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 799} {"info/global_step": 800, "train_info/time_within_train_step": 2.6822738647460938, "step": 800} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746314154, "_runtime": 2310}, "step": 800} {"logs": {"train/loss": 5.0435, "train/learning_rate": 0.0004888888888888889, "train/epoch": 0.27, "_timestamp": 1746314154, "_runtime": 2310}, "step": 800} {"train_info/time_between_train_steps": 15.550905704498291, "step": 800} {"info/global_step": 801, "train_info/time_within_train_step": 2.4839529991149902, "step": 801} {"train_info/time_between_train_steps": 0.002933025360107422, "step": 801} {"info/global_step": 802, "train_info/time_within_train_step": 2.4838225841522217, "step": 802} {"train_info/time_between_train_steps": 0.002957582473754883, "step": 802} {"info/global_step": 803, "train_info/time_within_train_step": 2.6722519397735596, "step": 803} {"train_info/time_between_train_steps": 0.002966642379760742, "step": 803} {"info/global_step": 804, "train_info/time_within_train_step": 2.677910089492798, "step": 804} {"train_info/time_between_train_steps": 0.0029714107513427734, "step": 804} {"info/global_step": 805, "train_info/time_within_train_step": 2.6796162128448486, "step": 805} {"train_info/time_between_train_steps": 0.0029571056365966797, "step": 805} {"info/global_step": 806, "train_info/time_within_train_step": 2.7027323246002197, "step": 806} {"train_info/time_between_train_steps": 0.0030269622802734375, "step": 806} {"info/global_step": 807, "train_info/time_within_train_step": 2.6804633140563965, "step": 807} {"train_info/time_between_train_steps": 0.0029692649841308594, "step": 807} {"info/global_step": 808, "train_info/time_within_train_step": 2.682126998901367, "step": 808} {"train_info/time_between_train_steps": 0.003058910369873047, "step": 808} {"info/global_step": 809, "train_info/time_within_train_step": 2.6800732612609863, "step": 809} {"train_info/time_between_train_steps": 0.002876758575439453, "step": 809} {"info/global_step": 810, "train_info/time_within_train_step": 2.6818690299987793, "step": 810} {"train_info/time_between_train_steps": 0.0030202865600585938, "step": 810} {"info/global_step": 811, "train_info/time_within_train_step": 2.691405773162842, "step": 811} {"train_info/time_between_train_steps": 0.0030469894409179688, "step": 811} {"info/global_step": 812, "train_info/time_within_train_step": 2.680948495864868, "step": 812} {"train_info/time_between_train_steps": 0.003052234649658203, "step": 812} {"info/global_step": 813, "train_info/time_within_train_step": 2.696096658706665, "step": 813} {"train_info/time_between_train_steps": 0.0030426979064941406, "step": 813} {"info/global_step": 814, "train_info/time_within_train_step": 2.85416579246521, "step": 814} {"train_info/time_between_train_steps": 0.0030913352966308594, "step": 814} {"info/global_step": 815, "train_info/time_within_train_step": 2.813891649246216, "step": 815} {"train_info/time_between_train_steps": 0.0029134750366210938, "step": 815} {"info/global_step": 816, "train_info/time_within_train_step": 2.7298061847686768, "step": 816} {"train_info/time_between_train_steps": 0.002880096435546875, "step": 816} {"info/global_step": 817, "train_info/time_within_train_step": 2.7102484703063965, "step": 817} {"train_info/time_between_train_steps": 0.0029664039611816406, "step": 817} {"info/global_step": 818, "train_info/time_within_train_step": 2.722543716430664, "step": 818} {"train_info/time_between_train_steps": 0.0028984546661376953, "step": 818} {"info/global_step": 819, "train_info/time_within_train_step": 2.72163987159729, "step": 819} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 819} {"info/global_step": 820, "train_info/time_within_train_step": 2.6987926959991455, "step": 820} {"train_info/time_between_train_steps": 0.003078937530517578, "step": 820} {"info/global_step": 821, "train_info/time_within_train_step": 2.7069942951202393, "step": 821} {"train_info/time_between_train_steps": 0.003094196319580078, "step": 821} {"info/global_step": 822, "train_info/time_within_train_step": 2.719754457473755, "step": 822} {"train_info/time_between_train_steps": 0.0029625892639160156, "step": 822} {"info/global_step": 823, "train_info/time_within_train_step": 2.6990928649902344, "step": 823} {"train_info/time_between_train_steps": 0.0030257701873779297, "step": 823} {"info/global_step": 824, "train_info/time_within_train_step": 2.688812732696533, "step": 824} {"train_info/time_between_train_steps": 0.003134489059448242, "step": 824} {"info/global_step": 825, "train_info/time_within_train_step": 2.7442264556884766, "step": 825} {"train_info/time_between_train_steps": 0.003039836883544922, "step": 825} {"info/global_step": 826, "train_info/time_within_train_step": 2.70220685005188, "step": 826} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 826} {"info/global_step": 827, "train_info/time_within_train_step": 2.7105250358581543, "step": 827} {"train_info/time_between_train_steps": 0.0031211376190185547, "step": 827} {"info/global_step": 828, "train_info/time_within_train_step": 2.7302889823913574, "step": 828} {"train_info/time_between_train_steps": 0.002941131591796875, "step": 828} {"info/global_step": 829, "train_info/time_within_train_step": 2.6926534175872803, "step": 829} {"train_info/time_between_train_steps": 0.0031206607818603516, "step": 829} {"info/global_step": 830, "train_info/time_within_train_step": 2.7433791160583496, "step": 830} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 830} {"info/global_step": 831, "train_info/time_within_train_step": 2.742619514465332, "step": 831} {"train_info/time_between_train_steps": 0.0032203197479248047, "step": 831} {"info/global_step": 832, "train_info/time_within_train_step": 2.704807758331299, "step": 832} {"train_info/time_between_train_steps": 0.0031027793884277344, "step": 832} {"info/global_step": 833, "train_info/time_within_train_step": 2.698291778564453, "step": 833} {"train_info/time_between_train_steps": 0.0030510425567626953, "step": 833} {"info/global_step": 834, "train_info/time_within_train_step": 2.6939940452575684, "step": 834} {"train_info/time_between_train_steps": 0.0029468536376953125, "step": 834} {"info/global_step": 835, "train_info/time_within_train_step": 2.7485103607177734, "step": 835} {"train_info/time_between_train_steps": 0.003400564193725586, "step": 835} {"info/global_step": 836, "train_info/time_within_train_step": 2.696894407272339, "step": 836} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 836} {"info/global_step": 837, "train_info/time_within_train_step": 2.7125163078308105, "step": 837} {"train_info/time_between_train_steps": 0.0032165050506591797, "step": 837} {"info/global_step": 838, "train_info/time_within_train_step": 2.7103469371795654, "step": 838} {"train_info/time_between_train_steps": 0.0030956268310546875, "step": 838} {"info/global_step": 839, "train_info/time_within_train_step": 2.691713571548462, "step": 839} {"train_info/time_between_train_steps": 0.003103971481323242, "step": 839} {"info/global_step": 840, "train_info/time_within_train_step": 2.685631036758423, "step": 840} {"train_info/time_between_train_steps": 0.0033292770385742188, "step": 840} {"info/global_step": 841, "train_info/time_within_train_step": 2.7096197605133057, "step": 841} {"train_info/time_between_train_steps": 0.0033524036407470703, "step": 841} {"info/global_step": 842, "train_info/time_within_train_step": 2.704284191131592, "step": 842} {"train_info/time_between_train_steps": 0.003108501434326172, "step": 842} {"info/global_step": 843, "train_info/time_within_train_step": 2.6950631141662598, "step": 843} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 843} {"info/global_step": 844, "train_info/time_within_train_step": 2.699955701828003, "step": 844} {"train_info/time_between_train_steps": 0.0035941600799560547, "step": 844} {"info/global_step": 845, "train_info/time_within_train_step": 2.701474905014038, "step": 845} {"train_info/time_between_train_steps": 0.0032167434692382812, "step": 845} {"info/global_step": 846, "train_info/time_within_train_step": 2.7079527378082275, "step": 846} {"train_info/time_between_train_steps": 0.0033292770385742188, "step": 846} {"info/global_step": 847, "train_info/time_within_train_step": 2.711054801940918, "step": 847} {"train_info/time_between_train_steps": 0.003269195556640625, "step": 847} {"info/global_step": 848, "train_info/time_within_train_step": 2.7002410888671875, "step": 848} {"train_info/time_between_train_steps": 0.0033371448516845703, "step": 848} {"info/global_step": 849, "train_info/time_within_train_step": 2.6915879249572754, "step": 849} {"train_info/time_between_train_steps": 0.0032804012298583984, "step": 849} {"info/global_step": 850, "train_info/time_within_train_step": 2.70654034614563, "step": 850} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746314306, "_runtime": 2462}, "step": 850} {"logs": {"train/loss": 4.9746, "train/learning_rate": 0.0004777777777777777, "train/epoch": 0.28, "_timestamp": 1746314306, "_runtime": 2462}, "step": 850} {"train_info/time_between_train_steps": 0.025279998779296875, "step": 850} {"info/global_step": 851, "train_info/time_within_train_step": 2.702747344970703, "step": 851} {"train_info/time_between_train_steps": 0.003515958786010742, "step": 851} {"info/global_step": 852, "train_info/time_within_train_step": 2.684265375137329, "step": 852} {"train_info/time_between_train_steps": 0.003470897674560547, "step": 852} {"info/global_step": 853, "train_info/time_within_train_step": 2.7129032611846924, "step": 853} {"train_info/time_between_train_steps": 0.0035266876220703125, "step": 853} {"train_info/time_between_train_steps": 3.4276583194732666, "step": 853} {"info/global_step": 854, "train_info/time_within_train_step": 2.680428981781006, "step": 854} {"train_info/time_between_train_steps": 0.0031173229217529297, "step": 854} {"info/global_step": 855, "train_info/time_within_train_step": 2.681293487548828, "step": 855} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 855} {"info/global_step": 856, "train_info/time_within_train_step": 2.6811745166778564, "step": 856} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 856} {"info/global_step": 857, "train_info/time_within_train_step": 2.680980682373047, "step": 857} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 857} {"info/global_step": 858, "train_info/time_within_train_step": 2.6817710399627686, "step": 858} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 858} {"info/global_step": 859, "train_info/time_within_train_step": 2.680243492126465, "step": 859} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 859} {"info/global_step": 860, "train_info/time_within_train_step": 2.680565357208252, "step": 860} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 860} {"info/global_step": 861, "train_info/time_within_train_step": 2.681434392929077, "step": 861} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 861} {"info/global_step": 862, "train_info/time_within_train_step": 2.681036949157715, "step": 862} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 862} {"info/global_step": 863, "train_info/time_within_train_step": 2.6813535690307617, "step": 863} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 863} {"info/global_step": 864, "train_info/time_within_train_step": 2.6814165115356445, "step": 864} {"train_info/time_between_train_steps": 0.003190755844116211, "step": 864} {"info/global_step": 865, "train_info/time_within_train_step": 2.6817638874053955, "step": 865} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 865} {"info/global_step": 866, "train_info/time_within_train_step": 2.682469129562378, "step": 866} {"train_info/time_between_train_steps": 0.0031287670135498047, "step": 866} {"info/global_step": 867, "train_info/time_within_train_step": 2.68137788772583, "step": 867} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 867} {"info/global_step": 868, "train_info/time_within_train_step": 2.6819894313812256, "step": 868} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 868} {"info/global_step": 869, "train_info/time_within_train_step": 2.6817967891693115, "step": 869} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 869} {"info/global_step": 870, "train_info/time_within_train_step": 2.6831324100494385, "step": 870} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 870} {"info/global_step": 871, "train_info/time_within_train_step": 2.7054977416992188, "step": 871} {"train_info/time_between_train_steps": 0.003133535385131836, "step": 871} {"info/global_step": 872, "train_info/time_within_train_step": 2.683331251144409, "step": 872} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 872} {"info/global_step": 873, "train_info/time_within_train_step": 2.681795597076416, "step": 873} {"train_info/time_between_train_steps": 0.0033795833587646484, "step": 873} {"info/global_step": 874, "train_info/time_within_train_step": 2.6807315349578857, "step": 874} {"train_info/time_between_train_steps": 0.003274202346801758, "step": 874} {"info/global_step": 875, "train_info/time_within_train_step": 2.6808390617370605, "step": 875} {"train_info/time_between_train_steps": 0.0033600330352783203, "step": 875} {"info/global_step": 876, "train_info/time_within_train_step": 2.681183099746704, "step": 876} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 876} {"info/global_step": 877, "train_info/time_within_train_step": 2.6804354190826416, "step": 877} {"train_info/time_between_train_steps": 0.0033915042877197266, "step": 877} {"info/global_step": 878, "train_info/time_within_train_step": 2.681051254272461, "step": 878} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 878} {"info/global_step": 879, "train_info/time_within_train_step": 2.681563138961792, "step": 879} {"train_info/time_between_train_steps": 0.0033659934997558594, "step": 879} {"info/global_step": 880, "train_info/time_within_train_step": 2.682791233062744, "step": 880} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 880} {"info/global_step": 881, "train_info/time_within_train_step": 2.6818604469299316, "step": 881} {"train_info/time_between_train_steps": 0.0033283233642578125, "step": 881} {"info/global_step": 882, "train_info/time_within_train_step": 2.682420253753662, "step": 882} {"train_info/time_between_train_steps": 0.003262758255004883, "step": 882} {"info/global_step": 883, "train_info/time_within_train_step": 2.6821889877319336, "step": 883} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 883} {"info/global_step": 884, "train_info/time_within_train_step": 2.6816656589508057, "step": 884} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 884} {"info/global_step": 885, "train_info/time_within_train_step": 2.682684898376465, "step": 885} {"train_info/time_between_train_steps": 0.0031273365020751953, "step": 885} {"info/global_step": 886, "train_info/time_within_train_step": 2.6820993423461914, "step": 886} {"train_info/time_between_train_steps": 0.003120899200439453, "step": 886} {"info/global_step": 887, "train_info/time_within_train_step": 2.682509183883667, "step": 887} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 887} {"info/global_step": 888, "train_info/time_within_train_step": 2.682323694229126, "step": 888} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 888} {"info/global_step": 889, "train_info/time_within_train_step": 2.6815924644470215, "step": 889} {"train_info/time_between_train_steps": 0.003387451171875, "step": 889} {"info/global_step": 890, "train_info/time_within_train_step": 2.6814627647399902, "step": 890} {"train_info/time_between_train_steps": 0.0037767887115478516, "step": 890} {"info/global_step": 891, "train_info/time_within_train_step": 2.681910514831543, "step": 891} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 891} {"info/global_step": 892, "train_info/time_within_train_step": 2.682058095932007, "step": 892} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 892} {"info/global_step": 893, "train_info/time_within_train_step": 2.681830883026123, "step": 893} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 893} {"info/global_step": 894, "train_info/time_within_train_step": 2.682236909866333, "step": 894} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 894} {"info/global_step": 895, "train_info/time_within_train_step": 2.682871103286743, "step": 895} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 895} {"info/global_step": 896, "train_info/time_within_train_step": 2.681814432144165, "step": 896} {"train_info/time_between_train_steps": 0.003359079360961914, "step": 896} {"info/global_step": 897, "train_info/time_within_train_step": 2.6809184551239014, "step": 897} {"train_info/time_between_train_steps": 0.0033943653106689453, "step": 897} {"info/global_step": 898, "train_info/time_within_train_step": 2.682756185531616, "step": 898} {"train_info/time_between_train_steps": 0.0033600330352783203, "step": 898} {"info/global_step": 899, "train_info/time_within_train_step": 2.6817126274108887, "step": 899} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 899} {"info/global_step": 900, "train_info/time_within_train_step": 2.6808221340179443, "step": 900} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746314444, "_runtime": 2600}, "step": 900} {"logs": {"train/loss": 4.9723, "train/learning_rate": 0.0004666666666666666, "train/epoch": 1.02, "_timestamp": 1746314444, "_runtime": 2600}, "step": 900} {"train_info/time_between_train_steps": 14.357206106185913, "step": 900} {"info/global_step": 901, "train_info/time_within_train_step": 2.4778950214385986, "step": 901} {"train_info/time_between_train_steps": 0.003243684768676758, "step": 901} {"info/global_step": 902, "train_info/time_within_train_step": 2.4924092292785645, "step": 902} {"train_info/time_between_train_steps": 0.0031075477600097656, "step": 902} {"info/global_step": 903, "train_info/time_within_train_step": 2.6762101650238037, "step": 903} {"train_info/time_between_train_steps": 0.003093719482421875, "step": 903} {"info/global_step": 904, "train_info/time_within_train_step": 2.677027702331543, "step": 904} {"train_info/time_between_train_steps": 0.003112316131591797, "step": 904} {"info/global_step": 905, "train_info/time_within_train_step": 2.6781299114227295, "step": 905} {"train_info/time_between_train_steps": 0.003272533416748047, "step": 905} {"info/global_step": 906, "train_info/time_within_train_step": 2.684131622314453, "step": 906} {"train_info/time_between_train_steps": 0.003267049789428711, "step": 906} {"info/global_step": 907, "train_info/time_within_train_step": 2.67989444732666, "step": 907} {"train_info/time_between_train_steps": 0.0031080245971679688, "step": 907} {"info/global_step": 908, "train_info/time_within_train_step": 2.6793406009674072, "step": 908} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 908} {"info/global_step": 909, "train_info/time_within_train_step": 2.6804404258728027, "step": 909} {"train_info/time_between_train_steps": 0.003125905990600586, "step": 909} {"info/global_step": 910, "train_info/time_within_train_step": 2.680166244506836, "step": 910} {"train_info/time_between_train_steps": 0.0031402111053466797, "step": 910} {"info/global_step": 911, "train_info/time_within_train_step": 2.682067632675171, "step": 911} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 911} {"info/global_step": 912, "train_info/time_within_train_step": 2.6817281246185303, "step": 912} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 912} {"info/global_step": 913, "train_info/time_within_train_step": 2.7173330783843994, "step": 913} {"train_info/time_between_train_steps": 0.0033495426177978516, "step": 913} {"info/global_step": 914, "train_info/time_within_train_step": 2.814796209335327, "step": 914} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 914} {"info/global_step": 915, "train_info/time_within_train_step": 2.764676809310913, "step": 915} {"train_info/time_between_train_steps": 0.0031256675720214844, "step": 915} {"info/global_step": 916, "train_info/time_within_train_step": 2.8419833183288574, "step": 916} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 916} {"info/global_step": 917, "train_info/time_within_train_step": 2.7142412662506104, "step": 917} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 917} {"info/global_step": 918, "train_info/time_within_train_step": 2.9209423065185547, "step": 918} {"train_info/time_between_train_steps": 0.0034797191619873047, "step": 918} {"info/global_step": 919, "train_info/time_within_train_step": 2.6883609294891357, "step": 919} {"train_info/time_between_train_steps": 0.003193378448486328, "step": 919} {"info/global_step": 920, "train_info/time_within_train_step": 2.697284698486328, "step": 920} {"train_info/time_between_train_steps": 0.003283262252807617, "step": 920} {"info/global_step": 921, "train_info/time_within_train_step": 2.7157745361328125, "step": 921} {"train_info/time_between_train_steps": 0.0033495426177978516, "step": 921} {"info/global_step": 922, "train_info/time_within_train_step": 2.7207915782928467, "step": 922} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 922} {"info/global_step": 923, "train_info/time_within_train_step": 2.690756320953369, "step": 923} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 923} {"info/global_step": 924, "train_info/time_within_train_step": 2.693912982940674, "step": 924} {"train_info/time_between_train_steps": 0.003916501998901367, "step": 924} {"info/global_step": 925, "train_info/time_within_train_step": 2.7230372428894043, "step": 925} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 925} {"info/global_step": 926, "train_info/time_within_train_step": 2.713878631591797, "step": 926} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 926} {"info/global_step": 927, "train_info/time_within_train_step": 2.708066701889038, "step": 927} {"train_info/time_between_train_steps": 0.00325775146484375, "step": 927} {"info/global_step": 928, "train_info/time_within_train_step": 2.7136106491088867, "step": 928} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 928} {"info/global_step": 929, "train_info/time_within_train_step": 2.6883885860443115, "step": 929} {"train_info/time_between_train_steps": 0.0034203529357910156, "step": 929} {"info/global_step": 930, "train_info/time_within_train_step": 2.6943719387054443, "step": 930} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 930} {"info/global_step": 931, "train_info/time_within_train_step": 2.7120437622070312, "step": 931} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 931} {"info/global_step": 932, "train_info/time_within_train_step": 2.7109904289245605, "step": 932} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 932} {"info/global_step": 933, "train_info/time_within_train_step": 2.6865251064300537, "step": 933} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 933} {"info/global_step": 934, "train_info/time_within_train_step": 2.713944911956787, "step": 934} {"train_info/time_between_train_steps": 0.003214120864868164, "step": 934} {"info/global_step": 935, "train_info/time_within_train_step": 2.6993086338043213, "step": 935} {"train_info/time_between_train_steps": 0.0031256675720214844, "step": 935} {"info/global_step": 936, "train_info/time_within_train_step": 2.699814796447754, "step": 936} {"train_info/time_between_train_steps": 0.0031232833862304688, "step": 936} {"info/global_step": 937, "train_info/time_within_train_step": 2.71754789352417, "step": 937} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 937} {"info/global_step": 938, "train_info/time_within_train_step": 2.711024045944214, "step": 938} {"train_info/time_between_train_steps": 0.003300189971923828, "step": 938} {"info/global_step": 939, "train_info/time_within_train_step": 2.6925768852233887, "step": 939} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 939} {"info/global_step": 940, "train_info/time_within_train_step": 2.7093071937561035, "step": 940} {"train_info/time_between_train_steps": 0.003267049789428711, "step": 940} {"info/global_step": 941, "train_info/time_within_train_step": 2.7205488681793213, "step": 941} {"train_info/time_between_train_steps": 0.003114461898803711, "step": 941} {"info/global_step": 942, "train_info/time_within_train_step": 2.6822879314422607, "step": 942} {"train_info/time_between_train_steps": 0.0033369064331054688, "step": 942} {"info/global_step": 943, "train_info/time_within_train_step": 2.6942384243011475, "step": 943} {"train_info/time_between_train_steps": 0.003389120101928711, "step": 943} {"info/global_step": 944, "train_info/time_within_train_step": 2.710228204727173, "step": 944} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 944} {"info/global_step": 945, "train_info/time_within_train_step": 2.684373140335083, "step": 945} {"train_info/time_between_train_steps": 0.0033669471740722656, "step": 945} {"info/global_step": 946, "train_info/time_within_train_step": 2.713505983352661, "step": 946} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 946} {"info/global_step": 947, "train_info/time_within_train_step": 2.691885232925415, "step": 947} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 947} {"info/global_step": 948, "train_info/time_within_train_step": 2.7068629264831543, "step": 948} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 948} {"info/global_step": 949, "train_info/time_within_train_step": 2.70487904548645, "step": 949} {"train_info/time_between_train_steps": 0.003396272659301758, "step": 949} {"info/global_step": 950, "train_info/time_within_train_step": 2.6944026947021484, "step": 950} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746314595, "_runtime": 2751}, "step": 950} {"logs": {"train/loss": 4.8626, "train/learning_rate": 0.00045555555555555556, "train/epoch": 1.03, "_timestamp": 1746314595, "_runtime": 2751}, "step": 950} {"train_info/time_between_train_steps": 0.024641036987304688, "step": 950} {"info/global_step": 951, "train_info/time_within_train_step": 2.690859317779541, "step": 951} {"train_info/time_between_train_steps": 0.0031397342681884766, "step": 951} {"info/global_step": 952, "train_info/time_within_train_step": 2.6841654777526855, "step": 952} {"train_info/time_between_train_steps": 0.0034286975860595703, "step": 952} {"info/global_step": 953, "train_info/time_within_train_step": 2.683222532272339, "step": 953} {"train_info/time_between_train_steps": 0.003409147262573242, "step": 953} {"info/global_step": 954, "train_info/time_within_train_step": 2.700683116912842, "step": 954} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 954} {"info/global_step": 955, "train_info/time_within_train_step": 2.7032933235168457, "step": 955} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 955} {"info/global_step": 956, "train_info/time_within_train_step": 2.683845281600952, "step": 956} {"train_info/time_between_train_steps": 0.003215789794921875, "step": 956} {"info/global_step": 957, "train_info/time_within_train_step": 2.9099388122558594, "step": 957} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 957} {"info/global_step": 958, "train_info/time_within_train_step": 2.683096170425415, "step": 958} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 958} {"info/global_step": 959, "train_info/time_within_train_step": 2.6920249462127686, "step": 959} {"train_info/time_between_train_steps": 0.00331878662109375, "step": 959} {"info/global_step": 960, "train_info/time_within_train_step": 2.6832680702209473, "step": 960} {"train_info/time_between_train_steps": 0.003236532211303711, "step": 960} {"info/global_step": 961, "train_info/time_within_train_step": 2.6841931343078613, "step": 961} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 961} {"info/global_step": 962, "train_info/time_within_train_step": 2.6820693016052246, "step": 962} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 962} {"info/global_step": 963, "train_info/time_within_train_step": 2.682513475418091, "step": 963} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 963} {"info/global_step": 964, "train_info/time_within_train_step": 2.6833996772766113, "step": 964} {"train_info/time_between_train_steps": 0.003323793411254883, "step": 964} {"info/global_step": 965, "train_info/time_within_train_step": 2.6817753314971924, "step": 965} {"train_info/time_between_train_steps": 0.003367185592651367, "step": 965} {"info/global_step": 966, "train_info/time_within_train_step": 2.681872844696045, "step": 966} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 966} {"info/global_step": 967, "train_info/time_within_train_step": 2.682206153869629, "step": 967} {"train_info/time_between_train_steps": 0.0033884048461914062, "step": 967} {"info/global_step": 968, "train_info/time_within_train_step": 2.6831154823303223, "step": 968} {"train_info/time_between_train_steps": 0.0031397342681884766, "step": 968} {"info/global_step": 969, "train_info/time_within_train_step": 2.681915760040283, "step": 969} {"train_info/time_between_train_steps": 0.003265380859375, "step": 969} {"info/global_step": 970, "train_info/time_within_train_step": 2.682408571243286, "step": 970} {"train_info/time_between_train_steps": 0.003106355667114258, "step": 970} {"info/global_step": 971, "train_info/time_within_train_step": 2.6830554008483887, "step": 971} {"train_info/time_between_train_steps": 0.003113985061645508, "step": 971} {"info/global_step": 972, "train_info/time_within_train_step": 2.681886672973633, "step": 972} {"train_info/time_between_train_steps": 0.0036516189575195312, "step": 972} {"info/global_step": 973, "train_info/time_within_train_step": 2.682739496231079, "step": 973} {"train_info/time_between_train_steps": 0.0033757686614990234, "step": 973} {"info/global_step": 974, "train_info/time_within_train_step": 2.682241201400757, "step": 974} {"train_info/time_between_train_steps": 0.0031256675720214844, "step": 974} {"info/global_step": 975, "train_info/time_within_train_step": 2.683702230453491, "step": 975} {"train_info/time_between_train_steps": 0.0033860206604003906, "step": 975} {"info/global_step": 976, "train_info/time_within_train_step": 2.684183359146118, "step": 976} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 976} {"info/global_step": 977, "train_info/time_within_train_step": 2.7050840854644775, "step": 977} {"train_info/time_between_train_steps": 0.003232240676879883, "step": 977} {"info/global_step": 978, "train_info/time_within_train_step": 2.6817829608917236, "step": 978} {"train_info/time_between_train_steps": 0.12566280364990234, "step": 978} {"info/global_step": 979, "train_info/time_within_train_step": 2.6833114624023438, "step": 979} {"train_info/time_between_train_steps": 0.0033075809478759766, "step": 979} {"info/global_step": 980, "train_info/time_within_train_step": 2.6836047172546387, "step": 980} {"train_info/time_between_train_steps": 0.0031337738037109375, "step": 980} {"info/global_step": 981, "train_info/time_within_train_step": 2.6822009086608887, "step": 981} {"train_info/time_between_train_steps": 0.0032355785369873047, "step": 981} {"info/global_step": 982, "train_info/time_within_train_step": 2.6830475330352783, "step": 982} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 982} {"info/global_step": 983, "train_info/time_within_train_step": 2.6826565265655518, "step": 983} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 983} {"info/global_step": 984, "train_info/time_within_train_step": 2.6817595958709717, "step": 984} {"train_info/time_between_train_steps": 0.0033850669860839844, "step": 984} {"info/global_step": 985, "train_info/time_within_train_step": 2.6820032596588135, "step": 985} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 985} {"info/global_step": 986, "train_info/time_within_train_step": 2.682267665863037, "step": 986} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 986} {"info/global_step": 987, "train_info/time_within_train_step": 2.681135892868042, "step": 987} {"train_info/time_between_train_steps": 0.0033321380615234375, "step": 987} {"info/global_step": 988, "train_info/time_within_train_step": 2.6824452877044678, "step": 988} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 988} {"info/global_step": 989, "train_info/time_within_train_step": 2.682426691055298, "step": 989} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 989} {"info/global_step": 990, "train_info/time_within_train_step": 2.6835923194885254, "step": 990} {"train_info/time_between_train_steps": 0.0037190914154052734, "step": 990} {"info/global_step": 991, "train_info/time_within_train_step": 2.6827125549316406, "step": 991} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 991} {"info/global_step": 992, "train_info/time_within_train_step": 2.682676076889038, "step": 992} {"train_info/time_between_train_steps": 0.003283262252807617, "step": 992} {"info/global_step": 993, "train_info/time_within_train_step": 2.6829185485839844, "step": 993} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 993} {"info/global_step": 994, "train_info/time_within_train_step": 2.6830332279205322, "step": 994} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 994} {"info/global_step": 995, "train_info/time_within_train_step": 2.6833784580230713, "step": 995} {"train_info/time_between_train_steps": 0.0033452510833740234, "step": 995} {"info/global_step": 996, "train_info/time_within_train_step": 2.683509349822998, "step": 996} {"train_info/time_between_train_steps": 0.0032913684844970703, "step": 996} {"info/global_step": 997, "train_info/time_within_train_step": 2.683581590652466, "step": 997} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 997} {"info/global_step": 998, "train_info/time_within_train_step": 2.682774066925049, "step": 998} {"train_info/time_between_train_steps": 0.0033867359161376953, "step": 998} {"info/global_step": 999, "train_info/time_within_train_step": 2.683692693710327, "step": 999} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 999} {"info/global_step": 1000, "train_info/time_within_train_step": 3.204343557357788, "step": 1000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746314732, "_runtime": 2888}, "step": 1000} {"logs": {"train/loss": 4.8166, "train/learning_rate": 0.00044444444444444436, "train/epoch": 1.05, "_timestamp": 1746314732, "_runtime": 2888}, "step": 1000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746314737, "_runtime": 2893}, "step": 1000} {"logs": {"eval/loss": 5.194957256317139, "eval/runtime": 5.2722, "eval/samples_per_second": 36.038, "eval/steps_per_second": 1.138, "train/epoch": 1.05, "_timestamp": 1746314737, "_runtime": 2893}, "step": 1000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746314737, "_runtime": 2893}, "step": 1000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 5.194957256317139, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 180.3604333630817, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.2722, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.038, "train/epoch": 1.05, "_timestamp": 1746314737, "_runtime": 2893}, "step": 1000} {"train_info/time_between_train_steps": 20.37800669670105, "step": 1000} {"info/global_step": 1001, "train_info/time_within_train_step": 2.47357439994812, "step": 1001} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 1001} {"info/global_step": 1002, "train_info/time_within_train_step": 2.4958457946777344, "step": 1002} {"train_info/time_between_train_steps": 0.0039577484130859375, "step": 1002} {"info/global_step": 1003, "train_info/time_within_train_step": 2.6772098541259766, "step": 1003} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 1003} {"info/global_step": 1004, "train_info/time_within_train_step": 2.6870555877685547, "step": 1004} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 1004} {"info/global_step": 1005, "train_info/time_within_train_step": 2.6798317432403564, "step": 1005} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 1005} {"info/global_step": 1006, "train_info/time_within_train_step": 2.681694269180298, "step": 1006} {"train_info/time_between_train_steps": 0.0034902095794677734, "step": 1006} {"info/global_step": 1007, "train_info/time_within_train_step": 2.681654691696167, "step": 1007} {"train_info/time_between_train_steps": 0.0033745765686035156, "step": 1007} {"info/global_step": 1008, "train_info/time_within_train_step": 2.6820292472839355, "step": 1008} {"train_info/time_between_train_steps": 0.0032880306243896484, "step": 1008} {"info/global_step": 1009, "train_info/time_within_train_step": 2.681396484375, "step": 1009} {"train_info/time_between_train_steps": 0.0033915042877197266, "step": 1009} {"info/global_step": 1010, "train_info/time_within_train_step": 2.681823492050171, "step": 1010} {"train_info/time_between_train_steps": 0.0032339096069335938, "step": 1010} {"info/global_step": 1011, "train_info/time_within_train_step": 2.6827988624572754, "step": 1011} {"train_info/time_between_train_steps": 0.003384828567504883, "step": 1011} {"info/global_step": 1012, "train_info/time_within_train_step": 2.6823041439056396, "step": 1012} {"train_info/time_between_train_steps": 0.0032815933227539062, "step": 1012} {"info/global_step": 1013, "train_info/time_within_train_step": 2.7089316844940186, "step": 1013} {"train_info/time_between_train_steps": 0.003193378448486328, "step": 1013} {"info/global_step": 1014, "train_info/time_within_train_step": 2.7762348651885986, "step": 1014} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 1014} {"info/global_step": 1015, "train_info/time_within_train_step": 2.7729990482330322, "step": 1015} {"train_info/time_between_train_steps": 0.003233194351196289, "step": 1015} {"info/global_step": 1016, "train_info/time_within_train_step": 2.751573324203491, "step": 1016} {"train_info/time_between_train_steps": 0.0032477378845214844, "step": 1016} {"info/global_step": 1017, "train_info/time_within_train_step": 2.7329609394073486, "step": 1017} {"train_info/time_between_train_steps": 0.003371000289916992, "step": 1017} {"info/global_step": 1018, "train_info/time_within_train_step": 2.7142090797424316, "step": 1018} {"train_info/time_between_train_steps": 0.0036172866821289062, "step": 1018} {"info/global_step": 1019, "train_info/time_within_train_step": 2.7363717555999756, "step": 1019} {"train_info/time_between_train_steps": 0.0035932064056396484, "step": 1019} {"info/global_step": 1020, "train_info/time_within_train_step": 2.7067556381225586, "step": 1020} {"train_info/time_between_train_steps": 0.0032684803009033203, "step": 1020} {"info/global_step": 1021, "train_info/time_within_train_step": 2.7051827907562256, "step": 1021} {"train_info/time_between_train_steps": 0.003816843032836914, "step": 1021} {"info/global_step": 1022, "train_info/time_within_train_step": 2.7136693000793457, "step": 1022} {"train_info/time_between_train_steps": 0.0034034252166748047, "step": 1022} {"info/global_step": 1023, "train_info/time_within_train_step": 2.7150511741638184, "step": 1023} {"train_info/time_between_train_steps": 0.0036613941192626953, "step": 1023} {"info/global_step": 1024, "train_info/time_within_train_step": 3.0297651290893555, "step": 1024} {"train_info/time_between_train_steps": 0.0033881664276123047, "step": 1024} {"info/global_step": 1025, "train_info/time_within_train_step": 2.685739517211914, "step": 1025} {"train_info/time_between_train_steps": 0.0034291744232177734, "step": 1025} {"info/global_step": 1026, "train_info/time_within_train_step": 2.684152364730835, "step": 1026} {"train_info/time_between_train_steps": 0.003628969192504883, "step": 1026} {"info/global_step": 1027, "train_info/time_within_train_step": 2.71221661567688, "step": 1027} {"train_info/time_between_train_steps": 0.003596067428588867, "step": 1027} {"info/global_step": 1028, "train_info/time_within_train_step": 2.71990704536438, "step": 1028} {"train_info/time_between_train_steps": 0.003351926803588867, "step": 1028} {"info/global_step": 1029, "train_info/time_within_train_step": 2.7087833881378174, "step": 1029} {"train_info/time_between_train_steps": 0.003328084945678711, "step": 1029} {"info/global_step": 1030, "train_info/time_within_train_step": 2.717522144317627, "step": 1030} {"train_info/time_between_train_steps": 0.003568410873413086, "step": 1030} {"info/global_step": 1031, "train_info/time_within_train_step": 2.7054431438446045, "step": 1031} {"train_info/time_between_train_steps": 0.0035915374755859375, "step": 1031} {"info/global_step": 1032, "train_info/time_within_train_step": 2.6838808059692383, "step": 1032} {"train_info/time_between_train_steps": 0.0033872127532958984, "step": 1032} {"info/global_step": 1033, "train_info/time_within_train_step": 2.7161006927490234, "step": 1033} {"train_info/time_between_train_steps": 0.0034558773040771484, "step": 1033} {"info/global_step": 1034, "train_info/time_within_train_step": 2.713792085647583, "step": 1034} {"train_info/time_between_train_steps": 0.0033211708068847656, "step": 1034} {"info/global_step": 1035, "train_info/time_within_train_step": 2.694281578063965, "step": 1035} {"train_info/time_between_train_steps": 0.003508329391479492, "step": 1035} {"info/global_step": 1036, "train_info/time_within_train_step": 2.7173516750335693, "step": 1036} {"train_info/time_between_train_steps": 0.0035212039947509766, "step": 1036} {"info/global_step": 1037, "train_info/time_within_train_step": 2.70458722114563, "step": 1037} {"train_info/time_between_train_steps": 0.0035774707794189453, "step": 1037} {"info/global_step": 1038, "train_info/time_within_train_step": 2.7117719650268555, "step": 1038} {"train_info/time_between_train_steps": 0.0034945011138916016, "step": 1038} {"info/global_step": 1039, "train_info/time_within_train_step": 2.700476884841919, "step": 1039} {"train_info/time_between_train_steps": 0.003734588623046875, "step": 1039} {"info/global_step": 1040, "train_info/time_within_train_step": 2.706529378890991, "step": 1040} {"train_info/time_between_train_steps": 0.003509044647216797, "step": 1040} {"info/global_step": 1041, "train_info/time_within_train_step": 2.854771852493286, "step": 1041} {"train_info/time_between_train_steps": 0.0032854080200195312, "step": 1041} {"info/global_step": 1042, "train_info/time_within_train_step": 2.6863248348236084, "step": 1042} {"train_info/time_between_train_steps": 0.0035538673400878906, "step": 1042} {"info/global_step": 1043, "train_info/time_within_train_step": 2.7114198207855225, "step": 1043} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 1043} {"info/global_step": 1044, "train_info/time_within_train_step": 2.7446866035461426, "step": 1044} {"train_info/time_between_train_steps": 0.0032875537872314453, "step": 1044} {"info/global_step": 1045, "train_info/time_within_train_step": 2.689829111099243, "step": 1045} {"train_info/time_between_train_steps": 0.0039560794830322266, "step": 1045} {"info/global_step": 1046, "train_info/time_within_train_step": 2.696340322494507, "step": 1046} {"train_info/time_between_train_steps": 0.003259420394897461, "step": 1046} {"info/global_step": 1047, "train_info/time_within_train_step": 2.691908836364746, "step": 1047} {"train_info/time_between_train_steps": 0.0034492015838623047, "step": 1047} {"info/global_step": 1048, "train_info/time_within_train_step": 2.686025381088257, "step": 1048} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 1048} {"info/global_step": 1049, "train_info/time_within_train_step": 2.720693588256836, "step": 1049} {"train_info/time_between_train_steps": 0.003493785858154297, "step": 1049} {"info/global_step": 1050, "train_info/time_within_train_step": 2.7007410526275635, "step": 1050} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746314888, "_runtime": 3044}, "step": 1050} {"logs": {"train/loss": 4.7761, "train/learning_rate": 0.0004333333333333333, "train/epoch": 1.07, "_timestamp": 1746314888, "_runtime": 3044}, "step": 1050} {"train_info/time_between_train_steps": 0.025368928909301758, "step": 1050} {"info/global_step": 1051, "train_info/time_within_train_step": 2.6836516857147217, "step": 1051} {"train_info/time_between_train_steps": 0.0032885074615478516, "step": 1051} {"info/global_step": 1052, "train_info/time_within_train_step": 2.702976703643799, "step": 1052} {"train_info/time_between_train_steps": 0.0032813549041748047, "step": 1052} {"info/global_step": 1053, "train_info/time_within_train_step": 2.7115418910980225, "step": 1053} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 1053} {"info/global_step": 1054, "train_info/time_within_train_step": 2.690519094467163, "step": 1054} {"train_info/time_between_train_steps": 0.003262758255004883, "step": 1054} {"info/global_step": 1055, "train_info/time_within_train_step": 2.694244146347046, "step": 1055} {"train_info/time_between_train_steps": 0.003306150436401367, "step": 1055} {"info/global_step": 1056, "train_info/time_within_train_step": 2.6949946880340576, "step": 1056} {"train_info/time_between_train_steps": 0.003477811813354492, "step": 1056} {"info/global_step": 1057, "train_info/time_within_train_step": 2.7054531574249268, "step": 1057} {"train_info/time_between_train_steps": 0.003416299819946289, "step": 1057} {"info/global_step": 1058, "train_info/time_within_train_step": 2.6836190223693848, "step": 1058} {"train_info/time_between_train_steps": 0.0032901763916015625, "step": 1058} {"info/global_step": 1059, "train_info/time_within_train_step": 2.697805643081665, "step": 1059} {"train_info/time_between_train_steps": 0.0033690929412841797, "step": 1059} {"info/global_step": 1060, "train_info/time_within_train_step": 2.704763412475586, "step": 1060} {"train_info/time_between_train_steps": 0.003262042999267578, "step": 1060} {"info/global_step": 1061, "train_info/time_within_train_step": 2.6899428367614746, "step": 1061} {"train_info/time_between_train_steps": 0.003477811813354492, "step": 1061} {"info/global_step": 1062, "train_info/time_within_train_step": 2.6834022998809814, "step": 1062} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 1062} {"info/global_step": 1063, "train_info/time_within_train_step": 2.692314624786377, "step": 1063} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 1063} {"info/global_step": 1064, "train_info/time_within_train_step": 2.683704137802124, "step": 1064} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 1064} {"info/global_step": 1065, "train_info/time_within_train_step": 2.6837117671966553, "step": 1065} {"train_info/time_between_train_steps": 0.003267049789428711, "step": 1065} {"info/global_step": 1066, "train_info/time_within_train_step": 2.684515953063965, "step": 1066} {"train_info/time_between_train_steps": 0.0032739639282226562, "step": 1066} {"info/global_step": 1067, "train_info/time_within_train_step": 2.6832385063171387, "step": 1067} {"train_info/time_between_train_steps": 0.003480672836303711, "step": 1067} {"info/global_step": 1068, "train_info/time_within_train_step": 2.6844747066497803, "step": 1068} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 1068} {"info/global_step": 1069, "train_info/time_within_train_step": 2.7042596340179443, "step": 1069} {"train_info/time_between_train_steps": 0.003273487091064453, "step": 1069} {"info/global_step": 1070, "train_info/time_within_train_step": 2.6934680938720703, "step": 1070} {"train_info/time_between_train_steps": 0.0032644271850585938, "step": 1070} {"info/global_step": 1071, "train_info/time_within_train_step": 2.6849124431610107, "step": 1071} {"train_info/time_between_train_steps": 0.003214120864868164, "step": 1071} {"info/global_step": 1072, "train_info/time_within_train_step": 2.6828269958496094, "step": 1072} {"train_info/time_between_train_steps": 0.003267526626586914, "step": 1072} {"info/global_step": 1073, "train_info/time_within_train_step": 2.6841492652893066, "step": 1073} {"train_info/time_between_train_steps": 0.0032706260681152344, "step": 1073} {"info/global_step": 1074, "train_info/time_within_train_step": 2.683678150177002, "step": 1074} {"train_info/time_between_train_steps": 0.0035080909729003906, "step": 1074} {"info/global_step": 1075, "train_info/time_within_train_step": 2.684262990951538, "step": 1075} {"train_info/time_between_train_steps": 0.003301382064819336, "step": 1075} {"info/global_step": 1076, "train_info/time_within_train_step": 2.6837384700775146, "step": 1076} {"train_info/time_between_train_steps": 0.0033974647521972656, "step": 1076} {"info/global_step": 1077, "train_info/time_within_train_step": 2.942603588104248, "step": 1077} {"train_info/time_between_train_steps": 0.0034530162811279297, "step": 1077} {"info/global_step": 1078, "train_info/time_within_train_step": 2.6831507682800293, "step": 1078} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 1078} {"info/global_step": 1079, "train_info/time_within_train_step": 2.6830427646636963, "step": 1079} {"train_info/time_between_train_steps": 0.0034465789794921875, "step": 1079} {"info/global_step": 1080, "train_info/time_within_train_step": 2.7074317932128906, "step": 1080} {"train_info/time_between_train_steps": 0.0033054351806640625, "step": 1080} {"info/global_step": 1081, "train_info/time_within_train_step": 2.683896541595459, "step": 1081} {"train_info/time_between_train_steps": 0.003282308578491211, "step": 1081} {"info/global_step": 1082, "train_info/time_within_train_step": 2.6840012073516846, "step": 1082} {"train_info/time_between_train_steps": 0.003255605697631836, "step": 1082} {"info/global_step": 1083, "train_info/time_within_train_step": 2.683609962463379, "step": 1083} {"train_info/time_between_train_steps": 0.003545045852661133, "step": 1083} {"info/global_step": 1084, "train_info/time_within_train_step": 2.6832151412963867, "step": 1084} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 1084} {"info/global_step": 1085, "train_info/time_within_train_step": 2.6837122440338135, "step": 1085} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 1085} {"info/global_step": 1086, "train_info/time_within_train_step": 2.6840896606445312, "step": 1086} {"train_info/time_between_train_steps": 0.0032930374145507812, "step": 1086} {"info/global_step": 1087, "train_info/time_within_train_step": 2.682802200317383, "step": 1087} {"train_info/time_between_train_steps": 0.0034837722778320312, "step": 1087} {"info/global_step": 1088, "train_info/time_within_train_step": 2.682899236679077, "step": 1088} {"train_info/time_between_train_steps": 0.0035867691040039062, "step": 1088} {"info/global_step": 1089, "train_info/time_within_train_step": 2.6873273849487305, "step": 1089} {"train_info/time_between_train_steps": 0.0035169124603271484, "step": 1089} {"info/global_step": 1090, "train_info/time_within_train_step": 2.6827211380004883, "step": 1090} {"train_info/time_between_train_steps": 0.003510713577270508, "step": 1090} {"info/global_step": 1091, "train_info/time_within_train_step": 2.6831793785095215, "step": 1091} {"train_info/time_between_train_steps": 0.0032393932342529297, "step": 1091} {"info/global_step": 1092, "train_info/time_within_train_step": 2.684903621673584, "step": 1092} {"train_info/time_between_train_steps": 0.0035467147827148438, "step": 1092} {"info/global_step": 1093, "train_info/time_within_train_step": 2.6827645301818848, "step": 1093} {"train_info/time_between_train_steps": 0.003291606903076172, "step": 1093} {"info/global_step": 1094, "train_info/time_within_train_step": 2.683427333831787, "step": 1094} {"train_info/time_between_train_steps": 0.003520488739013672, "step": 1094} {"info/global_step": 1095, "train_info/time_within_train_step": 2.6826231479644775, "step": 1095} {"train_info/time_between_train_steps": 0.003425121307373047, "step": 1095} {"info/global_step": 1096, "train_info/time_within_train_step": 2.6834001541137695, "step": 1096} {"train_info/time_between_train_steps": 0.0032525062561035156, "step": 1096} {"info/global_step": 1097, "train_info/time_within_train_step": 2.6871819496154785, "step": 1097} {"train_info/time_between_train_steps": 0.003462076187133789, "step": 1097} {"info/global_step": 1098, "train_info/time_within_train_step": 2.6835029125213623, "step": 1098} {"train_info/time_between_train_steps": 0.003634214401245117, "step": 1098} {"info/global_step": 1099, "train_info/time_within_train_step": 2.6834256649017334, "step": 1099} {"train_info/time_between_train_steps": 0.0032792091369628906, "step": 1099} {"info/global_step": 1100, "train_info/time_within_train_step": 2.6841089725494385, "step": 1100} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746315024, "_runtime": 3180}, "step": 1100} {"logs": {"train/loss": 4.7231, "train/learning_rate": 0.0004222222222222222, "train/epoch": 1.08, "_timestamp": 1746315024, "_runtime": 3180}, "step": 1100} {"train_info/time_between_train_steps": 18.52305555343628, "step": 1100} {"info/global_step": 1101, "train_info/time_within_train_step": 2.4889211654663086, "step": 1101} {"train_info/time_between_train_steps": 0.0033435821533203125, "step": 1101} {"info/global_step": 1102, "train_info/time_within_train_step": 2.490827798843384, "step": 1102} {"train_info/time_between_train_steps": 0.0033037662506103516, "step": 1102} {"info/global_step": 1103, "train_info/time_within_train_step": 2.6762032508850098, "step": 1103} {"train_info/time_between_train_steps": 0.1484391689300537, "step": 1103} {"info/global_step": 1104, "train_info/time_within_train_step": 2.6803486347198486, "step": 1104} {"train_info/time_between_train_steps": 0.0033729076385498047, "step": 1104} {"info/global_step": 1105, "train_info/time_within_train_step": 2.682013988494873, "step": 1105} {"train_info/time_between_train_steps": 0.0033271312713623047, "step": 1105} {"info/global_step": 1106, "train_info/time_within_train_step": 2.6815178394317627, "step": 1106} {"train_info/time_between_train_steps": 0.0035746097564697266, "step": 1106} {"info/global_step": 1107, "train_info/time_within_train_step": 2.682363271713257, "step": 1107} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 1107} {"info/global_step": 1108, "train_info/time_within_train_step": 2.6832566261291504, "step": 1108} {"train_info/time_between_train_steps": 0.0032782554626464844, "step": 1108} {"info/global_step": 1109, "train_info/time_within_train_step": 2.683316469192505, "step": 1109} {"train_info/time_between_train_steps": 0.003279447555541992, "step": 1109} {"info/global_step": 1110, "train_info/time_within_train_step": 2.683424711227417, "step": 1110} {"train_info/time_between_train_steps": 0.003241300582885742, "step": 1110} {"info/global_step": 1111, "train_info/time_within_train_step": 2.684730052947998, "step": 1111} {"train_info/time_between_train_steps": 0.0032706260681152344, "step": 1111} {"info/global_step": 1112, "train_info/time_within_train_step": 2.684579372406006, "step": 1112} {"train_info/time_between_train_steps": 0.003286123275756836, "step": 1112} {"info/global_step": 1113, "train_info/time_within_train_step": 2.6848790645599365, "step": 1113} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 1113} {"info/global_step": 1114, "train_info/time_within_train_step": 2.744237184524536, "step": 1114} {"train_info/time_between_train_steps": 0.003332376480102539, "step": 1114} {"info/global_step": 1115, "train_info/time_within_train_step": 2.8765454292297363, "step": 1115} {"train_info/time_between_train_steps": 0.003503084182739258, "step": 1115} {"info/global_step": 1116, "train_info/time_within_train_step": 2.7806808948516846, "step": 1116} {"train_info/time_between_train_steps": 0.0032739639282226562, "step": 1116} {"info/global_step": 1117, "train_info/time_within_train_step": 2.7118685245513916, "step": 1117} {"train_info/time_between_train_steps": 0.0035369396209716797, "step": 1117} {"info/global_step": 1118, "train_info/time_within_train_step": 2.706549644470215, "step": 1118} {"train_info/time_between_train_steps": 0.0035729408264160156, "step": 1118} {"info/global_step": 1119, "train_info/time_within_train_step": 2.711533546447754, "step": 1119} {"train_info/time_between_train_steps": 0.0033338069915771484, "step": 1119} {"info/global_step": 1120, "train_info/time_within_train_step": 2.7178895473480225, "step": 1120} {"train_info/time_between_train_steps": 0.003245115280151367, "step": 1120} {"info/global_step": 1121, "train_info/time_within_train_step": 2.7324514389038086, "step": 1121} {"train_info/time_between_train_steps": 0.0032835006713867188, "step": 1121} {"info/global_step": 1122, "train_info/time_within_train_step": 2.713860273361206, "step": 1122} {"train_info/time_between_train_steps": 0.0032842159271240234, "step": 1122} {"info/global_step": 1123, "train_info/time_within_train_step": 2.698268413543701, "step": 1123} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 1123} {"info/global_step": 1124, "train_info/time_within_train_step": 2.7279181480407715, "step": 1124} {"train_info/time_between_train_steps": 0.003317594528198242, "step": 1124} {"info/global_step": 1125, "train_info/time_within_train_step": 2.727515935897827, "step": 1125} {"train_info/time_between_train_steps": 0.0033042430877685547, "step": 1125} {"info/global_step": 1126, "train_info/time_within_train_step": 2.6980888843536377, "step": 1126} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 1126} {"info/global_step": 1127, "train_info/time_within_train_step": 2.7067389488220215, "step": 1127} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 1127} {"info/global_step": 1128, "train_info/time_within_train_step": 2.717388153076172, "step": 1128} {"train_info/time_between_train_steps": 0.0032758712768554688, "step": 1128} {"info/global_step": 1129, "train_info/time_within_train_step": 2.7160916328430176, "step": 1129} {"train_info/time_between_train_steps": 0.0032889842987060547, "step": 1129} {"info/global_step": 1130, "train_info/time_within_train_step": 2.7008016109466553, "step": 1130} {"train_info/time_between_train_steps": 0.0032699108123779297, "step": 1130} {"info/global_step": 1131, "train_info/time_within_train_step": 2.708486318588257, "step": 1131} {"train_info/time_between_train_steps": 0.0032770633697509766, "step": 1131} {"info/global_step": 1132, "train_info/time_within_train_step": 2.7031960487365723, "step": 1132} {"train_info/time_between_train_steps": 0.0033173561096191406, "step": 1132} {"info/global_step": 1133, "train_info/time_within_train_step": 2.7075958251953125, "step": 1133} {"train_info/time_between_train_steps": 0.003323078155517578, "step": 1133} {"info/global_step": 1134, "train_info/time_within_train_step": 2.6895270347595215, "step": 1134} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 1134} {"info/global_step": 1135, "train_info/time_within_train_step": 2.7074379920959473, "step": 1135} {"train_info/time_between_train_steps": 0.0032966136932373047, "step": 1135} {"info/global_step": 1136, "train_info/time_within_train_step": 2.70639705657959, "step": 1136} {"train_info/time_between_train_steps": 0.0032689571380615234, "step": 1136} {"info/global_step": 1137, "train_info/time_within_train_step": 2.6938164234161377, "step": 1137} {"train_info/time_between_train_steps": 0.0033152103424072266, "step": 1137} {"info/global_step": 1138, "train_info/time_within_train_step": 2.69329833984375, "step": 1138} {"train_info/time_between_train_steps": 0.0034067630767822266, "step": 1138} {"info/global_step": 1139, "train_info/time_within_train_step": 2.6924712657928467, "step": 1139} {"train_info/time_between_train_steps": 0.0033104419708251953, "step": 1139} {"info/global_step": 1140, "train_info/time_within_train_step": 2.720080614089966, "step": 1140} {"train_info/time_between_train_steps": 0.0033898353576660156, "step": 1140} {"info/global_step": 1141, "train_info/time_within_train_step": 2.6909255981445312, "step": 1141} {"train_info/time_between_train_steps": 0.003351926803588867, "step": 1141} {"info/global_step": 1142, "train_info/time_within_train_step": 2.7046186923980713, "step": 1142} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 1142} {"info/global_step": 1143, "train_info/time_within_train_step": 2.7114484310150146, "step": 1143} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 1143} {"info/global_step": 1144, "train_info/time_within_train_step": 2.686584711074829, "step": 1144} {"train_info/time_between_train_steps": 0.0032405853271484375, "step": 1144} {"info/global_step": 1145, "train_info/time_within_train_step": 2.69897198677063, "step": 1145} {"train_info/time_between_train_steps": 0.003549337387084961, "step": 1145} {"info/global_step": 1146, "train_info/time_within_train_step": 2.702197790145874, "step": 1146} {"train_info/time_between_train_steps": 0.0032434463500976562, "step": 1146} {"info/global_step": 1147, "train_info/time_within_train_step": 2.945970058441162, "step": 1147} {"train_info/time_between_train_steps": 0.003333568572998047, "step": 1147} {"info/global_step": 1148, "train_info/time_within_train_step": 2.6860475540161133, "step": 1148} {"train_info/time_between_train_steps": 0.0033686161041259766, "step": 1148} {"info/global_step": 1149, "train_info/time_within_train_step": 2.6850087642669678, "step": 1149} {"train_info/time_between_train_steps": 0.0032074451446533203, "step": 1149} {"info/global_step": 1150, "train_info/time_within_train_step": 2.6845812797546387, "step": 1150} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746315179, "_runtime": 3335}, "step": 1150} {"logs": {"train/loss": 4.6821, "train/learning_rate": 0.0004111111111111111, "train/epoch": 1.1, "_timestamp": 1746315179, "_runtime": 3335}, "step": 1150} {"train_info/time_between_train_steps": 0.02462005615234375, "step": 1150} {"info/global_step": 1151, "train_info/time_within_train_step": 2.685094118118286, "step": 1151} {"train_info/time_between_train_steps": 0.003417491912841797, "step": 1151} {"info/global_step": 1152, "train_info/time_within_train_step": 2.684873580932617, "step": 1152} {"train_info/time_between_train_steps": 0.0034952163696289062, "step": 1152} {"info/global_step": 1153, "train_info/time_within_train_step": 2.6845149993896484, "step": 1153} {"train_info/time_between_train_steps": 0.003492593765258789, "step": 1153} {"info/global_step": 1154, "train_info/time_within_train_step": 2.6852896213531494, "step": 1154} {"train_info/time_between_train_steps": 0.003248453140258789, "step": 1154} {"info/global_step": 1155, "train_info/time_within_train_step": 2.6851751804351807, "step": 1155} {"train_info/time_between_train_steps": 0.0032854080200195312, "step": 1155} {"info/global_step": 1156, "train_info/time_within_train_step": 2.6849353313446045, "step": 1156} {"train_info/time_between_train_steps": 0.003445148468017578, "step": 1156} {"info/global_step": 1157, "train_info/time_within_train_step": 2.6850922107696533, "step": 1157} {"train_info/time_between_train_steps": 0.003226041793823242, "step": 1157} {"info/global_step": 1158, "train_info/time_within_train_step": 2.6849241256713867, "step": 1158} {"train_info/time_between_train_steps": 0.0032384395599365234, "step": 1158} {"info/global_step": 1159, "train_info/time_within_train_step": 2.685081720352173, "step": 1159} {"train_info/time_between_train_steps": 0.0033817291259765625, "step": 1159} {"info/global_step": 1160, "train_info/time_within_train_step": 2.6844193935394287, "step": 1160} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 1160} {"info/global_step": 1161, "train_info/time_within_train_step": 2.684126853942871, "step": 1161} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 1161} {"info/global_step": 1162, "train_info/time_within_train_step": 2.6843831539154053, "step": 1162} {"train_info/time_between_train_steps": 0.0033469200134277344, "step": 1162} {"info/global_step": 1163, "train_info/time_within_train_step": 2.68414044380188, "step": 1163} {"train_info/time_between_train_steps": 0.003331422805786133, "step": 1163} {"info/global_step": 1164, "train_info/time_within_train_step": 2.6827638149261475, "step": 1164} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 1164} {"info/global_step": 1165, "train_info/time_within_train_step": 2.684030055999756, "step": 1165} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 1165} {"info/global_step": 1166, "train_info/time_within_train_step": 2.810209274291992, "step": 1166} {"train_info/time_between_train_steps": 0.003290891647338867, "step": 1166} {"info/global_step": 1167, "train_info/time_within_train_step": 2.6842706203460693, "step": 1167} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 1167} {"info/global_step": 1168, "train_info/time_within_train_step": 2.684035539627075, "step": 1168} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 1168} {"info/global_step": 1169, "train_info/time_within_train_step": 2.6848204135894775, "step": 1169} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 1169} {"info/global_step": 1170, "train_info/time_within_train_step": 2.7356276512145996, "step": 1170} {"train_info/time_between_train_steps": 0.0032019615173339844, "step": 1170} {"info/global_step": 1171, "train_info/time_within_train_step": 2.684382915496826, "step": 1171} {"train_info/time_between_train_steps": 0.0034360885620117188, "step": 1171} {"info/global_step": 1172, "train_info/time_within_train_step": 2.684734344482422, "step": 1172} {"train_info/time_between_train_steps": 0.0038077831268310547, "step": 1172} {"info/global_step": 1173, "train_info/time_within_train_step": 2.684319019317627, "step": 1173} {"train_info/time_between_train_steps": 0.0034575462341308594, "step": 1173} {"info/global_step": 1174, "train_info/time_within_train_step": 2.684687614440918, "step": 1174} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 1174} {"info/global_step": 1175, "train_info/time_within_train_step": 2.6834065914154053, "step": 1175} {"train_info/time_between_train_steps": 0.003503561019897461, "step": 1175} {"info/global_step": 1176, "train_info/time_within_train_step": 2.684892177581787, "step": 1176} {"train_info/time_between_train_steps": 0.0032651424407958984, "step": 1176} {"info/global_step": 1177, "train_info/time_within_train_step": 2.684292793273926, "step": 1177} {"train_info/time_between_train_steps": 0.003398418426513672, "step": 1177} {"info/global_step": 1178, "train_info/time_within_train_step": 2.6840620040893555, "step": 1178} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 1178} {"info/global_step": 1179, "train_info/time_within_train_step": 2.683419942855835, "step": 1179} {"train_info/time_between_train_steps": 0.003261566162109375, "step": 1179} {"info/global_step": 1180, "train_info/time_within_train_step": 2.683694839477539, "step": 1180} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 1180} {"info/global_step": 1181, "train_info/time_within_train_step": 2.6830408573150635, "step": 1181} {"train_info/time_between_train_steps": 0.0034155845642089844, "step": 1181} {"info/global_step": 1182, "train_info/time_within_train_step": 2.6835334300994873, "step": 1182} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 1182} {"info/global_step": 1183, "train_info/time_within_train_step": 2.683880090713501, "step": 1183} {"train_info/time_between_train_steps": 0.0032019615173339844, "step": 1183} {"info/global_step": 1184, "train_info/time_within_train_step": 2.7068839073181152, "step": 1184} {"train_info/time_between_train_steps": 0.0033168792724609375, "step": 1184} {"info/global_step": 1185, "train_info/time_within_train_step": 2.685905933380127, "step": 1185} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 1185} {"info/global_step": 1186, "train_info/time_within_train_step": 2.6840903759002686, "step": 1186} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 1186} {"info/global_step": 1187, "train_info/time_within_train_step": 2.6846935749053955, "step": 1187} {"train_info/time_between_train_steps": 0.0034546852111816406, "step": 1187} {"info/global_step": 1188, "train_info/time_within_train_step": 2.684938430786133, "step": 1188} {"train_info/time_between_train_steps": 0.0032918453216552734, "step": 1188} {"info/global_step": 1189, "train_info/time_within_train_step": 2.694704294204712, "step": 1189} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 1189} {"info/global_step": 1190, "train_info/time_within_train_step": 2.684964656829834, "step": 1190} {"train_info/time_between_train_steps": 0.0032596588134765625, "step": 1190} {"info/global_step": 1191, "train_info/time_within_train_step": 2.684546709060669, "step": 1191} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 1191} {"info/global_step": 1192, "train_info/time_within_train_step": 2.6848666667938232, "step": 1192} {"train_info/time_between_train_steps": 0.0034012794494628906, "step": 1192} {"info/global_step": 1193, "train_info/time_within_train_step": 2.6840248107910156, "step": 1193} {"train_info/time_between_train_steps": 0.003376483917236328, "step": 1193} {"info/global_step": 1194, "train_info/time_within_train_step": 2.6845762729644775, "step": 1194} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 1194} {"info/global_step": 1195, "train_info/time_within_train_step": 2.6838624477386475, "step": 1195} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 1195} {"info/global_step": 1196, "train_info/time_within_train_step": 2.6831696033477783, "step": 1196} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 1196} {"info/global_step": 1197, "train_info/time_within_train_step": 2.6834425926208496, "step": 1197} {"train_info/time_between_train_steps": 0.003342866897583008, "step": 1197} {"info/global_step": 1198, "train_info/time_within_train_step": 2.6825361251831055, "step": 1198} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 1198} {"info/global_step": 1199, "train_info/time_within_train_step": 2.6831939220428467, "step": 1199} {"train_info/time_between_train_steps": 0.0032591819763183594, "step": 1199} {"info/global_step": 1200, "train_info/time_within_train_step": 2.9399220943450928, "step": 1200} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746315315, "_runtime": 3471}, "step": 1200} {"logs": {"train/loss": 4.6516, "train/learning_rate": 0.00039999999999999996, "train/epoch": 1.12, "_timestamp": 1746315315, "_runtime": 3471}, "step": 1200} {"train_info/time_between_train_steps": 18.432607650756836, "step": 1200} {"info/global_step": 1201, "train_info/time_within_train_step": 2.483076572418213, "step": 1201} {"train_info/time_between_train_steps": 0.003253459930419922, "step": 1201} {"info/global_step": 1202, "train_info/time_within_train_step": 2.469752788543701, "step": 1202} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 1202} {"info/global_step": 1203, "train_info/time_within_train_step": 2.660717725753784, "step": 1203} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 1203} {"info/global_step": 1204, "train_info/time_within_train_step": 2.681211471557617, "step": 1204} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 1204} {"info/global_step": 1205, "train_info/time_within_train_step": 2.682368755340576, "step": 1205} {"train_info/time_between_train_steps": 0.003231048583984375, "step": 1205} {"info/global_step": 1206, "train_info/time_within_train_step": 2.6843695640563965, "step": 1206} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 1206} {"info/global_step": 1207, "train_info/time_within_train_step": 2.6841237545013428, "step": 1207} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 1207} {"info/global_step": 1208, "train_info/time_within_train_step": 2.6831748485565186, "step": 1208} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 1208} {"info/global_step": 1209, "train_info/time_within_train_step": 2.683911085128784, "step": 1209} {"train_info/time_between_train_steps": 0.003435850143432617, "step": 1209} {"info/global_step": 1210, "train_info/time_within_train_step": 2.6832454204559326, "step": 1210} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 1210} {"info/global_step": 1211, "train_info/time_within_train_step": 2.683779001235962, "step": 1211} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 1211} {"info/global_step": 1212, "train_info/time_within_train_step": 2.684105634689331, "step": 1212} {"train_info/time_between_train_steps": 0.0033397674560546875, "step": 1212} {"info/global_step": 1213, "train_info/time_within_train_step": 2.6862950325012207, "step": 1213} {"train_info/time_between_train_steps": 0.0034825801849365234, "step": 1213} {"info/global_step": 1214, "train_info/time_within_train_step": 2.795642614364624, "step": 1214} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 1214} {"info/global_step": 1215, "train_info/time_within_train_step": 2.745152235031128, "step": 1215} {"train_info/time_between_train_steps": 0.0032396316528320312, "step": 1215} {"info/global_step": 1216, "train_info/time_within_train_step": 2.736459493637085, "step": 1216} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 1216} {"info/global_step": 1217, "train_info/time_within_train_step": 2.718080997467041, "step": 1217} {"train_info/time_between_train_steps": 0.003396749496459961, "step": 1217} {"info/global_step": 1218, "train_info/time_within_train_step": 2.7271883487701416, "step": 1218} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 1218} {"info/global_step": 1219, "train_info/time_within_train_step": 2.715182065963745, "step": 1219} {"train_info/time_between_train_steps": 0.0032355785369873047, "step": 1219} {"info/global_step": 1220, "train_info/time_within_train_step": 2.7242443561553955, "step": 1220} {"train_info/time_between_train_steps": 0.003434419631958008, "step": 1220} {"info/global_step": 1221, "train_info/time_within_train_step": 2.7225515842437744, "step": 1221} {"train_info/time_between_train_steps": 0.003350973129272461, "step": 1221} {"info/global_step": 1222, "train_info/time_within_train_step": 2.693329334259033, "step": 1222} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 1222} {"info/global_step": 1223, "train_info/time_within_train_step": 2.696028470993042, "step": 1223} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 1223} {"info/global_step": 1224, "train_info/time_within_train_step": 2.710122585296631, "step": 1224} {"train_info/time_between_train_steps": 0.0032885074615478516, "step": 1224} {"info/global_step": 1225, "train_info/time_within_train_step": 2.7245495319366455, "step": 1225} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 1225} {"info/global_step": 1226, "train_info/time_within_train_step": 2.716975450515747, "step": 1226} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 1226} {"info/global_step": 1227, "train_info/time_within_train_step": 2.7343828678131104, "step": 1227} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 1227} {"info/global_step": 1228, "train_info/time_within_train_step": 2.695478677749634, "step": 1228} {"train_info/time_between_train_steps": 0.13211464881896973, "step": 1228} {"info/global_step": 1229, "train_info/time_within_train_step": 2.68574595451355, "step": 1229} {"train_info/time_between_train_steps": 0.003245830535888672, "step": 1229} {"info/global_step": 1230, "train_info/time_within_train_step": 2.68560791015625, "step": 1230} {"train_info/time_between_train_steps": 0.003381490707397461, "step": 1230} {"info/global_step": 1231, "train_info/time_within_train_step": 2.7023568153381348, "step": 1231} {"train_info/time_between_train_steps": 0.003428936004638672, "step": 1231} {"info/global_step": 1232, "train_info/time_within_train_step": 2.704333782196045, "step": 1232} {"train_info/time_between_train_steps": 0.0034101009368896484, "step": 1232} {"info/global_step": 1233, "train_info/time_within_train_step": 2.690688371658325, "step": 1233} {"train_info/time_between_train_steps": 0.003400564193725586, "step": 1233} {"info/global_step": 1234, "train_info/time_within_train_step": 2.7209155559539795, "step": 1234} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 1234} {"info/global_step": 1235, "train_info/time_within_train_step": 2.7355988025665283, "step": 1235} {"train_info/time_between_train_steps": 0.003388643264770508, "step": 1235} {"info/global_step": 1236, "train_info/time_within_train_step": 2.6896631717681885, "step": 1236} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 1236} {"info/global_step": 1237, "train_info/time_within_train_step": 2.7010560035705566, "step": 1237} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 1237} {"info/global_step": 1238, "train_info/time_within_train_step": 2.712367057800293, "step": 1238} {"train_info/time_between_train_steps": 0.003475666046142578, "step": 1238} {"info/global_step": 1239, "train_info/time_within_train_step": 2.7087273597717285, "step": 1239} {"train_info/time_between_train_steps": 0.003214120864868164, "step": 1239} {"info/global_step": 1240, "train_info/time_within_train_step": 2.71366548538208, "step": 1240} {"train_info/time_between_train_steps": 0.0032644271850585938, "step": 1240} {"info/global_step": 1241, "train_info/time_within_train_step": 2.7000226974487305, "step": 1241} {"train_info/time_between_train_steps": 0.003435373306274414, "step": 1241} {"info/global_step": 1242, "train_info/time_within_train_step": 2.6860239505767822, "step": 1242} {"train_info/time_between_train_steps": 0.003245115280151367, "step": 1242} {"info/global_step": 1243, "train_info/time_within_train_step": 2.6839542388916016, "step": 1243} {"train_info/time_between_train_steps": 0.0033922195434570312, "step": 1243} {"info/global_step": 1244, "train_info/time_within_train_step": 2.700857400894165, "step": 1244} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 1244} {"info/global_step": 1245, "train_info/time_within_train_step": 2.6957690715789795, "step": 1245} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 1245} {"info/global_step": 1246, "train_info/time_within_train_step": 2.686771869659424, "step": 1246} {"train_info/time_between_train_steps": 0.0032737255096435547, "step": 1246} {"info/global_step": 1247, "train_info/time_within_train_step": 2.7075719833374023, "step": 1247} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 1247} {"info/global_step": 1248, "train_info/time_within_train_step": 2.692704916000366, "step": 1248} {"train_info/time_between_train_steps": 0.0032203197479248047, "step": 1248} {"info/global_step": 1249, "train_info/time_within_train_step": 2.6889266967773438, "step": 1249} {"train_info/time_between_train_steps": 0.0035064220428466797, "step": 1249} {"info/global_step": 1250, "train_info/time_within_train_step": 3.249206066131592, "step": 1250} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746315470, "_runtime": 3626}, "step": 1250} {"logs": {"train/loss": 4.6196, "train/learning_rate": 0.00038888888888888887, "train/epoch": 1.13, "_timestamp": 1746315470, "_runtime": 3626}, "step": 1250} {"train_info/time_between_train_steps": 0.02502131462097168, "step": 1250} {"info/global_step": 1251, "train_info/time_within_train_step": 2.6850616931915283, "step": 1251} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 1251} {"info/global_step": 1252, "train_info/time_within_train_step": 2.6845245361328125, "step": 1252} {"train_info/time_between_train_steps": 0.0032482147216796875, "step": 1252} {"info/global_step": 1253, "train_info/time_within_train_step": 2.6840438842773438, "step": 1253} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 1253} {"info/global_step": 1254, "train_info/time_within_train_step": 2.6847970485687256, "step": 1254} {"train_info/time_between_train_steps": 0.003347158432006836, "step": 1254} {"info/global_step": 1255, "train_info/time_within_train_step": 2.684405565261841, "step": 1255} {"train_info/time_between_train_steps": 0.003351449966430664, "step": 1255} {"info/global_step": 1256, "train_info/time_within_train_step": 2.684070587158203, "step": 1256} {"train_info/time_between_train_steps": 0.003414154052734375, "step": 1256} {"info/global_step": 1257, "train_info/time_within_train_step": 2.6843159198760986, "step": 1257} {"train_info/time_between_train_steps": 0.0033447742462158203, "step": 1257} {"info/global_step": 1258, "train_info/time_within_train_step": 2.6835203170776367, "step": 1258} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 1258} {"info/global_step": 1259, "train_info/time_within_train_step": 2.6834182739257812, "step": 1259} {"train_info/time_between_train_steps": 0.003221273422241211, "step": 1259} {"info/global_step": 1260, "train_info/time_within_train_step": 2.6839206218719482, "step": 1260} {"train_info/time_between_train_steps": 0.0034112930297851562, "step": 1260} {"info/global_step": 1261, "train_info/time_within_train_step": 2.6848294734954834, "step": 1261} {"train_info/time_between_train_steps": 0.0033032894134521484, "step": 1261} {"info/global_step": 1262, "train_info/time_within_train_step": 2.6857259273529053, "step": 1262} {"train_info/time_between_train_steps": 0.003284931182861328, "step": 1262} {"info/global_step": 1263, "train_info/time_within_train_step": 2.6857492923736572, "step": 1263} {"train_info/time_between_train_steps": 0.003282308578491211, "step": 1263} {"info/global_step": 1264, "train_info/time_within_train_step": 2.685739517211914, "step": 1264} {"train_info/time_between_train_steps": 0.0032699108123779297, "step": 1264} {"info/global_step": 1265, "train_info/time_within_train_step": 2.6846349239349365, "step": 1265} {"train_info/time_between_train_steps": 0.0033125877380371094, "step": 1265} {"info/global_step": 1266, "train_info/time_within_train_step": 2.686713457107544, "step": 1266} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 1266} {"info/global_step": 1267, "train_info/time_within_train_step": 2.68461012840271, "step": 1267} {"train_info/time_between_train_steps": 0.0033979415893554688, "step": 1267} {"info/global_step": 1268, "train_info/time_within_train_step": 2.6840856075286865, "step": 1268} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 1268} {"info/global_step": 1269, "train_info/time_within_train_step": 2.6833739280700684, "step": 1269} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 1269} {"info/global_step": 1270, "train_info/time_within_train_step": 2.6827268600463867, "step": 1270} {"train_info/time_between_train_steps": 0.003358602523803711, "step": 1270} {"info/global_step": 1271, "train_info/time_within_train_step": 2.6840767860412598, "step": 1271} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 1271} {"info/global_step": 1272, "train_info/time_within_train_step": 2.6831746101379395, "step": 1272} {"train_info/time_between_train_steps": 0.0032188892364501953, "step": 1272} {"info/global_step": 1273, "train_info/time_within_train_step": 2.6825313568115234, "step": 1273} {"train_info/time_between_train_steps": 0.0033414363861083984, "step": 1273} {"info/global_step": 1274, "train_info/time_within_train_step": 2.6825294494628906, "step": 1274} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 1274} {"info/global_step": 1275, "train_info/time_within_train_step": 2.6830387115478516, "step": 1275} {"train_info/time_between_train_steps": 0.0033588409423828125, "step": 1275} {"info/global_step": 1276, "train_info/time_within_train_step": 2.682537317276001, "step": 1276} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 1276} {"info/global_step": 1277, "train_info/time_within_train_step": 2.6841368675231934, "step": 1277} {"train_info/time_between_train_steps": 0.0033478736877441406, "step": 1277} {"info/global_step": 1278, "train_info/time_within_train_step": 2.6826772689819336, "step": 1278} {"train_info/time_between_train_steps": 0.0034770965576171875, "step": 1278} {"info/global_step": 1279, "train_info/time_within_train_step": 2.6854050159454346, "step": 1279} {"train_info/time_between_train_steps": 0.003344297409057617, "step": 1279} {"info/global_step": 1280, "train_info/time_within_train_step": 2.684556007385254, "step": 1280} {"train_info/time_between_train_steps": 0.003333568572998047, "step": 1280} {"info/global_step": 1281, "train_info/time_within_train_step": 2.6847927570343018, "step": 1281} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 1281} {"info/global_step": 1282, "train_info/time_within_train_step": 2.6847352981567383, "step": 1282} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 1282} {"info/global_step": 1283, "train_info/time_within_train_step": 2.685094118118286, "step": 1283} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 1283} {"info/global_step": 1284, "train_info/time_within_train_step": 2.683910369873047, "step": 1284} {"train_info/time_between_train_steps": 0.003468036651611328, "step": 1284} {"info/global_step": 1285, "train_info/time_within_train_step": 2.950695514678955, "step": 1285} {"train_info/time_between_train_steps": 0.0034935474395751953, "step": 1285} {"info/global_step": 1286, "train_info/time_within_train_step": 2.683863639831543, "step": 1286} {"train_info/time_between_train_steps": 0.0034339427947998047, "step": 1286} {"info/global_step": 1287, "train_info/time_within_train_step": 2.6836845874786377, "step": 1287} {"train_info/time_between_train_steps": 0.003300189971923828, "step": 1287} {"info/global_step": 1288, "train_info/time_within_train_step": 2.6831533908843994, "step": 1288} {"train_info/time_between_train_steps": 0.003371000289916992, "step": 1288} {"info/global_step": 1289, "train_info/time_within_train_step": 2.6832659244537354, "step": 1289} {"train_info/time_between_train_steps": 0.003317117691040039, "step": 1289} {"info/global_step": 1290, "train_info/time_within_train_step": 2.683915853500366, "step": 1290} {"train_info/time_between_train_steps": 0.003397226333618164, "step": 1290} {"info/global_step": 1291, "train_info/time_within_train_step": 2.839862585067749, "step": 1291} {"train_info/time_between_train_steps": 0.0032367706298828125, "step": 1291} {"info/global_step": 1292, "train_info/time_within_train_step": 2.6829450130462646, "step": 1292} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 1292} {"info/global_step": 1293, "train_info/time_within_train_step": 2.6829798221588135, "step": 1293} {"train_info/time_between_train_steps": 0.003267049789428711, "step": 1293} {"info/global_step": 1294, "train_info/time_within_train_step": 2.6831679344177246, "step": 1294} {"train_info/time_between_train_steps": 0.0034284591674804688, "step": 1294} {"info/global_step": 1295, "train_info/time_within_train_step": 2.6849653720855713, "step": 1295} {"train_info/time_between_train_steps": 0.0034818649291992188, "step": 1295} {"info/global_step": 1296, "train_info/time_within_train_step": 2.6835148334503174, "step": 1296} {"train_info/time_between_train_steps": 0.003490447998046875, "step": 1296} {"info/global_step": 1297, "train_info/time_within_train_step": 2.688795328140259, "step": 1297} {"train_info/time_between_train_steps": 0.0033729076385498047, "step": 1297} {"info/global_step": 1298, "train_info/time_within_train_step": 2.6849024295806885, "step": 1298} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 1298} {"info/global_step": 1299, "train_info/time_within_train_step": 2.6846811771392822, "step": 1299} {"train_info/time_between_train_steps": 0.0034673213958740234, "step": 1299} {"info/global_step": 1300, "train_info/time_within_train_step": 2.683448314666748, "step": 1300} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746315606, "_runtime": 3762}, "step": 1300} {"logs": {"train/loss": 4.5693, "train/learning_rate": 0.00037777777777777777, "train/epoch": 1.15, "_timestamp": 1746315606, "_runtime": 3762}, "step": 1300} {"train_info/time_between_train_steps": 15.374024629592896, "step": 1300} {"info/global_step": 1301, "train_info/time_within_train_step": 2.4801042079925537, "step": 1301} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 1301} {"info/global_step": 1302, "train_info/time_within_train_step": 2.484654664993286, "step": 1302} {"train_info/time_between_train_steps": 0.003462076187133789, "step": 1302} {"info/global_step": 1303, "train_info/time_within_train_step": 2.673718214035034, "step": 1303} {"train_info/time_between_train_steps": 0.0034770965576171875, "step": 1303} {"info/global_step": 1304, "train_info/time_within_train_step": 2.6819818019866943, "step": 1304} {"train_info/time_between_train_steps": 0.0034770965576171875, "step": 1304} {"info/global_step": 1305, "train_info/time_within_train_step": 2.6820757389068604, "step": 1305} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 1305} {"info/global_step": 1306, "train_info/time_within_train_step": 2.6824166774749756, "step": 1306} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 1306} {"info/global_step": 1307, "train_info/time_within_train_step": 2.6832571029663086, "step": 1307} {"train_info/time_between_train_steps": 0.0033292770385742188, "step": 1307} {"info/global_step": 1308, "train_info/time_within_train_step": 2.682600498199463, "step": 1308} {"train_info/time_between_train_steps": 0.003378152847290039, "step": 1308} {"info/global_step": 1309, "train_info/time_within_train_step": 2.6813392639160156, "step": 1309} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 1309} {"info/global_step": 1310, "train_info/time_within_train_step": 2.6815593242645264, "step": 1310} {"train_info/time_between_train_steps": 0.0034897327423095703, "step": 1310} {"info/global_step": 1311, "train_info/time_within_train_step": 2.6821541786193848, "step": 1311} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 1311} {"info/global_step": 1312, "train_info/time_within_train_step": 2.6823439598083496, "step": 1312} {"train_info/time_between_train_steps": 0.003460407257080078, "step": 1312} {"info/global_step": 1313, "train_info/time_within_train_step": 2.682358980178833, "step": 1313} {"train_info/time_between_train_steps": 0.0033349990844726562, "step": 1313} {"info/global_step": 1314, "train_info/time_within_train_step": 2.725231170654297, "step": 1314} {"train_info/time_between_train_steps": 0.0034339427947998047, "step": 1314} {"info/global_step": 1315, "train_info/time_within_train_step": 2.811917304992676, "step": 1315} {"train_info/time_between_train_steps": 0.003266572952270508, "step": 1315} {"info/global_step": 1316, "train_info/time_within_train_step": 2.757145881652832, "step": 1316} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 1316} {"info/global_step": 1317, "train_info/time_within_train_step": 2.704089641571045, "step": 1317} {"train_info/time_between_train_steps": 0.003251791000366211, "step": 1317} {"info/global_step": 1318, "train_info/time_within_train_step": 2.728334903717041, "step": 1318} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 1318} {"info/global_step": 1319, "train_info/time_within_train_step": 2.713792085647583, "step": 1319} {"train_info/time_between_train_steps": 0.003390073776245117, "step": 1319} {"info/global_step": 1320, "train_info/time_within_train_step": 2.7197022438049316, "step": 1320} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 1320} {"info/global_step": 1321, "train_info/time_within_train_step": 2.7192039489746094, "step": 1321} {"train_info/time_between_train_steps": 0.0037615299224853516, "step": 1321} {"info/global_step": 1322, "train_info/time_within_train_step": 2.692993640899658, "step": 1322} {"train_info/time_between_train_steps": 0.0034127235412597656, "step": 1322} {"info/global_step": 1323, "train_info/time_within_train_step": 2.7113375663757324, "step": 1323} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 1323} {"info/global_step": 1324, "train_info/time_within_train_step": 2.7062652111053467, "step": 1324} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 1324} {"info/global_step": 1325, "train_info/time_within_train_step": 2.7090187072753906, "step": 1325} {"train_info/time_between_train_steps": 0.003237009048461914, "step": 1325} {"info/global_step": 1326, "train_info/time_within_train_step": 2.7007687091827393, "step": 1326} {"train_info/time_between_train_steps": 0.0034437179565429688, "step": 1326} {"info/global_step": 1327, "train_info/time_within_train_step": 2.6962685585021973, "step": 1327} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 1327} {"info/global_step": 1328, "train_info/time_within_train_step": 2.6970834732055664, "step": 1328} {"train_info/time_between_train_steps": 0.0032804012298583984, "step": 1328} {"info/global_step": 1329, "train_info/time_within_train_step": 2.71897554397583, "step": 1329} {"train_info/time_between_train_steps": 0.003351449966430664, "step": 1329} {"info/global_step": 1330, "train_info/time_within_train_step": 2.701098680496216, "step": 1330} {"train_info/time_between_train_steps": 0.003251791000366211, "step": 1330} {"info/global_step": 1331, "train_info/time_within_train_step": 2.6847214698791504, "step": 1331} {"train_info/time_between_train_steps": 0.0034449100494384766, "step": 1331} {"info/global_step": 1332, "train_info/time_within_train_step": 2.685610771179199, "step": 1332} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 1332} {"info/global_step": 1333, "train_info/time_within_train_step": 2.702127456665039, "step": 1333} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 1333} {"info/global_step": 1334, "train_info/time_within_train_step": 2.705518960952759, "step": 1334} {"train_info/time_between_train_steps": 0.0032563209533691406, "step": 1334} {"info/global_step": 1335, "train_info/time_within_train_step": 2.6866660118103027, "step": 1335} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 1335} {"info/global_step": 1336, "train_info/time_within_train_step": 2.7252330780029297, "step": 1336} {"train_info/time_between_train_steps": 0.003434896469116211, "step": 1336} {"info/global_step": 1337, "train_info/time_within_train_step": 2.7409117221832275, "step": 1337} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 1337} {"info/global_step": 1338, "train_info/time_within_train_step": 2.6829450130462646, "step": 1338} {"train_info/time_between_train_steps": 0.0034418106079101562, "step": 1338} {"info/global_step": 1339, "train_info/time_within_train_step": 2.6920108795166016, "step": 1339} {"train_info/time_between_train_steps": 0.003375530242919922, "step": 1339} {"info/global_step": 1340, "train_info/time_within_train_step": 2.7134437561035156, "step": 1340} {"train_info/time_between_train_steps": 0.0032906532287597656, "step": 1340} {"info/global_step": 1341, "train_info/time_within_train_step": 2.6915082931518555, "step": 1341} {"train_info/time_between_train_steps": 0.003470182418823242, "step": 1341} {"info/global_step": 1342, "train_info/time_within_train_step": 2.6973989009857178, "step": 1342} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 1342} {"info/global_step": 1343, "train_info/time_within_train_step": 2.6951963901519775, "step": 1343} {"train_info/time_between_train_steps": 0.0034284591674804688, "step": 1343} {"info/global_step": 1344, "train_info/time_within_train_step": 2.6844828128814697, "step": 1344} {"train_info/time_between_train_steps": 0.0033333301544189453, "step": 1344} {"info/global_step": 1345, "train_info/time_within_train_step": 2.6838338375091553, "step": 1345} {"train_info/time_between_train_steps": 0.0032753944396972656, "step": 1345} {"info/global_step": 1346, "train_info/time_within_train_step": 2.69684100151062, "step": 1346} {"train_info/time_between_train_steps": 0.0034258365631103516, "step": 1346} {"info/global_step": 1347, "train_info/time_within_train_step": 2.6959691047668457, "step": 1347} {"train_info/time_between_train_steps": 0.0034360885620117188, "step": 1347} {"info/global_step": 1348, "train_info/time_within_train_step": 2.6909422874450684, "step": 1348} {"train_info/time_between_train_steps": 0.003373384475708008, "step": 1348} {"info/global_step": 1349, "train_info/time_within_train_step": 2.684272050857544, "step": 1349} {"train_info/time_between_train_steps": 0.003362894058227539, "step": 1349} {"info/global_step": 1350, "train_info/time_within_train_step": 2.6890523433685303, "step": 1350} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746315757, "_runtime": 3913}, "step": 1350} {"logs": {"train/loss": 4.5494, "train/learning_rate": 0.00036666666666666667, "train/epoch": 1.17, "_timestamp": 1746315757, "_runtime": 3913}, "step": 1350} {"train_info/time_between_train_steps": 0.0241091251373291, "step": 1350} {"info/global_step": 1351, "train_info/time_within_train_step": 2.6915082931518555, "step": 1351} {"train_info/time_between_train_steps": 0.0033562183380126953, "step": 1351} {"info/global_step": 1352, "train_info/time_within_train_step": 2.699483871459961, "step": 1352} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 1352} {"info/global_step": 1353, "train_info/time_within_train_step": 2.7049591541290283, "step": 1353} {"train_info/time_between_train_steps": 0.0962071418762207, "step": 1353} {"info/global_step": 1354, "train_info/time_within_train_step": 2.6860647201538086, "step": 1354} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 1354} {"info/global_step": 1355, "train_info/time_within_train_step": 2.682832956314087, "step": 1355} {"train_info/time_between_train_steps": 0.003476858139038086, "step": 1355} {"info/global_step": 1356, "train_info/time_within_train_step": 2.681509017944336, "step": 1356} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 1356} {"info/global_step": 1357, "train_info/time_within_train_step": 2.6835691928863525, "step": 1357} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 1357} {"info/global_step": 1358, "train_info/time_within_train_step": 2.6834850311279297, "step": 1358} {"train_info/time_between_train_steps": 0.003314495086669922, "step": 1358} {"info/global_step": 1359, "train_info/time_within_train_step": 2.6836764812469482, "step": 1359} {"train_info/time_between_train_steps": 0.003455638885498047, "step": 1359} {"info/global_step": 1360, "train_info/time_within_train_step": 2.683377265930176, "step": 1360} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 1360} {"info/global_step": 1361, "train_info/time_within_train_step": 2.946192741394043, "step": 1361} {"train_info/time_between_train_steps": 0.003412008285522461, "step": 1361} {"info/global_step": 1362, "train_info/time_within_train_step": 2.6836581230163574, "step": 1362} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 1362} {"info/global_step": 1363, "train_info/time_within_train_step": 2.6829171180725098, "step": 1363} {"train_info/time_between_train_steps": 0.003421306610107422, "step": 1363} {"info/global_step": 1364, "train_info/time_within_train_step": 2.6831798553466797, "step": 1364} {"train_info/time_between_train_steps": 0.0032825469970703125, "step": 1364} {"info/global_step": 1365, "train_info/time_within_train_step": 2.683239221572876, "step": 1365} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 1365} {"info/global_step": 1366, "train_info/time_within_train_step": 2.682760000228882, "step": 1366} {"train_info/time_between_train_steps": 0.003362894058227539, "step": 1366} {"info/global_step": 1367, "train_info/time_within_train_step": 2.6845505237579346, "step": 1367} {"train_info/time_between_train_steps": 0.003463268280029297, "step": 1367} {"info/global_step": 1368, "train_info/time_within_train_step": 2.6832289695739746, "step": 1368} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 1368} {"info/global_step": 1369, "train_info/time_within_train_step": 2.683209180831909, "step": 1369} {"train_info/time_between_train_steps": 0.003214597702026367, "step": 1369} {"info/global_step": 1370, "train_info/time_within_train_step": 2.6839542388916016, "step": 1370} {"train_info/time_between_train_steps": 0.0032796859741210938, "step": 1370} {"info/global_step": 1371, "train_info/time_within_train_step": 2.6825435161590576, "step": 1371} {"train_info/time_between_train_steps": 0.0033702850341796875, "step": 1371} {"info/global_step": 1372, "train_info/time_within_train_step": 2.6839518547058105, "step": 1372} {"train_info/time_between_train_steps": 0.003452301025390625, "step": 1372} {"info/global_step": 1373, "train_info/time_within_train_step": 2.6833977699279785, "step": 1373} {"train_info/time_between_train_steps": 0.0034809112548828125, "step": 1373} {"info/global_step": 1374, "train_info/time_within_train_step": 2.683312177658081, "step": 1374} {"train_info/time_between_train_steps": 0.0033674240112304688, "step": 1374} {"info/global_step": 1375, "train_info/time_within_train_step": 2.683535099029541, "step": 1375} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 1375} {"info/global_step": 1376, "train_info/time_within_train_step": 2.6924242973327637, "step": 1376} {"train_info/time_between_train_steps": 0.0032501220703125, "step": 1376} {"info/global_step": 1377, "train_info/time_within_train_step": 2.6837973594665527, "step": 1377} {"train_info/time_between_train_steps": 0.003208637237548828, "step": 1377} {"info/global_step": 1378, "train_info/time_within_train_step": 2.6836001873016357, "step": 1378} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 1378} {"info/global_step": 1379, "train_info/time_within_train_step": 2.682239532470703, "step": 1379} {"train_info/time_between_train_steps": 0.003201007843017578, "step": 1379} {"info/global_step": 1380, "train_info/time_within_train_step": 2.687685251235962, "step": 1380} {"train_info/time_between_train_steps": 0.0034110546112060547, "step": 1380} {"info/global_step": 1381, "train_info/time_within_train_step": 2.6835365295410156, "step": 1381} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 1381} {"info/global_step": 1382, "train_info/time_within_train_step": 2.6834404468536377, "step": 1382} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 1382} {"info/global_step": 1383, "train_info/time_within_train_step": 2.6831140518188477, "step": 1383} {"train_info/time_between_train_steps": 0.0034949779510498047, "step": 1383} {"info/global_step": 1384, "train_info/time_within_train_step": 2.6824347972869873, "step": 1384} {"train_info/time_between_train_steps": 0.0034263134002685547, "step": 1384} {"info/global_step": 1385, "train_info/time_within_train_step": 2.68251895904541, "step": 1385} {"train_info/time_between_train_steps": 0.003254413604736328, "step": 1385} {"info/global_step": 1386, "train_info/time_within_train_step": 2.6836905479431152, "step": 1386} {"train_info/time_between_train_steps": 0.003332376480102539, "step": 1386} {"info/global_step": 1387, "train_info/time_within_train_step": 2.683029890060425, "step": 1387} {"train_info/time_between_train_steps": 0.0032188892364501953, "step": 1387} {"info/global_step": 1388, "train_info/time_within_train_step": 2.682643413543701, "step": 1388} {"train_info/time_between_train_steps": 0.003382444381713867, "step": 1388} {"info/global_step": 1389, "train_info/time_within_train_step": 2.6822214126586914, "step": 1389} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 1389} {"info/global_step": 1390, "train_info/time_within_train_step": 2.6835246086120605, "step": 1390} {"train_info/time_between_train_steps": 0.0034122467041015625, "step": 1390} {"info/global_step": 1391, "train_info/time_within_train_step": 2.6834144592285156, "step": 1391} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 1391} {"info/global_step": 1392, "train_info/time_within_train_step": 2.6834065914154053, "step": 1392} {"train_info/time_between_train_steps": 0.003585338592529297, "step": 1392} {"info/global_step": 1393, "train_info/time_within_train_step": 2.683014392852783, "step": 1393} {"train_info/time_between_train_steps": 0.003474712371826172, "step": 1393} {"info/global_step": 1394, "train_info/time_within_train_step": 2.6837964057922363, "step": 1394} {"train_info/time_between_train_steps": 0.020938396453857422, "step": 1394} {"info/global_step": 1395, "train_info/time_within_train_step": 2.683346748352051, "step": 1395} {"train_info/time_between_train_steps": 0.0030050277709960938, "step": 1395} {"info/global_step": 1396, "train_info/time_within_train_step": 2.6821389198303223, "step": 1396} {"train_info/time_between_train_steps": 0.003020763397216797, "step": 1396} {"info/global_step": 1397, "train_info/time_within_train_step": 2.68283748626709, "step": 1397} {"train_info/time_between_train_steps": 0.002873659133911133, "step": 1397} {"info/global_step": 1398, "train_info/time_within_train_step": 2.6830902099609375, "step": 1398} {"train_info/time_between_train_steps": 0.0029668807983398438, "step": 1398} {"info/global_step": 1399, "train_info/time_within_train_step": 2.6824002265930176, "step": 1399} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 1399} {"info/global_step": 1400, "train_info/time_within_train_step": 2.683051824569702, "step": 1400} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746315893, "_runtime": 4049}, "step": 1400} {"logs": {"train/loss": 4.534, "train/learning_rate": 0.0003555555555555555, "train/epoch": 1.18, "_timestamp": 1746315893, "_runtime": 4049}, "step": 1400} {"train_info/time_between_train_steps": 13.732973098754883, "step": 1400} {"info/global_step": 1401, "train_info/time_within_train_step": 2.4858479499816895, "step": 1401} {"train_info/time_between_train_steps": 0.0029463768005371094, "step": 1401} {"info/global_step": 1402, "train_info/time_within_train_step": 2.5107531547546387, "step": 1402} {"train_info/time_between_train_steps": 0.0029172897338867188, "step": 1402} {"info/global_step": 1403, "train_info/time_within_train_step": 2.678395986557007, "step": 1403} {"train_info/time_between_train_steps": 0.0029671192169189453, "step": 1403} {"info/global_step": 1404, "train_info/time_within_train_step": 2.680389642715454, "step": 1404} {"train_info/time_between_train_steps": 0.002941131591796875, "step": 1404} {"info/global_step": 1405, "train_info/time_within_train_step": 2.6811225414276123, "step": 1405} {"train_info/time_between_train_steps": 0.002918243408203125, "step": 1405} {"info/global_step": 1406, "train_info/time_within_train_step": 2.6813907623291016, "step": 1406} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 1406} {"info/global_step": 1407, "train_info/time_within_train_step": 2.6819334030151367, "step": 1407} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 1407} {"info/global_step": 1408, "train_info/time_within_train_step": 2.682551622390747, "step": 1408} {"train_info/time_between_train_steps": 0.002938985824584961, "step": 1408} {"info/global_step": 1409, "train_info/time_within_train_step": 2.683279275894165, "step": 1409} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 1409} {"info/global_step": 1410, "train_info/time_within_train_step": 2.68380069732666, "step": 1410} {"train_info/time_between_train_steps": 0.0029282569885253906, "step": 1410} {"info/global_step": 1411, "train_info/time_within_train_step": 2.6832094192504883, "step": 1411} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 1411} {"info/global_step": 1412, "train_info/time_within_train_step": 2.6833789348602295, "step": 1412} {"train_info/time_between_train_steps": 0.0029342174530029297, "step": 1412} {"info/global_step": 1413, "train_info/time_within_train_step": 2.6825900077819824, "step": 1413} {"train_info/time_between_train_steps": 0.0029566287994384766, "step": 1413} {"info/global_step": 1414, "train_info/time_within_train_step": 2.7397003173828125, "step": 1414} {"train_info/time_between_train_steps": 0.002900838851928711, "step": 1414} {"info/global_step": 1415, "train_info/time_within_train_step": 2.7979722023010254, "step": 1415} {"train_info/time_between_train_steps": 0.0029840469360351562, "step": 1415} {"info/global_step": 1416, "train_info/time_within_train_step": 2.9244706630706787, "step": 1416} {"train_info/time_between_train_steps": 0.0029413700103759766, "step": 1416} {"info/global_step": 1417, "train_info/time_within_train_step": 2.707817554473877, "step": 1417} {"train_info/time_between_train_steps": 0.0034253597259521484, "step": 1417} {"info/global_step": 1418, "train_info/time_within_train_step": 2.710796594619751, "step": 1418} {"train_info/time_between_train_steps": 0.0031058788299560547, "step": 1418} {"info/global_step": 1419, "train_info/time_within_train_step": 2.749555826187134, "step": 1419} {"train_info/time_between_train_steps": 0.002918720245361328, "step": 1419} {"info/global_step": 1420, "train_info/time_within_train_step": 2.741826057434082, "step": 1420} {"train_info/time_between_train_steps": 0.0030150413513183594, "step": 1420} {"info/global_step": 1421, "train_info/time_within_train_step": 2.713273286819458, "step": 1421} {"train_info/time_between_train_steps": 0.003140687942504883, "step": 1421} {"info/global_step": 1422, "train_info/time_within_train_step": 2.722825527191162, "step": 1422} {"train_info/time_between_train_steps": 0.0029366016387939453, "step": 1422} {"info/global_step": 1423, "train_info/time_within_train_step": 2.7014236450195312, "step": 1423} {"train_info/time_between_train_steps": 0.0030374526977539062, "step": 1423} {"info/global_step": 1424, "train_info/time_within_train_step": 2.70994234085083, "step": 1424} {"train_info/time_between_train_steps": 0.003009796142578125, "step": 1424} {"info/global_step": 1425, "train_info/time_within_train_step": 2.712498188018799, "step": 1425} {"train_info/time_between_train_steps": 0.0030295848846435547, "step": 1425} {"info/global_step": 1426, "train_info/time_within_train_step": 2.6922109127044678, "step": 1426} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 1426} {"info/global_step": 1427, "train_info/time_within_train_step": 2.718998432159424, "step": 1427} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 1427} {"info/global_step": 1428, "train_info/time_within_train_step": 2.704324245452881, "step": 1428} {"train_info/time_between_train_steps": 0.002931356430053711, "step": 1428} {"info/global_step": 1429, "train_info/time_within_train_step": 2.6951911449432373, "step": 1429} {"train_info/time_between_train_steps": 0.0029256343841552734, "step": 1429} {"info/global_step": 1430, "train_info/time_within_train_step": 2.6886537075042725, "step": 1430} {"train_info/time_between_train_steps": 0.002900838851928711, "step": 1430} {"info/global_step": 1431, "train_info/time_within_train_step": 2.7102692127227783, "step": 1431} {"train_info/time_between_train_steps": 0.0030927658081054688, "step": 1431} {"info/global_step": 1432, "train_info/time_within_train_step": 2.6915082931518555, "step": 1432} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 1432} {"info/global_step": 1433, "train_info/time_within_train_step": 2.7186367511749268, "step": 1433} {"train_info/time_between_train_steps": 0.0029926300048828125, "step": 1433} {"info/global_step": 1434, "train_info/time_within_train_step": 2.745452404022217, "step": 1434} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 1434} {"info/global_step": 1435, "train_info/time_within_train_step": 2.6893045902252197, "step": 1435} {"train_info/time_between_train_steps": 0.0030028820037841797, "step": 1435} {"info/global_step": 1436, "train_info/time_within_train_step": 2.683750867843628, "step": 1436} {"train_info/time_between_train_steps": 0.0031499862670898438, "step": 1436} {"info/global_step": 1437, "train_info/time_within_train_step": 2.68789005279541, "step": 1437} {"train_info/time_between_train_steps": 0.00293731689453125, "step": 1437} {"info/global_step": 1438, "train_info/time_within_train_step": 2.713923454284668, "step": 1438} {"train_info/time_between_train_steps": 0.003444671630859375, "step": 1438} {"info/global_step": 1439, "train_info/time_within_train_step": 2.703122138977051, "step": 1439} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 1439} {"info/global_step": 1440, "train_info/time_within_train_step": 2.6968026161193848, "step": 1440} {"train_info/time_between_train_steps": 0.0029325485229492188, "step": 1440} {"info/global_step": 1441, "train_info/time_within_train_step": 2.7510077953338623, "step": 1441} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 1441} {"info/global_step": 1442, "train_info/time_within_train_step": 2.6824800968170166, "step": 1442} {"train_info/time_between_train_steps": 0.002899646759033203, "step": 1442} {"info/global_step": 1443, "train_info/time_within_train_step": 2.6912457942962646, "step": 1443} {"train_info/time_between_train_steps": 0.0030875205993652344, "step": 1443} {"info/global_step": 1444, "train_info/time_within_train_step": 2.71282696723938, "step": 1444} {"train_info/time_between_train_steps": 0.0029726028442382812, "step": 1444} {"info/global_step": 1445, "train_info/time_within_train_step": 2.7003695964813232, "step": 1445} {"train_info/time_between_train_steps": 0.003124713897705078, "step": 1445} {"info/global_step": 1446, "train_info/time_within_train_step": 2.6866447925567627, "step": 1446} {"train_info/time_between_train_steps": 0.0030722618103027344, "step": 1446} {"info/global_step": 1447, "train_info/time_within_train_step": 2.724520683288574, "step": 1447} {"train_info/time_between_train_steps": 0.003002643585205078, "step": 1447} {"info/global_step": 1448, "train_info/time_within_train_step": 2.6844029426574707, "step": 1448} {"train_info/time_between_train_steps": 0.0029320716857910156, "step": 1448} {"info/global_step": 1449, "train_info/time_within_train_step": 2.6837358474731445, "step": 1449} {"train_info/time_between_train_steps": 0.0030143260955810547, "step": 1449} {"info/global_step": 1450, "train_info/time_within_train_step": 2.6834144592285156, "step": 1450} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746316043, "_runtime": 4199}, "step": 1450} {"logs": {"train/loss": 4.5103, "train/learning_rate": 0.0003444444444444444, "train/epoch": 1.2, "_timestamp": 1746316043, "_runtime": 4199}, "step": 1450} {"train_info/time_between_train_steps": 0.02471613883972168, "step": 1450} {"info/global_step": 1451, "train_info/time_within_train_step": 2.6833267211914062, "step": 1451} {"train_info/time_between_train_steps": 0.0030684471130371094, "step": 1451} {"info/global_step": 1452, "train_info/time_within_train_step": 2.6847658157348633, "step": 1452} {"train_info/time_between_train_steps": 0.0030252933502197266, "step": 1452} {"info/global_step": 1453, "train_info/time_within_train_step": 2.682382345199585, "step": 1453} {"train_info/time_between_train_steps": 0.0029768943786621094, "step": 1453} {"info/global_step": 1454, "train_info/time_within_train_step": 2.6820120811462402, "step": 1454} {"train_info/time_between_train_steps": 0.002905130386352539, "step": 1454} {"info/global_step": 1455, "train_info/time_within_train_step": 2.693204641342163, "step": 1455} {"train_info/time_between_train_steps": 0.0031244754791259766, "step": 1455} {"info/global_step": 1456, "train_info/time_within_train_step": 2.7080304622650146, "step": 1456} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 1456} {"info/global_step": 1457, "train_info/time_within_train_step": 2.8884572982788086, "step": 1457} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 1457} {"info/global_step": 1458, "train_info/time_within_train_step": 2.6835312843322754, "step": 1458} {"train_info/time_between_train_steps": 0.002859830856323242, "step": 1458} {"info/global_step": 1459, "train_info/time_within_train_step": 2.6840975284576416, "step": 1459} {"train_info/time_between_train_steps": 0.003005504608154297, "step": 1459} {"info/global_step": 1460, "train_info/time_within_train_step": 2.6827149391174316, "step": 1460} {"train_info/time_between_train_steps": 0.0029397010803222656, "step": 1460} {"info/global_step": 1461, "train_info/time_within_train_step": 2.6826043128967285, "step": 1461} {"train_info/time_between_train_steps": 0.0029039382934570312, "step": 1461} {"info/global_step": 1462, "train_info/time_within_train_step": 2.682737112045288, "step": 1462} {"train_info/time_between_train_steps": 0.003004312515258789, "step": 1462} {"info/global_step": 1463, "train_info/time_within_train_step": 2.6823322772979736, "step": 1463} {"train_info/time_between_train_steps": 0.002880096435546875, "step": 1463} {"info/global_step": 1464, "train_info/time_within_train_step": 2.6838691234588623, "step": 1464} {"train_info/time_between_train_steps": 0.0029561519622802734, "step": 1464} {"info/global_step": 1465, "train_info/time_within_train_step": 2.6825268268585205, "step": 1465} {"train_info/time_between_train_steps": 0.0029451847076416016, "step": 1465} {"info/global_step": 1466, "train_info/time_within_train_step": 2.683168888092041, "step": 1466} {"train_info/time_between_train_steps": 0.0029151439666748047, "step": 1466} {"info/global_step": 1467, "train_info/time_within_train_step": 2.683762788772583, "step": 1467} {"train_info/time_between_train_steps": 0.002969980239868164, "step": 1467} {"info/global_step": 1468, "train_info/time_within_train_step": 2.6830222606658936, "step": 1468} {"train_info/time_between_train_steps": 0.0029790401458740234, "step": 1468} {"info/global_step": 1469, "train_info/time_within_train_step": 2.682826280593872, "step": 1469} {"train_info/time_between_train_steps": 0.0029745101928710938, "step": 1469} {"info/global_step": 1470, "train_info/time_within_train_step": 2.6836965084075928, "step": 1470} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 1470} {"info/global_step": 1471, "train_info/time_within_train_step": 2.6842212677001953, "step": 1471} {"train_info/time_between_train_steps": 0.003072500228881836, "step": 1471} {"info/global_step": 1472, "train_info/time_within_train_step": 2.6830976009368896, "step": 1472} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 1472} {"info/global_step": 1473, "train_info/time_within_train_step": 2.6829748153686523, "step": 1473} {"train_info/time_between_train_steps": 0.0031142234802246094, "step": 1473} {"info/global_step": 1474, "train_info/time_within_train_step": 2.682812213897705, "step": 1474} {"train_info/time_between_train_steps": 0.002979278564453125, "step": 1474} {"info/global_step": 1475, "train_info/time_within_train_step": 2.681725263595581, "step": 1475} {"train_info/time_between_train_steps": 0.0029039382934570312, "step": 1475} {"info/global_step": 1476, "train_info/time_within_train_step": 2.6817851066589355, "step": 1476} {"train_info/time_between_train_steps": 0.0029761791229248047, "step": 1476} {"info/global_step": 1477, "train_info/time_within_train_step": 2.6844115257263184, "step": 1477} {"train_info/time_between_train_steps": 0.0029168128967285156, "step": 1477} {"info/global_step": 1478, "train_info/time_within_train_step": 2.6825850009918213, "step": 1478} {"train_info/time_between_train_steps": 0.0028798580169677734, "step": 1478} {"info/global_step": 1479, "train_info/time_within_train_step": 2.683549642562866, "step": 1479} {"train_info/time_between_train_steps": 0.0030426979064941406, "step": 1479} {"info/global_step": 1480, "train_info/time_within_train_step": 2.6831514835357666, "step": 1480} {"train_info/time_between_train_steps": 0.002910137176513672, "step": 1480} {"info/global_step": 1481, "train_info/time_within_train_step": 2.681736469268799, "step": 1481} {"train_info/time_between_train_steps": 0.002964019775390625, "step": 1481} {"info/global_step": 1482, "train_info/time_within_train_step": 2.682548999786377, "step": 1482} {"train_info/time_between_train_steps": 0.002905130386352539, "step": 1482} {"info/global_step": 1483, "train_info/time_within_train_step": 2.682480573654175, "step": 1483} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 1483} {"info/global_step": 1484, "train_info/time_within_train_step": 2.682135820388794, "step": 1484} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 1484} {"info/global_step": 1485, "train_info/time_within_train_step": 2.683356523513794, "step": 1485} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 1485} {"info/global_step": 1486, "train_info/time_within_train_step": 2.6842293739318848, "step": 1486} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 1486} {"info/global_step": 1487, "train_info/time_within_train_step": 2.6838784217834473, "step": 1487} {"train_info/time_between_train_steps": 0.002905607223510742, "step": 1487} {"info/global_step": 1488, "train_info/time_within_train_step": 2.684267997741699, "step": 1488} {"train_info/time_between_train_steps": 0.0029227733612060547, "step": 1488} {"info/global_step": 1489, "train_info/time_within_train_step": 2.6845314502716064, "step": 1489} {"train_info/time_between_train_steps": 0.0029745101928710938, "step": 1489} {"info/global_step": 1490, "train_info/time_within_train_step": 2.684292793273926, "step": 1490} {"train_info/time_between_train_steps": 0.003149747848510742, "step": 1490} {"info/global_step": 1491, "train_info/time_within_train_step": 2.6836166381835938, "step": 1491} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 1491} {"info/global_step": 1492, "train_info/time_within_train_step": 2.6837055683135986, "step": 1492} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 1492} {"info/global_step": 1493, "train_info/time_within_train_step": 2.681596279144287, "step": 1493} {"train_info/time_between_train_steps": 0.0030024051666259766, "step": 1493} {"info/global_step": 1494, "train_info/time_within_train_step": 2.682636260986328, "step": 1494} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 1494} {"info/global_step": 1495, "train_info/time_within_train_step": 2.6821517944335938, "step": 1495} {"train_info/time_between_train_steps": 0.0029485225677490234, "step": 1495} {"info/global_step": 1496, "train_info/time_within_train_step": 2.6828854084014893, "step": 1496} {"train_info/time_between_train_steps": 0.0029408931732177734, "step": 1496} {"info/global_step": 1497, "train_info/time_within_train_step": 2.681565046310425, "step": 1497} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 1497} {"info/global_step": 1498, "train_info/time_within_train_step": 2.682384490966797, "step": 1498} {"train_info/time_between_train_steps": 0.0029191970825195312, "step": 1498} {"info/global_step": 1499, "train_info/time_within_train_step": 2.68202543258667, "step": 1499} {"train_info/time_between_train_steps": 0.0030901432037353516, "step": 1499} {"info/global_step": 1500, "train_info/time_within_train_step": 3.2667794227600098, "step": 1500} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746316179, "_runtime": 4335}, "step": 1500} {"logs": {"train/loss": 4.4729, "train/learning_rate": 0.0003333333333333333, "train/epoch": 1.22, "_timestamp": 1746316179, "_runtime": 4335}, "step": 1500} {"train_info/time_between_train_steps": 14.162846565246582, "step": 1500} {"info/global_step": 1501, "train_info/time_within_train_step": 2.4812138080596924, "step": 1501} {"train_info/time_between_train_steps": 0.0029158592224121094, "step": 1501} {"info/global_step": 1502, "train_info/time_within_train_step": 2.5013861656188965, "step": 1502} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 1502} {"info/global_step": 1503, "train_info/time_within_train_step": 2.6793506145477295, "step": 1503} {"train_info/time_between_train_steps": 0.0029370784759521484, "step": 1503} {"info/global_step": 1504, "train_info/time_within_train_step": 2.6796462535858154, "step": 1504} {"train_info/time_between_train_steps": 0.0032241344451904297, "step": 1504} {"info/global_step": 1505, "train_info/time_within_train_step": 2.680225372314453, "step": 1505} {"train_info/time_between_train_steps": 0.002980947494506836, "step": 1505} {"info/global_step": 1506, "train_info/time_within_train_step": 2.6822500228881836, "step": 1506} {"train_info/time_between_train_steps": 0.0030660629272460938, "step": 1506} {"info/global_step": 1507, "train_info/time_within_train_step": 2.68196439743042, "step": 1507} {"train_info/time_between_train_steps": 0.002899169921875, "step": 1507} {"info/global_step": 1508, "train_info/time_within_train_step": 2.6810648441314697, "step": 1508} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 1508} {"info/global_step": 1509, "train_info/time_within_train_step": 2.681594133377075, "step": 1509} {"train_info/time_between_train_steps": 0.0030670166015625, "step": 1509} {"info/global_step": 1510, "train_info/time_within_train_step": 2.6826343536376953, "step": 1510} {"train_info/time_between_train_steps": 0.003089427947998047, "step": 1510} {"info/global_step": 1511, "train_info/time_within_train_step": 2.682285785675049, "step": 1511} {"train_info/time_between_train_steps": 0.0029735565185546875, "step": 1511} {"info/global_step": 1512, "train_info/time_within_train_step": 2.6823863983154297, "step": 1512} {"train_info/time_between_train_steps": 0.002981424331665039, "step": 1512} {"info/global_step": 1513, "train_info/time_within_train_step": 2.6833884716033936, "step": 1513} {"train_info/time_between_train_steps": 0.002911090850830078, "step": 1513} {"info/global_step": 1514, "train_info/time_within_train_step": 2.7569737434387207, "step": 1514} {"train_info/time_between_train_steps": 0.0030622482299804688, "step": 1514} {"info/global_step": 1515, "train_info/time_within_train_step": 2.8712329864501953, "step": 1515} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 1515} {"info/global_step": 1516, "train_info/time_within_train_step": 2.8180527687072754, "step": 1516} {"train_info/time_between_train_steps": 0.0030660629272460938, "step": 1516} {"info/global_step": 1517, "train_info/time_within_train_step": 2.7026331424713135, "step": 1517} {"train_info/time_between_train_steps": 0.0031032562255859375, "step": 1517} {"info/global_step": 1518, "train_info/time_within_train_step": 2.7046899795532227, "step": 1518} {"train_info/time_between_train_steps": 0.002906322479248047, "step": 1518} {"info/global_step": 1519, "train_info/time_within_train_step": 2.7051844596862793, "step": 1519} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 1519} {"info/global_step": 1520, "train_info/time_within_train_step": 2.7082748413085938, "step": 1520} {"train_info/time_between_train_steps": 0.0028924942016601562, "step": 1520} {"info/global_step": 1521, "train_info/time_within_train_step": 2.73203706741333, "step": 1521} {"train_info/time_between_train_steps": 0.002979278564453125, "step": 1521} {"info/global_step": 1522, "train_info/time_within_train_step": 2.711061954498291, "step": 1522} {"train_info/time_between_train_steps": 0.0030150413513183594, "step": 1522} {"info/global_step": 1523, "train_info/time_within_train_step": 2.6948437690734863, "step": 1523} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 1523} {"info/global_step": 1524, "train_info/time_within_train_step": 2.7240829467773438, "step": 1524} {"train_info/time_between_train_steps": 0.0031249523162841797, "step": 1524} {"info/global_step": 1525, "train_info/time_within_train_step": 2.6927108764648438, "step": 1525} {"train_info/time_between_train_steps": 0.003113985061645508, "step": 1525} {"info/global_step": 1526, "train_info/time_within_train_step": 2.692073345184326, "step": 1526} {"train_info/time_between_train_steps": 0.0031032562255859375, "step": 1526} {"info/global_step": 1527, "train_info/time_within_train_step": 2.707616090774536, "step": 1527} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 1527} {"info/global_step": 1528, "train_info/time_within_train_step": 2.6959705352783203, "step": 1528} {"train_info/time_between_train_steps": 0.0029637813568115234, "step": 1528} {"info/global_step": 1529, "train_info/time_within_train_step": 2.7046875953674316, "step": 1529} {"train_info/time_between_train_steps": 0.0030281543731689453, "step": 1529} {"info/global_step": 1530, "train_info/time_within_train_step": 2.687692165374756, "step": 1530} {"train_info/time_between_train_steps": 0.0030214786529541016, "step": 1530} {"info/global_step": 1531, "train_info/time_within_train_step": 2.8652472496032715, "step": 1531} {"train_info/time_between_train_steps": 0.0030128955841064453, "step": 1531} {"info/global_step": 1532, "train_info/time_within_train_step": 2.6843507289886475, "step": 1532} {"train_info/time_between_train_steps": 0.003069162368774414, "step": 1532} {"info/global_step": 1533, "train_info/time_within_train_step": 2.68477725982666, "step": 1533} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 1533} {"info/global_step": 1534, "train_info/time_within_train_step": 2.6839420795440674, "step": 1534} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 1534} {"info/global_step": 1535, "train_info/time_within_train_step": 2.686350107192993, "step": 1535} {"train_info/time_between_train_steps": 0.002891063690185547, "step": 1535} {"info/global_step": 1536, "train_info/time_within_train_step": 2.7238571643829346, "step": 1536} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 1536} {"info/global_step": 1537, "train_info/time_within_train_step": 2.69655704498291, "step": 1537} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 1537} {"info/global_step": 1538, "train_info/time_within_train_step": 2.6972296237945557, "step": 1538} {"train_info/time_between_train_steps": 0.0030608177185058594, "step": 1538} {"info/global_step": 1539, "train_info/time_within_train_step": 2.6925928592681885, "step": 1539} {"train_info/time_between_train_steps": 0.002974987030029297, "step": 1539} {"info/global_step": 1540, "train_info/time_within_train_step": 2.699136734008789, "step": 1540} {"train_info/time_between_train_steps": 0.0029032230377197266, "step": 1540} {"info/global_step": 1541, "train_info/time_within_train_step": 2.722724676132202, "step": 1541} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 1541} {"info/global_step": 1542, "train_info/time_within_train_step": 2.7048323154449463, "step": 1542} {"train_info/time_between_train_steps": 0.003061532974243164, "step": 1542} {"info/global_step": 1543, "train_info/time_within_train_step": 2.6855127811431885, "step": 1543} {"train_info/time_between_train_steps": 0.002974987030029297, "step": 1543} {"info/global_step": 1544, "train_info/time_within_train_step": 2.6845309734344482, "step": 1544} {"train_info/time_between_train_steps": 0.003123760223388672, "step": 1544} {"info/global_step": 1545, "train_info/time_within_train_step": 2.6873929500579834, "step": 1545} {"train_info/time_between_train_steps": 0.0030624866485595703, "step": 1545} {"info/global_step": 1546, "train_info/time_within_train_step": 2.7144131660461426, "step": 1546} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 1546} {"info/global_step": 1547, "train_info/time_within_train_step": 2.707834243774414, "step": 1547} {"train_info/time_between_train_steps": 0.0030755996704101562, "step": 1547} {"info/global_step": 1548, "train_info/time_within_train_step": 2.701946258544922, "step": 1548} {"train_info/time_between_train_steps": 0.0030889511108398438, "step": 1548} {"info/global_step": 1549, "train_info/time_within_train_step": 2.696669340133667, "step": 1549} {"train_info/time_between_train_steps": 0.0029146671295166016, "step": 1549} {"info/global_step": 1550, "train_info/time_within_train_step": 2.684056043624878, "step": 1550} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746316329, "_runtime": 4485}, "step": 1550} {"logs": {"train/loss": 4.4497, "train/learning_rate": 0.0003222222222222222, "train/epoch": 1.23, "_timestamp": 1746316329, "_runtime": 4485}, "step": 1550} {"train_info/time_between_train_steps": 0.02486896514892578, "step": 1550} {"info/global_step": 1551, "train_info/time_within_train_step": 2.6837308406829834, "step": 1551} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 1551} {"info/global_step": 1552, "train_info/time_within_train_step": 2.684255361557007, "step": 1552} {"train_info/time_between_train_steps": 0.00301361083984375, "step": 1552} {"info/global_step": 1553, "train_info/time_within_train_step": 2.6829802989959717, "step": 1553} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 1553} {"info/global_step": 1554, "train_info/time_within_train_step": 2.682539224624634, "step": 1554} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 1554} {"info/global_step": 1555, "train_info/time_within_train_step": 2.6876423358917236, "step": 1555} {"train_info/time_between_train_steps": 0.0028715133666992188, "step": 1555} {"info/global_step": 1556, "train_info/time_within_train_step": 2.683009147644043, "step": 1556} {"train_info/time_between_train_steps": 0.002968311309814453, "step": 1556} {"info/global_step": 1557, "train_info/time_within_train_step": 2.682976007461548, "step": 1557} {"train_info/time_between_train_steps": 0.0029196739196777344, "step": 1557} {"info/global_step": 1558, "train_info/time_within_train_step": 2.6990764141082764, "step": 1558} {"train_info/time_between_train_steps": 0.002935171127319336, "step": 1558} {"info/global_step": 1559, "train_info/time_within_train_step": 2.684180974960327, "step": 1559} {"train_info/time_between_train_steps": 0.0029850006103515625, "step": 1559} {"info/global_step": 1560, "train_info/time_within_train_step": 2.6834499835968018, "step": 1560} {"train_info/time_between_train_steps": 0.0030481815338134766, "step": 1560} {"info/global_step": 1561, "train_info/time_within_train_step": 2.7017176151275635, "step": 1561} {"train_info/time_between_train_steps": 0.002895832061767578, "step": 1561} {"info/global_step": 1562, "train_info/time_within_train_step": 2.6841213703155518, "step": 1562} {"train_info/time_between_train_steps": 0.002912282943725586, "step": 1562} {"info/global_step": 1563, "train_info/time_within_train_step": 2.6824216842651367, "step": 1563} {"train_info/time_between_train_steps": 0.002917766571044922, "step": 1563} {"info/global_step": 1564, "train_info/time_within_train_step": 2.6829047203063965, "step": 1564} {"train_info/time_between_train_steps": 0.0028982162475585938, "step": 1564} {"info/global_step": 1565, "train_info/time_within_train_step": 2.68353009223938, "step": 1565} {"train_info/time_between_train_steps": 0.0030059814453125, "step": 1565} {"info/global_step": 1566, "train_info/time_within_train_step": 2.6849119663238525, "step": 1566} {"train_info/time_between_train_steps": 0.003061532974243164, "step": 1566} {"info/global_step": 1567, "train_info/time_within_train_step": 2.683912515640259, "step": 1567} {"train_info/time_between_train_steps": 0.002910137176513672, "step": 1567} {"info/global_step": 1568, "train_info/time_within_train_step": 2.684056282043457, "step": 1568} {"train_info/time_between_train_steps": 0.003010272979736328, "step": 1568} {"info/global_step": 1569, "train_info/time_within_train_step": 2.6948764324188232, "step": 1569} {"train_info/time_between_train_steps": 0.003082275390625, "step": 1569} {"info/global_step": 1570, "train_info/time_within_train_step": 2.683652877807617, "step": 1570} {"train_info/time_between_train_steps": 0.0029151439666748047, "step": 1570} {"info/global_step": 1571, "train_info/time_within_train_step": 2.8146111965179443, "step": 1571} {"train_info/time_between_train_steps": 0.003088235855102539, "step": 1571} {"info/global_step": 1572, "train_info/time_within_train_step": 2.683220386505127, "step": 1572} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 1572} {"info/global_step": 1573, "train_info/time_within_train_step": 2.6838648319244385, "step": 1573} {"train_info/time_between_train_steps": 0.0029544830322265625, "step": 1573} {"info/global_step": 1574, "train_info/time_within_train_step": 2.683927059173584, "step": 1574} {"train_info/time_between_train_steps": 0.002960205078125, "step": 1574} {"info/global_step": 1575, "train_info/time_within_train_step": 2.6826484203338623, "step": 1575} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 1575} {"info/global_step": 1576, "train_info/time_within_train_step": 2.6833746433258057, "step": 1576} {"train_info/time_between_train_steps": 0.0029141902923583984, "step": 1576} {"info/global_step": 1577, "train_info/time_within_train_step": 2.683539390563965, "step": 1577} {"train_info/time_between_train_steps": 0.0029175281524658203, "step": 1577} {"info/global_step": 1578, "train_info/time_within_train_step": 2.6829802989959717, "step": 1578} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 1578} {"info/global_step": 1579, "train_info/time_within_train_step": 2.6842782497406006, "step": 1579} {"train_info/time_between_train_steps": 0.0029189586639404297, "step": 1579} {"info/global_step": 1580, "train_info/time_within_train_step": 2.6831769943237305, "step": 1580} {"train_info/time_between_train_steps": 0.0029408931732177734, "step": 1580} {"info/global_step": 1581, "train_info/time_within_train_step": 2.6837596893310547, "step": 1581} {"train_info/time_between_train_steps": 0.003074169158935547, "step": 1581} {"info/global_step": 1582, "train_info/time_within_train_step": 2.6831634044647217, "step": 1582} {"train_info/time_between_train_steps": 0.002987384796142578, "step": 1582} {"info/global_step": 1583, "train_info/time_within_train_step": 2.6886532306671143, "step": 1583} {"train_info/time_between_train_steps": 0.003016948699951172, "step": 1583} {"info/global_step": 1584, "train_info/time_within_train_step": 2.6822657585144043, "step": 1584} {"train_info/time_between_train_steps": 0.0028829574584960938, "step": 1584} {"info/global_step": 1585, "train_info/time_within_train_step": 2.682945966720581, "step": 1585} {"train_info/time_between_train_steps": 0.0037119388580322266, "step": 1585} {"info/global_step": 1586, "train_info/time_within_train_step": 2.6833550930023193, "step": 1586} {"train_info/time_between_train_steps": 0.003063201904296875, "step": 1586} {"info/global_step": 1587, "train_info/time_within_train_step": 2.683655261993408, "step": 1587} {"train_info/time_between_train_steps": 0.002956390380859375, "step": 1587} {"info/global_step": 1588, "train_info/time_within_train_step": 2.6831068992614746, "step": 1588} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 1588} {"info/global_step": 1589, "train_info/time_within_train_step": 2.682851552963257, "step": 1589} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 1589} {"info/global_step": 1590, "train_info/time_within_train_step": 2.6829404830932617, "step": 1590} {"train_info/time_between_train_steps": 0.0029914379119873047, "step": 1590} {"info/global_step": 1591, "train_info/time_within_train_step": 2.6837751865386963, "step": 1591} {"train_info/time_between_train_steps": 0.003119945526123047, "step": 1591} {"info/global_step": 1592, "train_info/time_within_train_step": 2.6839723587036133, "step": 1592} {"train_info/time_between_train_steps": 0.0030841827392578125, "step": 1592} {"info/global_step": 1593, "train_info/time_within_train_step": 2.684467315673828, "step": 1593} {"train_info/time_between_train_steps": 0.00305938720703125, "step": 1593} {"info/global_step": 1594, "train_info/time_within_train_step": 2.6839964389801025, "step": 1594} {"train_info/time_between_train_steps": 0.002912759780883789, "step": 1594} {"info/global_step": 1595, "train_info/time_within_train_step": 2.6833181381225586, "step": 1595} {"train_info/time_between_train_steps": 0.0029287338256835938, "step": 1595} {"info/global_step": 1596, "train_info/time_within_train_step": 2.6833903789520264, "step": 1596} {"train_info/time_between_train_steps": 0.002899646759033203, "step": 1596} {"info/global_step": 1597, "train_info/time_within_train_step": 2.683551549911499, "step": 1597} {"train_info/time_between_train_steps": 0.002998828887939453, "step": 1597} {"info/global_step": 1598, "train_info/time_within_train_step": 2.681833505630493, "step": 1598} {"train_info/time_between_train_steps": 0.0030918121337890625, "step": 1598} {"info/global_step": 1599, "train_info/time_within_train_step": 2.6836092472076416, "step": 1599} {"train_info/time_between_train_steps": 0.0030074119567871094, "step": 1599} {"info/global_step": 1600, "train_info/time_within_train_step": 2.6832993030548096, "step": 1600} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746316465, "_runtime": 4621}, "step": 1600} {"logs": {"train/loss": 4.4262, "train/learning_rate": 0.00031111111111111107, "train/epoch": 1.25, "_timestamp": 1746316465, "_runtime": 4621}, "step": 1600} {"train_info/time_between_train_steps": 14.762100219726562, "step": 1600} {"info/global_step": 1601, "train_info/time_within_train_step": 2.483966827392578, "step": 1601} {"train_info/time_between_train_steps": 0.0030901432037353516, "step": 1601} {"info/global_step": 1602, "train_info/time_within_train_step": 2.4857091903686523, "step": 1602} {"train_info/time_between_train_steps": 0.003032684326171875, "step": 1602} {"info/global_step": 1603, "train_info/time_within_train_step": 2.675157070159912, "step": 1603} {"train_info/time_between_train_steps": 0.0029802322387695312, "step": 1603} {"info/global_step": 1604, "train_info/time_within_train_step": 2.679835796356201, "step": 1604} {"train_info/time_between_train_steps": 0.0030159950256347656, "step": 1604} {"info/global_step": 1605, "train_info/time_within_train_step": 2.6805965900421143, "step": 1605} {"train_info/time_between_train_steps": 0.0030210018157958984, "step": 1605} {"info/global_step": 1606, "train_info/time_within_train_step": 2.682204246520996, "step": 1606} {"train_info/time_between_train_steps": 0.0031042098999023438, "step": 1606} {"info/global_step": 1607, "train_info/time_within_train_step": 2.6819310188293457, "step": 1607} {"train_info/time_between_train_steps": 0.003072023391723633, "step": 1607} {"info/global_step": 1608, "train_info/time_within_train_step": 2.6867964267730713, "step": 1608} {"train_info/time_between_train_steps": 0.0030829906463623047, "step": 1608} {"info/global_step": 1609, "train_info/time_within_train_step": 2.6820359230041504, "step": 1609} {"train_info/time_between_train_steps": 0.0030531883239746094, "step": 1609} {"info/global_step": 1610, "train_info/time_within_train_step": 2.6820642948150635, "step": 1610} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 1610} {"info/global_step": 1611, "train_info/time_within_train_step": 2.793930768966675, "step": 1611} {"train_info/time_between_train_steps": 0.0030198097229003906, "step": 1611} {"info/global_step": 1612, "train_info/time_within_train_step": 2.6827380657196045, "step": 1612} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 1612} {"info/global_step": 1613, "train_info/time_within_train_step": 2.6829349994659424, "step": 1613} {"train_info/time_between_train_steps": 0.0029511451721191406, "step": 1613} {"info/global_step": 1614, "train_info/time_within_train_step": 2.70174241065979, "step": 1614} {"train_info/time_between_train_steps": 0.0030066967010498047, "step": 1614} {"info/global_step": 1615, "train_info/time_within_train_step": 2.798280954360962, "step": 1615} {"train_info/time_between_train_steps": 0.002916574478149414, "step": 1615} {"info/global_step": 1616, "train_info/time_within_train_step": 2.772077798843384, "step": 1616} {"train_info/time_between_train_steps": 0.0029990673065185547, "step": 1616} {"info/global_step": 1617, "train_info/time_within_train_step": 2.7181830406188965, "step": 1617} {"train_info/time_between_train_steps": 0.0031325817108154297, "step": 1617} {"info/global_step": 1618, "train_info/time_within_train_step": 2.717240571975708, "step": 1618} {"train_info/time_between_train_steps": 0.003052949905395508, "step": 1618} {"info/global_step": 1619, "train_info/time_within_train_step": 2.7171359062194824, "step": 1619} {"train_info/time_between_train_steps": 0.003016948699951172, "step": 1619} {"info/global_step": 1620, "train_info/time_within_train_step": 2.711092710494995, "step": 1620} {"train_info/time_between_train_steps": 0.0031158924102783203, "step": 1620} {"info/global_step": 1621, "train_info/time_within_train_step": 2.706542491912842, "step": 1621} {"train_info/time_between_train_steps": 0.0029516220092773438, "step": 1621} {"info/global_step": 1622, "train_info/time_within_train_step": 2.71157169342041, "step": 1622} {"train_info/time_between_train_steps": 0.003004312515258789, "step": 1622} {"info/global_step": 1623, "train_info/time_within_train_step": 2.721644401550293, "step": 1623} {"train_info/time_between_train_steps": 0.0028836727142333984, "step": 1623} {"info/global_step": 1624, "train_info/time_within_train_step": 2.689873218536377, "step": 1624} {"train_info/time_between_train_steps": 0.002899169921875, "step": 1624} {"info/global_step": 1625, "train_info/time_within_train_step": 2.733954906463623, "step": 1625} {"train_info/time_between_train_steps": 0.0031061172485351562, "step": 1625} {"info/global_step": 1626, "train_info/time_within_train_step": 2.698387622833252, "step": 1626} {"train_info/time_between_train_steps": 0.0029485225677490234, "step": 1626} {"info/global_step": 1627, "train_info/time_within_train_step": 2.685288429260254, "step": 1627} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 1627} {"info/global_step": 1628, "train_info/time_within_train_step": 2.6913249492645264, "step": 1628} {"train_info/time_between_train_steps": 0.0029134750366210938, "step": 1628} {"info/global_step": 1629, "train_info/time_within_train_step": 2.724112033843994, "step": 1629} {"train_info/time_between_train_steps": 0.0030481815338134766, "step": 1629} {"info/global_step": 1630, "train_info/time_within_train_step": 2.7079503536224365, "step": 1630} {"train_info/time_between_train_steps": 0.0030660629272460938, "step": 1630} {"info/global_step": 1631, "train_info/time_within_train_step": 2.6905839443206787, "step": 1631} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 1631} {"info/global_step": 1632, "train_info/time_within_train_step": 2.710771083831787, "step": 1632} {"train_info/time_between_train_steps": 0.002889871597290039, "step": 1632} {"info/global_step": 1633, "train_info/time_within_train_step": 2.709967613220215, "step": 1633} {"train_info/time_between_train_steps": 0.003110647201538086, "step": 1633} {"info/global_step": 1634, "train_info/time_within_train_step": 2.690337657928467, "step": 1634} {"train_info/time_between_train_steps": 0.0028886795043945312, "step": 1634} {"info/global_step": 1635, "train_info/time_within_train_step": 2.706935405731201, "step": 1635} {"train_info/time_between_train_steps": 0.0029959678649902344, "step": 1635} {"info/global_step": 1636, "train_info/time_within_train_step": 2.7043404579162598, "step": 1636} {"train_info/time_between_train_steps": 0.0035400390625, "step": 1636} {"info/global_step": 1637, "train_info/time_within_train_step": 2.6863088607788086, "step": 1637} {"train_info/time_between_train_steps": 0.003000020980834961, "step": 1637} {"info/global_step": 1638, "train_info/time_within_train_step": 2.701725482940674, "step": 1638} {"train_info/time_between_train_steps": 0.002919435501098633, "step": 1638} {"info/global_step": 1639, "train_info/time_within_train_step": 2.702134132385254, "step": 1639} {"train_info/time_between_train_steps": 0.0030863285064697266, "step": 1639} {"info/global_step": 1640, "train_info/time_within_train_step": 2.685065507888794, "step": 1640} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 1640} {"info/global_step": 1641, "train_info/time_within_train_step": 2.686924934387207, "step": 1641} {"train_info/time_between_train_steps": 0.0030241012573242188, "step": 1641} {"info/global_step": 1642, "train_info/time_within_train_step": 2.713128089904785, "step": 1642} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 1642} {"info/global_step": 1643, "train_info/time_within_train_step": 2.73240327835083, "step": 1643} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 1643} {"info/global_step": 1644, "train_info/time_within_train_step": 2.6814863681793213, "step": 1644} {"train_info/time_between_train_steps": 0.003027677536010742, "step": 1644} {"info/global_step": 1645, "train_info/time_within_train_step": 2.6821208000183105, "step": 1645} {"train_info/time_between_train_steps": 0.002929210662841797, "step": 1645} {"info/global_step": 1646, "train_info/time_within_train_step": 2.6931419372558594, "step": 1646} {"train_info/time_between_train_steps": 0.0029506683349609375, "step": 1646} {"info/global_step": 1647, "train_info/time_within_train_step": 2.683377265930176, "step": 1647} {"train_info/time_between_train_steps": 0.002884387969970703, "step": 1647} {"info/global_step": 1648, "train_info/time_within_train_step": 2.757683038711548, "step": 1648} {"train_info/time_between_train_steps": 0.0030395984649658203, "step": 1648} {"info/global_step": 1649, "train_info/time_within_train_step": 2.684706926345825, "step": 1649} {"train_info/time_between_train_steps": 0.002938508987426758, "step": 1649} {"info/global_step": 1650, "train_info/time_within_train_step": 2.6835687160491943, "step": 1650} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746316616, "_runtime": 4772}, "step": 1650} {"logs": {"train/loss": 4.4028, "train/learning_rate": 0.0003, "train/epoch": 1.27, "_timestamp": 1746316616, "_runtime": 4772}, "step": 1650} {"train_info/time_between_train_steps": 0.024969816207885742, "step": 1650} {"info/global_step": 1651, "train_info/time_within_train_step": 2.6839241981506348, "step": 1651} {"train_info/time_between_train_steps": 0.0030059814453125, "step": 1651} {"info/global_step": 1652, "train_info/time_within_train_step": 2.743368625640869, "step": 1652} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 1652} {"info/global_step": 1653, "train_info/time_within_train_step": 2.6838276386260986, "step": 1653} {"train_info/time_between_train_steps": 0.0032219886779785156, "step": 1653} {"info/global_step": 1654, "train_info/time_within_train_step": 2.6833670139312744, "step": 1654} {"train_info/time_between_train_steps": 0.0028901100158691406, "step": 1654} {"info/global_step": 1655, "train_info/time_within_train_step": 2.683803081512451, "step": 1655} {"train_info/time_between_train_steps": 0.0031375885009765625, "step": 1655} {"info/global_step": 1656, "train_info/time_within_train_step": 2.683591365814209, "step": 1656} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 1656} {"info/global_step": 1657, "train_info/time_within_train_step": 2.683596134185791, "step": 1657} {"train_info/time_between_train_steps": 0.002918243408203125, "step": 1657} {"info/global_step": 1658, "train_info/time_within_train_step": 2.6846415996551514, "step": 1658} {"train_info/time_between_train_steps": 0.0030744075775146484, "step": 1658} {"info/global_step": 1659, "train_info/time_within_train_step": 2.6827595233917236, "step": 1659} {"train_info/time_between_train_steps": 0.002975940704345703, "step": 1659} {"info/global_step": 1660, "train_info/time_within_train_step": 2.6833298206329346, "step": 1660} {"train_info/time_between_train_steps": 0.0033996105194091797, "step": 1660} {"info/global_step": 1661, "train_info/time_within_train_step": 2.683868169784546, "step": 1661} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 1661} {"info/global_step": 1662, "train_info/time_within_train_step": 2.683318853378296, "step": 1662} {"train_info/time_between_train_steps": 0.003485441207885742, "step": 1662} {"info/global_step": 1663, "train_info/time_within_train_step": 2.6839756965637207, "step": 1663} {"train_info/time_between_train_steps": 0.003462553024291992, "step": 1663} {"info/global_step": 1664, "train_info/time_within_train_step": 2.684094190597534, "step": 1664} {"train_info/time_between_train_steps": 0.003523588180541992, "step": 1664} {"info/global_step": 1665, "train_info/time_within_train_step": 2.683023452758789, "step": 1665} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 1665} {"info/global_step": 1666, "train_info/time_within_train_step": 2.684255361557007, "step": 1666} {"train_info/time_between_train_steps": 0.003143787384033203, "step": 1666} {"info/global_step": 1667, "train_info/time_within_train_step": 2.6844046115875244, "step": 1667} {"train_info/time_between_train_steps": 0.003411531448364258, "step": 1667} {"info/global_step": 1668, "train_info/time_within_train_step": 2.6838531494140625, "step": 1668} {"train_info/time_between_train_steps": 0.003239154815673828, "step": 1668} {"info/global_step": 1669, "train_info/time_within_train_step": 2.683638572692871, "step": 1669} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 1669} {"info/global_step": 1670, "train_info/time_within_train_step": 2.6837809085845947, "step": 1670} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 1670} {"info/global_step": 1671, "train_info/time_within_train_step": 2.6842331886291504, "step": 1671} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 1671} {"info/global_step": 1672, "train_info/time_within_train_step": 2.693451404571533, "step": 1672} {"train_info/time_between_train_steps": 0.003451108932495117, "step": 1672} {"info/global_step": 1673, "train_info/time_within_train_step": 2.6828153133392334, "step": 1673} {"train_info/time_between_train_steps": 0.003232717514038086, "step": 1673} {"info/global_step": 1674, "train_info/time_within_train_step": 2.682915687561035, "step": 1674} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 1674} {"info/global_step": 1675, "train_info/time_within_train_step": 2.682312250137329, "step": 1675} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 1675} {"info/global_step": 1676, "train_info/time_within_train_step": 2.6836373805999756, "step": 1676} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 1676} {"info/global_step": 1677, "train_info/time_within_train_step": 2.683443069458008, "step": 1677} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 1677} {"info/global_step": 1678, "train_info/time_within_train_step": 2.6816444396972656, "step": 1678} {"train_info/time_between_train_steps": 0.0035915374755859375, "step": 1678} {"info/global_step": 1679, "train_info/time_within_train_step": 2.68318510055542, "step": 1679} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 1679} {"info/global_step": 1680, "train_info/time_within_train_step": 2.6834027767181396, "step": 1680} {"train_info/time_between_train_steps": 0.003129720687866211, "step": 1680} {"info/global_step": 1681, "train_info/time_within_train_step": 2.6832287311553955, "step": 1681} {"train_info/time_between_train_steps": 0.003084421157836914, "step": 1681} {"info/global_step": 1682, "train_info/time_within_train_step": 2.6827752590179443, "step": 1682} {"train_info/time_between_train_steps": 0.003336668014526367, "step": 1682} {"info/global_step": 1683, "train_info/time_within_train_step": 2.6844241619110107, "step": 1683} {"train_info/time_between_train_steps": 0.003264188766479492, "step": 1683} {"info/global_step": 1684, "train_info/time_within_train_step": 2.6840977668762207, "step": 1684} {"train_info/time_between_train_steps": 0.0033960342407226562, "step": 1684} {"info/global_step": 1685, "train_info/time_within_train_step": 2.6837637424468994, "step": 1685} {"train_info/time_between_train_steps": 0.003564596176147461, "step": 1685} {"info/global_step": 1686, "train_info/time_within_train_step": 2.6841909885406494, "step": 1686} {"train_info/time_between_train_steps": 0.003320455551147461, "step": 1686} {"info/global_step": 1687, "train_info/time_within_train_step": 2.6840879917144775, "step": 1687} {"train_info/time_between_train_steps": 0.003415822982788086, "step": 1687} {"info/global_step": 1688, "train_info/time_within_train_step": 2.6853318214416504, "step": 1688} {"train_info/time_between_train_steps": 0.00336456298828125, "step": 1688} {"info/global_step": 1689, "train_info/time_within_train_step": 2.685133695602417, "step": 1689} {"train_info/time_between_train_steps": 0.0034546852111816406, "step": 1689} {"info/global_step": 1690, "train_info/time_within_train_step": 2.683009386062622, "step": 1690} {"train_info/time_between_train_steps": 0.003668546676635742, "step": 1690} {"info/global_step": 1691, "train_info/time_within_train_step": 2.6835405826568604, "step": 1691} {"train_info/time_between_train_steps": 0.0034589767456054688, "step": 1691} {"info/global_step": 1692, "train_info/time_within_train_step": 2.6834216117858887, "step": 1692} {"train_info/time_between_train_steps": 0.003638744354248047, "step": 1692} {"info/global_step": 1693, "train_info/time_within_train_step": 2.6844403743743896, "step": 1693} {"train_info/time_between_train_steps": 0.0035431385040283203, "step": 1693} {"info/global_step": 1694, "train_info/time_within_train_step": 2.6845810413360596, "step": 1694} {"train_info/time_between_train_steps": 0.003873109817504883, "step": 1694} {"info/global_step": 1695, "train_info/time_within_train_step": 2.684473752975464, "step": 1695} {"train_info/time_between_train_steps": 0.003335714340209961, "step": 1695} {"info/global_step": 1696, "train_info/time_within_train_step": 2.6839547157287598, "step": 1696} {"train_info/time_between_train_steps": 0.0035092830657958984, "step": 1696} {"info/global_step": 1697, "train_info/time_within_train_step": 2.683964967727661, "step": 1697} {"train_info/time_between_train_steps": 0.003481626510620117, "step": 1697} {"info/global_step": 1698, "train_info/time_within_train_step": 2.6833057403564453, "step": 1698} {"train_info/time_between_train_steps": 0.003493785858154297, "step": 1698} {"info/global_step": 1699, "train_info/time_within_train_step": 2.6839451789855957, "step": 1699} {"train_info/time_between_train_steps": 0.004012107849121094, "step": 1699} {"info/global_step": 1700, "train_info/time_within_train_step": 2.6845269203186035, "step": 1700} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746316751, "_runtime": 4907}, "step": 1700} {"logs": {"train/loss": 4.3792, "train/learning_rate": 0.0002888888888888888, "train/epoch": 1.28, "_timestamp": 1746316751, "_runtime": 4907}, "step": 1700} {"train_info/time_between_train_steps": 13.528259038925171, "step": 1700} {"info/global_step": 1701, "train_info/time_within_train_step": 2.479515790939331, "step": 1701} {"train_info/time_between_train_steps": 0.0037527084350585938, "step": 1701} {"info/global_step": 1702, "train_info/time_within_train_step": 2.5114965438842773, "step": 1702} {"train_info/time_between_train_steps": 0.003787994384765625, "step": 1702} {"info/global_step": 1703, "train_info/time_within_train_step": 2.6824278831481934, "step": 1703} {"train_info/time_between_train_steps": 0.0038149356842041016, "step": 1703} {"info/global_step": 1704, "train_info/time_within_train_step": 2.682382345199585, "step": 1704} {"train_info/time_between_train_steps": 0.0038690567016601562, "step": 1704} {"info/global_step": 1705, "train_info/time_within_train_step": 2.684497117996216, "step": 1705} {"train_info/time_between_train_steps": 0.003657102584838867, "step": 1705} {"info/global_step": 1706, "train_info/time_within_train_step": 2.683256149291992, "step": 1706} {"train_info/time_between_train_steps": 0.004359245300292969, "step": 1706} {"train_info/time_between_train_steps": 3.3768248558044434, "step": 1706} {"info/global_step": 1707, "train_info/time_within_train_step": 2.6887423992156982, "step": 1707} {"train_info/time_between_train_steps": 0.0033881664276123047, "step": 1707} {"info/global_step": 1708, "train_info/time_within_train_step": 2.6811554431915283, "step": 1708} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 1708} {"info/global_step": 1709, "train_info/time_within_train_step": 2.682659387588501, "step": 1709} {"train_info/time_between_train_steps": 0.0032792091369628906, "step": 1709} {"info/global_step": 1710, "train_info/time_within_train_step": 2.682312250137329, "step": 1710} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 1710} {"info/global_step": 1711, "train_info/time_within_train_step": 2.6829991340637207, "step": 1711} {"train_info/time_between_train_steps": 0.0034027099609375, "step": 1711} {"info/global_step": 1712, "train_info/time_within_train_step": 2.6831345558166504, "step": 1712} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 1712} {"info/global_step": 1713, "train_info/time_within_train_step": 2.6828510761260986, "step": 1713} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 1713} {"info/global_step": 1714, "train_info/time_within_train_step": 2.6877059936523438, "step": 1714} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 1714} {"info/global_step": 1715, "train_info/time_within_train_step": 2.7729101181030273, "step": 1715} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 1715} {"info/global_step": 1716, "train_info/time_within_train_step": 2.8105688095092773, "step": 1716} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 1716} {"info/global_step": 1717, "train_info/time_within_train_step": 2.7472128868103027, "step": 1717} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 1717} {"info/global_step": 1718, "train_info/time_within_train_step": 2.722376823425293, "step": 1718} {"train_info/time_between_train_steps": 0.0032930374145507812, "step": 1718} {"info/global_step": 1719, "train_info/time_within_train_step": 2.712351083755493, "step": 1719} {"train_info/time_between_train_steps": 0.003321409225463867, "step": 1719} {"info/global_step": 1720, "train_info/time_within_train_step": 2.719231605529785, "step": 1720} {"train_info/time_between_train_steps": 0.0033326148986816406, "step": 1720} {"info/global_step": 1721, "train_info/time_within_train_step": 2.7334117889404297, "step": 1721} {"train_info/time_between_train_steps": 0.0032799243927001953, "step": 1721} {"info/global_step": 1722, "train_info/time_within_train_step": 2.7006161212921143, "step": 1722} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 1722} {"info/global_step": 1723, "train_info/time_within_train_step": 2.7066009044647217, "step": 1723} {"train_info/time_between_train_steps": 0.0031266212463378906, "step": 1723} {"info/global_step": 1724, "train_info/time_within_train_step": 2.716747760772705, "step": 1724} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 1724} {"info/global_step": 1725, "train_info/time_within_train_step": 2.6990325450897217, "step": 1725} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 1725} {"info/global_step": 1726, "train_info/time_within_train_step": 2.703544855117798, "step": 1726} {"train_info/time_between_train_steps": 0.0036013126373291016, "step": 1726} {"info/global_step": 1727, "train_info/time_within_train_step": 2.705648183822632, "step": 1727} {"train_info/time_between_train_steps": 0.003536224365234375, "step": 1727} {"info/global_step": 1728, "train_info/time_within_train_step": 2.694094181060791, "step": 1728} {"train_info/time_between_train_steps": 0.0033388137817382812, "step": 1728} {"info/global_step": 1729, "train_info/time_within_train_step": 2.7212460041046143, "step": 1729} {"train_info/time_between_train_steps": 0.003423452377319336, "step": 1729} {"info/global_step": 1730, "train_info/time_within_train_step": 2.699643850326538, "step": 1730} {"train_info/time_between_train_steps": 0.003481626510620117, "step": 1730} {"info/global_step": 1731, "train_info/time_within_train_step": 2.706027030944824, "step": 1731} {"train_info/time_between_train_steps": 0.003346681594848633, "step": 1731} {"info/global_step": 1732, "train_info/time_within_train_step": 2.739741802215576, "step": 1732} {"train_info/time_between_train_steps": 0.003455638885498047, "step": 1732} {"info/global_step": 1733, "train_info/time_within_train_step": 2.9171111583709717, "step": 1733} {"train_info/time_between_train_steps": 0.003379344940185547, "step": 1733} {"info/global_step": 1734, "train_info/time_within_train_step": 2.6849405765533447, "step": 1734} {"train_info/time_between_train_steps": 0.003448963165283203, "step": 1734} {"info/global_step": 1735, "train_info/time_within_train_step": 2.683255910873413, "step": 1735} {"train_info/time_between_train_steps": 0.003293275833129883, "step": 1735} {"info/global_step": 1736, "train_info/time_within_train_step": 2.6888062953948975, "step": 1736} {"train_info/time_between_train_steps": 0.003546476364135742, "step": 1736} {"info/global_step": 1737, "train_info/time_within_train_step": 2.707749128341675, "step": 1737} {"train_info/time_between_train_steps": 0.0035295486450195312, "step": 1737} {"info/global_step": 1738, "train_info/time_within_train_step": 2.720616579055786, "step": 1738} {"train_info/time_between_train_steps": 0.003408193588256836, "step": 1738} {"info/global_step": 1739, "train_info/time_within_train_step": 2.701524019241333, "step": 1739} {"train_info/time_between_train_steps": 0.0035257339477539062, "step": 1739} {"info/global_step": 1740, "train_info/time_within_train_step": 2.6858131885528564, "step": 1740} {"train_info/time_between_train_steps": 0.0034856796264648438, "step": 1740} {"info/global_step": 1741, "train_info/time_within_train_step": 2.6849679946899414, "step": 1741} {"train_info/time_between_train_steps": 0.0035140514373779297, "step": 1741} {"info/global_step": 1742, "train_info/time_within_train_step": 2.6932554244995117, "step": 1742} {"train_info/time_between_train_steps": 0.003447294235229492, "step": 1742} {"info/global_step": 1743, "train_info/time_within_train_step": 2.710089683532715, "step": 1743} {"train_info/time_between_train_steps": 0.003541707992553711, "step": 1743} {"info/global_step": 1744, "train_info/time_within_train_step": 2.6944825649261475, "step": 1744} {"train_info/time_between_train_steps": 0.0034139156341552734, "step": 1744} {"info/global_step": 1745, "train_info/time_within_train_step": 2.6905922889709473, "step": 1745} {"train_info/time_between_train_steps": 0.0033528804779052734, "step": 1745} {"info/global_step": 1746, "train_info/time_within_train_step": 2.7041728496551514, "step": 1746} {"train_info/time_between_train_steps": 0.0034215450286865234, "step": 1746} {"info/global_step": 1747, "train_info/time_within_train_step": 2.687713146209717, "step": 1747} {"train_info/time_between_train_steps": 0.0034875869750976562, "step": 1747} {"info/global_step": 1748, "train_info/time_within_train_step": 2.686237096786499, "step": 1748} {"train_info/time_between_train_steps": 0.003328084945678711, "step": 1748} {"info/global_step": 1749, "train_info/time_within_train_step": 3.270892381668091, "step": 1749} {"train_info/time_between_train_steps": 0.003384113311767578, "step": 1749} {"info/global_step": 1750, "train_info/time_within_train_step": 2.684832811355591, "step": 1750} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746316905, "_runtime": 5061}, "step": 1750} {"logs": {"train/loss": 4.4115, "train/learning_rate": 0.0002777777777777778, "train/epoch": 2.01, "_timestamp": 1746316905, "_runtime": 5061}, "step": 1750} {"train_info/time_between_train_steps": 0.02480626106262207, "step": 1750} {"info/global_step": 1751, "train_info/time_within_train_step": 2.6858959197998047, "step": 1751} {"train_info/time_between_train_steps": 0.0035202503204345703, "step": 1751} {"info/global_step": 1752, "train_info/time_within_train_step": 2.6854069232940674, "step": 1752} {"train_info/time_between_train_steps": 0.003503561019897461, "step": 1752} {"info/global_step": 1753, "train_info/time_within_train_step": 2.6861469745635986, "step": 1753} {"train_info/time_between_train_steps": 0.003591775894165039, "step": 1753} {"info/global_step": 1754, "train_info/time_within_train_step": 2.6868085861206055, "step": 1754} {"train_info/time_between_train_steps": 0.0033838748931884766, "step": 1754} {"info/global_step": 1755, "train_info/time_within_train_step": 2.68631649017334, "step": 1755} {"train_info/time_between_train_steps": 0.0034465789794921875, "step": 1755} {"info/global_step": 1756, "train_info/time_within_train_step": 2.68540096282959, "step": 1756} {"train_info/time_between_train_steps": 0.0035614967346191406, "step": 1756} {"info/global_step": 1757, "train_info/time_within_train_step": 2.685448169708252, "step": 1757} {"train_info/time_between_train_steps": 0.0035262107849121094, "step": 1757} {"info/global_step": 1758, "train_info/time_within_train_step": 2.686174154281616, "step": 1758} {"train_info/time_between_train_steps": 0.0034406185150146484, "step": 1758} {"info/global_step": 1759, "train_info/time_within_train_step": 2.685417890548706, "step": 1759} {"train_info/time_between_train_steps": 0.003687620162963867, "step": 1759} {"info/global_step": 1760, "train_info/time_within_train_step": 2.684532880783081, "step": 1760} {"train_info/time_between_train_steps": 0.003376483917236328, "step": 1760} {"info/global_step": 1761, "train_info/time_within_train_step": 2.684558868408203, "step": 1761} {"train_info/time_between_train_steps": 0.003347158432006836, "step": 1761} {"info/global_step": 1762, "train_info/time_within_train_step": 2.683114528656006, "step": 1762} {"train_info/time_between_train_steps": 0.003523588180541992, "step": 1762} {"info/global_step": 1763, "train_info/time_within_train_step": 2.685380458831787, "step": 1763} {"train_info/time_between_train_steps": 0.0034444332122802734, "step": 1763} {"info/global_step": 1764, "train_info/time_within_train_step": 2.6845545768737793, "step": 1764} {"train_info/time_between_train_steps": 0.0035173892974853516, "step": 1764} {"info/global_step": 1765, "train_info/time_within_train_step": 2.684634208679199, "step": 1765} {"train_info/time_between_train_steps": 0.003629922866821289, "step": 1765} {"info/global_step": 1766, "train_info/time_within_train_step": 2.6834301948547363, "step": 1766} {"train_info/time_between_train_steps": 0.0034263134002685547, "step": 1766} {"info/global_step": 1767, "train_info/time_within_train_step": 2.6860718727111816, "step": 1767} {"train_info/time_between_train_steps": 0.003698587417602539, "step": 1767} {"info/global_step": 1768, "train_info/time_within_train_step": 2.6861538887023926, "step": 1768} {"train_info/time_between_train_steps": 0.003642559051513672, "step": 1768} {"info/global_step": 1769, "train_info/time_within_train_step": 2.8157942295074463, "step": 1769} {"train_info/time_between_train_steps": 0.0034384727478027344, "step": 1769} {"info/global_step": 1770, "train_info/time_within_train_step": 2.6854324340820312, "step": 1770} {"train_info/time_between_train_steps": 0.003396749496459961, "step": 1770} {"info/global_step": 1771, "train_info/time_within_train_step": 2.6844828128814697, "step": 1771} {"train_info/time_between_train_steps": 0.003381967544555664, "step": 1771} {"info/global_step": 1772, "train_info/time_within_train_step": 2.685344934463501, "step": 1772} {"train_info/time_between_train_steps": 0.0033910274505615234, "step": 1772} {"info/global_step": 1773, "train_info/time_within_train_step": 2.6842894554138184, "step": 1773} {"train_info/time_between_train_steps": 0.0034575462341308594, "step": 1773} {"info/global_step": 1774, "train_info/time_within_train_step": 2.6839542388916016, "step": 1774} {"train_info/time_between_train_steps": 0.0033822059631347656, "step": 1774} {"info/global_step": 1775, "train_info/time_within_train_step": 2.684288740158081, "step": 1775} {"train_info/time_between_train_steps": 0.003392934799194336, "step": 1775} {"info/global_step": 1776, "train_info/time_within_train_step": 2.68517804145813, "step": 1776} {"train_info/time_between_train_steps": 0.0035948753356933594, "step": 1776} {"info/global_step": 1777, "train_info/time_within_train_step": 2.6836836338043213, "step": 1777} {"train_info/time_between_train_steps": 0.003486156463623047, "step": 1777} {"info/global_step": 1778, "train_info/time_within_train_step": 2.685420036315918, "step": 1778} {"train_info/time_between_train_steps": 0.0035924911499023438, "step": 1778} {"info/global_step": 1779, "train_info/time_within_train_step": 2.735707998275757, "step": 1779} {"train_info/time_between_train_steps": 0.0034940242767333984, "step": 1779} {"info/global_step": 1780, "train_info/time_within_train_step": 2.6847403049468994, "step": 1780} {"train_info/time_between_train_steps": 0.0033829212188720703, "step": 1780} {"info/global_step": 1781, "train_info/time_within_train_step": 2.6840810775756836, "step": 1781} {"train_info/time_between_train_steps": 0.0035545825958251953, "step": 1781} {"info/global_step": 1782, "train_info/time_within_train_step": 2.685412883758545, "step": 1782} {"train_info/time_between_train_steps": 0.0039675235748291016, "step": 1782} {"info/global_step": 1783, "train_info/time_within_train_step": 2.686100482940674, "step": 1783} {"train_info/time_between_train_steps": 0.0035219192504882812, "step": 1783} {"info/global_step": 1784, "train_info/time_within_train_step": 2.6857481002807617, "step": 1784} {"train_info/time_between_train_steps": 0.0034945011138916016, "step": 1784} {"info/global_step": 1785, "train_info/time_within_train_step": 2.6855621337890625, "step": 1785} {"train_info/time_between_train_steps": 0.0034775733947753906, "step": 1785} {"info/global_step": 1786, "train_info/time_within_train_step": 2.6860313415527344, "step": 1786} {"train_info/time_between_train_steps": 0.0035157203674316406, "step": 1786} {"info/global_step": 1787, "train_info/time_within_train_step": 2.6900904178619385, "step": 1787} {"train_info/time_between_train_steps": 0.003392934799194336, "step": 1787} {"info/global_step": 1788, "train_info/time_within_train_step": 2.684591770172119, "step": 1788} {"train_info/time_between_train_steps": 0.0036306381225585938, "step": 1788} {"info/global_step": 1789, "train_info/time_within_train_step": 2.6840667724609375, "step": 1789} {"train_info/time_between_train_steps": 0.003340482711791992, "step": 1789} {"info/global_step": 1790, "train_info/time_within_train_step": 2.6850085258483887, "step": 1790} {"train_info/time_between_train_steps": 0.0034949779510498047, "step": 1790} {"info/global_step": 1791, "train_info/time_within_train_step": 2.6846156120300293, "step": 1791} {"train_info/time_between_train_steps": 0.0035181045532226562, "step": 1791} {"info/global_step": 1792, "train_info/time_within_train_step": 2.6848526000976562, "step": 1792} {"train_info/time_between_train_steps": 0.003930807113647461, "step": 1792} {"info/global_step": 1793, "train_info/time_within_train_step": 2.6846868991851807, "step": 1793} {"train_info/time_between_train_steps": 0.003352642059326172, "step": 1793} {"info/global_step": 1794, "train_info/time_within_train_step": 2.684812307357788, "step": 1794} {"train_info/time_between_train_steps": 0.0033152103424072266, "step": 1794} {"info/global_step": 1795, "train_info/time_within_train_step": 2.684800863265991, "step": 1795} {"train_info/time_between_train_steps": 0.003496408462524414, "step": 1795} {"info/global_step": 1796, "train_info/time_within_train_step": 2.68650484085083, "step": 1796} {"train_info/time_between_train_steps": 0.003419637680053711, "step": 1796} {"info/global_step": 1797, "train_info/time_within_train_step": 2.6859915256500244, "step": 1797} {"train_info/time_between_train_steps": 0.0035135746002197266, "step": 1797} {"info/global_step": 1798, "train_info/time_within_train_step": 2.686788320541382, "step": 1798} {"train_info/time_between_train_steps": 0.0033502578735351562, "step": 1798} {"info/global_step": 1799, "train_info/time_within_train_step": 2.6946442127227783, "step": 1799} {"train_info/time_between_train_steps": 0.003287792205810547, "step": 1799} {"info/global_step": 1800, "train_info/time_within_train_step": 2.6850504875183105, "step": 1800} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746317040, "_runtime": 5196}, "step": 1800} {"logs": {"train/loss": 4.3362, "train/learning_rate": 0.0002666666666666666, "train/epoch": 2.03, "_timestamp": 1746317040, "_runtime": 5196}, "step": 1800} {"train_info/time_between_train_steps": 14.222656011581421, "step": 1800} {"info/global_step": 1801, "train_info/time_within_train_step": 2.4826161861419678, "step": 1801} {"train_info/time_between_train_steps": 0.003371715545654297, "step": 1801} {"info/global_step": 1802, "train_info/time_within_train_step": 2.5064563751220703, "step": 1802} {"train_info/time_between_train_steps": 0.0034165382385253906, "step": 1802} {"info/global_step": 1803, "train_info/time_within_train_step": 2.68222975730896, "step": 1803} {"train_info/time_between_train_steps": 0.003624439239501953, "step": 1803} {"info/global_step": 1804, "train_info/time_within_train_step": 2.6817281246185303, "step": 1804} {"train_info/time_between_train_steps": 0.0035507678985595703, "step": 1804} {"info/global_step": 1805, "train_info/time_within_train_step": 2.682565927505493, "step": 1805} {"train_info/time_between_train_steps": 0.003391742706298828, "step": 1805} {"info/global_step": 1806, "train_info/time_within_train_step": 2.6834261417388916, "step": 1806} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 1806} {"info/global_step": 1807, "train_info/time_within_train_step": 2.6833536624908447, "step": 1807} {"train_info/time_between_train_steps": 0.003610372543334961, "step": 1807} {"info/global_step": 1808, "train_info/time_within_train_step": 2.6842896938323975, "step": 1808} {"train_info/time_between_train_steps": 0.003613710403442383, "step": 1808} {"info/global_step": 1809, "train_info/time_within_train_step": 2.962552785873413, "step": 1809} {"train_info/time_between_train_steps": 0.0036792755126953125, "step": 1809} {"info/global_step": 1810, "train_info/time_within_train_step": 2.6848301887512207, "step": 1810} {"train_info/time_between_train_steps": 0.003295421600341797, "step": 1810} {"info/global_step": 1811, "train_info/time_within_train_step": 2.686152696609497, "step": 1811} {"train_info/time_between_train_steps": 0.003587007522583008, "step": 1811} {"info/global_step": 1812, "train_info/time_within_train_step": 2.6848771572113037, "step": 1812} {"train_info/time_between_train_steps": 0.003554821014404297, "step": 1812} {"info/global_step": 1813, "train_info/time_within_train_step": 2.685757637023926, "step": 1813} {"train_info/time_between_train_steps": 0.0033202171325683594, "step": 1813} {"info/global_step": 1814, "train_info/time_within_train_step": 2.6849775314331055, "step": 1814} {"train_info/time_between_train_steps": 0.003476858139038086, "step": 1814} {"info/global_step": 1815, "train_info/time_within_train_step": 2.772965908050537, "step": 1815} {"train_info/time_between_train_steps": 0.0035636425018310547, "step": 1815} {"info/global_step": 1816, "train_info/time_within_train_step": 2.797471523284912, "step": 1816} {"train_info/time_between_train_steps": 0.0036792755126953125, "step": 1816} {"info/global_step": 1817, "train_info/time_within_train_step": 2.7576191425323486, "step": 1817} {"train_info/time_between_train_steps": 0.003483295440673828, "step": 1817} {"info/global_step": 1818, "train_info/time_within_train_step": 2.7148470878601074, "step": 1818} {"train_info/time_between_train_steps": 0.003464937210083008, "step": 1818} {"info/global_step": 1819, "train_info/time_within_train_step": 2.722609758377075, "step": 1819} {"train_info/time_between_train_steps": 0.0034101009368896484, "step": 1819} {"info/global_step": 1820, "train_info/time_within_train_step": 2.701298713684082, "step": 1820} {"train_info/time_between_train_steps": 0.0034401416778564453, "step": 1820} {"info/global_step": 1821, "train_info/time_within_train_step": 2.724086046218872, "step": 1821} {"train_info/time_between_train_steps": 0.0034296512603759766, "step": 1821} {"info/global_step": 1822, "train_info/time_within_train_step": 2.7256054878234863, "step": 1822} {"train_info/time_between_train_steps": 0.003677845001220703, "step": 1822} {"info/global_step": 1823, "train_info/time_within_train_step": 2.706378698348999, "step": 1823} {"train_info/time_between_train_steps": 0.0035507678985595703, "step": 1823} {"info/global_step": 1824, "train_info/time_within_train_step": 2.7025792598724365, "step": 1824} {"train_info/time_between_train_steps": 0.0033621788024902344, "step": 1824} {"info/global_step": 1825, "train_info/time_within_train_step": 2.706692934036255, "step": 1825} {"train_info/time_between_train_steps": 0.0036427974700927734, "step": 1825} {"info/global_step": 1826, "train_info/time_within_train_step": 2.7249133586883545, "step": 1826} {"train_info/time_between_train_steps": 0.0035505294799804688, "step": 1826} {"info/global_step": 1827, "train_info/time_within_train_step": 2.7193989753723145, "step": 1827} {"train_info/time_between_train_steps": 0.0033080577850341797, "step": 1827} {"info/global_step": 1828, "train_info/time_within_train_step": 2.687588930130005, "step": 1828} {"train_info/time_between_train_steps": 0.0033347606658935547, "step": 1828} {"info/global_step": 1829, "train_info/time_within_train_step": 2.7105295658111572, "step": 1829} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 1829} {"info/global_step": 1830, "train_info/time_within_train_step": 2.7006540298461914, "step": 1830} {"train_info/time_between_train_steps": 0.0035161972045898438, "step": 1830} {"info/global_step": 1831, "train_info/time_within_train_step": 2.689042568206787, "step": 1831} {"train_info/time_between_train_steps": 0.1435987949371338, "step": 1831} {"info/global_step": 1832, "train_info/time_within_train_step": 2.6855344772338867, "step": 1832} {"train_info/time_between_train_steps": 0.0034456253051757812, "step": 1832} {"info/global_step": 1833, "train_info/time_within_train_step": 2.698965072631836, "step": 1833} {"train_info/time_between_train_steps": 0.0034372806549072266, "step": 1833} {"info/global_step": 1834, "train_info/time_within_train_step": 2.7224812507629395, "step": 1834} {"train_info/time_between_train_steps": 0.003482341766357422, "step": 1834} {"info/global_step": 1835, "train_info/time_within_train_step": 2.6840198040008545, "step": 1835} {"train_info/time_between_train_steps": 0.003522634506225586, "step": 1835} {"info/global_step": 1836, "train_info/time_within_train_step": 2.6840739250183105, "step": 1836} {"train_info/time_between_train_steps": 0.003559112548828125, "step": 1836} {"info/global_step": 1837, "train_info/time_within_train_step": 2.6862194538116455, "step": 1837} {"train_info/time_between_train_steps": 0.0034215450286865234, "step": 1837} {"info/global_step": 1838, "train_info/time_within_train_step": 2.715759515762329, "step": 1838} {"train_info/time_between_train_steps": 0.003460407257080078, "step": 1838} {"info/global_step": 1839, "train_info/time_within_train_step": 2.7175397872924805, "step": 1839} {"train_info/time_between_train_steps": 0.0035102367401123047, "step": 1839} {"info/global_step": 1840, "train_info/time_within_train_step": 2.70231032371521, "step": 1840} {"train_info/time_between_train_steps": 0.0033817291259765625, "step": 1840} {"info/global_step": 1841, "train_info/time_within_train_step": 2.6980414390563965, "step": 1841} {"train_info/time_between_train_steps": 0.0034630298614501953, "step": 1841} {"info/global_step": 1842, "train_info/time_within_train_step": 2.6859254837036133, "step": 1842} {"train_info/time_between_train_steps": 0.003307819366455078, "step": 1842} {"info/global_step": 1843, "train_info/time_within_train_step": 2.69541335105896, "step": 1843} {"train_info/time_between_train_steps": 0.003479480743408203, "step": 1843} {"info/global_step": 1844, "train_info/time_within_train_step": 2.7092318534851074, "step": 1844} {"train_info/time_between_train_steps": 0.003374814987182617, "step": 1844} {"info/global_step": 1845, "train_info/time_within_train_step": 2.685316801071167, "step": 1845} {"train_info/time_between_train_steps": 0.0033369064331054688, "step": 1845} {"info/global_step": 1846, "train_info/time_within_train_step": 2.6856017112731934, "step": 1846} {"train_info/time_between_train_steps": 0.003363370895385742, "step": 1846} {"info/global_step": 1847, "train_info/time_within_train_step": 2.702540874481201, "step": 1847} {"train_info/time_between_train_steps": 0.0033447742462158203, "step": 1847} {"info/global_step": 1848, "train_info/time_within_train_step": 2.704012870788574, "step": 1848} {"train_info/time_between_train_steps": 0.003509521484375, "step": 1848} {"info/global_step": 1849, "train_info/time_within_train_step": 2.684298515319824, "step": 1849} {"train_info/time_between_train_steps": 0.0036406517028808594, "step": 1849} {"info/global_step": 1850, "train_info/time_within_train_step": 2.685593605041504, "step": 1850} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746317191, "_runtime": 5347}, "step": 1850} {"logs": {"train/loss": 4.3169, "train/learning_rate": 0.00025555555555555553, "train/epoch": 2.05, "_timestamp": 1746317191, "_runtime": 5347}, "step": 1850} {"train_info/time_between_train_steps": 0.02561783790588379, "step": 1850} {"info/global_step": 1851, "train_info/time_within_train_step": 2.6846392154693604, "step": 1851} {"train_info/time_between_train_steps": 0.0033707618713378906, "step": 1851} {"info/global_step": 1852, "train_info/time_within_train_step": 2.684387445449829, "step": 1852} {"train_info/time_between_train_steps": 0.0033648014068603516, "step": 1852} {"info/global_step": 1853, "train_info/time_within_train_step": 2.684305429458618, "step": 1853} {"train_info/time_between_train_steps": 0.003503561019897461, "step": 1853} {"info/global_step": 1854, "train_info/time_within_train_step": 2.690308094024658, "step": 1854} {"train_info/time_between_train_steps": 0.0035653114318847656, "step": 1854} {"info/global_step": 1855, "train_info/time_within_train_step": 2.691513776779175, "step": 1855} {"train_info/time_between_train_steps": 0.003656148910522461, "step": 1855} {"info/global_step": 1856, "train_info/time_within_train_step": 2.6922268867492676, "step": 1856} {"train_info/time_between_train_steps": 0.0035941600799560547, "step": 1856} {"info/global_step": 1857, "train_info/time_within_train_step": 2.684765338897705, "step": 1857} {"train_info/time_between_train_steps": 0.0034515857696533203, "step": 1857} {"info/global_step": 1858, "train_info/time_within_train_step": 2.685438871383667, "step": 1858} {"train_info/time_between_train_steps": 0.0034203529357910156, "step": 1858} {"info/global_step": 1859, "train_info/time_within_train_step": 2.6932826042175293, "step": 1859} {"train_info/time_between_train_steps": 0.003668069839477539, "step": 1859} {"info/global_step": 1860, "train_info/time_within_train_step": 2.6854913234710693, "step": 1860} {"train_info/time_between_train_steps": 0.0034759044647216797, "step": 1860} {"info/global_step": 1861, "train_info/time_within_train_step": 2.687136173248291, "step": 1861} {"train_info/time_between_train_steps": 0.003526926040649414, "step": 1861} {"info/global_step": 1862, "train_info/time_within_train_step": 2.6852753162384033, "step": 1862} {"train_info/time_between_train_steps": 0.0036096572875976562, "step": 1862} {"info/global_step": 1863, "train_info/time_within_train_step": 2.7417356967926025, "step": 1863} {"train_info/time_between_train_steps": 0.0037636756896972656, "step": 1863} {"info/global_step": 1864, "train_info/time_within_train_step": 2.6852471828460693, "step": 1864} {"train_info/time_between_train_steps": 0.003421783447265625, "step": 1864} {"info/global_step": 1865, "train_info/time_within_train_step": 2.686588764190674, "step": 1865} {"train_info/time_between_train_steps": 0.0037343502044677734, "step": 1865} {"info/global_step": 1866, "train_info/time_within_train_step": 2.68750262260437, "step": 1866} {"train_info/time_between_train_steps": 0.0034554004669189453, "step": 1866} {"info/global_step": 1867, "train_info/time_within_train_step": 2.6872050762176514, "step": 1867} {"train_info/time_between_train_steps": 0.003451108932495117, "step": 1867} {"info/global_step": 1868, "train_info/time_within_train_step": 2.685755968093872, "step": 1868} {"train_info/time_between_train_steps": 0.0033729076385498047, "step": 1868} {"info/global_step": 1869, "train_info/time_within_train_step": 2.6855051517486572, "step": 1869} {"train_info/time_between_train_steps": 0.0033721923828125, "step": 1869} {"info/global_step": 1870, "train_info/time_within_train_step": 2.6851649284362793, "step": 1870} {"train_info/time_between_train_steps": 0.003551006317138672, "step": 1870} {"info/global_step": 1871, "train_info/time_within_train_step": 2.6847426891326904, "step": 1871} {"train_info/time_between_train_steps": 0.0034830570220947266, "step": 1871} {"info/global_step": 1872, "train_info/time_within_train_step": 2.6838486194610596, "step": 1872} {"train_info/time_between_train_steps": 0.0036411285400390625, "step": 1872} {"info/global_step": 1873, "train_info/time_within_train_step": 2.684536933898926, "step": 1873} {"train_info/time_between_train_steps": 0.0033044815063476562, "step": 1873} {"info/global_step": 1874, "train_info/time_within_train_step": 2.6838645935058594, "step": 1874} {"train_info/time_between_train_steps": 0.0034461021423339844, "step": 1874} {"info/global_step": 1875, "train_info/time_within_train_step": 2.6843996047973633, "step": 1875} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 1875} {"info/global_step": 1876, "train_info/time_within_train_step": 2.6850132942199707, "step": 1876} {"train_info/time_between_train_steps": 0.0032639503479003906, "step": 1876} {"info/global_step": 1877, "train_info/time_within_train_step": 2.705997943878174, "step": 1877} {"train_info/time_between_train_steps": 0.0034072399139404297, "step": 1877} {"info/global_step": 1878, "train_info/time_within_train_step": 2.683379650115967, "step": 1878} {"train_info/time_between_train_steps": 0.003451108932495117, "step": 1878} {"info/global_step": 1879, "train_info/time_within_train_step": 2.683929443359375, "step": 1879} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 1879} {"info/global_step": 1880, "train_info/time_within_train_step": 2.6842525005340576, "step": 1880} {"train_info/time_between_train_steps": 0.003404855728149414, "step": 1880} {"info/global_step": 1881, "train_info/time_within_train_step": 2.6836605072021484, "step": 1881} {"train_info/time_between_train_steps": 0.003373384475708008, "step": 1881} {"info/global_step": 1882, "train_info/time_within_train_step": 2.6833982467651367, "step": 1882} {"train_info/time_between_train_steps": 0.003280162811279297, "step": 1882} {"info/global_step": 1883, "train_info/time_within_train_step": 2.684075355529785, "step": 1883} {"train_info/time_between_train_steps": 0.003447294235229492, "step": 1883} {"info/global_step": 1884, "train_info/time_within_train_step": 2.683598756790161, "step": 1884} {"train_info/time_between_train_steps": 0.0034198760986328125, "step": 1884} {"info/global_step": 1885, "train_info/time_within_train_step": 2.683426856994629, "step": 1885} {"train_info/time_between_train_steps": 0.0035037994384765625, "step": 1885} {"info/global_step": 1886, "train_info/time_within_train_step": 2.683016538619995, "step": 1886} {"train_info/time_between_train_steps": 0.0033583641052246094, "step": 1886} {"info/global_step": 1887, "train_info/time_within_train_step": 2.680969715118408, "step": 1887} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 1887} {"info/global_step": 1888, "train_info/time_within_train_step": 2.681004762649536, "step": 1888} {"train_info/time_between_train_steps": 0.0034852027893066406, "step": 1888} {"info/global_step": 1889, "train_info/time_within_train_step": 2.6819634437561035, "step": 1889} {"train_info/time_between_train_steps": 0.003322124481201172, "step": 1889} {"info/global_step": 1890, "train_info/time_within_train_step": 2.6823036670684814, "step": 1890} {"train_info/time_between_train_steps": 0.0035026073455810547, "step": 1890} {"info/global_step": 1891, "train_info/time_within_train_step": 2.6848666667938232, "step": 1891} {"train_info/time_between_train_steps": 0.003690481185913086, "step": 1891} {"info/global_step": 1892, "train_info/time_within_train_step": 2.685326337814331, "step": 1892} {"train_info/time_between_train_steps": 0.003537416458129883, "step": 1892} {"info/global_step": 1893, "train_info/time_within_train_step": 2.683234214782715, "step": 1893} {"train_info/time_between_train_steps": 0.0035419464111328125, "step": 1893} {"info/global_step": 1894, "train_info/time_within_train_step": 2.8227484226226807, "step": 1894} {"train_info/time_between_train_steps": 0.003514528274536133, "step": 1894} {"info/global_step": 1895, "train_info/time_within_train_step": 2.9579930305480957, "step": 1895} {"train_info/time_between_train_steps": 0.0034792423248291016, "step": 1895} {"info/global_step": 1896, "train_info/time_within_train_step": 2.6852521896362305, "step": 1896} {"train_info/time_between_train_steps": 0.0034041404724121094, "step": 1896} {"info/global_step": 1897, "train_info/time_within_train_step": 2.684717893600464, "step": 1897} {"train_info/time_between_train_steps": 0.003557920455932617, "step": 1897} {"info/global_step": 1898, "train_info/time_within_train_step": 2.6850597858428955, "step": 1898} {"train_info/time_between_train_steps": 0.0034656524658203125, "step": 1898} {"info/global_step": 1899, "train_info/time_within_train_step": 2.7080118656158447, "step": 1899} {"train_info/time_between_train_steps": 0.0036382675170898438, "step": 1899} {"info/global_step": 1900, "train_info/time_within_train_step": 2.684600591659546, "step": 1900} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746317327, "_runtime": 5483}, "step": 1900} {"logs": {"train/loss": 4.2983, "train/learning_rate": 0.00024444444444444443, "train/epoch": 2.06, "_timestamp": 1746317327, "_runtime": 5483}, "step": 1900} {"train_info/time_between_train_steps": 13.234197854995728, "step": 1900} {"info/global_step": 1901, "train_info/time_within_train_step": 2.4869208335876465, "step": 1901} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 1901} {"info/global_step": 1902, "train_info/time_within_train_step": 2.50335431098938, "step": 1902} {"train_info/time_between_train_steps": 0.003281116485595703, "step": 1902} {"info/global_step": 1903, "train_info/time_within_train_step": 2.6806068420410156, "step": 1903} {"train_info/time_between_train_steps": 0.003284454345703125, "step": 1903} {"info/global_step": 1904, "train_info/time_within_train_step": 2.6806480884552, "step": 1904} {"train_info/time_between_train_steps": 0.0033724308013916016, "step": 1904} {"info/global_step": 1905, "train_info/time_within_train_step": 2.6824088096618652, "step": 1905} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 1905} {"info/global_step": 1906, "train_info/time_within_train_step": 2.691675901412964, "step": 1906} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 1906} {"info/global_step": 1907, "train_info/time_within_train_step": 2.6819167137145996, "step": 1907} {"train_info/time_between_train_steps": 0.003341197967529297, "step": 1907} {"info/global_step": 1908, "train_info/time_within_train_step": 2.681642532348633, "step": 1908} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 1908} {"info/global_step": 1909, "train_info/time_within_train_step": 2.6822617053985596, "step": 1909} {"train_info/time_between_train_steps": 0.00341033935546875, "step": 1909} {"info/global_step": 1910, "train_info/time_within_train_step": 2.6841955184936523, "step": 1910} {"train_info/time_between_train_steps": 0.0034012794494628906, "step": 1910} {"info/global_step": 1911, "train_info/time_within_train_step": 2.683440685272217, "step": 1911} {"train_info/time_between_train_steps": 0.003265857696533203, "step": 1911} {"info/global_step": 1912, "train_info/time_within_train_step": 2.6828458309173584, "step": 1912} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 1912} {"info/global_step": 1913, "train_info/time_within_train_step": 2.683438539505005, "step": 1913} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 1913} {"info/global_step": 1914, "train_info/time_within_train_step": 2.737934112548828, "step": 1914} {"train_info/time_between_train_steps": 0.003259420394897461, "step": 1914} {"info/global_step": 1915, "train_info/time_within_train_step": 2.857356071472168, "step": 1915} {"train_info/time_between_train_steps": 0.0034646987915039062, "step": 1915} {"info/global_step": 1916, "train_info/time_within_train_step": 2.792332410812378, "step": 1916} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 1916} {"info/global_step": 1917, "train_info/time_within_train_step": 2.7366843223571777, "step": 1917} {"train_info/time_between_train_steps": 0.003386259078979492, "step": 1917} {"info/global_step": 1918, "train_info/time_within_train_step": 2.6954798698425293, "step": 1918} {"train_info/time_between_train_steps": 0.003254413604736328, "step": 1918} {"info/global_step": 1919, "train_info/time_within_train_step": 2.7147843837738037, "step": 1919} {"train_info/time_between_train_steps": 0.003287792205810547, "step": 1919} {"info/global_step": 1920, "train_info/time_within_train_step": 2.7156319618225098, "step": 1920} {"train_info/time_between_train_steps": 0.0034728050231933594, "step": 1920} {"info/global_step": 1921, "train_info/time_within_train_step": 2.6862714290618896, "step": 1921} {"train_info/time_between_train_steps": 0.0035202503204345703, "step": 1921} {"info/global_step": 1922, "train_info/time_within_train_step": 2.7158708572387695, "step": 1922} {"train_info/time_between_train_steps": 0.003896951675415039, "step": 1922} {"info/global_step": 1923, "train_info/time_within_train_step": 2.71631121635437, "step": 1923} {"train_info/time_between_train_steps": 0.003483295440673828, "step": 1923} {"info/global_step": 1924, "train_info/time_within_train_step": 2.6943256855010986, "step": 1924} {"train_info/time_between_train_steps": 0.003344297409057617, "step": 1924} {"info/global_step": 1925, "train_info/time_within_train_step": 2.702528238296509, "step": 1925} {"train_info/time_between_train_steps": 0.003519773483276367, "step": 1925} {"info/global_step": 1926, "train_info/time_within_train_step": 2.7146005630493164, "step": 1926} {"train_info/time_between_train_steps": 0.003327608108520508, "step": 1926} {"info/global_step": 1927, "train_info/time_within_train_step": 2.692298173904419, "step": 1927} {"train_info/time_between_train_steps": 0.0035257339477539062, "step": 1927} {"info/global_step": 1928, "train_info/time_within_train_step": 2.6970858573913574, "step": 1928} {"train_info/time_between_train_steps": 0.0033333301544189453, "step": 1928} {"info/global_step": 1929, "train_info/time_within_train_step": 2.706026315689087, "step": 1929} {"train_info/time_between_train_steps": 0.0035581588745117188, "step": 1929} {"info/global_step": 1930, "train_info/time_within_train_step": 2.7107768058776855, "step": 1930} {"train_info/time_between_train_steps": 0.003389596939086914, "step": 1930} {"info/global_step": 1931, "train_info/time_within_train_step": 2.7151505947113037, "step": 1931} {"train_info/time_between_train_steps": 0.0034515857696533203, "step": 1931} {"info/global_step": 1932, "train_info/time_within_train_step": 2.7054402828216553, "step": 1932} {"train_info/time_between_train_steps": 0.0033173561096191406, "step": 1932} {"info/global_step": 1933, "train_info/time_within_train_step": 2.692338228225708, "step": 1933} {"train_info/time_between_train_steps": 0.003301382064819336, "step": 1933} {"info/global_step": 1934, "train_info/time_within_train_step": 2.6908950805664062, "step": 1934} {"train_info/time_between_train_steps": 0.0032927989959716797, "step": 1934} {"info/global_step": 1935, "train_info/time_within_train_step": 2.6951804161071777, "step": 1935} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 1935} {"info/global_step": 1936, "train_info/time_within_train_step": 2.703995943069458, "step": 1936} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 1936} {"info/global_step": 1937, "train_info/time_within_train_step": 2.705829381942749, "step": 1937} {"train_info/time_between_train_steps": 0.0035774707794189453, "step": 1937} {"info/global_step": 1938, "train_info/time_within_train_step": 2.6949446201324463, "step": 1938} {"train_info/time_between_train_steps": 0.003371715545654297, "step": 1938} {"info/global_step": 1939, "train_info/time_within_train_step": 2.7040021419525146, "step": 1939} {"train_info/time_between_train_steps": 0.003682374954223633, "step": 1939} {"info/global_step": 1940, "train_info/time_within_train_step": 2.6855382919311523, "step": 1940} {"train_info/time_between_train_steps": 0.003796100616455078, "step": 1940} {"info/global_step": 1941, "train_info/time_within_train_step": 2.710177183151245, "step": 1941} {"train_info/time_between_train_steps": 0.0038242340087890625, "step": 1941} {"info/global_step": 1942, "train_info/time_within_train_step": 2.6995558738708496, "step": 1942} {"train_info/time_between_train_steps": 0.0038461685180664062, "step": 1942} {"info/global_step": 1943, "train_info/time_within_train_step": 2.686410903930664, "step": 1943} {"train_info/time_between_train_steps": 0.00393986701965332, "step": 1943} {"info/global_step": 1944, "train_info/time_within_train_step": 2.6877570152282715, "step": 1944} {"train_info/time_between_train_steps": 0.003938436508178711, "step": 1944} {"info/global_step": 1945, "train_info/time_within_train_step": 2.6871559619903564, "step": 1945} {"train_info/time_between_train_steps": 0.003933906555175781, "step": 1945} {"info/global_step": 1946, "train_info/time_within_train_step": 2.6886816024780273, "step": 1946} {"train_info/time_between_train_steps": 0.0038802623748779297, "step": 1946} {"info/global_step": 1947, "train_info/time_within_train_step": 2.699428081512451, "step": 1947} {"train_info/time_between_train_steps": 0.0039031505584716797, "step": 1947} {"info/global_step": 1948, "train_info/time_within_train_step": 2.6953442096710205, "step": 1948} {"train_info/time_between_train_steps": 0.003934383392333984, "step": 1948} {"info/global_step": 1949, "train_info/time_within_train_step": 2.693758010864258, "step": 1949} {"train_info/time_between_train_steps": 0.003954887390136719, "step": 1949} {"info/global_step": 1950, "train_info/time_within_train_step": 2.6875343322753906, "step": 1950} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746317476, "_runtime": 5632}, "step": 1950} {"logs": {"train/loss": 4.2758, "train/learning_rate": 0.0002333333333333333, "train/epoch": 2.08, "_timestamp": 1746317476, "_runtime": 5632}, "step": 1950} {"train_info/time_between_train_steps": 0.025689125061035156, "step": 1950} {"info/global_step": 1951, "train_info/time_within_train_step": 2.6864395141601562, "step": 1951} {"train_info/time_between_train_steps": 0.00371551513671875, "step": 1951} {"info/global_step": 1952, "train_info/time_within_train_step": 2.693258285522461, "step": 1952} {"train_info/time_between_train_steps": 0.00400233268737793, "step": 1952} {"info/global_step": 1953, "train_info/time_within_train_step": 2.687340021133423, "step": 1953} {"train_info/time_between_train_steps": 0.0037784576416015625, "step": 1953} {"info/global_step": 1954, "train_info/time_within_train_step": 2.687222719192505, "step": 1954} {"train_info/time_between_train_steps": 0.0038154125213623047, "step": 1954} {"info/global_step": 1955, "train_info/time_within_train_step": 2.686678647994995, "step": 1955} {"train_info/time_between_train_steps": 0.003769397735595703, "step": 1955} {"info/global_step": 1956, "train_info/time_within_train_step": 2.6983630657196045, "step": 1956} {"train_info/time_between_train_steps": 0.19093871116638184, "step": 1956} {"info/global_step": 1957, "train_info/time_within_train_step": 2.6888082027435303, "step": 1957} {"train_info/time_between_train_steps": 0.003589153289794922, "step": 1957} {"info/global_step": 1958, "train_info/time_within_train_step": 2.6863620281219482, "step": 1958} {"train_info/time_between_train_steps": 0.0035789012908935547, "step": 1958} {"info/global_step": 1959, "train_info/time_within_train_step": 2.685786724090576, "step": 1959} {"train_info/time_between_train_steps": 0.003537893295288086, "step": 1959} {"info/global_step": 1960, "train_info/time_within_train_step": 2.687533140182495, "step": 1960} {"train_info/time_between_train_steps": 0.0035703182220458984, "step": 1960} {"info/global_step": 1961, "train_info/time_within_train_step": 2.685946226119995, "step": 1961} {"train_info/time_between_train_steps": 0.003600597381591797, "step": 1961} {"info/global_step": 1962, "train_info/time_within_train_step": 2.6874969005584717, "step": 1962} {"train_info/time_between_train_steps": 0.003701925277709961, "step": 1962} {"info/global_step": 1963, "train_info/time_within_train_step": 2.6868698596954346, "step": 1963} {"train_info/time_between_train_steps": 0.0036449432373046875, "step": 1963} {"info/global_step": 1964, "train_info/time_within_train_step": 2.6863114833831787, "step": 1964} {"train_info/time_between_train_steps": 0.0036215782165527344, "step": 1964} {"info/global_step": 1965, "train_info/time_within_train_step": 2.6857872009277344, "step": 1965} {"train_info/time_between_train_steps": 0.0034656524658203125, "step": 1965} {"info/global_step": 1966, "train_info/time_within_train_step": 2.6862926483154297, "step": 1966} {"train_info/time_between_train_steps": 0.0034918785095214844, "step": 1966} {"info/global_step": 1967, "train_info/time_within_train_step": 2.686908721923828, "step": 1967} {"train_info/time_between_train_steps": 0.0034003257751464844, "step": 1967} {"info/global_step": 1968, "train_info/time_within_train_step": 2.689852714538574, "step": 1968} {"train_info/time_between_train_steps": 0.0035271644592285156, "step": 1968} {"info/global_step": 1969, "train_info/time_within_train_step": 2.7363028526306152, "step": 1969} {"train_info/time_between_train_steps": 0.0034503936767578125, "step": 1969} {"info/global_step": 1970, "train_info/time_within_train_step": 2.6839635372161865, "step": 1970} {"train_info/time_between_train_steps": 0.003483295440673828, "step": 1970} {"info/global_step": 1971, "train_info/time_within_train_step": 2.6851859092712402, "step": 1971} {"train_info/time_between_train_steps": 0.003570556640625, "step": 1971} {"info/global_step": 1972, "train_info/time_within_train_step": 2.685068368911743, "step": 1972} {"train_info/time_between_train_steps": 0.004171848297119141, "step": 1972} {"info/global_step": 1973, "train_info/time_within_train_step": 2.6859195232391357, "step": 1973} {"train_info/time_between_train_steps": 0.00330352783203125, "step": 1973} {"info/global_step": 1974, "train_info/time_within_train_step": 2.6847639083862305, "step": 1974} {"train_info/time_between_train_steps": 0.003551483154296875, "step": 1974} {"info/global_step": 1975, "train_info/time_within_train_step": 2.6851537227630615, "step": 1975} {"train_info/time_between_train_steps": 0.0035185813903808594, "step": 1975} {"info/global_step": 1976, "train_info/time_within_train_step": 2.690059185028076, "step": 1976} {"train_info/time_between_train_steps": 0.0035152435302734375, "step": 1976} {"info/global_step": 1977, "train_info/time_within_train_step": 2.6836602687835693, "step": 1977} {"train_info/time_between_train_steps": 0.003436565399169922, "step": 1977} {"info/global_step": 1978, "train_info/time_within_train_step": 3.0078744888305664, "step": 1978} {"train_info/time_between_train_steps": 0.003293275833129883, "step": 1978} {"info/global_step": 1979, "train_info/time_within_train_step": 2.685211181640625, "step": 1979} {"train_info/time_between_train_steps": 0.0036368370056152344, "step": 1979} {"info/global_step": 1980, "train_info/time_within_train_step": 2.6850991249084473, "step": 1980} {"train_info/time_between_train_steps": 0.003601551055908203, "step": 1980} {"info/global_step": 1981, "train_info/time_within_train_step": 2.685178518295288, "step": 1981} {"train_info/time_between_train_steps": 0.003603696823120117, "step": 1981} {"info/global_step": 1982, "train_info/time_within_train_step": 2.6859023571014404, "step": 1982} {"train_info/time_between_train_steps": 0.0034368038177490234, "step": 1982} {"info/global_step": 1983, "train_info/time_within_train_step": 2.684828281402588, "step": 1983} {"train_info/time_between_train_steps": 0.003652811050415039, "step": 1983} {"info/global_step": 1984, "train_info/time_within_train_step": 2.685087203979492, "step": 1984} {"train_info/time_between_train_steps": 0.003390073776245117, "step": 1984} {"info/global_step": 1985, "train_info/time_within_train_step": 2.6845545768737793, "step": 1985} {"train_info/time_between_train_steps": 0.0033566951751708984, "step": 1985} {"info/global_step": 1986, "train_info/time_within_train_step": 2.6866800785064697, "step": 1986} {"train_info/time_between_train_steps": 0.003492593765258789, "step": 1986} {"info/global_step": 1987, "train_info/time_within_train_step": 2.685990333557129, "step": 1987} {"train_info/time_between_train_steps": 0.003464221954345703, "step": 1987} {"info/global_step": 1988, "train_info/time_within_train_step": 2.684389114379883, "step": 1988} {"train_info/time_between_train_steps": 0.003542661666870117, "step": 1988} {"info/global_step": 1989, "train_info/time_within_train_step": 2.6860058307647705, "step": 1989} {"train_info/time_between_train_steps": 0.0036089420318603516, "step": 1989} {"info/global_step": 1990, "train_info/time_within_train_step": 2.6899547576904297, "step": 1990} {"train_info/time_between_train_steps": 0.0033850669860839844, "step": 1990} {"info/global_step": 1991, "train_info/time_within_train_step": 2.7363953590393066, "step": 1991} {"train_info/time_between_train_steps": 0.003468751907348633, "step": 1991} {"info/global_step": 1992, "train_info/time_within_train_step": 2.685154438018799, "step": 1992} {"train_info/time_between_train_steps": 0.003401517868041992, "step": 1992} {"info/global_step": 1993, "train_info/time_within_train_step": 2.6850507259368896, "step": 1993} {"train_info/time_between_train_steps": 0.003579854965209961, "step": 1993} {"info/global_step": 1994, "train_info/time_within_train_step": 2.6845574378967285, "step": 1994} {"train_info/time_between_train_steps": 0.003674030303955078, "step": 1994} {"info/global_step": 1995, "train_info/time_within_train_step": 2.6837880611419678, "step": 1995} {"train_info/time_between_train_steps": 0.003520965576171875, "step": 1995} {"info/global_step": 1996, "train_info/time_within_train_step": 2.6844048500061035, "step": 1996} {"train_info/time_between_train_steps": 0.0034236907958984375, "step": 1996} {"info/global_step": 1997, "train_info/time_within_train_step": 2.6861321926116943, "step": 1997} {"train_info/time_between_train_steps": 0.0033540725708007812, "step": 1997} {"info/global_step": 1998, "train_info/time_within_train_step": 2.6904375553131104, "step": 1998} {"train_info/time_between_train_steps": 0.0036993026733398438, "step": 1998} {"info/global_step": 1999, "train_info/time_within_train_step": 3.2745513916015625, "step": 1999} {"train_info/time_between_train_steps": 0.0034759044647216797, "step": 1999} {"info/global_step": 2000, "train_info/time_within_train_step": 2.684952735900879, "step": 2000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746317613, "_runtime": 5769}, "step": 2000} {"logs": {"train/loss": 4.2496, "train/learning_rate": 0.00022222222222222218, "train/epoch": 2.1, "_timestamp": 1746317613, "_runtime": 5769}, "step": 2000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746317618, "_runtime": 5774}, "step": 2000} {"logs": {"eval/loss": 4.77055549621582, "eval/runtime": 5.2303, "eval/samples_per_second": 36.327, "eval/steps_per_second": 1.147, "train/epoch": 2.1, "_timestamp": 1746317618, "_runtime": 5774}, "step": 2000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746317618, "_runtime": 5774}, "step": 2000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.77055549621582, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 117.9847638502482, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.2303, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.327, "train/epoch": 2.1, "_timestamp": 1746317618, "_runtime": 5774}, "step": 2000} {"train_info/time_between_train_steps": 25.552340745925903, "step": 2000} {"info/global_step": 2001, "train_info/time_within_train_step": 2.479109764099121, "step": 2001} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 2001} {"info/global_step": 2002, "train_info/time_within_train_step": 2.471436023712158, "step": 2002} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 2002} {"info/global_step": 2003, "train_info/time_within_train_step": 2.6594529151916504, "step": 2003} {"train_info/time_between_train_steps": 0.0032951831817626953, "step": 2003} {"info/global_step": 2004, "train_info/time_within_train_step": 2.6798722743988037, "step": 2004} {"train_info/time_between_train_steps": 0.003269672393798828, "step": 2004} {"info/global_step": 2005, "train_info/time_within_train_step": 2.6806952953338623, "step": 2005} {"train_info/time_between_train_steps": 0.0034089088439941406, "step": 2005} {"info/global_step": 2006, "train_info/time_within_train_step": 2.683316707611084, "step": 2006} {"train_info/time_between_train_steps": 0.0033092498779296875, "step": 2006} {"info/global_step": 2007, "train_info/time_within_train_step": 2.683124542236328, "step": 2007} {"train_info/time_between_train_steps": 0.003922700881958008, "step": 2007} {"info/global_step": 2008, "train_info/time_within_train_step": 2.6825177669525146, "step": 2008} {"train_info/time_between_train_steps": 0.0033762454986572266, "step": 2008} {"info/global_step": 2009, "train_info/time_within_train_step": 2.683776378631592, "step": 2009} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 2009} {"info/global_step": 2010, "train_info/time_within_train_step": 2.684330463409424, "step": 2010} {"train_info/time_between_train_steps": 0.0032961368560791016, "step": 2010} {"info/global_step": 2011, "train_info/time_within_train_step": 2.6838014125823975, "step": 2011} {"train_info/time_between_train_steps": 0.0032453536987304688, "step": 2011} {"info/global_step": 2012, "train_info/time_within_train_step": 2.684365749359131, "step": 2012} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 2012} {"info/global_step": 2013, "train_info/time_within_train_step": 2.684755563735962, "step": 2013} {"train_info/time_between_train_steps": 0.0034155845642089844, "step": 2013} {"info/global_step": 2014, "train_info/time_within_train_step": 2.6845479011535645, "step": 2014} {"train_info/time_between_train_steps": 0.0034575462341308594, "step": 2014} {"info/global_step": 2015, "train_info/time_within_train_step": 2.7113234996795654, "step": 2015} {"train_info/time_between_train_steps": 0.003278493881225586, "step": 2015} {"info/global_step": 2016, "train_info/time_within_train_step": 2.808821678161621, "step": 2016} {"train_info/time_between_train_steps": 0.0035774707794189453, "step": 2016} {"info/global_step": 2017, "train_info/time_within_train_step": 2.745055913925171, "step": 2017} {"train_info/time_between_train_steps": 0.0033583641052246094, "step": 2017} {"info/global_step": 2018, "train_info/time_within_train_step": 2.7037363052368164, "step": 2018} {"train_info/time_between_train_steps": 0.003636598587036133, "step": 2018} {"info/global_step": 2019, "train_info/time_within_train_step": 2.907536506652832, "step": 2019} {"train_info/time_between_train_steps": 0.003569364547729492, "step": 2019} {"info/global_step": 2020, "train_info/time_within_train_step": 2.6861560344696045, "step": 2020} {"train_info/time_between_train_steps": 0.003345966339111328, "step": 2020} {"info/global_step": 2021, "train_info/time_within_train_step": 3.0034730434417725, "step": 2021} {"train_info/time_between_train_steps": 0.0036211013793945312, "step": 2021} {"info/global_step": 2022, "train_info/time_within_train_step": 2.6858012676239014, "step": 2022} {"train_info/time_between_train_steps": 0.0034313201904296875, "step": 2022} {"info/global_step": 2023, "train_info/time_within_train_step": 2.6841752529144287, "step": 2023} {"train_info/time_between_train_steps": 0.0035529136657714844, "step": 2023} {"info/global_step": 2024, "train_info/time_within_train_step": 2.6971776485443115, "step": 2024} {"train_info/time_between_train_steps": 0.0037698745727539062, "step": 2024} {"info/global_step": 2025, "train_info/time_within_train_step": 2.7092325687408447, "step": 2025} {"train_info/time_between_train_steps": 0.004261016845703125, "step": 2025} {"info/global_step": 2026, "train_info/time_within_train_step": 2.7111971378326416, "step": 2026} {"train_info/time_between_train_steps": 0.0034558773040771484, "step": 2026} {"info/global_step": 2027, "train_info/time_within_train_step": 2.706815719604492, "step": 2027} {"train_info/time_between_train_steps": 0.003584146499633789, "step": 2027} {"info/global_step": 2028, "train_info/time_within_train_step": 2.7050225734710693, "step": 2028} {"train_info/time_between_train_steps": 0.003499746322631836, "step": 2028} {"info/global_step": 2029, "train_info/time_within_train_step": 2.7162182331085205, "step": 2029} {"train_info/time_between_train_steps": 0.0036530494689941406, "step": 2029} {"info/global_step": 2030, "train_info/time_within_train_step": 2.704942464828491, "step": 2030} {"train_info/time_between_train_steps": 0.0034241676330566406, "step": 2030} {"info/global_step": 2031, "train_info/time_within_train_step": 2.7065999507904053, "step": 2031} {"train_info/time_between_train_steps": 0.003584623336791992, "step": 2031} {"info/global_step": 2032, "train_info/time_within_train_step": 2.6858718395233154, "step": 2032} {"train_info/time_between_train_steps": 0.0033729076385498047, "step": 2032} {"info/global_step": 2033, "train_info/time_within_train_step": 2.696031332015991, "step": 2033} {"train_info/time_between_train_steps": 0.003375530242919922, "step": 2033} {"info/global_step": 2034, "train_info/time_within_train_step": 2.7244367599487305, "step": 2034} {"train_info/time_between_train_steps": 0.0035238265991210938, "step": 2034} {"info/global_step": 2035, "train_info/time_within_train_step": 2.687504529953003, "step": 2035} {"train_info/time_between_train_steps": 0.0035986900329589844, "step": 2035} {"info/global_step": 2036, "train_info/time_within_train_step": 2.6868863105773926, "step": 2036} {"train_info/time_between_train_steps": 0.0036373138427734375, "step": 2036} {"info/global_step": 2037, "train_info/time_within_train_step": 2.715867519378662, "step": 2037} {"train_info/time_between_train_steps": 0.0035500526428222656, "step": 2037} {"info/global_step": 2038, "train_info/time_within_train_step": 2.685149669647217, "step": 2038} {"train_info/time_between_train_steps": 0.0035774707794189453, "step": 2038} {"info/global_step": 2039, "train_info/time_within_train_step": 2.685541868209839, "step": 2039} {"train_info/time_between_train_steps": 0.0033731460571289062, "step": 2039} {"info/global_step": 2040, "train_info/time_within_train_step": 2.6975765228271484, "step": 2040} {"train_info/time_between_train_steps": 0.0036437511444091797, "step": 2040} {"info/global_step": 2041, "train_info/time_within_train_step": 2.696431875228882, "step": 2041} {"train_info/time_between_train_steps": 0.0034372806549072266, "step": 2041} {"info/global_step": 2042, "train_info/time_within_train_step": 2.6921823024749756, "step": 2042} {"train_info/time_between_train_steps": 0.003595113754272461, "step": 2042} {"info/global_step": 2043, "train_info/time_within_train_step": 2.6977531909942627, "step": 2043} {"train_info/time_between_train_steps": 0.003472566604614258, "step": 2043} {"info/global_step": 2044, "train_info/time_within_train_step": 2.6998448371887207, "step": 2044} {"train_info/time_between_train_steps": 0.0034186840057373047, "step": 2044} {"info/global_step": 2045, "train_info/time_within_train_step": 2.701693058013916, "step": 2045} {"train_info/time_between_train_steps": 0.003387928009033203, "step": 2045} {"info/global_step": 2046, "train_info/time_within_train_step": 2.7018041610717773, "step": 2046} {"train_info/time_between_train_steps": 0.0036325454711914062, "step": 2046} {"info/global_step": 2047, "train_info/time_within_train_step": 2.707521915435791, "step": 2047} {"train_info/time_between_train_steps": 0.0034651756286621094, "step": 2047} {"info/global_step": 2048, "train_info/time_within_train_step": 2.736515998840332, "step": 2048} {"train_info/time_between_train_steps": 0.0034945011138916016, "step": 2048} {"info/global_step": 2049, "train_info/time_within_train_step": 2.685239315032959, "step": 2049} {"train_info/time_between_train_steps": 0.003442525863647461, "step": 2049} {"info/global_step": 2050, "train_info/time_within_train_step": 2.683926582336426, "step": 2050} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746317775, "_runtime": 5931}, "step": 2050} {"logs": {"train/loss": 4.2365, "train/learning_rate": 0.0002111111111111111, "train/epoch": 2.11, "_timestamp": 1746317775, "_runtime": 5931}, "step": 2050} {"train_info/time_between_train_steps": 0.024306774139404297, "step": 2050} {"info/global_step": 2051, "train_info/time_within_train_step": 2.6841232776641846, "step": 2051} {"train_info/time_between_train_steps": 0.0033888816833496094, "step": 2051} {"info/global_step": 2052, "train_info/time_within_train_step": 2.68422532081604, "step": 2052} {"train_info/time_between_train_steps": 0.0034639835357666016, "step": 2052} {"info/global_step": 2053, "train_info/time_within_train_step": 2.6838839054107666, "step": 2053} {"train_info/time_between_train_steps": 0.0035037994384765625, "step": 2053} {"info/global_step": 2054, "train_info/time_within_train_step": 2.6841113567352295, "step": 2054} {"train_info/time_between_train_steps": 0.0034935474395751953, "step": 2054} {"info/global_step": 2055, "train_info/time_within_train_step": 2.6848931312561035, "step": 2055} {"train_info/time_between_train_steps": 0.003587484359741211, "step": 2055} {"info/global_step": 2056, "train_info/time_within_train_step": 2.684143543243408, "step": 2056} {"train_info/time_between_train_steps": 0.003521442413330078, "step": 2056} {"info/global_step": 2057, "train_info/time_within_train_step": 2.6849796772003174, "step": 2057} {"train_info/time_between_train_steps": 0.003516674041748047, "step": 2057} {"info/global_step": 2058, "train_info/time_within_train_step": 2.685389757156372, "step": 2058} {"train_info/time_between_train_steps": 0.0036835670471191406, "step": 2058} {"info/global_step": 2059, "train_info/time_within_train_step": 2.6844375133514404, "step": 2059} {"train_info/time_between_train_steps": 0.0036284923553466797, "step": 2059} {"info/global_step": 2060, "train_info/time_within_train_step": 2.6845779418945312, "step": 2060} {"train_info/time_between_train_steps": 0.0035047531127929688, "step": 2060} {"info/global_step": 2061, "train_info/time_within_train_step": 2.6846704483032227, "step": 2061} {"train_info/time_between_train_steps": 0.0034151077270507812, "step": 2061} {"info/global_step": 2062, "train_info/time_within_train_step": 2.68462872505188, "step": 2062} {"train_info/time_between_train_steps": 0.003500223159790039, "step": 2062} {"info/global_step": 2063, "train_info/time_within_train_step": 2.6858973503112793, "step": 2063} {"train_info/time_between_train_steps": 0.003390073776245117, "step": 2063} {"info/global_step": 2064, "train_info/time_within_train_step": 2.6841304302215576, "step": 2064} {"train_info/time_between_train_steps": 0.003573179244995117, "step": 2064} {"info/global_step": 2065, "train_info/time_within_train_step": 2.6845459938049316, "step": 2065} {"train_info/time_between_train_steps": 0.003402233123779297, "step": 2065} {"info/global_step": 2066, "train_info/time_within_train_step": 2.6840782165527344, "step": 2066} {"train_info/time_between_train_steps": 0.0036530494689941406, "step": 2066} {"info/global_step": 2067, "train_info/time_within_train_step": 2.6838955879211426, "step": 2067} {"train_info/time_between_train_steps": 0.0036690235137939453, "step": 2067} {"info/global_step": 2068, "train_info/time_within_train_step": 2.683945894241333, "step": 2068} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 2068} {"info/global_step": 2069, "train_info/time_within_train_step": 2.6840288639068604, "step": 2069} {"train_info/time_between_train_steps": 0.003628253936767578, "step": 2069} {"info/global_step": 2070, "train_info/time_within_train_step": 2.684523344039917, "step": 2070} {"train_info/time_between_train_steps": 0.003778219223022461, "step": 2070} {"info/global_step": 2071, "train_info/time_within_train_step": 2.68459415435791, "step": 2071} {"train_info/time_between_train_steps": 0.003346681594848633, "step": 2071} {"info/global_step": 2072, "train_info/time_within_train_step": 2.684232711791992, "step": 2072} {"train_info/time_between_train_steps": 0.003607034683227539, "step": 2072} {"info/global_step": 2073, "train_info/time_within_train_step": 2.684595823287964, "step": 2073} {"train_info/time_between_train_steps": 0.0036225318908691406, "step": 2073} {"info/global_step": 2074, "train_info/time_within_train_step": 2.684258460998535, "step": 2074} {"train_info/time_between_train_steps": 0.0033283233642578125, "step": 2074} {"info/global_step": 2075, "train_info/time_within_train_step": 2.684598922729492, "step": 2075} {"train_info/time_between_train_steps": 0.00347900390625, "step": 2075} {"info/global_step": 2076, "train_info/time_within_train_step": 2.6835780143737793, "step": 2076} {"train_info/time_between_train_steps": 0.003593921661376953, "step": 2076} {"info/global_step": 2077, "train_info/time_within_train_step": 2.683201313018799, "step": 2077} {"train_info/time_between_train_steps": 0.0034945011138916016, "step": 2077} {"info/global_step": 2078, "train_info/time_within_train_step": 2.68463397026062, "step": 2078} {"train_info/time_between_train_steps": 0.0035123825073242188, "step": 2078} {"info/global_step": 2079, "train_info/time_within_train_step": 2.6858129501342773, "step": 2079} {"train_info/time_between_train_steps": 0.003324747085571289, "step": 2079} {"info/global_step": 2080, "train_info/time_within_train_step": 2.684525728225708, "step": 2080} {"train_info/time_between_train_steps": 0.003435850143432617, "step": 2080} {"info/global_step": 2081, "train_info/time_within_train_step": 2.6852288246154785, "step": 2081} {"train_info/time_between_train_steps": 0.13659214973449707, "step": 2081} {"info/global_step": 2082, "train_info/time_within_train_step": 2.683340072631836, "step": 2082} {"train_info/time_between_train_steps": 0.0034127235412597656, "step": 2082} {"info/global_step": 2083, "train_info/time_within_train_step": 2.6844136714935303, "step": 2083} {"train_info/time_between_train_steps": 0.003530263900756836, "step": 2083} {"info/global_step": 2084, "train_info/time_within_train_step": 2.7074906826019287, "step": 2084} {"train_info/time_between_train_steps": 0.003373861312866211, "step": 2084} {"info/global_step": 2085, "train_info/time_within_train_step": 2.6838126182556152, "step": 2085} {"train_info/time_between_train_steps": 0.0034427642822265625, "step": 2085} {"info/global_step": 2086, "train_info/time_within_train_step": 2.684197425842285, "step": 2086} {"train_info/time_between_train_steps": 0.0034847259521484375, "step": 2086} {"info/global_step": 2087, "train_info/time_within_train_step": 2.684274196624756, "step": 2087} {"train_info/time_between_train_steps": 0.0034079551696777344, "step": 2087} {"info/global_step": 2088, "train_info/time_within_train_step": 2.683767795562744, "step": 2088} {"train_info/time_between_train_steps": 0.0035288333892822266, "step": 2088} {"info/global_step": 2089, "train_info/time_within_train_step": 2.6844513416290283, "step": 2089} {"train_info/time_between_train_steps": 0.003317117691040039, "step": 2089} {"info/global_step": 2090, "train_info/time_within_train_step": 2.692868709564209, "step": 2090} {"train_info/time_between_train_steps": 0.0036034584045410156, "step": 2090} {"info/global_step": 2091, "train_info/time_within_train_step": 2.6842451095581055, "step": 2091} {"train_info/time_between_train_steps": 0.003526449203491211, "step": 2091} {"info/global_step": 2092, "train_info/time_within_train_step": 2.6842308044433594, "step": 2092} {"train_info/time_between_train_steps": 0.003257274627685547, "step": 2092} {"info/global_step": 2093, "train_info/time_within_train_step": 2.683316946029663, "step": 2093} {"train_info/time_between_train_steps": 0.0035393238067626953, "step": 2093} {"info/global_step": 2094, "train_info/time_within_train_step": 2.6842384338378906, "step": 2094} {"train_info/time_between_train_steps": 0.0033371448516845703, "step": 2094} {"info/global_step": 2095, "train_info/time_within_train_step": 2.6847386360168457, "step": 2095} {"train_info/time_between_train_steps": 0.0032868385314941406, "step": 2095} {"info/global_step": 2096, "train_info/time_within_train_step": 2.6843442916870117, "step": 2096} {"train_info/time_between_train_steps": 0.0033631324768066406, "step": 2096} {"info/global_step": 2097, "train_info/time_within_train_step": 2.685162305831909, "step": 2097} {"train_info/time_between_train_steps": 0.003553152084350586, "step": 2097} {"info/global_step": 2098, "train_info/time_within_train_step": 2.684403657913208, "step": 2098} {"train_info/time_between_train_steps": 0.0034122467041015625, "step": 2098} {"info/global_step": 2099, "train_info/time_within_train_step": 2.684471607208252, "step": 2099} {"train_info/time_between_train_steps": 0.003262042999267578, "step": 2099} {"info/global_step": 2100, "train_info/time_within_train_step": 2.6825075149536133, "step": 2100} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746317910, "_runtime": 6066}, "step": 2100} {"logs": {"train/loss": 4.2228, "train/learning_rate": 0.00019999999999999998, "train/epoch": 2.13, "_timestamp": 1746317910, "_runtime": 6066}, "step": 2100} {"train_info/time_between_train_steps": 21.865195989608765, "step": 2100} {"info/global_step": 2101, "train_info/time_within_train_step": 2.4849705696105957, "step": 2101} {"train_info/time_between_train_steps": 0.0033216476440429688, "step": 2101} {"info/global_step": 2102, "train_info/time_within_train_step": 2.477308988571167, "step": 2102} {"train_info/time_between_train_steps": 0.003393411636352539, "step": 2102} {"info/global_step": 2103, "train_info/time_within_train_step": 2.667750120162964, "step": 2103} {"train_info/time_between_train_steps": 0.003299713134765625, "step": 2103} {"info/global_step": 2104, "train_info/time_within_train_step": 2.6814842224121094, "step": 2104} {"train_info/time_between_train_steps": 0.0034961700439453125, "step": 2104} {"info/global_step": 2105, "train_info/time_within_train_step": 2.9809534549713135, "step": 2105} {"train_info/time_between_train_steps": 0.0035026073455810547, "step": 2105} {"info/global_step": 2106, "train_info/time_within_train_step": 2.681382656097412, "step": 2106} {"train_info/time_between_train_steps": 0.003499269485473633, "step": 2106} {"info/global_step": 2107, "train_info/time_within_train_step": 2.682119369506836, "step": 2107} {"train_info/time_between_train_steps": 0.0032711029052734375, "step": 2107} {"info/global_step": 2108, "train_info/time_within_train_step": 2.6839144229888916, "step": 2108} {"train_info/time_between_train_steps": 0.0032820701599121094, "step": 2108} {"info/global_step": 2109, "train_info/time_within_train_step": 2.68345046043396, "step": 2109} {"train_info/time_between_train_steps": 0.0034422874450683594, "step": 2109} {"info/global_step": 2110, "train_info/time_within_train_step": 2.6827282905578613, "step": 2110} {"train_info/time_between_train_steps": 0.003912687301635742, "step": 2110} {"info/global_step": 2111, "train_info/time_within_train_step": 2.6837503910064697, "step": 2111} {"train_info/time_between_train_steps": 0.0033457279205322266, "step": 2111} {"info/global_step": 2112, "train_info/time_within_train_step": 2.683866500854492, "step": 2112} {"train_info/time_between_train_steps": 0.0034241676330566406, "step": 2112} {"info/global_step": 2113, "train_info/time_within_train_step": 2.6840226650238037, "step": 2113} {"train_info/time_between_train_steps": 0.003385305404663086, "step": 2113} {"info/global_step": 2114, "train_info/time_within_train_step": 2.686079978942871, "step": 2114} {"train_info/time_between_train_steps": 0.003359079360961914, "step": 2114} {"info/global_step": 2115, "train_info/time_within_train_step": 2.770988941192627, "step": 2115} {"train_info/time_between_train_steps": 0.003483295440673828, "step": 2115} {"info/global_step": 2116, "train_info/time_within_train_step": 2.7449002265930176, "step": 2116} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 2116} {"info/global_step": 2117, "train_info/time_within_train_step": 2.7167234420776367, "step": 2117} {"train_info/time_between_train_steps": 0.0032660961151123047, "step": 2117} {"info/global_step": 2118, "train_info/time_within_train_step": 2.718550443649292, "step": 2118} {"train_info/time_between_train_steps": 0.0034492015838623047, "step": 2118} {"info/global_step": 2119, "train_info/time_within_train_step": 2.7251601219177246, "step": 2119} {"train_info/time_between_train_steps": 0.003419160842895508, "step": 2119} {"info/global_step": 2120, "train_info/time_within_train_step": 2.7350494861602783, "step": 2120} {"train_info/time_between_train_steps": 0.00327301025390625, "step": 2120} {"info/global_step": 2121, "train_info/time_within_train_step": 2.691168785095215, "step": 2121} {"train_info/time_between_train_steps": 0.0032668113708496094, "step": 2121} {"info/global_step": 2122, "train_info/time_within_train_step": 2.698796272277832, "step": 2122} {"train_info/time_between_train_steps": 0.0033369064331054688, "step": 2122} {"info/global_step": 2123, "train_info/time_within_train_step": 2.7192320823669434, "step": 2123} {"train_info/time_between_train_steps": 0.003369569778442383, "step": 2123} {"info/global_step": 2124, "train_info/time_within_train_step": 2.7032241821289062, "step": 2124} {"train_info/time_between_train_steps": 0.0033402442932128906, "step": 2124} {"info/global_step": 2125, "train_info/time_within_train_step": 2.6897614002227783, "step": 2125} {"train_info/time_between_train_steps": 0.0034749507904052734, "step": 2125} {"info/global_step": 2126, "train_info/time_within_train_step": 2.707059621810913, "step": 2126} {"train_info/time_between_train_steps": 0.003319978713989258, "step": 2126} {"info/global_step": 2127, "train_info/time_within_train_step": 2.691033363342285, "step": 2127} {"train_info/time_between_train_steps": 0.0032842159271240234, "step": 2127} {"info/global_step": 2128, "train_info/time_within_train_step": 2.7032454013824463, "step": 2128} {"train_info/time_between_train_steps": 0.003476858139038086, "step": 2128} {"info/global_step": 2129, "train_info/time_within_train_step": 2.707249879837036, "step": 2129} {"train_info/time_between_train_steps": 0.0034508705139160156, "step": 2129} {"info/global_step": 2130, "train_info/time_within_train_step": 2.713404417037964, "step": 2130} {"train_info/time_between_train_steps": 0.0034928321838378906, "step": 2130} {"info/global_step": 2131, "train_info/time_within_train_step": 2.7067220211029053, "step": 2131} {"train_info/time_between_train_steps": 0.003411531448364258, "step": 2131} {"info/global_step": 2132, "train_info/time_within_train_step": 2.7022106647491455, "step": 2132} {"train_info/time_between_train_steps": 0.003433704376220703, "step": 2132} {"info/global_step": 2133, "train_info/time_within_train_step": 2.6858487129211426, "step": 2133} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 2133} {"info/global_step": 2134, "train_info/time_within_train_step": 2.6867966651916504, "step": 2134} {"train_info/time_between_train_steps": 0.0032684803009033203, "step": 2134} {"info/global_step": 2135, "train_info/time_within_train_step": 2.723679304122925, "step": 2135} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 2135} {"info/global_step": 2136, "train_info/time_within_train_step": 2.704543352127075, "step": 2136} {"train_info/time_between_train_steps": 0.003294229507446289, "step": 2136} {"info/global_step": 2137, "train_info/time_within_train_step": 2.685523748397827, "step": 2137} {"train_info/time_between_train_steps": 0.0032300949096679688, "step": 2137} {"info/global_step": 2138, "train_info/time_within_train_step": 2.699374198913574, "step": 2138} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 2138} {"info/global_step": 2139, "train_info/time_within_train_step": 2.7023723125457764, "step": 2139} {"train_info/time_between_train_steps": 0.0034177303314208984, "step": 2139} {"info/global_step": 2140, "train_info/time_within_train_step": 2.6836555004119873, "step": 2140} {"train_info/time_between_train_steps": 0.0034155845642089844, "step": 2140} {"info/global_step": 2141, "train_info/time_within_train_step": 2.683168888092041, "step": 2141} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 2141} {"info/global_step": 2142, "train_info/time_within_train_step": 2.7032430171966553, "step": 2142} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 2142} {"info/global_step": 2143, "train_info/time_within_train_step": 2.71366024017334, "step": 2143} {"train_info/time_between_train_steps": 0.003308534622192383, "step": 2143} {"info/global_step": 2144, "train_info/time_within_train_step": 3.091583251953125, "step": 2144} {"train_info/time_between_train_steps": 0.003354787826538086, "step": 2144} {"info/global_step": 2145, "train_info/time_within_train_step": 2.682769775390625, "step": 2145} {"train_info/time_between_train_steps": 0.003309011459350586, "step": 2145} {"info/global_step": 2146, "train_info/time_within_train_step": 2.6828112602233887, "step": 2146} {"train_info/time_between_train_steps": 0.0034775733947753906, "step": 2146} {"info/global_step": 2147, "train_info/time_within_train_step": 2.683878183364868, "step": 2147} {"train_info/time_between_train_steps": 0.0033736228942871094, "step": 2147} {"info/global_step": 2148, "train_info/time_within_train_step": 2.684943675994873, "step": 2148} {"train_info/time_between_train_steps": 0.0035355091094970703, "step": 2148} {"info/global_step": 2149, "train_info/time_within_train_step": 2.6840126514434814, "step": 2149} {"train_info/time_between_train_steps": 0.0033288002014160156, "step": 2149} {"info/global_step": 2150, "train_info/time_within_train_step": 2.6840460300445557, "step": 2150} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746318069, "_runtime": 6225}, "step": 2150} {"logs": {"train/loss": 4.188, "train/learning_rate": 0.00018888888888888888, "train/epoch": 2.15, "_timestamp": 1746318069, "_runtime": 6225}, "step": 2150} {"train_info/time_between_train_steps": 0.024424076080322266, "step": 2150} {"info/global_step": 2151, "train_info/time_within_train_step": 2.684032917022705, "step": 2151} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 2151} {"info/global_step": 2152, "train_info/time_within_train_step": 2.684624433517456, "step": 2152} {"train_info/time_between_train_steps": 0.0034110546112060547, "step": 2152} {"info/global_step": 2153, "train_info/time_within_train_step": 2.684394598007202, "step": 2153} {"train_info/time_between_train_steps": 0.003236532211303711, "step": 2153} {"info/global_step": 2154, "train_info/time_within_train_step": 2.6840157508850098, "step": 2154} {"train_info/time_between_train_steps": 0.0033380985260009766, "step": 2154} {"info/global_step": 2155, "train_info/time_within_train_step": 2.684948205947876, "step": 2155} {"train_info/time_between_train_steps": 0.0035228729248046875, "step": 2155} {"info/global_step": 2156, "train_info/time_within_train_step": 2.6836154460906982, "step": 2156} {"train_info/time_between_train_steps": 0.003381967544555664, "step": 2156} {"info/global_step": 2157, "train_info/time_within_train_step": 2.6835286617279053, "step": 2157} {"train_info/time_between_train_steps": 0.003247976303100586, "step": 2157} {"info/global_step": 2158, "train_info/time_within_train_step": 2.6845788955688477, "step": 2158} {"train_info/time_between_train_steps": 0.003488779067993164, "step": 2158} {"info/global_step": 2159, "train_info/time_within_train_step": 2.683725595474243, "step": 2159} {"train_info/time_between_train_steps": 0.0034589767456054688, "step": 2159} {"info/global_step": 2160, "train_info/time_within_train_step": 2.683661937713623, "step": 2160} {"train_info/time_between_train_steps": 0.003370523452758789, "step": 2160} {"info/global_step": 2161, "train_info/time_within_train_step": 2.6836671829223633, "step": 2161} {"train_info/time_between_train_steps": 0.00331878662109375, "step": 2161} {"info/global_step": 2162, "train_info/time_within_train_step": 2.6840226650238037, "step": 2162} {"train_info/time_between_train_steps": 0.0032553672790527344, "step": 2162} {"info/global_step": 2163, "train_info/time_within_train_step": 2.6837148666381836, "step": 2163} {"train_info/time_between_train_steps": 0.0033822059631347656, "step": 2163} {"info/global_step": 2164, "train_info/time_within_train_step": 2.68418550491333, "step": 2164} {"train_info/time_between_train_steps": 0.0034987926483154297, "step": 2164} {"info/global_step": 2165, "train_info/time_within_train_step": 2.684380054473877, "step": 2165} {"train_info/time_between_train_steps": 0.0032291412353515625, "step": 2165} {"info/global_step": 2166, "train_info/time_within_train_step": 2.6839029788970947, "step": 2166} {"train_info/time_between_train_steps": 0.003507852554321289, "step": 2166} {"info/global_step": 2167, "train_info/time_within_train_step": 2.6842336654663086, "step": 2167} {"train_info/time_between_train_steps": 0.0033347606658935547, "step": 2167} {"info/global_step": 2168, "train_info/time_within_train_step": 2.684624433517456, "step": 2168} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 2168} {"info/global_step": 2169, "train_info/time_within_train_step": 2.685060501098633, "step": 2169} {"train_info/time_between_train_steps": 0.003431558609008789, "step": 2169} {"info/global_step": 2170, "train_info/time_within_train_step": 2.684107780456543, "step": 2170} {"train_info/time_between_train_steps": 0.003336668014526367, "step": 2170} {"info/global_step": 2171, "train_info/time_within_train_step": 2.6846392154693604, "step": 2171} {"train_info/time_between_train_steps": 0.0033559799194335938, "step": 2171} {"info/global_step": 2172, "train_info/time_within_train_step": 2.684385061264038, "step": 2172} {"train_info/time_between_train_steps": 0.003423929214477539, "step": 2172} {"info/global_step": 2173, "train_info/time_within_train_step": 2.6845386028289795, "step": 2173} {"train_info/time_between_train_steps": 0.003338336944580078, "step": 2173} {"info/global_step": 2174, "train_info/time_within_train_step": 2.6837074756622314, "step": 2174} {"train_info/time_between_train_steps": 0.0033807754516601562, "step": 2174} {"info/global_step": 2175, "train_info/time_within_train_step": 2.683487892150879, "step": 2175} {"train_info/time_between_train_steps": 0.0032482147216796875, "step": 2175} {"info/global_step": 2176, "train_info/time_within_train_step": 2.6932168006896973, "step": 2176} {"train_info/time_between_train_steps": 0.0032486915588378906, "step": 2176} {"info/global_step": 2177, "train_info/time_within_train_step": 2.683082342147827, "step": 2177} {"train_info/time_between_train_steps": 0.003439664840698242, "step": 2177} {"info/global_step": 2178, "train_info/time_within_train_step": 2.6838791370391846, "step": 2178} {"train_info/time_between_train_steps": 0.0032553672790527344, "step": 2178} {"info/global_step": 2179, "train_info/time_within_train_step": 2.683361053466797, "step": 2179} {"train_info/time_between_train_steps": 0.003239154815673828, "step": 2179} {"info/global_step": 2180, "train_info/time_within_train_step": 2.6831836700439453, "step": 2180} {"train_info/time_between_train_steps": 0.003357410430908203, "step": 2180} {"info/global_step": 2181, "train_info/time_within_train_step": 2.6833770275115967, "step": 2181} {"train_info/time_between_train_steps": 0.003422260284423828, "step": 2181} {"info/global_step": 2182, "train_info/time_within_train_step": 2.6842522621154785, "step": 2182} {"train_info/time_between_train_steps": 0.0033712387084960938, "step": 2182} {"info/global_step": 2183, "train_info/time_within_train_step": 2.6832387447357178, "step": 2183} {"train_info/time_between_train_steps": 0.0033049583435058594, "step": 2183} {"info/global_step": 2184, "train_info/time_within_train_step": 2.6827244758605957, "step": 2184} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 2184} {"info/global_step": 2185, "train_info/time_within_train_step": 2.682473659515381, "step": 2185} {"train_info/time_between_train_steps": 0.0033440589904785156, "step": 2185} {"info/global_step": 2186, "train_info/time_within_train_step": 2.6830270290374756, "step": 2186} {"train_info/time_between_train_steps": 0.003336668014526367, "step": 2186} {"info/global_step": 2187, "train_info/time_within_train_step": 2.68341326713562, "step": 2187} {"train_info/time_between_train_steps": 0.0032854080200195312, "step": 2187} {"info/global_step": 2188, "train_info/time_within_train_step": 2.684459924697876, "step": 2188} {"train_info/time_between_train_steps": 0.003397226333618164, "step": 2188} {"info/global_step": 2189, "train_info/time_within_train_step": 2.683905839920044, "step": 2189} {"train_info/time_between_train_steps": 0.0034422874450683594, "step": 2189} {"info/global_step": 2190, "train_info/time_within_train_step": 2.6835780143737793, "step": 2190} {"train_info/time_between_train_steps": 0.0033521652221679688, "step": 2190} {"info/global_step": 2191, "train_info/time_within_train_step": 2.684087038040161, "step": 2191} {"train_info/time_between_train_steps": 0.003380298614501953, "step": 2191} {"info/global_step": 2192, "train_info/time_within_train_step": 2.684464454650879, "step": 2192} {"train_info/time_between_train_steps": 0.003439664840698242, "step": 2192} {"info/global_step": 2193, "train_info/time_within_train_step": 2.693986415863037, "step": 2193} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 2193} {"info/global_step": 2194, "train_info/time_within_train_step": 2.6880478858947754, "step": 2194} {"train_info/time_between_train_steps": 0.003458738327026367, "step": 2194} {"info/global_step": 2195, "train_info/time_within_train_step": 2.7346551418304443, "step": 2195} {"train_info/time_between_train_steps": 0.0032806396484375, "step": 2195} {"info/global_step": 2196, "train_info/time_within_train_step": 2.6824791431427, "step": 2196} {"train_info/time_between_train_steps": 0.003221273422241211, "step": 2196} {"info/global_step": 2197, "train_info/time_within_train_step": 2.683566093444824, "step": 2197} {"train_info/time_between_train_steps": 0.0033338069915771484, "step": 2197} {"info/global_step": 2198, "train_info/time_within_train_step": 2.683044910430908, "step": 2198} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 2198} {"info/global_step": 2199, "train_info/time_within_train_step": 2.6824934482574463, "step": 2199} {"train_info/time_between_train_steps": 0.0035059452056884766, "step": 2199} {"info/global_step": 2200, "train_info/time_within_train_step": 2.6822965145111084, "step": 2200} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746318204, "_runtime": 6360}, "step": 2200} {"logs": {"train/loss": 4.1803, "train/learning_rate": 0.00017777777777777776, "train/epoch": 2.16, "_timestamp": 1746318204, "_runtime": 6360}, "step": 2200} {"train_info/time_between_train_steps": 15.658699989318848, "step": 2200} {"info/global_step": 2201, "train_info/time_within_train_step": 2.4758172035217285, "step": 2201} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 2201} {"info/global_step": 2202, "train_info/time_within_train_step": 2.5124971866607666, "step": 2202} {"train_info/time_between_train_steps": 0.0033111572265625, "step": 2202} {"info/global_step": 2203, "train_info/time_within_train_step": 2.680103063583374, "step": 2203} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 2203} {"info/global_step": 2204, "train_info/time_within_train_step": 2.6807377338409424, "step": 2204} {"train_info/time_between_train_steps": 0.003300189971923828, "step": 2204} {"info/global_step": 2205, "train_info/time_within_train_step": 2.681417465209961, "step": 2205} {"train_info/time_between_train_steps": 0.0034966468811035156, "step": 2205} {"info/global_step": 2206, "train_info/time_within_train_step": 2.682093620300293, "step": 2206} {"train_info/time_between_train_steps": 0.09971499443054199, "step": 2206} {"info/global_step": 2207, "train_info/time_within_train_step": 2.694445848464966, "step": 2207} {"train_info/time_between_train_steps": 0.003300905227661133, "step": 2207} {"info/global_step": 2208, "train_info/time_within_train_step": 2.6829748153686523, "step": 2208} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 2208} {"info/global_step": 2209, "train_info/time_within_train_step": 2.6829209327697754, "step": 2209} {"train_info/time_between_train_steps": 0.0032973289489746094, "step": 2209} {"info/global_step": 2210, "train_info/time_within_train_step": 2.68467116355896, "step": 2210} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 2210} {"info/global_step": 2211, "train_info/time_within_train_step": 2.683023691177368, "step": 2211} {"train_info/time_between_train_steps": 0.003270864486694336, "step": 2211} {"info/global_step": 2212, "train_info/time_within_train_step": 2.684209108352661, "step": 2212} {"train_info/time_between_train_steps": 0.0033240318298339844, "step": 2212} {"info/global_step": 2213, "train_info/time_within_train_step": 2.6830644607543945, "step": 2213} {"train_info/time_between_train_steps": 0.0034804344177246094, "step": 2213} {"info/global_step": 2214, "train_info/time_within_train_step": 2.6993677616119385, "step": 2214} {"train_info/time_between_train_steps": 0.0032567977905273438, "step": 2214} {"info/global_step": 2215, "train_info/time_within_train_step": 2.7775826454162598, "step": 2215} {"train_info/time_between_train_steps": 0.0032835006713867188, "step": 2215} {"info/global_step": 2216, "train_info/time_within_train_step": 2.745448112487793, "step": 2216} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 2216} {"info/global_step": 2217, "train_info/time_within_train_step": 2.715315818786621, "step": 2217} {"train_info/time_between_train_steps": 0.003245830535888672, "step": 2217} {"info/global_step": 2218, "train_info/time_within_train_step": 2.721893310546875, "step": 2218} {"train_info/time_between_train_steps": 0.0032672882080078125, "step": 2218} {"info/global_step": 2219, "train_info/time_within_train_step": 2.9595932960510254, "step": 2219} {"train_info/time_between_train_steps": 0.003492593765258789, "step": 2219} {"info/global_step": 2220, "train_info/time_within_train_step": 2.684291124343872, "step": 2220} {"train_info/time_between_train_steps": 0.0032470226287841797, "step": 2220} {"info/global_step": 2221, "train_info/time_within_train_step": 2.683880567550659, "step": 2221} {"train_info/time_between_train_steps": 0.003262758255004883, "step": 2221} {"info/global_step": 2222, "train_info/time_within_train_step": 2.6858022212982178, "step": 2222} {"train_info/time_between_train_steps": 0.0033431053161621094, "step": 2222} {"info/global_step": 2223, "train_info/time_within_train_step": 2.6861493587493896, "step": 2223} {"train_info/time_between_train_steps": 0.00339508056640625, "step": 2223} {"info/global_step": 2224, "train_info/time_within_train_step": 2.7073781490325928, "step": 2224} {"train_info/time_between_train_steps": 0.003265857696533203, "step": 2224} {"info/global_step": 2225, "train_info/time_within_train_step": 2.6911795139312744, "step": 2225} {"train_info/time_between_train_steps": 0.0032722949981689453, "step": 2225} {"info/global_step": 2226, "train_info/time_within_train_step": 2.692298412322998, "step": 2226} {"train_info/time_between_train_steps": 0.003244161605834961, "step": 2226} {"info/global_step": 2227, "train_info/time_within_train_step": 2.69008207321167, "step": 2227} {"train_info/time_between_train_steps": 0.003247976303100586, "step": 2227} {"info/global_step": 2228, "train_info/time_within_train_step": 2.694014549255371, "step": 2228} {"train_info/time_between_train_steps": 0.0036773681640625, "step": 2228} {"info/global_step": 2229, "train_info/time_within_train_step": 2.690828561782837, "step": 2229} {"train_info/time_between_train_steps": 0.0032494068145751953, "step": 2229} {"info/global_step": 2230, "train_info/time_within_train_step": 2.686952829360962, "step": 2230} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 2230} {"info/global_step": 2231, "train_info/time_within_train_step": 2.703278064727783, "step": 2231} {"train_info/time_between_train_steps": 0.0033676624298095703, "step": 2231} {"info/global_step": 2232, "train_info/time_within_train_step": 2.694638252258301, "step": 2232} {"train_info/time_between_train_steps": 0.0034172534942626953, "step": 2232} {"info/global_step": 2233, "train_info/time_within_train_step": 2.69819712638855, "step": 2233} {"train_info/time_between_train_steps": 0.0032455921173095703, "step": 2233} {"info/global_step": 2234, "train_info/time_within_train_step": 2.7040135860443115, "step": 2234} {"train_info/time_between_train_steps": 0.0033652782440185547, "step": 2234} {"info/global_step": 2235, "train_info/time_within_train_step": 2.7077152729034424, "step": 2235} {"train_info/time_between_train_steps": 0.003371715545654297, "step": 2235} {"info/global_step": 2236, "train_info/time_within_train_step": 2.6920104026794434, "step": 2236} {"train_info/time_between_train_steps": 0.0033092498779296875, "step": 2236} {"info/global_step": 2237, "train_info/time_within_train_step": 2.6841630935668945, "step": 2237} {"train_info/time_between_train_steps": 0.0034019947052001953, "step": 2237} {"info/global_step": 2238, "train_info/time_within_train_step": 2.6845052242279053, "step": 2238} {"train_info/time_between_train_steps": 0.0034246444702148438, "step": 2238} {"info/global_step": 2239, "train_info/time_within_train_step": 2.685742139816284, "step": 2239} {"train_info/time_between_train_steps": 0.0034027099609375, "step": 2239} {"info/global_step": 2240, "train_info/time_within_train_step": 2.7042386531829834, "step": 2240} {"train_info/time_between_train_steps": 0.003290891647338867, "step": 2240} {"info/global_step": 2241, "train_info/time_within_train_step": 2.6839096546173096, "step": 2241} {"train_info/time_between_train_steps": 0.0033113956451416016, "step": 2241} {"info/global_step": 2242, "train_info/time_within_train_step": 2.6847474575042725, "step": 2242} {"train_info/time_between_train_steps": 0.003464937210083008, "step": 2242} {"info/global_step": 2243, "train_info/time_within_train_step": 2.6838066577911377, "step": 2243} {"train_info/time_between_train_steps": 0.0034644603729248047, "step": 2243} {"info/global_step": 2244, "train_info/time_within_train_step": 2.687896966934204, "step": 2244} {"train_info/time_between_train_steps": 0.0033109188079833984, "step": 2244} {"info/global_step": 2245, "train_info/time_within_train_step": 2.707165241241455, "step": 2245} {"train_info/time_between_train_steps": 0.003484487533569336, "step": 2245} {"info/global_step": 2246, "train_info/time_within_train_step": 2.684603452682495, "step": 2246} {"train_info/time_between_train_steps": 0.0034656524658203125, "step": 2246} {"info/global_step": 2247, "train_info/time_within_train_step": 2.699733018875122, "step": 2247} {"train_info/time_between_train_steps": 0.021984577178955078, "step": 2247} {"info/global_step": 2248, "train_info/time_within_train_step": 2.684030771255493, "step": 2248} {"train_info/time_between_train_steps": 0.0029418468475341797, "step": 2248} {"info/global_step": 2249, "train_info/time_within_train_step": 3.265406370162964, "step": 2249} {"train_info/time_between_train_steps": 0.0030264854431152344, "step": 2249} {"info/global_step": 2250, "train_info/time_within_train_step": 2.681361436843872, "step": 2250} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746318356, "_runtime": 6512}, "step": 2250} {"logs": {"train/loss": 4.1717, "train/learning_rate": 0.00016666666666666666, "train/epoch": 2.18, "_timestamp": 1746318356, "_runtime": 6512}, "step": 2250} {"train_info/time_between_train_steps": 0.024479150772094727, "step": 2250} {"info/global_step": 2251, "train_info/time_within_train_step": 2.6826062202453613, "step": 2251} {"train_info/time_between_train_steps": 0.0029685497283935547, "step": 2251} {"info/global_step": 2252, "train_info/time_within_train_step": 2.6821677684783936, "step": 2252} {"train_info/time_between_train_steps": 0.0029528141021728516, "step": 2252} {"info/global_step": 2253, "train_info/time_within_train_step": 2.682016372680664, "step": 2253} {"train_info/time_between_train_steps": 0.0029687881469726562, "step": 2253} {"info/global_step": 2254, "train_info/time_within_train_step": 2.6819815635681152, "step": 2254} {"train_info/time_between_train_steps": 0.0029761791229248047, "step": 2254} {"info/global_step": 2255, "train_info/time_within_train_step": 2.6822988986968994, "step": 2255} {"train_info/time_between_train_steps": 0.002960205078125, "step": 2255} {"info/global_step": 2256, "train_info/time_within_train_step": 2.6824543476104736, "step": 2256} {"train_info/time_between_train_steps": 0.003026723861694336, "step": 2256} {"info/global_step": 2257, "train_info/time_within_train_step": 2.681962013244629, "step": 2257} {"train_info/time_between_train_steps": 0.0029897689819335938, "step": 2257} {"info/global_step": 2258, "train_info/time_within_train_step": 2.683356523513794, "step": 2258} {"train_info/time_between_train_steps": 0.0030171871185302734, "step": 2258} {"info/global_step": 2259, "train_info/time_within_train_step": 2.683483600616455, "step": 2259} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 2259} {"info/global_step": 2260, "train_info/time_within_train_step": 2.682710647583008, "step": 2260} {"train_info/time_between_train_steps": 0.0029828548431396484, "step": 2260} {"info/global_step": 2261, "train_info/time_within_train_step": 2.682568311691284, "step": 2261} {"train_info/time_between_train_steps": 0.002946138381958008, "step": 2261} {"info/global_step": 2262, "train_info/time_within_train_step": 2.6830501556396484, "step": 2262} {"train_info/time_between_train_steps": 0.002971649169921875, "step": 2262} {"info/global_step": 2263, "train_info/time_within_train_step": 2.6838347911834717, "step": 2263} {"train_info/time_between_train_steps": 0.003000974655151367, "step": 2263} {"info/global_step": 2264, "train_info/time_within_train_step": 2.68426251411438, "step": 2264} {"train_info/time_between_train_steps": 0.0030274391174316406, "step": 2264} {"info/global_step": 2265, "train_info/time_within_train_step": 2.683271884918213, "step": 2265} {"train_info/time_between_train_steps": 0.002963542938232422, "step": 2265} {"info/global_step": 2266, "train_info/time_within_train_step": 2.6837141513824463, "step": 2266} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 2266} {"info/global_step": 2267, "train_info/time_within_train_step": 2.6824886798858643, "step": 2267} {"train_info/time_between_train_steps": 0.002957582473754883, "step": 2267} {"info/global_step": 2268, "train_info/time_within_train_step": 2.683215856552124, "step": 2268} {"train_info/time_between_train_steps": 0.0029494762420654297, "step": 2268} {"info/global_step": 2269, "train_info/time_within_train_step": 2.6840460300445557, "step": 2269} {"train_info/time_between_train_steps": 0.002979755401611328, "step": 2269} {"info/global_step": 2270, "train_info/time_within_train_step": 2.6828420162200928, "step": 2270} {"train_info/time_between_train_steps": 0.002992391586303711, "step": 2270} {"info/global_step": 2271, "train_info/time_within_train_step": 2.6827585697174072, "step": 2271} {"train_info/time_between_train_steps": 0.0029709339141845703, "step": 2271} {"info/global_step": 2272, "train_info/time_within_train_step": 2.681917905807495, "step": 2272} {"train_info/time_between_train_steps": 0.002999544143676758, "step": 2272} {"info/global_step": 2273, "train_info/time_within_train_step": 2.6827404499053955, "step": 2273} {"train_info/time_between_train_steps": 0.0029811859130859375, "step": 2273} {"info/global_step": 2274, "train_info/time_within_train_step": 2.682419776916504, "step": 2274} {"train_info/time_between_train_steps": 0.0029942989349365234, "step": 2274} {"info/global_step": 2275, "train_info/time_within_train_step": 2.6828622817993164, "step": 2275} {"train_info/time_between_train_steps": 0.002965211868286133, "step": 2275} {"info/global_step": 2276, "train_info/time_within_train_step": 2.919079542160034, "step": 2276} {"train_info/time_between_train_steps": 0.0030019283294677734, "step": 2276} {"info/global_step": 2277, "train_info/time_within_train_step": 2.6815195083618164, "step": 2277} {"train_info/time_between_train_steps": 0.0029778480529785156, "step": 2277} {"info/global_step": 2278, "train_info/time_within_train_step": 2.6820318698883057, "step": 2278} {"train_info/time_between_train_steps": 0.0029900074005126953, "step": 2278} {"info/global_step": 2279, "train_info/time_within_train_step": 2.6836531162261963, "step": 2279} {"train_info/time_between_train_steps": 0.0029897689819335938, "step": 2279} {"info/global_step": 2280, "train_info/time_within_train_step": 2.6843342781066895, "step": 2280} {"train_info/time_between_train_steps": 0.0029878616333007812, "step": 2280} {"info/global_step": 2281, "train_info/time_within_train_step": 2.6925466060638428, "step": 2281} {"train_info/time_between_train_steps": 0.0030264854431152344, "step": 2281} {"info/global_step": 2282, "train_info/time_within_train_step": 2.683121919631958, "step": 2282} {"train_info/time_between_train_steps": 0.0029616355895996094, "step": 2282} {"info/global_step": 2283, "train_info/time_within_train_step": 2.682664632797241, "step": 2283} {"train_info/time_between_train_steps": 0.002987384796142578, "step": 2283} {"info/global_step": 2284, "train_info/time_within_train_step": 2.682114362716675, "step": 2284} {"train_info/time_between_train_steps": 0.0029790401458740234, "step": 2284} {"info/global_step": 2285, "train_info/time_within_train_step": 2.681162118911743, "step": 2285} {"train_info/time_between_train_steps": 0.002976655960083008, "step": 2285} {"info/global_step": 2286, "train_info/time_within_train_step": 2.6827142238616943, "step": 2286} {"train_info/time_between_train_steps": 0.003015756607055664, "step": 2286} {"info/global_step": 2287, "train_info/time_within_train_step": 2.683014392852783, "step": 2287} {"train_info/time_between_train_steps": 0.002970457077026367, "step": 2287} {"info/global_step": 2288, "train_info/time_within_train_step": 2.682206392288208, "step": 2288} {"train_info/time_between_train_steps": 0.002946138381958008, "step": 2288} {"info/global_step": 2289, "train_info/time_within_train_step": 2.6822454929351807, "step": 2289} {"train_info/time_between_train_steps": 0.002973794937133789, "step": 2289} {"info/global_step": 2290, "train_info/time_within_train_step": 2.6832399368286133, "step": 2290} {"train_info/time_between_train_steps": 0.0029850006103515625, "step": 2290} {"info/global_step": 2291, "train_info/time_within_train_step": 2.683607578277588, "step": 2291} {"train_info/time_between_train_steps": 0.003036022186279297, "step": 2291} {"info/global_step": 2292, "train_info/time_within_train_step": 2.6825737953186035, "step": 2292} {"train_info/time_between_train_steps": 0.0030281543731689453, "step": 2292} {"info/global_step": 2293, "train_info/time_within_train_step": 2.681990385055542, "step": 2293} {"train_info/time_between_train_steps": 0.0029556751251220703, "step": 2293} {"info/global_step": 2294, "train_info/time_within_train_step": 2.6811883449554443, "step": 2294} {"train_info/time_between_train_steps": 0.0030150413513183594, "step": 2294} {"info/global_step": 2295, "train_info/time_within_train_step": 2.6820223331451416, "step": 2295} {"train_info/time_between_train_steps": 0.0029914379119873047, "step": 2295} {"info/global_step": 2296, "train_info/time_within_train_step": 2.681060314178467, "step": 2296} {"train_info/time_between_train_steps": 0.002923727035522461, "step": 2296} {"info/global_step": 2297, "train_info/time_within_train_step": 2.682023048400879, "step": 2297} {"train_info/time_between_train_steps": 0.002934694290161133, "step": 2297} {"info/global_step": 2298, "train_info/time_within_train_step": 2.6816766262054443, "step": 2298} {"train_info/time_between_train_steps": 0.002939939498901367, "step": 2298} {"info/global_step": 2299, "train_info/time_within_train_step": 2.6817591190338135, "step": 2299} {"train_info/time_between_train_steps": 0.0029456615447998047, "step": 2299} {"info/global_step": 2300, "train_info/time_within_train_step": 2.681626319885254, "step": 2300} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746318492, "_runtime": 6648}, "step": 2300} {"logs": {"train/loss": 4.1548, "train/learning_rate": 0.00015555555555555554, "train/epoch": 2.2, "_timestamp": 1746318492, "_runtime": 6648}, "step": 2300} {"train_info/time_between_train_steps": 13.38616943359375, "step": 2300} {"info/global_step": 2301, "train_info/time_within_train_step": 2.4765872955322266, "step": 2301} {"train_info/time_between_train_steps": 0.0029611587524414062, "step": 2301} {"info/global_step": 2302, "train_info/time_within_train_step": 2.524573802947998, "step": 2302} {"train_info/time_between_train_steps": 0.002928495407104492, "step": 2302} {"info/global_step": 2303, "train_info/time_within_train_step": 2.6770315170288086, "step": 2303} {"train_info/time_between_train_steps": 0.0029866695404052734, "step": 2303} {"info/global_step": 2304, "train_info/time_within_train_step": 2.6778178215026855, "step": 2304} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 2304} {"info/global_step": 2305, "train_info/time_within_train_step": 2.6797449588775635, "step": 2305} {"train_info/time_between_train_steps": 0.0031676292419433594, "step": 2305} {"info/global_step": 2306, "train_info/time_within_train_step": 2.6819756031036377, "step": 2306} {"train_info/time_between_train_steps": 0.003053903579711914, "step": 2306} {"info/global_step": 2307, "train_info/time_within_train_step": 2.6834676265716553, "step": 2307} {"train_info/time_between_train_steps": 0.003032207489013672, "step": 2307} {"info/global_step": 2308, "train_info/time_within_train_step": 2.68161678314209, "step": 2308} {"train_info/time_between_train_steps": 0.003000497817993164, "step": 2308} {"info/global_step": 2309, "train_info/time_within_train_step": 2.6830055713653564, "step": 2309} {"train_info/time_between_train_steps": 0.0029931068420410156, "step": 2309} {"info/global_step": 2310, "train_info/time_within_train_step": 2.6832337379455566, "step": 2310} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 2310} {"info/global_step": 2311, "train_info/time_within_train_step": 2.7051022052764893, "step": 2311} {"train_info/time_between_train_steps": 0.002969026565551758, "step": 2311} {"info/global_step": 2312, "train_info/time_within_train_step": 2.6823415756225586, "step": 2312} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 2312} {"info/global_step": 2313, "train_info/time_within_train_step": 2.682316780090332, "step": 2313} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 2313} {"info/global_step": 2314, "train_info/time_within_train_step": 2.7083258628845215, "step": 2314} {"train_info/time_between_train_steps": 0.003094196319580078, "step": 2314} {"info/global_step": 2315, "train_info/time_within_train_step": 2.7692341804504395, "step": 2315} {"train_info/time_between_train_steps": 0.003075838088989258, "step": 2315} {"info/global_step": 2316, "train_info/time_within_train_step": 2.7357141971588135, "step": 2316} {"train_info/time_between_train_steps": 0.003110647201538086, "step": 2316} {"info/global_step": 2317, "train_info/time_within_train_step": 2.7356667518615723, "step": 2317} {"train_info/time_between_train_steps": 0.0030891895294189453, "step": 2317} {"info/global_step": 2318, "train_info/time_within_train_step": 2.71500563621521, "step": 2318} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 2318} {"info/global_step": 2319, "train_info/time_within_train_step": 2.71429181098938, "step": 2319} {"train_info/time_between_train_steps": 0.003419637680053711, "step": 2319} {"info/global_step": 2320, "train_info/time_within_train_step": 2.7042787075042725, "step": 2320} {"train_info/time_between_train_steps": 0.0029764175415039062, "step": 2320} {"info/global_step": 2321, "train_info/time_within_train_step": 2.686131238937378, "step": 2321} {"train_info/time_between_train_steps": 0.002942323684692383, "step": 2321} {"info/global_step": 2322, "train_info/time_within_train_step": 2.7188186645507812, "step": 2322} {"train_info/time_between_train_steps": 0.0031206607818603516, "step": 2322} {"info/global_step": 2323, "train_info/time_within_train_step": 2.722583055496216, "step": 2323} {"train_info/time_between_train_steps": 0.0029327869415283203, "step": 2323} {"info/global_step": 2324, "train_info/time_within_train_step": 2.691396713256836, "step": 2324} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 2324} {"info/global_step": 2325, "train_info/time_within_train_step": 2.7080819606781006, "step": 2325} {"train_info/time_between_train_steps": 0.0029282569885253906, "step": 2325} {"info/global_step": 2326, "train_info/time_within_train_step": 2.714895725250244, "step": 2326} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 2326} {"info/global_step": 2327, "train_info/time_within_train_step": 2.6856157779693604, "step": 2327} {"train_info/time_between_train_steps": 0.002942800521850586, "step": 2327} {"info/global_step": 2328, "train_info/time_within_train_step": 2.6978609561920166, "step": 2328} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 2328} {"info/global_step": 2329, "train_info/time_within_train_step": 2.701460838317871, "step": 2329} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 2329} {"info/global_step": 2330, "train_info/time_within_train_step": 2.6916263103485107, "step": 2330} {"train_info/time_between_train_steps": 0.0031435489654541016, "step": 2330} {"info/global_step": 2331, "train_info/time_within_train_step": 2.699995517730713, "step": 2331} {"train_info/time_between_train_steps": 0.0030198097229003906, "step": 2331} {"info/global_step": 2332, "train_info/time_within_train_step": 2.709345817565918, "step": 2332} {"train_info/time_between_train_steps": 0.003258943557739258, "step": 2332} {"info/global_step": 2333, "train_info/time_within_train_step": 2.7326085567474365, "step": 2333} {"train_info/time_between_train_steps": 0.0030298233032226562, "step": 2333} {"info/global_step": 2334, "train_info/time_within_train_step": 2.6849188804626465, "step": 2334} {"train_info/time_between_train_steps": 0.0030548572540283203, "step": 2334} {"info/global_step": 2335, "train_info/time_within_train_step": 2.6896274089813232, "step": 2335} {"train_info/time_between_train_steps": 0.0030159950256347656, "step": 2335} {"info/global_step": 2336, "train_info/time_within_train_step": 2.703699827194214, "step": 2336} {"train_info/time_between_train_steps": 0.003030061721801758, "step": 2336} {"info/global_step": 2337, "train_info/time_within_train_step": 2.693765878677368, "step": 2337} {"train_info/time_between_train_steps": 0.0030143260955810547, "step": 2337} {"info/global_step": 2338, "train_info/time_within_train_step": 2.7066991329193115, "step": 2338} {"train_info/time_between_train_steps": 0.002989530563354492, "step": 2338} {"info/global_step": 2339, "train_info/time_within_train_step": 2.700202703475952, "step": 2339} {"train_info/time_between_train_steps": 0.002962827682495117, "step": 2339} {"info/global_step": 2340, "train_info/time_within_train_step": 2.6832821369171143, "step": 2340} {"train_info/time_between_train_steps": 0.0029647350311279297, "step": 2340} {"info/global_step": 2341, "train_info/time_within_train_step": 2.704242467880249, "step": 2341} {"train_info/time_between_train_steps": 0.002967357635498047, "step": 2341} {"info/global_step": 2342, "train_info/time_within_train_step": 2.686109781265259, "step": 2342} {"train_info/time_between_train_steps": 0.0029878616333007812, "step": 2342} {"info/global_step": 2343, "train_info/time_within_train_step": 2.692112922668457, "step": 2343} {"train_info/time_between_train_steps": 0.003002166748046875, "step": 2343} {"info/global_step": 2344, "train_info/time_within_train_step": 2.6841890811920166, "step": 2344} {"train_info/time_between_train_steps": 0.0030128955841064453, "step": 2344} {"info/global_step": 2345, "train_info/time_within_train_step": 2.684007167816162, "step": 2345} {"train_info/time_between_train_steps": 0.0030367374420166016, "step": 2345} {"info/global_step": 2346, "train_info/time_within_train_step": 2.6937191486358643, "step": 2346} {"train_info/time_between_train_steps": 0.0029785633087158203, "step": 2346} {"info/global_step": 2347, "train_info/time_within_train_step": 2.697927951812744, "step": 2347} {"train_info/time_between_train_steps": 0.003000020980834961, "step": 2347} {"info/global_step": 2348, "train_info/time_within_train_step": 2.6841065883636475, "step": 2348} {"train_info/time_between_train_steps": 0.0030303001403808594, "step": 2348} {"info/global_step": 2349, "train_info/time_within_train_step": 2.685999631881714, "step": 2349} {"train_info/time_between_train_steps": 0.003041982650756836, "step": 2349} {"info/global_step": 2350, "train_info/time_within_train_step": 2.696680784225464, "step": 2350} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746318641, "_runtime": 6797}, "step": 2350} {"logs": {"train/loss": 4.1353, "train/learning_rate": 0.0001444444444444444, "train/epoch": 2.21, "_timestamp": 1746318641, "_runtime": 6797}, "step": 2350} {"train_info/time_between_train_steps": 0.029832124710083008, "step": 2350} {"info/global_step": 2351, "train_info/time_within_train_step": 2.684636354446411, "step": 2351} {"train_info/time_between_train_steps": 0.002986907958984375, "step": 2351} {"info/global_step": 2352, "train_info/time_within_train_step": 2.6840169429779053, "step": 2352} {"train_info/time_between_train_steps": 0.0030167102813720703, "step": 2352} {"info/global_step": 2353, "train_info/time_within_train_step": 2.6833302974700928, "step": 2353} {"train_info/time_between_train_steps": 0.0029778480529785156, "step": 2353} {"info/global_step": 2354, "train_info/time_within_train_step": 2.683243751525879, "step": 2354} {"train_info/time_between_train_steps": 0.0030074119567871094, "step": 2354} {"info/global_step": 2355, "train_info/time_within_train_step": 2.6831891536712646, "step": 2355} {"train_info/time_between_train_steps": 0.0030710697174072266, "step": 2355} {"info/global_step": 2356, "train_info/time_within_train_step": 2.6835436820983887, "step": 2356} {"train_info/time_between_train_steps": 0.0030341148376464844, "step": 2356} {"info/global_step": 2357, "train_info/time_within_train_step": 2.683253049850464, "step": 2357} {"train_info/time_between_train_steps": 0.003112316131591797, "step": 2357} {"info/global_step": 2358, "train_info/time_within_train_step": 2.6837680339813232, "step": 2358} {"train_info/time_between_train_steps": 0.003069639205932617, "step": 2358} {"info/global_step": 2359, "train_info/time_within_train_step": 2.8739683628082275, "step": 2359} {"train_info/time_between_train_steps": 0.003078460693359375, "step": 2359} {"info/global_step": 2360, "train_info/time_within_train_step": 2.682858943939209, "step": 2360} {"train_info/time_between_train_steps": 0.003017902374267578, "step": 2360} {"info/global_step": 2361, "train_info/time_within_train_step": 2.683537721633911, "step": 2361} {"train_info/time_between_train_steps": 0.003045797348022461, "step": 2361} {"info/global_step": 2362, "train_info/time_within_train_step": 2.683506488800049, "step": 2362} {"train_info/time_between_train_steps": 0.0030965805053710938, "step": 2362} {"info/global_step": 2363, "train_info/time_within_train_step": 2.683701992034912, "step": 2363} {"train_info/time_between_train_steps": 0.003025531768798828, "step": 2363} {"info/global_step": 2364, "train_info/time_within_train_step": 2.6841938495635986, "step": 2364} {"train_info/time_between_train_steps": 0.0030553340911865234, "step": 2364} {"info/global_step": 2365, "train_info/time_within_train_step": 2.683539628982544, "step": 2365} {"train_info/time_between_train_steps": 0.003017425537109375, "step": 2365} {"info/global_step": 2366, "train_info/time_within_train_step": 2.68375301361084, "step": 2366} {"train_info/time_between_train_steps": 0.003048419952392578, "step": 2366} {"info/global_step": 2367, "train_info/time_within_train_step": 2.683980703353882, "step": 2367} {"train_info/time_between_train_steps": 0.0030241012573242188, "step": 2367} {"info/global_step": 2368, "train_info/time_within_train_step": 2.6844894886016846, "step": 2368} {"train_info/time_between_train_steps": 0.003009319305419922, "step": 2368} {"info/global_step": 2369, "train_info/time_within_train_step": 2.6847238540649414, "step": 2369} {"train_info/time_between_train_steps": 0.0030210018157958984, "step": 2369} {"info/global_step": 2370, "train_info/time_within_train_step": 2.683136463165283, "step": 2370} {"train_info/time_between_train_steps": 0.0030176639556884766, "step": 2370} {"info/global_step": 2371, "train_info/time_within_train_step": 2.68392276763916, "step": 2371} {"train_info/time_between_train_steps": 0.0030410289764404297, "step": 2371} {"info/global_step": 2372, "train_info/time_within_train_step": 2.682955741882324, "step": 2372} {"train_info/time_between_train_steps": 0.003000020980834961, "step": 2372} {"info/global_step": 2373, "train_info/time_within_train_step": 2.68329119682312, "step": 2373} {"train_info/time_between_train_steps": 0.003014087677001953, "step": 2373} {"info/global_step": 2374, "train_info/time_within_train_step": 2.6834053993225098, "step": 2374} {"train_info/time_between_train_steps": 0.0030562877655029297, "step": 2374} {"info/global_step": 2375, "train_info/time_within_train_step": 2.682732343673706, "step": 2375} {"train_info/time_between_train_steps": 0.0030112266540527344, "step": 2375} {"info/global_step": 2376, "train_info/time_within_train_step": 2.683356761932373, "step": 2376} {"train_info/time_between_train_steps": 0.0030159950256347656, "step": 2376} {"info/global_step": 2377, "train_info/time_within_train_step": 2.683727741241455, "step": 2377} {"train_info/time_between_train_steps": 0.0030517578125, "step": 2377} {"info/global_step": 2378, "train_info/time_within_train_step": 2.6826696395874023, "step": 2378} {"train_info/time_between_train_steps": 0.0030188560485839844, "step": 2378} {"info/global_step": 2379, "train_info/time_within_train_step": 2.683688163757324, "step": 2379} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 2379} {"info/global_step": 2380, "train_info/time_within_train_step": 2.6820409297943115, "step": 2380} {"train_info/time_between_train_steps": 0.002987384796142578, "step": 2380} {"info/global_step": 2381, "train_info/time_within_train_step": 2.684433937072754, "step": 2381} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 2381} {"info/global_step": 2382, "train_info/time_within_train_step": 2.6836254596710205, "step": 2382} {"train_info/time_between_train_steps": 0.003035306930541992, "step": 2382} {"info/global_step": 2383, "train_info/time_within_train_step": 2.6839535236358643, "step": 2383} {"train_info/time_between_train_steps": 0.0029816627502441406, "step": 2383} {"info/global_step": 2384, "train_info/time_within_train_step": 2.6822621822357178, "step": 2384} {"train_info/time_between_train_steps": 0.0029909610748291016, "step": 2384} {"info/global_step": 2385, "train_info/time_within_train_step": 2.681919574737549, "step": 2385} {"train_info/time_between_train_steps": 0.0030176639556884766, "step": 2385} {"info/global_step": 2386, "train_info/time_within_train_step": 2.6826348304748535, "step": 2386} {"train_info/time_between_train_steps": 0.0030145645141601562, "step": 2386} {"info/global_step": 2387, "train_info/time_within_train_step": 2.681657314300537, "step": 2387} {"train_info/time_between_train_steps": 0.003027677536010742, "step": 2387} {"info/global_step": 2388, "train_info/time_within_train_step": 2.6827311515808105, "step": 2388} {"train_info/time_between_train_steps": 0.0030057430267333984, "step": 2388} {"info/global_step": 2389, "train_info/time_within_train_step": 2.68247389793396, "step": 2389} {"train_info/time_between_train_steps": 0.003006458282470703, "step": 2389} {"info/global_step": 2390, "train_info/time_within_train_step": 2.681663751602173, "step": 2390} {"train_info/time_between_train_steps": 0.003016233444213867, "step": 2390} {"info/global_step": 2391, "train_info/time_within_train_step": 2.6821329593658447, "step": 2391} {"train_info/time_between_train_steps": 0.003035306930541992, "step": 2391} {"info/global_step": 2392, "train_info/time_within_train_step": 2.6830105781555176, "step": 2392} {"train_info/time_between_train_steps": 0.003026247024536133, "step": 2392} {"info/global_step": 2393, "train_info/time_within_train_step": 2.6825318336486816, "step": 2393} {"train_info/time_between_train_steps": 0.0029768943786621094, "step": 2393} {"info/global_step": 2394, "train_info/time_within_train_step": 2.683208465576172, "step": 2394} {"train_info/time_between_train_steps": 0.0030384063720703125, "step": 2394} {"info/global_step": 2395, "train_info/time_within_train_step": 2.6825175285339355, "step": 2395} {"train_info/time_between_train_steps": 0.002992391586303711, "step": 2395} {"info/global_step": 2396, "train_info/time_within_train_step": 2.682811975479126, "step": 2396} {"train_info/time_between_train_steps": 0.0030066967010498047, "step": 2396} {"info/global_step": 2397, "train_info/time_within_train_step": 2.6834826469421387, "step": 2397} {"train_info/time_between_train_steps": 0.0029344558715820312, "step": 2397} {"info/global_step": 2398, "train_info/time_within_train_step": 2.6835644245147705, "step": 2398} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 2398} {"info/global_step": 2399, "train_info/time_within_train_step": 2.684903860092163, "step": 2399} {"train_info/time_between_train_steps": 0.003032207489013672, "step": 2399} {"info/global_step": 2400, "train_info/time_within_train_step": 2.6845030784606934, "step": 2400} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746318777, "_runtime": 6933}, "step": 2400} {"logs": {"train/loss": 4.1184, "train/learning_rate": 0.0001333333333333333, "train/epoch": 2.23, "_timestamp": 1746318777, "_runtime": 6933}, "step": 2400} {"train_info/time_between_train_steps": 12.874290943145752, "step": 2400} {"info/global_step": 2401, "train_info/time_within_train_step": 2.4827661514282227, "step": 2401} {"train_info/time_between_train_steps": 0.003098726272583008, "step": 2401} {"info/global_step": 2402, "train_info/time_within_train_step": 2.537382125854492, "step": 2402} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 2402} {"info/global_step": 2403, "train_info/time_within_train_step": 2.6807048320770264, "step": 2403} {"train_info/time_between_train_steps": 0.002971649169921875, "step": 2403} {"info/global_step": 2404, "train_info/time_within_train_step": 2.679960012435913, "step": 2404} {"train_info/time_between_train_steps": 0.003026723861694336, "step": 2404} {"info/global_step": 2405, "train_info/time_within_train_step": 2.6828999519348145, "step": 2405} {"train_info/time_between_train_steps": 0.0029914379119873047, "step": 2405} {"info/global_step": 2406, "train_info/time_within_train_step": 2.6831188201904297, "step": 2406} {"train_info/time_between_train_steps": 0.003023862838745117, "step": 2406} {"info/global_step": 2407, "train_info/time_within_train_step": 2.6839096546173096, "step": 2407} {"train_info/time_between_train_steps": 0.0030584335327148438, "step": 2407} {"info/global_step": 2408, "train_info/time_within_train_step": 2.684086799621582, "step": 2408} {"train_info/time_between_train_steps": 0.0030753612518310547, "step": 2408} {"info/global_step": 2409, "train_info/time_within_train_step": 2.682818651199341, "step": 2409} {"train_info/time_between_train_steps": 0.0030405521392822266, "step": 2409} {"info/global_step": 2410, "train_info/time_within_train_step": 2.682720184326172, "step": 2410} {"train_info/time_between_train_steps": 0.003015279769897461, "step": 2410} {"info/global_step": 2411, "train_info/time_within_train_step": 2.683176040649414, "step": 2411} {"train_info/time_between_train_steps": 0.0030984878540039062, "step": 2411} {"info/global_step": 2412, "train_info/time_within_train_step": 2.682709217071533, "step": 2412} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 2412} {"info/global_step": 2413, "train_info/time_within_train_step": 2.683626413345337, "step": 2413} {"train_info/time_between_train_steps": 0.00310516357421875, "step": 2413} {"info/global_step": 2414, "train_info/time_within_train_step": 2.6875407695770264, "step": 2414} {"train_info/time_between_train_steps": 0.0030896663665771484, "step": 2414} {"info/global_step": 2415, "train_info/time_within_train_step": 2.8806467056274414, "step": 2415} {"train_info/time_between_train_steps": 0.0032689571380615234, "step": 2415} {"info/global_step": 2416, "train_info/time_within_train_step": 2.7097644805908203, "step": 2416} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 2416} {"info/global_step": 2417, "train_info/time_within_train_step": 2.722540855407715, "step": 2417} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 2417} {"info/global_step": 2418, "train_info/time_within_train_step": 2.7061173915863037, "step": 2418} {"train_info/time_between_train_steps": 0.002994537353515625, "step": 2418} {"info/global_step": 2419, "train_info/time_within_train_step": 2.7349908351898193, "step": 2419} {"train_info/time_between_train_steps": 0.0030307769775390625, "step": 2419} {"info/global_step": 2420, "train_info/time_within_train_step": 2.7041256427764893, "step": 2420} {"train_info/time_between_train_steps": 0.0029375553131103516, "step": 2420} {"info/global_step": 2421, "train_info/time_within_train_step": 2.714266300201416, "step": 2421} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 2421} {"info/global_step": 2422, "train_info/time_within_train_step": 2.7101962566375732, "step": 2422} {"train_info/time_between_train_steps": 0.0032663345336914062, "step": 2422} {"info/global_step": 2423, "train_info/time_within_train_step": 2.7011847496032715, "step": 2423} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 2423} {"info/global_step": 2424, "train_info/time_within_train_step": 2.7473926544189453, "step": 2424} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 2424} {"info/global_step": 2425, "train_info/time_within_train_step": 2.68904447555542, "step": 2425} {"train_info/time_between_train_steps": 0.0029146671295166016, "step": 2425} {"info/global_step": 2426, "train_info/time_within_train_step": 2.6870529651641846, "step": 2426} {"train_info/time_between_train_steps": 0.0031371116638183594, "step": 2426} {"info/global_step": 2427, "train_info/time_within_train_step": 2.689061403274536, "step": 2427} {"train_info/time_between_train_steps": 0.0028967857360839844, "step": 2427} {"info/global_step": 2428, "train_info/time_within_train_step": 2.702578067779541, "step": 2428} {"train_info/time_between_train_steps": 0.002897977828979492, "step": 2428} {"info/global_step": 2429, "train_info/time_within_train_step": 2.691103935241699, "step": 2429} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 2429} {"info/global_step": 2430, "train_info/time_within_train_step": 2.7008278369903564, "step": 2430} {"train_info/time_between_train_steps": 0.002991199493408203, "step": 2430} {"info/global_step": 2431, "train_info/time_within_train_step": 2.697089910507202, "step": 2431} {"train_info/time_between_train_steps": 0.002962350845336914, "step": 2431} {"info/global_step": 2432, "train_info/time_within_train_step": 2.6854608058929443, "step": 2432} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 2432} {"info/global_step": 2433, "train_info/time_within_train_step": 2.69138765335083, "step": 2433} {"train_info/time_between_train_steps": 0.003040313720703125, "step": 2433} {"info/global_step": 2434, "train_info/time_within_train_step": 2.7070260047912598, "step": 2434} {"train_info/time_between_train_steps": 0.0029447078704833984, "step": 2434} {"info/global_step": 2435, "train_info/time_within_train_step": 2.691082000732422, "step": 2435} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 2435} {"info/global_step": 2436, "train_info/time_within_train_step": 2.681830883026123, "step": 2436} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 2436} {"info/global_step": 2437, "train_info/time_within_train_step": 2.682807683944702, "step": 2437} {"train_info/time_between_train_steps": 0.0029671192169189453, "step": 2437} {"info/global_step": 2438, "train_info/time_within_train_step": 2.699077606201172, "step": 2438} {"train_info/time_between_train_steps": 0.0030486583709716797, "step": 2438} {"info/global_step": 2439, "train_info/time_within_train_step": 2.701456308364868, "step": 2439} {"train_info/time_between_train_steps": 0.0028841495513916016, "step": 2439} {"info/global_step": 2440, "train_info/time_within_train_step": 2.699364423751831, "step": 2440} {"train_info/time_between_train_steps": 0.0029599666595458984, "step": 2440} {"info/global_step": 2441, "train_info/time_within_train_step": 2.684067964553833, "step": 2441} {"train_info/time_between_train_steps": 0.0028831958770751953, "step": 2441} {"info/global_step": 2442, "train_info/time_within_train_step": 2.6827683448791504, "step": 2442} {"train_info/time_between_train_steps": 0.003057718276977539, "step": 2442} {"info/global_step": 2443, "train_info/time_within_train_step": 2.683732271194458, "step": 2443} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 2443} {"info/global_step": 2444, "train_info/time_within_train_step": 2.686436176300049, "step": 2444} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 2444} {"info/global_step": 2445, "train_info/time_within_train_step": 2.682734489440918, "step": 2445} {"train_info/time_between_train_steps": 0.0029315948486328125, "step": 2445} {"info/global_step": 2446, "train_info/time_within_train_step": 2.6878907680511475, "step": 2446} {"train_info/time_between_train_steps": 0.0030231475830078125, "step": 2446} {"info/global_step": 2447, "train_info/time_within_train_step": 2.6820387840270996, "step": 2447} {"train_info/time_between_train_steps": 0.003101348876953125, "step": 2447} {"info/global_step": 2448, "train_info/time_within_train_step": 2.708589792251587, "step": 2448} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 2448} {"info/global_step": 2449, "train_info/time_within_train_step": 2.682685613632202, "step": 2449} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 2449} {"info/global_step": 2450, "train_info/time_within_train_step": 2.683708906173706, "step": 2450} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746318925, "_runtime": 7081}, "step": 2450} {"logs": {"train/loss": 4.1014, "train/learning_rate": 0.00012222222222222221, "train/epoch": 2.25, "_timestamp": 1746318925, "_runtime": 7081}, "step": 2450} {"train_info/time_between_train_steps": 0.024895429611206055, "step": 2450} {"info/global_step": 2451, "train_info/time_within_train_step": 2.6928536891937256, "step": 2451} {"train_info/time_between_train_steps": 0.0037682056427001953, "step": 2451} {"info/global_step": 2452, "train_info/time_within_train_step": 2.6839001178741455, "step": 2452} {"train_info/time_between_train_steps": 0.0029840469360351562, "step": 2452} {"info/global_step": 2453, "train_info/time_within_train_step": 2.6835312843322754, "step": 2453} {"train_info/time_between_train_steps": 0.003004312515258789, "step": 2453} {"info/global_step": 2454, "train_info/time_within_train_step": 2.797898054122925, "step": 2454} {"train_info/time_between_train_steps": 0.003045797348022461, "step": 2454} {"info/global_step": 2455, "train_info/time_within_train_step": 2.6830146312713623, "step": 2455} {"train_info/time_between_train_steps": 0.003023386001586914, "step": 2455} {"info/global_step": 2456, "train_info/time_within_train_step": 2.6832692623138428, "step": 2456} {"train_info/time_between_train_steps": 0.00295257568359375, "step": 2456} {"info/global_step": 2457, "train_info/time_within_train_step": 2.6839587688446045, "step": 2457} {"train_info/time_between_train_steps": 0.0029685497283935547, "step": 2457} {"info/global_step": 2458, "train_info/time_within_train_step": 2.6827566623687744, "step": 2458} {"train_info/time_between_train_steps": 0.0031058788299560547, "step": 2458} {"info/global_step": 2459, "train_info/time_within_train_step": 2.6838715076446533, "step": 2459} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 2459} {"info/global_step": 2460, "train_info/time_within_train_step": 2.6832292079925537, "step": 2460} {"train_info/time_between_train_steps": 0.0030393600463867188, "step": 2460} {"info/global_step": 2461, "train_info/time_within_train_step": 2.6832540035247803, "step": 2461} {"train_info/time_between_train_steps": 0.003091573715209961, "step": 2461} {"info/global_step": 2462, "train_info/time_within_train_step": 2.683239459991455, "step": 2462} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 2462} {"info/global_step": 2463, "train_info/time_within_train_step": 2.682425022125244, "step": 2463} {"train_info/time_between_train_steps": 0.0030028820037841797, "step": 2463} {"info/global_step": 2464, "train_info/time_within_train_step": 2.6828293800354004, "step": 2464} {"train_info/time_between_train_steps": 0.0030236244201660156, "step": 2464} {"info/global_step": 2465, "train_info/time_within_train_step": 2.683161735534668, "step": 2465} {"train_info/time_between_train_steps": 0.0030090808868408203, "step": 2465} {"info/global_step": 2466, "train_info/time_within_train_step": 2.683483362197876, "step": 2466} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 2466} {"info/global_step": 2467, "train_info/time_within_train_step": 2.6884899139404297, "step": 2467} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 2467} {"info/global_step": 2468, "train_info/time_within_train_step": 2.683150053024292, "step": 2468} {"train_info/time_between_train_steps": 0.0030355453491210938, "step": 2468} {"info/global_step": 2469, "train_info/time_within_train_step": 2.683060646057129, "step": 2469} {"train_info/time_between_train_steps": 0.0029685497283935547, "step": 2469} {"info/global_step": 2470, "train_info/time_within_train_step": 2.683419704437256, "step": 2470} {"train_info/time_between_train_steps": 0.0030488967895507812, "step": 2470} {"info/global_step": 2471, "train_info/time_within_train_step": 2.682478666305542, "step": 2471} {"train_info/time_between_train_steps": 0.0031502246856689453, "step": 2471} {"info/global_step": 2472, "train_info/time_within_train_step": 2.682805061340332, "step": 2472} {"train_info/time_between_train_steps": 0.0029625892639160156, "step": 2472} {"info/global_step": 2473, "train_info/time_within_train_step": 2.683298110961914, "step": 2473} {"train_info/time_between_train_steps": 0.002998828887939453, "step": 2473} {"info/global_step": 2474, "train_info/time_within_train_step": 2.6831271648406982, "step": 2474} {"train_info/time_between_train_steps": 0.002978801727294922, "step": 2474} {"info/global_step": 2475, "train_info/time_within_train_step": 2.683204412460327, "step": 2475} {"train_info/time_between_train_steps": 0.0030307769775390625, "step": 2475} {"info/global_step": 2476, "train_info/time_within_train_step": 2.68302059173584, "step": 2476} {"train_info/time_between_train_steps": 0.002958059310913086, "step": 2476} {"info/global_step": 2477, "train_info/time_within_train_step": 2.68385910987854, "step": 2477} {"train_info/time_between_train_steps": 0.0029480457305908203, "step": 2477} {"info/global_step": 2478, "train_info/time_within_train_step": 2.682263135910034, "step": 2478} {"train_info/time_between_train_steps": 0.00295257568359375, "step": 2478} {"info/global_step": 2479, "train_info/time_within_train_step": 2.6827449798583984, "step": 2479} {"train_info/time_between_train_steps": 0.0030078887939453125, "step": 2479} {"info/global_step": 2480, "train_info/time_within_train_step": 2.6832785606384277, "step": 2480} {"train_info/time_between_train_steps": 0.0029408931732177734, "step": 2480} {"info/global_step": 2481, "train_info/time_within_train_step": 2.6833910942077637, "step": 2481} {"train_info/time_between_train_steps": 0.0029878616333007812, "step": 2481} {"info/global_step": 2482, "train_info/time_within_train_step": 2.6833698749542236, "step": 2482} {"train_info/time_between_train_steps": 0.0029799938201904297, "step": 2482} {"info/global_step": 2483, "train_info/time_within_train_step": 2.6835572719573975, "step": 2483} {"train_info/time_between_train_steps": 0.002966165542602539, "step": 2483} {"info/global_step": 2484, "train_info/time_within_train_step": 2.6839215755462646, "step": 2484} {"train_info/time_between_train_steps": 0.0029985904693603516, "step": 2484} {"info/global_step": 2485, "train_info/time_within_train_step": 2.6840243339538574, "step": 2485} {"train_info/time_between_train_steps": 0.002995014190673828, "step": 2485} {"info/global_step": 2486, "train_info/time_within_train_step": 2.6848926544189453, "step": 2486} {"train_info/time_between_train_steps": 0.0030357837677001953, "step": 2486} {"info/global_step": 2487, "train_info/time_within_train_step": 2.6847176551818848, "step": 2487} {"train_info/time_between_train_steps": 0.003010988235473633, "step": 2487} {"info/global_step": 2488, "train_info/time_within_train_step": 2.6840569972991943, "step": 2488} {"train_info/time_between_train_steps": 0.003022909164428711, "step": 2488} {"info/global_step": 2489, "train_info/time_within_train_step": 2.683288812637329, "step": 2489} {"train_info/time_between_train_steps": 0.0029921531677246094, "step": 2489} {"info/global_step": 2490, "train_info/time_within_train_step": 2.684290647506714, "step": 2490} {"train_info/time_between_train_steps": 0.0035429000854492188, "step": 2490} {"info/global_step": 2491, "train_info/time_within_train_step": 2.683276414871216, "step": 2491} {"train_info/time_between_train_steps": 0.002984762191772461, "step": 2491} {"info/global_step": 2492, "train_info/time_within_train_step": 2.6825292110443115, "step": 2492} {"train_info/time_between_train_steps": 0.0029990673065185547, "step": 2492} {"info/global_step": 2493, "train_info/time_within_train_step": 2.682345151901245, "step": 2493} {"train_info/time_between_train_steps": 0.0029811859130859375, "step": 2493} {"info/global_step": 2494, "train_info/time_within_train_step": 2.6833484172821045, "step": 2494} {"train_info/time_between_train_steps": 0.0030198097229003906, "step": 2494} {"info/global_step": 2495, "train_info/time_within_train_step": 2.683034658432007, "step": 2495} {"train_info/time_between_train_steps": 0.0029637813568115234, "step": 2495} {"info/global_step": 2496, "train_info/time_within_train_step": 2.6824913024902344, "step": 2496} {"train_info/time_between_train_steps": 0.0029916763305664062, "step": 2496} {"info/global_step": 2497, "train_info/time_within_train_step": 2.6830432415008545, "step": 2497} {"train_info/time_between_train_steps": 0.0031082630157470703, "step": 2497} {"info/global_step": 2498, "train_info/time_within_train_step": 2.682931423187256, "step": 2498} {"train_info/time_between_train_steps": 0.0029625892639160156, "step": 2498} {"info/global_step": 2499, "train_info/time_within_train_step": 3.243320941925049, "step": 2499} {"train_info/time_between_train_steps": 0.0030040740966796875, "step": 2499} {"info/global_step": 2500, "train_info/time_within_train_step": 2.6828675270080566, "step": 2500} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746319061, "_runtime": 7217}, "step": 2500} {"logs": {"train/loss": 4.0865, "train/learning_rate": 0.00011111111111111109, "train/epoch": 2.26, "_timestamp": 1746319061, "_runtime": 7217}, "step": 2500} {"train_info/time_between_train_steps": 13.740568399429321, "step": 2500} {"info/global_step": 2501, "train_info/time_within_train_step": 2.4817492961883545, "step": 2501} {"train_info/time_between_train_steps": 0.003021717071533203, "step": 2501} {"info/global_step": 2502, "train_info/time_within_train_step": 2.514397144317627, "step": 2502} {"train_info/time_between_train_steps": 0.0029926300048828125, "step": 2502} {"info/global_step": 2503, "train_info/time_within_train_step": 2.6811046600341797, "step": 2503} {"train_info/time_between_train_steps": 0.002980947494506836, "step": 2503} {"info/global_step": 2504, "train_info/time_within_train_step": 2.6814889907836914, "step": 2504} {"train_info/time_between_train_steps": 0.003034353256225586, "step": 2504} {"info/global_step": 2505, "train_info/time_within_train_step": 2.681118965148926, "step": 2505} {"train_info/time_between_train_steps": 0.003038644790649414, "step": 2505} {"info/global_step": 2506, "train_info/time_within_train_step": 2.681673288345337, "step": 2506} {"train_info/time_between_train_steps": 0.003031492233276367, "step": 2506} {"info/global_step": 2507, "train_info/time_within_train_step": 2.6840391159057617, "step": 2507} {"train_info/time_between_train_steps": 0.00299072265625, "step": 2507} {"info/global_step": 2508, "train_info/time_within_train_step": 2.6810784339904785, "step": 2508} {"train_info/time_between_train_steps": 0.0030798912048339844, "step": 2508} {"info/global_step": 2509, "train_info/time_within_train_step": 2.6817586421966553, "step": 2509} {"train_info/time_between_train_steps": 0.0029630661010742188, "step": 2509} {"info/global_step": 2510, "train_info/time_within_train_step": 2.683974504470825, "step": 2510} {"train_info/time_between_train_steps": 0.003000974655151367, "step": 2510} {"info/global_step": 2511, "train_info/time_within_train_step": 2.6837637424468994, "step": 2511} {"train_info/time_between_train_steps": 0.00302886962890625, "step": 2511} {"info/global_step": 2512, "train_info/time_within_train_step": 2.6841044425964355, "step": 2512} {"train_info/time_between_train_steps": 0.0031137466430664062, "step": 2512} {"info/global_step": 2513, "train_info/time_within_train_step": 2.6849193572998047, "step": 2513} {"train_info/time_between_train_steps": 0.003078460693359375, "step": 2513} {"info/global_step": 2514, "train_info/time_within_train_step": 2.736076831817627, "step": 2514} {"train_info/time_between_train_steps": 0.003248453140258789, "step": 2514} {"info/global_step": 2515, "train_info/time_within_train_step": 2.779383420944214, "step": 2515} {"train_info/time_between_train_steps": 0.0032770633697509766, "step": 2515} {"info/global_step": 2516, "train_info/time_within_train_step": 2.7198431491851807, "step": 2516} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 2516} {"info/global_step": 2517, "train_info/time_within_train_step": 2.7286899089813232, "step": 2517} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 2517} {"info/global_step": 2518, "train_info/time_within_train_step": 2.7083616256713867, "step": 2518} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 2518} {"info/global_step": 2519, "train_info/time_within_train_step": 2.689380407333374, "step": 2519} {"train_info/time_between_train_steps": 0.0030345916748046875, "step": 2519} {"info/global_step": 2520, "train_info/time_within_train_step": 2.7109854221343994, "step": 2520} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 2520} {"info/global_step": 2521, "train_info/time_within_train_step": 2.698137044906616, "step": 2521} {"train_info/time_between_train_steps": 0.0032498836517333984, "step": 2521} {"info/global_step": 2522, "train_info/time_within_train_step": 2.6970784664154053, "step": 2522} {"train_info/time_between_train_steps": 0.003108978271484375, "step": 2522} {"info/global_step": 2523, "train_info/time_within_train_step": 2.725684642791748, "step": 2523} {"train_info/time_between_train_steps": 0.0045626163482666016, "step": 2523} {"info/global_step": 2524, "train_info/time_within_train_step": 2.7383718490600586, "step": 2524} {"train_info/time_between_train_steps": 0.005017995834350586, "step": 2524} {"info/global_step": 2525, "train_info/time_within_train_step": 2.691345691680908, "step": 2525} {"train_info/time_between_train_steps": 0.0034036636352539062, "step": 2525} {"info/global_step": 2526, "train_info/time_within_train_step": 2.695884943008423, "step": 2526} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 2526} {"info/global_step": 2527, "train_info/time_within_train_step": 2.751569986343384, "step": 2527} {"train_info/time_between_train_steps": 0.003117799758911133, "step": 2527} {"info/global_step": 2528, "train_info/time_within_train_step": 2.684610605239868, "step": 2528} {"train_info/time_between_train_steps": 0.003063678741455078, "step": 2528} {"info/global_step": 2529, "train_info/time_within_train_step": 2.703376054763794, "step": 2529} {"train_info/time_between_train_steps": 0.003201007843017578, "step": 2529} {"info/global_step": 2530, "train_info/time_within_train_step": 2.700975179672241, "step": 2530} {"train_info/time_between_train_steps": 0.0029189586639404297, "step": 2530} {"info/global_step": 2531, "train_info/time_within_train_step": 2.685795307159424, "step": 2531} {"train_info/time_between_train_steps": 0.0028963088989257812, "step": 2531} {"info/global_step": 2532, "train_info/time_within_train_step": 2.6982312202453613, "step": 2532} {"train_info/time_between_train_steps": 0.003106355667114258, "step": 2532} {"info/global_step": 2533, "train_info/time_within_train_step": 2.7114384174346924, "step": 2533} {"train_info/time_between_train_steps": 0.0031218528747558594, "step": 2533} {"info/global_step": 2534, "train_info/time_within_train_step": 2.681894540786743, "step": 2534} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 2534} {"info/global_step": 2535, "train_info/time_within_train_step": 2.6849446296691895, "step": 2535} {"train_info/time_between_train_steps": 0.0030488967895507812, "step": 2535} {"info/global_step": 2536, "train_info/time_within_train_step": 2.6859772205352783, "step": 2536} {"train_info/time_between_train_steps": 0.0030596256256103516, "step": 2536} {"info/global_step": 2537, "train_info/time_within_train_step": 2.6962168216705322, "step": 2537} {"train_info/time_between_train_steps": 0.0030145645141601562, "step": 2537} {"info/global_step": 2538, "train_info/time_within_train_step": 2.6837427616119385, "step": 2538} {"train_info/time_between_train_steps": 0.0031044483184814453, "step": 2538} {"info/global_step": 2539, "train_info/time_within_train_step": 2.6951615810394287, "step": 2539} {"train_info/time_between_train_steps": 0.0030515193939208984, "step": 2539} {"info/global_step": 2540, "train_info/time_within_train_step": 2.697742223739624, "step": 2540} {"train_info/time_between_train_steps": 0.002979278564453125, "step": 2540} {"info/global_step": 2541, "train_info/time_within_train_step": 2.6839492321014404, "step": 2541} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 2541} {"info/global_step": 2542, "train_info/time_within_train_step": 2.6841893196105957, "step": 2542} {"train_info/time_between_train_steps": 0.0031385421752929688, "step": 2542} {"info/global_step": 2543, "train_info/time_within_train_step": 2.683778762817383, "step": 2543} {"train_info/time_between_train_steps": 0.0033991336822509766, "step": 2543} {"info/global_step": 2544, "train_info/time_within_train_step": 2.684577703475952, "step": 2544} {"train_info/time_between_train_steps": 0.003130197525024414, "step": 2544} {"info/global_step": 2545, "train_info/time_within_train_step": 2.69301438331604, "step": 2545} {"train_info/time_between_train_steps": 0.0033330917358398438, "step": 2545} {"info/global_step": 2546, "train_info/time_within_train_step": 2.720264196395874, "step": 2546} {"train_info/time_between_train_steps": 0.003291606903076172, "step": 2546} {"info/global_step": 2547, "train_info/time_within_train_step": 2.694504976272583, "step": 2547} {"train_info/time_between_train_steps": 0.0033757686614990234, "step": 2547} {"info/global_step": 2548, "train_info/time_within_train_step": 2.697349786758423, "step": 2548} {"train_info/time_between_train_steps": 0.003544330596923828, "step": 2548} {"info/global_step": 2549, "train_info/time_within_train_step": 2.685666561126709, "step": 2549} {"train_info/time_between_train_steps": 0.0031807422637939453, "step": 2549} {"info/global_step": 2550, "train_info/time_within_train_step": 2.6855263710021973, "step": 2550} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746319211, "_runtime": 7367}, "step": 2550} {"logs": {"train/loss": 4.0704, "train/learning_rate": 9.999999999999999e-05, "train/epoch": 2.28, "_timestamp": 1746319211, "_runtime": 7367}, "step": 2550} {"train_info/time_between_train_steps": 0.024190664291381836, "step": 2550} {"info/global_step": 2551, "train_info/time_within_train_step": 2.685075521469116, "step": 2551} {"train_info/time_between_train_steps": 0.002933502197265625, "step": 2551} {"info/global_step": 2552, "train_info/time_within_train_step": 2.7307136058807373, "step": 2552} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 2552} {"info/global_step": 2553, "train_info/time_within_train_step": 2.684004783630371, "step": 2553} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 2553} {"info/global_step": 2554, "train_info/time_within_train_step": 2.6839163303375244, "step": 2554} {"train_info/time_between_train_steps": 0.0033545494079589844, "step": 2554} {"info/global_step": 2555, "train_info/time_within_train_step": 2.6842401027679443, "step": 2555} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 2555} {"info/global_step": 2556, "train_info/time_within_train_step": 2.6842873096466064, "step": 2556} {"train_info/time_between_train_steps": 0.003425121307373047, "step": 2556} {"info/global_step": 2557, "train_info/time_within_train_step": 2.685873508453369, "step": 2557} {"train_info/time_between_train_steps": 0.003417491912841797, "step": 2557} {"info/global_step": 2558, "train_info/time_within_train_step": 2.6850454807281494, "step": 2558} {"train_info/time_between_train_steps": 0.0035181045532226562, "step": 2558} {"info/global_step": 2559, "train_info/time_within_train_step": 2.6858832836151123, "step": 2559} {"train_info/time_between_train_steps": 0.0036487579345703125, "step": 2559} {"train_info/time_between_train_steps": 3.279370069503784, "step": 2559} {"info/global_step": 2560, "train_info/time_within_train_step": 2.6844773292541504, "step": 2560} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 2560} {"info/global_step": 2561, "train_info/time_within_train_step": 2.682734489440918, "step": 2561} {"train_info/time_between_train_steps": 0.003356456756591797, "step": 2561} {"info/global_step": 2562, "train_info/time_within_train_step": 2.6840498447418213, "step": 2562} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 2562} {"info/global_step": 2563, "train_info/time_within_train_step": 2.6845829486846924, "step": 2563} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 2563} {"info/global_step": 2564, "train_info/time_within_train_step": 2.683387041091919, "step": 2564} {"train_info/time_between_train_steps": 0.003331899642944336, "step": 2564} {"info/global_step": 2565, "train_info/time_within_train_step": 2.6823198795318604, "step": 2565} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 2565} {"info/global_step": 2566, "train_info/time_within_train_step": 2.682645320892334, "step": 2566} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 2566} {"info/global_step": 2567, "train_info/time_within_train_step": 2.682239532470703, "step": 2567} {"train_info/time_between_train_steps": 0.0033974647521972656, "step": 2567} {"info/global_step": 2568, "train_info/time_within_train_step": 2.682403326034546, "step": 2568} {"train_info/time_between_train_steps": 0.0031385421752929688, "step": 2568} {"info/global_step": 2569, "train_info/time_within_train_step": 2.682389974594116, "step": 2569} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 2569} {"info/global_step": 2570, "train_info/time_within_train_step": 2.6816115379333496, "step": 2570} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 2570} {"info/global_step": 2571, "train_info/time_within_train_step": 2.682649612426758, "step": 2571} {"train_info/time_between_train_steps": 0.003140687942504883, "step": 2571} {"info/global_step": 2572, "train_info/time_within_train_step": 2.6822547912597656, "step": 2572} {"train_info/time_between_train_steps": 0.0033822059631347656, "step": 2572} {"info/global_step": 2573, "train_info/time_within_train_step": 2.7301557064056396, "step": 2573} {"train_info/time_between_train_steps": 0.0033974647521972656, "step": 2573} {"info/global_step": 2574, "train_info/time_within_train_step": 2.6835200786590576, "step": 2574} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 2574} {"info/global_step": 2575, "train_info/time_within_train_step": 2.68357515335083, "step": 2575} {"train_info/time_between_train_steps": 0.003201007843017578, "step": 2575} {"info/global_step": 2576, "train_info/time_within_train_step": 2.6842918395996094, "step": 2576} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 2576} {"info/global_step": 2577, "train_info/time_within_train_step": 2.6838343143463135, "step": 2577} {"train_info/time_between_train_steps": 0.003345966339111328, "step": 2577} {"info/global_step": 2578, "train_info/time_within_train_step": 2.9064249992370605, "step": 2578} {"train_info/time_between_train_steps": 0.0034782886505126953, "step": 2578} {"info/global_step": 2579, "train_info/time_within_train_step": 2.6843650341033936, "step": 2579} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 2579} {"info/global_step": 2580, "train_info/time_within_train_step": 2.6839499473571777, "step": 2580} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 2580} {"info/global_step": 2581, "train_info/time_within_train_step": 2.6846048831939697, "step": 2581} {"train_info/time_between_train_steps": 0.0032720565795898438, "step": 2581} {"info/global_step": 2582, "train_info/time_within_train_step": 2.6831324100494385, "step": 2582} {"train_info/time_between_train_steps": 0.003339529037475586, "step": 2582} {"info/global_step": 2583, "train_info/time_within_train_step": 2.683953046798706, "step": 2583} {"train_info/time_between_train_steps": 0.0031299591064453125, "step": 2583} {"info/global_step": 2584, "train_info/time_within_train_step": 2.683443307876587, "step": 2584} {"train_info/time_between_train_steps": 0.0032875537872314453, "step": 2584} {"info/global_step": 2585, "train_info/time_within_train_step": 2.6837124824523926, "step": 2585} {"train_info/time_between_train_steps": 0.003264188766479492, "step": 2585} {"info/global_step": 2586, "train_info/time_within_train_step": 2.6835737228393555, "step": 2586} {"train_info/time_between_train_steps": 0.0032477378845214844, "step": 2586} {"info/global_step": 2587, "train_info/time_within_train_step": 2.6811327934265137, "step": 2587} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 2587} {"info/global_step": 2588, "train_info/time_within_train_step": 2.683391809463501, "step": 2588} {"train_info/time_between_train_steps": 0.003369569778442383, "step": 2588} {"info/global_step": 2589, "train_info/time_within_train_step": 2.682321786880493, "step": 2589} {"train_info/time_between_train_steps": 0.003240823745727539, "step": 2589} {"info/global_step": 2590, "train_info/time_within_train_step": 2.6837170124053955, "step": 2590} {"train_info/time_between_train_steps": 0.0032684803009033203, "step": 2590} {"info/global_step": 2591, "train_info/time_within_train_step": 2.684227228164673, "step": 2591} {"train_info/time_between_train_steps": 0.0031337738037109375, "step": 2591} {"info/global_step": 2592, "train_info/time_within_train_step": 2.6830406188964844, "step": 2592} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 2592} {"info/global_step": 2593, "train_info/time_within_train_step": 2.6841962337493896, "step": 2593} {"train_info/time_between_train_steps": 0.003351926803588867, "step": 2593} {"info/global_step": 2594, "train_info/time_within_train_step": 2.688784599304199, "step": 2594} {"train_info/time_between_train_steps": 0.0033621788024902344, "step": 2594} {"info/global_step": 2595, "train_info/time_within_train_step": 2.6890676021575928, "step": 2595} {"train_info/time_between_train_steps": 0.0032896995544433594, "step": 2595} {"info/global_step": 2596, "train_info/time_within_train_step": 2.6844546794891357, "step": 2596} {"train_info/time_between_train_steps": 0.0033855438232421875, "step": 2596} {"info/global_step": 2597, "train_info/time_within_train_step": 2.684023141860962, "step": 2597} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 2597} {"info/global_step": 2598, "train_info/time_within_train_step": 2.6827826499938965, "step": 2598} {"train_info/time_between_train_steps": 0.003240823745727539, "step": 2598} {"info/global_step": 2599, "train_info/time_within_train_step": 2.6825249195098877, "step": 2599} {"train_info/time_between_train_steps": 0.003332376480102539, "step": 2599} {"info/global_step": 2600, "train_info/time_within_train_step": 2.6827540397644043, "step": 2600} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746319350, "_runtime": 7506}, "step": 2600} {"logs": {"train/loss": 4.1083, "train/learning_rate": 8.888888888888888e-05, "train/epoch": 3.01, "_timestamp": 1746319350, "_runtime": 7506}, "step": 2600} {"train_info/time_between_train_steps": 13.401677370071411, "step": 2600} {"info/global_step": 2601, "train_info/time_within_train_step": 2.472170352935791, "step": 2601} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 2601} {"info/global_step": 2602, "train_info/time_within_train_step": 2.491713762283325, "step": 2602} {"train_info/time_between_train_steps": 0.0032804012298583984, "step": 2602} {"info/global_step": 2603, "train_info/time_within_train_step": 2.6793413162231445, "step": 2603} {"train_info/time_between_train_steps": 0.0031218528747558594, "step": 2603} {"info/global_step": 2604, "train_info/time_within_train_step": 2.682011127471924, "step": 2604} {"train_info/time_between_train_steps": 0.003362417221069336, "step": 2604} {"info/global_step": 2605, "train_info/time_within_train_step": 2.6813411712646484, "step": 2605} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 2605} {"info/global_step": 2606, "train_info/time_within_train_step": 2.6829144954681396, "step": 2606} {"train_info/time_between_train_steps": 0.0033330917358398438, "step": 2606} {"info/global_step": 2607, "train_info/time_within_train_step": 2.6818456649780273, "step": 2607} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 2607} {"info/global_step": 2608, "train_info/time_within_train_step": 2.6831648349761963, "step": 2608} {"train_info/time_between_train_steps": 0.0033655166625976562, "step": 2608} {"info/global_step": 2609, "train_info/time_within_train_step": 2.683934450149536, "step": 2609} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 2609} {"info/global_step": 2610, "train_info/time_within_train_step": 2.6822261810302734, "step": 2610} {"train_info/time_between_train_steps": 0.0033202171325683594, "step": 2610} {"info/global_step": 2611, "train_info/time_within_train_step": 2.6827638149261475, "step": 2611} {"train_info/time_between_train_steps": 0.0033636093139648438, "step": 2611} {"info/global_step": 2612, "train_info/time_within_train_step": 2.6840343475341797, "step": 2612} {"train_info/time_between_train_steps": 0.003284931182861328, "step": 2612} {"info/global_step": 2613, "train_info/time_within_train_step": 2.683056354522705, "step": 2613} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 2613} {"info/global_step": 2614, "train_info/time_within_train_step": 2.683878183364868, "step": 2614} {"train_info/time_between_train_steps": 0.0033392906188964844, "step": 2614} {"info/global_step": 2615, "train_info/time_within_train_step": 2.7032995223999023, "step": 2615} {"train_info/time_between_train_steps": 0.0033440589904785156, "step": 2615} {"info/global_step": 2616, "train_info/time_within_train_step": 2.7403252124786377, "step": 2616} {"train_info/time_between_train_steps": 0.003113985061645508, "step": 2616} {"info/global_step": 2617, "train_info/time_within_train_step": 2.9701926708221436, "step": 2617} {"train_info/time_between_train_steps": 0.003491640090942383, "step": 2617} {"info/global_step": 2618, "train_info/time_within_train_step": 2.683864116668701, "step": 2618} {"train_info/time_between_train_steps": 0.003316640853881836, "step": 2618} {"info/global_step": 2619, "train_info/time_within_train_step": 2.6890552043914795, "step": 2619} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 2619} {"info/global_step": 2620, "train_info/time_within_train_step": 2.7235286235809326, "step": 2620} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 2620} {"info/global_step": 2621, "train_info/time_within_train_step": 2.7014849185943604, "step": 2621} {"train_info/time_between_train_steps": 0.003265857696533203, "step": 2621} {"info/global_step": 2622, "train_info/time_within_train_step": 2.805401086807251, "step": 2622} {"train_info/time_between_train_steps": 0.003447294235229492, "step": 2622} {"info/global_step": 2623, "train_info/time_within_train_step": 2.683964252471924, "step": 2623} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 2623} {"info/global_step": 2624, "train_info/time_within_train_step": 2.6836016178131104, "step": 2624} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 2624} {"info/global_step": 2625, "train_info/time_within_train_step": 2.6843814849853516, "step": 2625} {"train_info/time_between_train_steps": 0.0032927989959716797, "step": 2625} {"info/global_step": 2626, "train_info/time_within_train_step": 2.690678358078003, "step": 2626} {"train_info/time_between_train_steps": 0.0033953189849853516, "step": 2626} {"info/global_step": 2627, "train_info/time_within_train_step": 2.6879045963287354, "step": 2627} {"train_info/time_between_train_steps": 0.003448963165283203, "step": 2627} {"info/global_step": 2628, "train_info/time_within_train_step": 2.689545154571533, "step": 2628} {"train_info/time_between_train_steps": 0.003332376480102539, "step": 2628} {"info/global_step": 2629, "train_info/time_within_train_step": 2.7133266925811768, "step": 2629} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 2629} {"info/global_step": 2630, "train_info/time_within_train_step": 2.710304021835327, "step": 2630} {"train_info/time_between_train_steps": 0.0032889842987060547, "step": 2630} {"info/global_step": 2631, "train_info/time_within_train_step": 2.6856110095977783, "step": 2631} {"train_info/time_between_train_steps": 0.0035643577575683594, "step": 2631} {"info/global_step": 2632, "train_info/time_within_train_step": 2.684422492980957, "step": 2632} {"train_info/time_between_train_steps": 0.003521442413330078, "step": 2632} {"info/global_step": 2633, "train_info/time_within_train_step": 2.684570074081421, "step": 2633} {"train_info/time_between_train_steps": 0.0035581588745117188, "step": 2633} {"info/global_step": 2634, "train_info/time_within_train_step": 2.68342924118042, "step": 2634} {"train_info/time_between_train_steps": 0.0034689903259277344, "step": 2634} {"info/global_step": 2635, "train_info/time_within_train_step": 2.685042142868042, "step": 2635} {"train_info/time_between_train_steps": 0.003285646438598633, "step": 2635} {"info/global_step": 2636, "train_info/time_within_train_step": 2.6843228340148926, "step": 2636} {"train_info/time_between_train_steps": 0.0034580230712890625, "step": 2636} {"info/global_step": 2637, "train_info/time_within_train_step": 2.684687376022339, "step": 2637} {"train_info/time_between_train_steps": 0.003621339797973633, "step": 2637} {"info/global_step": 2638, "train_info/time_within_train_step": 2.69299578666687, "step": 2638} {"train_info/time_between_train_steps": 0.0036859512329101562, "step": 2638} {"info/global_step": 2639, "train_info/time_within_train_step": 2.6911089420318604, "step": 2639} {"train_info/time_between_train_steps": 0.0033864974975585938, "step": 2639} {"info/global_step": 2640, "train_info/time_within_train_step": 2.6866533756256104, "step": 2640} {"train_info/time_between_train_steps": 0.003636598587036133, "step": 2640} {"info/global_step": 2641, "train_info/time_within_train_step": 2.697129726409912, "step": 2641} {"train_info/time_between_train_steps": 0.0032749176025390625, "step": 2641} {"info/global_step": 2642, "train_info/time_within_train_step": 2.69893217086792, "step": 2642} {"train_info/time_between_train_steps": 0.0033111572265625, "step": 2642} {"info/global_step": 2643, "train_info/time_within_train_step": 2.6837055683135986, "step": 2643} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 2643} {"info/global_step": 2644, "train_info/time_within_train_step": 2.686199188232422, "step": 2644} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 2644} {"info/global_step": 2645, "train_info/time_within_train_step": 2.7021806240081787, "step": 2645} {"train_info/time_between_train_steps": 0.0032548904418945312, "step": 2645} {"info/global_step": 2646, "train_info/time_within_train_step": 2.686154842376709, "step": 2646} {"train_info/time_between_train_steps": 0.0033075809478759766, "step": 2646} {"info/global_step": 2647, "train_info/time_within_train_step": 2.6849632263183594, "step": 2647} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 2647} {"info/global_step": 2648, "train_info/time_within_train_step": 2.685314893722534, "step": 2648} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 2648} {"info/global_step": 2649, "train_info/time_within_train_step": 2.6848433017730713, "step": 2649} {"train_info/time_between_train_steps": 0.003255128860473633, "step": 2649} {"info/global_step": 2650, "train_info/time_within_train_step": 2.7081544399261475, "step": 2650} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746319499, "_runtime": 7655}, "step": 2650} {"logs": {"train/loss": 4.0428, "train/learning_rate": 7.777777777777777e-05, "train/epoch": 3.03, "_timestamp": 1746319499, "_runtime": 7655}, "step": 2650} {"train_info/time_between_train_steps": 0.02483224868774414, "step": 2650} {"info/global_step": 2651, "train_info/time_within_train_step": 2.6849677562713623, "step": 2651} {"train_info/time_between_train_steps": 0.003261089324951172, "step": 2651} {"info/global_step": 2652, "train_info/time_within_train_step": 2.6845176219940186, "step": 2652} {"train_info/time_between_train_steps": 0.0032901763916015625, "step": 2652} {"info/global_step": 2653, "train_info/time_within_train_step": 2.6848294734954834, "step": 2653} {"train_info/time_between_train_steps": 0.003293752670288086, "step": 2653} {"info/global_step": 2654, "train_info/time_within_train_step": 2.6841866970062256, "step": 2654} {"train_info/time_between_train_steps": 0.003325939178466797, "step": 2654} {"info/global_step": 2655, "train_info/time_within_train_step": 2.684192180633545, "step": 2655} {"train_info/time_between_train_steps": 0.0032503604888916016, "step": 2655} {"info/global_step": 2656, "train_info/time_within_train_step": 2.6847715377807617, "step": 2656} {"train_info/time_between_train_steps": 0.003303050994873047, "step": 2656} {"info/global_step": 2657, "train_info/time_within_train_step": 2.6849663257598877, "step": 2657} {"train_info/time_between_train_steps": 0.0032813549041748047, "step": 2657} {"info/global_step": 2658, "train_info/time_within_train_step": 2.68426251411438, "step": 2658} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 2658} {"info/global_step": 2659, "train_info/time_within_train_step": 2.6847009658813477, "step": 2659} {"train_info/time_between_train_steps": 0.003320932388305664, "step": 2659} {"info/global_step": 2660, "train_info/time_within_train_step": 2.6854755878448486, "step": 2660} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 2660} {"info/global_step": 2661, "train_info/time_within_train_step": 2.684581995010376, "step": 2661} {"train_info/time_between_train_steps": 0.0032274723052978516, "step": 2661} {"info/global_step": 2662, "train_info/time_within_train_step": 2.6841492652893066, "step": 2662} {"train_info/time_between_train_steps": 0.0032606124877929688, "step": 2662} {"info/global_step": 2663, "train_info/time_within_train_step": 2.6844942569732666, "step": 2663} {"train_info/time_between_train_steps": 0.0032646656036376953, "step": 2663} {"info/global_step": 2664, "train_info/time_within_train_step": 2.6857266426086426, "step": 2664} {"train_info/time_between_train_steps": 0.0032799243927001953, "step": 2664} {"info/global_step": 2665, "train_info/time_within_train_step": 2.6845510005950928, "step": 2665} {"train_info/time_between_train_steps": 0.0033156871795654297, "step": 2665} {"info/global_step": 2666, "train_info/time_within_train_step": 2.6850361824035645, "step": 2666} {"train_info/time_between_train_steps": 0.0033423900604248047, "step": 2666} {"info/global_step": 2667, "train_info/time_within_train_step": 2.685166597366333, "step": 2667} {"train_info/time_between_train_steps": 0.0033648014068603516, "step": 2667} {"info/global_step": 2668, "train_info/time_within_train_step": 2.6849892139434814, "step": 2668} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 2668} {"info/global_step": 2669, "train_info/time_within_train_step": 2.68393874168396, "step": 2669} {"train_info/time_between_train_steps": 0.0033140182495117188, "step": 2669} {"info/global_step": 2670, "train_info/time_within_train_step": 2.684257745742798, "step": 2670} {"train_info/time_between_train_steps": 0.003428936004638672, "step": 2670} {"info/global_step": 2671, "train_info/time_within_train_step": 2.6857352256774902, "step": 2671} {"train_info/time_between_train_steps": 0.0033435821533203125, "step": 2671} {"info/global_step": 2672, "train_info/time_within_train_step": 2.684025287628174, "step": 2672} {"train_info/time_between_train_steps": 0.0033380985260009766, "step": 2672} {"info/global_step": 2673, "train_info/time_within_train_step": 2.6840007305145264, "step": 2673} {"train_info/time_between_train_steps": 0.0033197402954101562, "step": 2673} {"info/global_step": 2674, "train_info/time_within_train_step": 2.683825969696045, "step": 2674} {"train_info/time_between_train_steps": 0.0032918453216552734, "step": 2674} {"info/global_step": 2675, "train_info/time_within_train_step": 2.683288812637329, "step": 2675} {"train_info/time_between_train_steps": 0.003242969512939453, "step": 2675} {"info/global_step": 2676, "train_info/time_within_train_step": 2.684023141860962, "step": 2676} {"train_info/time_between_train_steps": 0.003285646438598633, "step": 2676} {"info/global_step": 2677, "train_info/time_within_train_step": 2.683931827545166, "step": 2677} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 2677} {"info/global_step": 2678, "train_info/time_within_train_step": 2.684394121170044, "step": 2678} {"train_info/time_between_train_steps": 0.0032858848571777344, "step": 2678} {"info/global_step": 2679, "train_info/time_within_train_step": 2.682453155517578, "step": 2679} {"train_info/time_between_train_steps": 0.0032732486724853516, "step": 2679} {"info/global_step": 2680, "train_info/time_within_train_step": 2.684177875518799, "step": 2680} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 2680} {"info/global_step": 2681, "train_info/time_within_train_step": 2.6830801963806152, "step": 2681} {"train_info/time_between_train_steps": 0.003245115280151367, "step": 2681} {"info/global_step": 2682, "train_info/time_within_train_step": 2.684286594390869, "step": 2682} {"train_info/time_between_train_steps": 0.0032281875610351562, "step": 2682} {"info/global_step": 2683, "train_info/time_within_train_step": 2.684102773666382, "step": 2683} {"train_info/time_between_train_steps": 0.003272533416748047, "step": 2683} {"info/global_step": 2684, "train_info/time_within_train_step": 2.6839599609375, "step": 2684} {"train_info/time_between_train_steps": 0.13668441772460938, "step": 2684} {"info/global_step": 2685, "train_info/time_within_train_step": 2.689434289932251, "step": 2685} {"train_info/time_between_train_steps": 0.0032672882080078125, "step": 2685} {"info/global_step": 2686, "train_info/time_within_train_step": 2.6850197315216064, "step": 2686} {"train_info/time_between_train_steps": 0.003257274627685547, "step": 2686} {"info/global_step": 2687, "train_info/time_within_train_step": 2.684875011444092, "step": 2687} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 2687} {"info/global_step": 2688, "train_info/time_within_train_step": 2.684027910232544, "step": 2688} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 2688} {"info/global_step": 2689, "train_info/time_within_train_step": 2.6841983795166016, "step": 2689} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 2689} {"info/global_step": 2690, "train_info/time_within_train_step": 2.6845314502716064, "step": 2690} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 2690} {"info/global_step": 2691, "train_info/time_within_train_step": 2.685281991958618, "step": 2691} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 2691} {"info/global_step": 2692, "train_info/time_within_train_step": 2.6847424507141113, "step": 2692} {"train_info/time_between_train_steps": 0.0032083988189697266, "step": 2692} {"info/global_step": 2693, "train_info/time_within_train_step": 2.6849024295806885, "step": 2693} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 2693} {"info/global_step": 2694, "train_info/time_within_train_step": 2.683817148208618, "step": 2694} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 2694} {"info/global_step": 2695, "train_info/time_within_train_step": 2.684992551803589, "step": 2695} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 2695} {"info/global_step": 2696, "train_info/time_within_train_step": 2.684030532836914, "step": 2696} {"train_info/time_between_train_steps": 0.003248453140258789, "step": 2696} {"info/global_step": 2697, "train_info/time_within_train_step": 2.6847877502441406, "step": 2697} {"train_info/time_between_train_steps": 0.003253459930419922, "step": 2697} {"info/global_step": 2698, "train_info/time_within_train_step": 2.684281587600708, "step": 2698} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 2698} {"info/global_step": 2699, "train_info/time_within_train_step": 2.6849920749664307, "step": 2699} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 2699} {"info/global_step": 2700, "train_info/time_within_train_step": 2.698761224746704, "step": 2700} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746319634, "_runtime": 7790}, "step": 2700} {"logs": {"train/loss": 4.032, "train/learning_rate": 6.666666666666666e-05, "train/epoch": 3.05, "_timestamp": 1746319634, "_runtime": 7790}, "step": 2700} {"train_info/time_between_train_steps": 13.711633920669556, "step": 2700} {"info/global_step": 2701, "train_info/time_within_train_step": 2.4869883060455322, "step": 2701} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 2701} {"info/global_step": 2702, "train_info/time_within_train_step": 2.774827480316162, "step": 2702} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 2702} {"info/global_step": 2703, "train_info/time_within_train_step": 2.6826281547546387, "step": 2703} {"train_info/time_between_train_steps": 0.003400087356567383, "step": 2703} {"info/global_step": 2704, "train_info/time_within_train_step": 2.6824393272399902, "step": 2704} {"train_info/time_between_train_steps": 0.0033380985260009766, "step": 2704} {"info/global_step": 2705, "train_info/time_within_train_step": 2.6829071044921875, "step": 2705} {"train_info/time_between_train_steps": 0.0033371448516845703, "step": 2705} {"info/global_step": 2706, "train_info/time_within_train_step": 2.6823458671569824, "step": 2706} {"train_info/time_between_train_steps": 0.003378629684448242, "step": 2706} {"info/global_step": 2707, "train_info/time_within_train_step": 2.6829919815063477, "step": 2707} {"train_info/time_between_train_steps": 0.003156423568725586, "step": 2707} {"info/global_step": 2708, "train_info/time_within_train_step": 2.682659149169922, "step": 2708} {"train_info/time_between_train_steps": 0.0032622814178466797, "step": 2708} {"info/global_step": 2709, "train_info/time_within_train_step": 2.684114933013916, "step": 2709} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 2709} {"info/global_step": 2710, "train_info/time_within_train_step": 2.684046506881714, "step": 2710} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 2710} {"info/global_step": 2711, "train_info/time_within_train_step": 2.682929039001465, "step": 2711} {"train_info/time_between_train_steps": 0.0033822059631347656, "step": 2711} {"info/global_step": 2712, "train_info/time_within_train_step": 2.682082414627075, "step": 2712} {"train_info/time_between_train_steps": 0.003382444381713867, "step": 2712} {"info/global_step": 2713, "train_info/time_within_train_step": 2.6839938163757324, "step": 2713} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 2713} {"info/global_step": 2714, "train_info/time_within_train_step": 2.6848902702331543, "step": 2714} {"train_info/time_between_train_steps": 0.0033926963806152344, "step": 2714} {"info/global_step": 2715, "train_info/time_within_train_step": 2.7285356521606445, "step": 2715} {"train_info/time_between_train_steps": 0.003333568572998047, "step": 2715} {"info/global_step": 2716, "train_info/time_within_train_step": 2.7241787910461426, "step": 2716} {"train_info/time_between_train_steps": 0.0032644271850585938, "step": 2716} {"info/global_step": 2717, "train_info/time_within_train_step": 2.7294986248016357, "step": 2717} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 2717} {"info/global_step": 2718, "train_info/time_within_train_step": 2.718580961227417, "step": 2718} {"train_info/time_between_train_steps": 0.0032625198364257812, "step": 2718} {"info/global_step": 2719, "train_info/time_within_train_step": 2.757000684738159, "step": 2719} {"train_info/time_between_train_steps": 0.003280162811279297, "step": 2719} {"info/global_step": 2720, "train_info/time_within_train_step": 2.717543840408325, "step": 2720} {"train_info/time_between_train_steps": 0.003244638442993164, "step": 2720} {"info/global_step": 2721, "train_info/time_within_train_step": 2.7001681327819824, "step": 2721} {"train_info/time_between_train_steps": 0.003124237060546875, "step": 2721} {"info/global_step": 2722, "train_info/time_within_train_step": 2.7152369022369385, "step": 2722} {"train_info/time_between_train_steps": 0.003224611282348633, "step": 2722} {"info/global_step": 2723, "train_info/time_within_train_step": 2.6925606727600098, "step": 2723} {"train_info/time_between_train_steps": 0.003457784652709961, "step": 2723} {"info/global_step": 2724, "train_info/time_within_train_step": 2.70225191116333, "step": 2724} {"train_info/time_between_train_steps": 0.0033936500549316406, "step": 2724} {"info/global_step": 2725, "train_info/time_within_train_step": 2.6958489418029785, "step": 2725} {"train_info/time_between_train_steps": 0.0032300949096679688, "step": 2725} {"info/global_step": 2726, "train_info/time_within_train_step": 2.703974962234497, "step": 2726} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 2726} {"info/global_step": 2727, "train_info/time_within_train_step": 2.684603214263916, "step": 2727} {"train_info/time_between_train_steps": 0.0031714439392089844, "step": 2727} {"info/global_step": 2728, "train_info/time_within_train_step": 2.6854515075683594, "step": 2728} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 2728} {"info/global_step": 2729, "train_info/time_within_train_step": 2.6857714653015137, "step": 2729} {"train_info/time_between_train_steps": 0.003236055374145508, "step": 2729} {"info/global_step": 2730, "train_info/time_within_train_step": 2.6839568614959717, "step": 2730} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 2730} {"info/global_step": 2731, "train_info/time_within_train_step": 2.6938695907592773, "step": 2731} {"train_info/time_between_train_steps": 0.0031585693359375, "step": 2731} {"info/global_step": 2732, "train_info/time_within_train_step": 2.7111029624938965, "step": 2732} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 2732} {"info/global_step": 2733, "train_info/time_within_train_step": 2.7028777599334717, "step": 2733} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 2733} {"info/global_step": 2734, "train_info/time_within_train_step": 2.684843063354492, "step": 2734} {"train_info/time_between_train_steps": 0.0032434463500976562, "step": 2734} {"info/global_step": 2735, "train_info/time_within_train_step": 2.685299873352051, "step": 2735} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 2735} {"info/global_step": 2736, "train_info/time_within_train_step": 2.6960840225219727, "step": 2736} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 2736} {"info/global_step": 2737, "train_info/time_within_train_step": 2.692753553390503, "step": 2737} {"train_info/time_between_train_steps": 0.003249645233154297, "step": 2737} {"info/global_step": 2738, "train_info/time_within_train_step": 2.6857471466064453, "step": 2738} {"train_info/time_between_train_steps": 0.003239154815673828, "step": 2738} {"info/global_step": 2739, "train_info/time_within_train_step": 2.685239791870117, "step": 2739} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 2739} {"info/global_step": 2740, "train_info/time_within_train_step": 2.69624924659729, "step": 2740} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 2740} {"info/global_step": 2741, "train_info/time_within_train_step": 2.696194648742676, "step": 2741} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 2741} {"info/global_step": 2742, "train_info/time_within_train_step": 2.6945080757141113, "step": 2742} {"train_info/time_between_train_steps": 0.003283977508544922, "step": 2742} {"info/global_step": 2743, "train_info/time_within_train_step": 2.6992928981781006, "step": 2743} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 2743} {"info/global_step": 2744, "train_info/time_within_train_step": 2.6861181259155273, "step": 2744} {"train_info/time_between_train_steps": 0.0032677650451660156, "step": 2744} {"info/global_step": 2745, "train_info/time_within_train_step": 2.6850855350494385, "step": 2745} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 2745} {"info/global_step": 2746, "train_info/time_within_train_step": 2.6841273307800293, "step": 2746} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 2746} {"info/global_step": 2747, "train_info/time_within_train_step": 2.811011552810669, "step": 2747} {"train_info/time_between_train_steps": 0.0032308101654052734, "step": 2747} {"info/global_step": 2748, "train_info/time_within_train_step": 2.6846611499786377, "step": 2748} {"train_info/time_between_train_steps": 0.0032634735107421875, "step": 2748} {"info/global_step": 2749, "train_info/time_within_train_step": 3.2300267219543457, "step": 2749} {"train_info/time_between_train_steps": 0.003269195556640625, "step": 2749} {"info/global_step": 2750, "train_info/time_within_train_step": 2.684565782546997, "step": 2750} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746319785, "_runtime": 7941}, "step": 2750} {"logs": {"train/loss": 4.0141, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 3.06, "_timestamp": 1746319785, "_runtime": 7941}, "step": 2750} {"train_info/time_between_train_steps": 0.02523064613342285, "step": 2750} {"info/global_step": 2751, "train_info/time_within_train_step": 2.684368848800659, "step": 2751} {"train_info/time_between_train_steps": 0.0033414363861083984, "step": 2751} {"info/global_step": 2752, "train_info/time_within_train_step": 2.6846282482147217, "step": 2752} {"train_info/time_between_train_steps": 0.0033948421478271484, "step": 2752} {"info/global_step": 2753, "train_info/time_within_train_step": 2.6851978302001953, "step": 2753} {"train_info/time_between_train_steps": 0.0032973289489746094, "step": 2753} {"info/global_step": 2754, "train_info/time_within_train_step": 2.6838560104370117, "step": 2754} {"train_info/time_between_train_steps": 0.003264188766479492, "step": 2754} {"info/global_step": 2755, "train_info/time_within_train_step": 2.6840786933898926, "step": 2755} {"train_info/time_between_train_steps": 0.0034019947052001953, "step": 2755} {"info/global_step": 2756, "train_info/time_within_train_step": 2.684718370437622, "step": 2756} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 2756} {"info/global_step": 2757, "train_info/time_within_train_step": 2.6846818923950195, "step": 2757} {"train_info/time_between_train_steps": 0.003479480743408203, "step": 2757} {"info/global_step": 2758, "train_info/time_within_train_step": 2.6846401691436768, "step": 2758} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 2758} {"info/global_step": 2759, "train_info/time_within_train_step": 2.6838274002075195, "step": 2759} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 2759} {"info/global_step": 2760, "train_info/time_within_train_step": 2.6842148303985596, "step": 2760} {"train_info/time_between_train_steps": 0.0034639835357666016, "step": 2760} {"info/global_step": 2761, "train_info/time_within_train_step": 2.6847877502441406, "step": 2761} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 2761} {"info/global_step": 2762, "train_info/time_within_train_step": 2.6847493648529053, "step": 2762} {"train_info/time_between_train_steps": 0.0033540725708007812, "step": 2762} {"info/global_step": 2763, "train_info/time_within_train_step": 2.6843068599700928, "step": 2763} {"train_info/time_between_train_steps": 0.003252744674682617, "step": 2763} {"info/global_step": 2764, "train_info/time_within_train_step": 2.6843855381011963, "step": 2764} {"train_info/time_between_train_steps": 0.0033102035522460938, "step": 2764} {"info/global_step": 2765, "train_info/time_within_train_step": 2.685289144515991, "step": 2765} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 2765} {"info/global_step": 2766, "train_info/time_within_train_step": 2.6853742599487305, "step": 2766} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 2766} {"info/global_step": 2767, "train_info/time_within_train_step": 2.685408353805542, "step": 2767} {"train_info/time_between_train_steps": 0.003438711166381836, "step": 2767} {"info/global_step": 2768, "train_info/time_within_train_step": 2.6847620010375977, "step": 2768} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 2768} {"info/global_step": 2769, "train_info/time_within_train_step": 2.685971260070801, "step": 2769} {"train_info/time_between_train_steps": 0.0032453536987304688, "step": 2769} {"info/global_step": 2770, "train_info/time_within_train_step": 2.6852612495422363, "step": 2770} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 2770} {"info/global_step": 2771, "train_info/time_within_train_step": 2.6841490268707275, "step": 2771} {"train_info/time_between_train_steps": 0.0032532215118408203, "step": 2771} {"info/global_step": 2772, "train_info/time_within_train_step": 2.684380531311035, "step": 2772} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 2772} {"info/global_step": 2773, "train_info/time_within_train_step": 2.6838645935058594, "step": 2773} {"train_info/time_between_train_steps": 0.003236055374145508, "step": 2773} {"info/global_step": 2774, "train_info/time_within_train_step": 2.685112714767456, "step": 2774} {"train_info/time_between_train_steps": 0.003222942352294922, "step": 2774} {"info/global_step": 2775, "train_info/time_within_train_step": 2.684629201889038, "step": 2775} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 2775} {"info/global_step": 2776, "train_info/time_within_train_step": 2.6842241287231445, "step": 2776} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 2776} {"info/global_step": 2777, "train_info/time_within_train_step": 2.6845579147338867, "step": 2777} {"train_info/time_between_train_steps": 0.0032291412353515625, "step": 2777} {"info/global_step": 2778, "train_info/time_within_train_step": 2.684237241744995, "step": 2778} {"train_info/time_between_train_steps": 0.0032978057861328125, "step": 2778} {"info/global_step": 2779, "train_info/time_within_train_step": 2.6847171783447266, "step": 2779} {"train_info/time_between_train_steps": 0.003274202346801758, "step": 2779} {"info/global_step": 2780, "train_info/time_within_train_step": 2.684638261795044, "step": 2780} {"train_info/time_between_train_steps": 0.003239870071411133, "step": 2780} {"info/global_step": 2781, "train_info/time_within_train_step": 2.6851797103881836, "step": 2781} {"train_info/time_between_train_steps": 0.003237009048461914, "step": 2781} {"info/global_step": 2782, "train_info/time_within_train_step": 2.6851022243499756, "step": 2782} {"train_info/time_between_train_steps": 0.0032320022583007812, "step": 2782} {"info/global_step": 2783, "train_info/time_within_train_step": 2.684450149536133, "step": 2783} {"train_info/time_between_train_steps": 0.00325775146484375, "step": 2783} {"info/global_step": 2784, "train_info/time_within_train_step": 2.684638500213623, "step": 2784} {"train_info/time_between_train_steps": 0.003286123275756836, "step": 2784} {"info/global_step": 2785, "train_info/time_within_train_step": 2.6852262020111084, "step": 2785} {"train_info/time_between_train_steps": 0.003272533416748047, "step": 2785} {"info/global_step": 2786, "train_info/time_within_train_step": 2.684134006500244, "step": 2786} {"train_info/time_between_train_steps": 0.0032341480255126953, "step": 2786} {"info/global_step": 2787, "train_info/time_within_train_step": 2.685818910598755, "step": 2787} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 2787} {"info/global_step": 2788, "train_info/time_within_train_step": 2.684500217437744, "step": 2788} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 2788} {"info/global_step": 2789, "train_info/time_within_train_step": 2.94045090675354, "step": 2789} {"train_info/time_between_train_steps": 0.0032396316528320312, "step": 2789} {"info/global_step": 2790, "train_info/time_within_train_step": 2.6853089332580566, "step": 2790} {"train_info/time_between_train_steps": 0.0032792091369628906, "step": 2790} {"info/global_step": 2791, "train_info/time_within_train_step": 2.6856091022491455, "step": 2791} {"train_info/time_between_train_steps": 0.003264188766479492, "step": 2791} {"info/global_step": 2792, "train_info/time_within_train_step": 2.6846227645874023, "step": 2792} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 2792} {"info/global_step": 2793, "train_info/time_within_train_step": 2.6830973625183105, "step": 2793} {"train_info/time_between_train_steps": 0.0032358169555664062, "step": 2793} {"info/global_step": 2794, "train_info/time_within_train_step": 2.683227062225342, "step": 2794} {"train_info/time_between_train_steps": 0.0032596588134765625, "step": 2794} {"info/global_step": 2795, "train_info/time_within_train_step": 2.683398962020874, "step": 2795} {"train_info/time_between_train_steps": 0.003262042999267578, "step": 2795} {"info/global_step": 2796, "train_info/time_within_train_step": 2.684373617172241, "step": 2796} {"train_info/time_between_train_steps": 0.003229856491088867, "step": 2796} {"info/global_step": 2797, "train_info/time_within_train_step": 2.683741331100464, "step": 2797} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 2797} {"info/global_step": 2798, "train_info/time_within_train_step": 2.6838958263397217, "step": 2798} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 2798} {"info/global_step": 2799, "train_info/time_within_train_step": 2.68379545211792, "step": 2799} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 2799} {"info/global_step": 2800, "train_info/time_within_train_step": 2.684826135635376, "step": 2800} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746319920, "_runtime": 8076}, "step": 2800} {"logs": {"train/loss": 4.0043, "train/learning_rate": 4.444444444444444e-05, "train/epoch": 3.08, "_timestamp": 1746319920, "_runtime": 8076}, "step": 2800} {"train_info/time_between_train_steps": 16.802806854248047, "step": 2800} {"info/global_step": 2801, "train_info/time_within_train_step": 2.4932050704956055, "step": 2801} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 2801} {"info/global_step": 2802, "train_info/time_within_train_step": 2.483766794204712, "step": 2802} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 2802} {"info/global_step": 2803, "train_info/time_within_train_step": 2.6715519428253174, "step": 2803} {"train_info/time_between_train_steps": 0.003237485885620117, "step": 2803} {"info/global_step": 2804, "train_info/time_within_train_step": 2.681492805480957, "step": 2804} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 2804} {"info/global_step": 2805, "train_info/time_within_train_step": 2.6824591159820557, "step": 2805} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 2805} {"info/global_step": 2806, "train_info/time_within_train_step": 2.6929128170013428, "step": 2806} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 2806} {"info/global_step": 2807, "train_info/time_within_train_step": 2.6873624324798584, "step": 2807} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 2807} {"info/global_step": 2808, "train_info/time_within_train_step": 2.6837213039398193, "step": 2808} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 2808} {"info/global_step": 2809, "train_info/time_within_train_step": 2.6843225955963135, "step": 2809} {"train_info/time_between_train_steps": 0.13193011283874512, "step": 2809} {"info/global_step": 2810, "train_info/time_within_train_step": 2.6843135356903076, "step": 2810} {"train_info/time_between_train_steps": 0.003256082534790039, "step": 2810} {"info/global_step": 2811, "train_info/time_within_train_step": 2.6841979026794434, "step": 2811} {"train_info/time_between_train_steps": 0.0032732486724853516, "step": 2811} {"info/global_step": 2812, "train_info/time_within_train_step": 2.685453414916992, "step": 2812} {"train_info/time_between_train_steps": 0.0033178329467773438, "step": 2812} {"info/global_step": 2813, "train_info/time_within_train_step": 2.685202121734619, "step": 2813} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 2813} {"info/global_step": 2814, "train_info/time_within_train_step": 2.684952735900879, "step": 2814} {"train_info/time_between_train_steps": 0.003356456756591797, "step": 2814} {"info/global_step": 2815, "train_info/time_within_train_step": 2.741821527481079, "step": 2815} {"train_info/time_between_train_steps": 0.0032901763916015625, "step": 2815} {"info/global_step": 2816, "train_info/time_within_train_step": 2.759152412414551, "step": 2816} {"train_info/time_between_train_steps": 0.0032470226287841797, "step": 2816} {"info/global_step": 2817, "train_info/time_within_train_step": 2.7219998836517334, "step": 2817} {"train_info/time_between_train_steps": 0.003246784210205078, "step": 2817} {"info/global_step": 2818, "train_info/time_within_train_step": 2.7195355892181396, "step": 2818} {"train_info/time_between_train_steps": 0.0032384395599365234, "step": 2818} {"info/global_step": 2819, "train_info/time_within_train_step": 2.7227742671966553, "step": 2819} {"train_info/time_between_train_steps": 0.0032532215118408203, "step": 2819} {"info/global_step": 2820, "train_info/time_within_train_step": 2.6893508434295654, "step": 2820} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 2820} {"info/global_step": 2821, "train_info/time_within_train_step": 2.7065656185150146, "step": 2821} {"train_info/time_between_train_steps": 0.003286123275756836, "step": 2821} {"info/global_step": 2822, "train_info/time_within_train_step": 2.6963508129119873, "step": 2822} {"train_info/time_between_train_steps": 0.0032579898834228516, "step": 2822} {"info/global_step": 2823, "train_info/time_within_train_step": 2.7048356533050537, "step": 2823} {"train_info/time_between_train_steps": 0.0032901763916015625, "step": 2823} {"info/global_step": 2824, "train_info/time_within_train_step": 2.6930832862854004, "step": 2824} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 2824} {"info/global_step": 2825, "train_info/time_within_train_step": 2.706369161605835, "step": 2825} {"train_info/time_between_train_steps": 0.003257274627685547, "step": 2825} {"info/global_step": 2826, "train_info/time_within_train_step": 2.7069895267486572, "step": 2826} {"train_info/time_between_train_steps": 0.00330352783203125, "step": 2826} {"info/global_step": 2827, "train_info/time_within_train_step": 2.694509744644165, "step": 2827} {"train_info/time_between_train_steps": 0.0038878917694091797, "step": 2827} {"info/global_step": 2828, "train_info/time_within_train_step": 2.714933395385742, "step": 2828} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 2828} {"info/global_step": 2829, "train_info/time_within_train_step": 2.693876266479492, "step": 2829} {"train_info/time_between_train_steps": 0.0032835006713867188, "step": 2829} {"info/global_step": 2830, "train_info/time_within_train_step": 2.6965854167938232, "step": 2830} {"train_info/time_between_train_steps": 0.003265380859375, "step": 2830} {"info/global_step": 2831, "train_info/time_within_train_step": 2.705982208251953, "step": 2831} {"train_info/time_between_train_steps": 0.003334522247314453, "step": 2831} {"info/global_step": 2832, "train_info/time_within_train_step": 2.6851069927215576, "step": 2832} {"train_info/time_between_train_steps": 0.0032563209533691406, "step": 2832} {"info/global_step": 2833, "train_info/time_within_train_step": 2.6847803592681885, "step": 2833} {"train_info/time_between_train_steps": 0.003283262252807617, "step": 2833} {"info/global_step": 2834, "train_info/time_within_train_step": 2.6893832683563232, "step": 2834} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 2834} {"info/global_step": 2835, "train_info/time_within_train_step": 2.6935482025146484, "step": 2835} {"train_info/time_between_train_steps": 0.0032958984375, "step": 2835} {"info/global_step": 2836, "train_info/time_within_train_step": 2.7066938877105713, "step": 2836} {"train_info/time_between_train_steps": 0.0032813549041748047, "step": 2836} {"info/global_step": 2837, "train_info/time_within_train_step": 2.6991727352142334, "step": 2837} {"train_info/time_between_train_steps": 0.0033762454986572266, "step": 2837} {"info/global_step": 2838, "train_info/time_within_train_step": 2.7063565254211426, "step": 2838} {"train_info/time_between_train_steps": 0.003276824951171875, "step": 2838} {"info/global_step": 2839, "train_info/time_within_train_step": 2.6976211071014404, "step": 2839} {"train_info/time_between_train_steps": 0.003299236297607422, "step": 2839} {"info/global_step": 2840, "train_info/time_within_train_step": 2.6850779056549072, "step": 2840} {"train_info/time_between_train_steps": 0.0032587051391601562, "step": 2840} {"info/global_step": 2841, "train_info/time_within_train_step": 2.687629222869873, "step": 2841} {"train_info/time_between_train_steps": 0.0033402442932128906, "step": 2841} {"info/global_step": 2842, "train_info/time_within_train_step": 2.703531503677368, "step": 2842} {"train_info/time_between_train_steps": 0.003293275833129883, "step": 2842} {"info/global_step": 2843, "train_info/time_within_train_step": 2.6841421127319336, "step": 2843} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 2843} {"info/global_step": 2844, "train_info/time_within_train_step": 2.6845548152923584, "step": 2844} {"train_info/time_between_train_steps": 0.003286123275756836, "step": 2844} {"info/global_step": 2845, "train_info/time_within_train_step": 2.6858103275299072, "step": 2845} {"train_info/time_between_train_steps": 0.0032367706298828125, "step": 2845} {"info/global_step": 2846, "train_info/time_within_train_step": 2.7019946575164795, "step": 2846} {"train_info/time_between_train_steps": 0.003261089324951172, "step": 2846} {"info/global_step": 2847, "train_info/time_within_train_step": 2.685791492462158, "step": 2847} {"train_info/time_between_train_steps": 0.003286123275756836, "step": 2847} {"info/global_step": 2848, "train_info/time_within_train_step": 2.68288254737854, "step": 2848} {"train_info/time_between_train_steps": 0.004613399505615234, "step": 2848} {"info/global_step": 2849, "train_info/time_within_train_step": 2.6918911933898926, "step": 2849} {"train_info/time_between_train_steps": 0.003252744674682617, "step": 2849} {"info/global_step": 2850, "train_info/time_within_train_step": 2.6861846446990967, "step": 2850} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746320073, "_runtime": 8229}, "step": 2850} {"logs": {"train/loss": 3.9803, "train/learning_rate": 3.333333333333333e-05, "train/epoch": 3.1, "_timestamp": 1746320073, "_runtime": 8229}, "step": 2850} {"train_info/time_between_train_steps": 0.023908376693725586, "step": 2850} {"info/global_step": 2851, "train_info/time_within_train_step": 2.684126377105713, "step": 2851} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 2851} {"info/global_step": 2852, "train_info/time_within_train_step": 2.6848392486572266, "step": 2852} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 2852} {"info/global_step": 2853, "train_info/time_within_train_step": 2.684788227081299, "step": 2853} {"train_info/time_between_train_steps": 0.0032439231872558594, "step": 2853} {"info/global_step": 2854, "train_info/time_within_train_step": 2.68997859954834, "step": 2854} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 2854} {"info/global_step": 2855, "train_info/time_within_train_step": 2.684037685394287, "step": 2855} {"train_info/time_between_train_steps": 0.0033028125762939453, "step": 2855} {"info/global_step": 2856, "train_info/time_within_train_step": 2.6848437786102295, "step": 2856} {"train_info/time_between_train_steps": 0.0032341480255126953, "step": 2856} {"info/global_step": 2857, "train_info/time_within_train_step": 2.6830122470855713, "step": 2857} {"train_info/time_between_train_steps": 0.0032973289489746094, "step": 2857} {"info/global_step": 2858, "train_info/time_within_train_step": 2.6835744380950928, "step": 2858} {"train_info/time_between_train_steps": 0.003446817398071289, "step": 2858} {"info/global_step": 2859, "train_info/time_within_train_step": 2.6836066246032715, "step": 2859} {"train_info/time_between_train_steps": 0.00347137451171875, "step": 2859} {"info/global_step": 2860, "train_info/time_within_train_step": 2.6847386360168457, "step": 2860} {"train_info/time_between_train_steps": 0.003297567367553711, "step": 2860} {"info/global_step": 2861, "train_info/time_within_train_step": 2.6839029788970947, "step": 2861} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 2861} {"info/global_step": 2862, "train_info/time_within_train_step": 2.685041904449463, "step": 2862} {"train_info/time_between_train_steps": 0.003300189971923828, "step": 2862} {"info/global_step": 2863, "train_info/time_within_train_step": 2.6836600303649902, "step": 2863} {"train_info/time_between_train_steps": 0.0034155845642089844, "step": 2863} {"info/global_step": 2864, "train_info/time_within_train_step": 2.684621572494507, "step": 2864} {"train_info/time_between_train_steps": 0.0033140182495117188, "step": 2864} {"info/global_step": 2865, "train_info/time_within_train_step": 2.6840641498565674, "step": 2865} {"train_info/time_between_train_steps": 0.003428936004638672, "step": 2865} {"info/global_step": 2866, "train_info/time_within_train_step": 2.6846678256988525, "step": 2866} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 2866} {"info/global_step": 2867, "train_info/time_within_train_step": 2.6837754249572754, "step": 2867} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 2867} {"info/global_step": 2868, "train_info/time_within_train_step": 2.736147880554199, "step": 2868} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 2868} {"info/global_step": 2869, "train_info/time_within_train_step": 2.6839611530303955, "step": 2869} {"train_info/time_between_train_steps": 0.0034956932067871094, "step": 2869} {"info/global_step": 2870, "train_info/time_within_train_step": 2.960514783859253, "step": 2870} {"train_info/time_between_train_steps": 0.003365755081176758, "step": 2870} {"info/global_step": 2871, "train_info/time_within_train_step": 2.683790922164917, "step": 2871} {"train_info/time_between_train_steps": 0.0033910274505615234, "step": 2871} {"info/global_step": 2872, "train_info/time_within_train_step": 2.8185744285583496, "step": 2872} {"train_info/time_between_train_steps": 0.003237009048461914, "step": 2872} {"info/global_step": 2873, "train_info/time_within_train_step": 2.683745861053467, "step": 2873} {"train_info/time_between_train_steps": 0.0034029483795166016, "step": 2873} {"info/global_step": 2874, "train_info/time_within_train_step": 2.683868885040283, "step": 2874} {"train_info/time_between_train_steps": 0.0032444000244140625, "step": 2874} {"info/global_step": 2875, "train_info/time_within_train_step": 2.6834447383880615, "step": 2875} {"train_info/time_between_train_steps": 0.0033495426177978516, "step": 2875} {"info/global_step": 2876, "train_info/time_within_train_step": 2.68328857421875, "step": 2876} {"train_info/time_between_train_steps": 0.0032787322998046875, "step": 2876} {"info/global_step": 2877, "train_info/time_within_train_step": 2.683326005935669, "step": 2877} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 2877} {"info/global_step": 2878, "train_info/time_within_train_step": 2.6830217838287354, "step": 2878} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 2878} {"info/global_step": 2879, "train_info/time_within_train_step": 2.684370756149292, "step": 2879} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 2879} {"info/global_step": 2880, "train_info/time_within_train_step": 2.685321569442749, "step": 2880} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 2880} {"info/global_step": 2881, "train_info/time_within_train_step": 2.684849500656128, "step": 2881} {"train_info/time_between_train_steps": 0.0032377243041992188, "step": 2881} {"info/global_step": 2882, "train_info/time_within_train_step": 2.6835625171661377, "step": 2882} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 2882} {"info/global_step": 2883, "train_info/time_within_train_step": 2.683943510055542, "step": 2883} {"train_info/time_between_train_steps": 0.0032243728637695312, "step": 2883} {"info/global_step": 2884, "train_info/time_within_train_step": 2.684128761291504, "step": 2884} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 2884} {"info/global_step": 2885, "train_info/time_within_train_step": 2.6834969520568848, "step": 2885} {"train_info/time_between_train_steps": 0.003265380859375, "step": 2885} {"info/global_step": 2886, "train_info/time_within_train_step": 2.6836953163146973, "step": 2886} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 2886} {"info/global_step": 2887, "train_info/time_within_train_step": 2.683633804321289, "step": 2887} {"train_info/time_between_train_steps": 0.0032453536987304688, "step": 2887} {"info/global_step": 2888, "train_info/time_within_train_step": 2.6839427947998047, "step": 2888} {"train_info/time_between_train_steps": 0.003264188766479492, "step": 2888} {"info/global_step": 2889, "train_info/time_within_train_step": 2.683303117752075, "step": 2889} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 2889} {"info/global_step": 2890, "train_info/time_within_train_step": 2.7344284057617188, "step": 2890} {"train_info/time_between_train_steps": 0.0032994747161865234, "step": 2890} {"info/global_step": 2891, "train_info/time_within_train_step": 2.6835925579071045, "step": 2891} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 2891} {"info/global_step": 2892, "train_info/time_within_train_step": 2.6827805042266846, "step": 2892} {"train_info/time_between_train_steps": 0.0032503604888916016, "step": 2892} {"info/global_step": 2893, "train_info/time_within_train_step": 2.6841416358947754, "step": 2893} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 2893} {"info/global_step": 2894, "train_info/time_within_train_step": 2.6839215755462646, "step": 2894} {"train_info/time_between_train_steps": 0.003283977508544922, "step": 2894} {"info/global_step": 2895, "train_info/time_within_train_step": 2.6835873126983643, "step": 2895} {"train_info/time_between_train_steps": 0.003229856491088867, "step": 2895} {"info/global_step": 2896, "train_info/time_within_train_step": 2.6829307079315186, "step": 2896} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 2896} {"info/global_step": 2897, "train_info/time_within_train_step": 2.684117078781128, "step": 2897} {"train_info/time_between_train_steps": 0.003252744674682617, "step": 2897} {"info/global_step": 2898, "train_info/time_within_train_step": 2.6832597255706787, "step": 2898} {"train_info/time_between_train_steps": 0.0032274723052978516, "step": 2898} {"info/global_step": 2899, "train_info/time_within_train_step": 2.6843085289001465, "step": 2899} {"train_info/time_between_train_steps": 0.003278970718383789, "step": 2899} {"info/global_step": 2900, "train_info/time_within_train_step": 2.6839263439178467, "step": 2900} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746320209, "_runtime": 8365}, "step": 2900} {"logs": {"train/loss": 3.9802, "train/learning_rate": 2.222222222222222e-05, "train/epoch": 3.11, "_timestamp": 1746320209, "_runtime": 8365}, "step": 2900} {"train_info/time_between_train_steps": 13.02354645729065, "step": 2900} {"info/global_step": 2901, "train_info/time_within_train_step": 2.4898881912231445, "step": 2901} {"train_info/time_between_train_steps": 0.003325939178466797, "step": 2901} {"info/global_step": 2902, "train_info/time_within_train_step": 2.498708724975586, "step": 2902} {"train_info/time_between_train_steps": 0.003746509552001953, "step": 2902} {"info/global_step": 2903, "train_info/time_within_train_step": 2.6782424449920654, "step": 2903} {"train_info/time_between_train_steps": 0.0033288002014160156, "step": 2903} {"info/global_step": 2904, "train_info/time_within_train_step": 2.6793479919433594, "step": 2904} {"train_info/time_between_train_steps": 0.0032422542572021484, "step": 2904} {"info/global_step": 2905, "train_info/time_within_train_step": 2.680718421936035, "step": 2905} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 2905} {"info/global_step": 2906, "train_info/time_within_train_step": 2.6800901889801025, "step": 2906} {"train_info/time_between_train_steps": 0.003256559371948242, "step": 2906} {"info/global_step": 2907, "train_info/time_within_train_step": 2.6815085411071777, "step": 2907} {"train_info/time_between_train_steps": 0.0033059120178222656, "step": 2907} {"info/global_step": 2908, "train_info/time_within_train_step": 2.6822757720947266, "step": 2908} {"train_info/time_between_train_steps": 0.0032727718353271484, "step": 2908} {"info/global_step": 2909, "train_info/time_within_train_step": 2.6832423210144043, "step": 2909} {"train_info/time_between_train_steps": 0.003271818161010742, "step": 2909} {"info/global_step": 2910, "train_info/time_within_train_step": 2.6836678981781006, "step": 2910} {"train_info/time_between_train_steps": 0.0032815933227539062, "step": 2910} {"info/global_step": 2911, "train_info/time_within_train_step": 2.682960033416748, "step": 2911} {"train_info/time_between_train_steps": 0.003261089324951172, "step": 2911} {"info/global_step": 2912, "train_info/time_within_train_step": 2.693720817565918, "step": 2912} {"train_info/time_between_train_steps": 0.0032939910888671875, "step": 2912} {"info/global_step": 2913, "train_info/time_within_train_step": 2.689425230026245, "step": 2913} {"train_info/time_between_train_steps": 0.003271341323852539, "step": 2913} {"info/global_step": 2914, "train_info/time_within_train_step": 2.6842117309570312, "step": 2914} {"train_info/time_between_train_steps": 0.0034890174865722656, "step": 2914} {"info/global_step": 2915, "train_info/time_within_train_step": 2.685508966445923, "step": 2915} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 2915} {"info/global_step": 2916, "train_info/time_within_train_step": 2.791796922683716, "step": 2916} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 2916} {"info/global_step": 2917, "train_info/time_within_train_step": 2.778681993484497, "step": 2917} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 2917} {"info/global_step": 2918, "train_info/time_within_train_step": 2.9646050930023193, "step": 2918} {"train_info/time_between_train_steps": 0.0034911632537841797, "step": 2918} {"info/global_step": 2919, "train_info/time_within_train_step": 2.694193124771118, "step": 2919} {"train_info/time_between_train_steps": 0.0033321380615234375, "step": 2919} {"info/global_step": 2920, "train_info/time_within_train_step": 2.7005538940429688, "step": 2920} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 2920} {"info/global_step": 2921, "train_info/time_within_train_step": 2.683399200439453, "step": 2921} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 2921} {"info/global_step": 2922, "train_info/time_within_train_step": 2.6854045391082764, "step": 2922} {"train_info/time_between_train_steps": 0.0032663345336914062, "step": 2922} {"info/global_step": 2923, "train_info/time_within_train_step": 2.704617977142334, "step": 2923} {"train_info/time_between_train_steps": 0.0034220218658447266, "step": 2923} {"info/global_step": 2924, "train_info/time_within_train_step": 2.6931896209716797, "step": 2924} {"train_info/time_between_train_steps": 0.003406524658203125, "step": 2924} {"info/global_step": 2925, "train_info/time_within_train_step": 2.6939187049865723, "step": 2925} {"train_info/time_between_train_steps": 0.0033371448516845703, "step": 2925} {"info/global_step": 2926, "train_info/time_within_train_step": 2.7042078971862793, "step": 2926} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 2926} {"info/global_step": 2927, "train_info/time_within_train_step": 2.708972930908203, "step": 2927} {"train_info/time_between_train_steps": 0.0032951831817626953, "step": 2927} {"info/global_step": 2928, "train_info/time_within_train_step": 2.6849305629730225, "step": 2928} {"train_info/time_between_train_steps": 0.0032558441162109375, "step": 2928} {"info/global_step": 2929, "train_info/time_within_train_step": 2.6953935623168945, "step": 2929} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 2929} {"info/global_step": 2930, "train_info/time_within_train_step": 2.6968231201171875, "step": 2930} {"train_info/time_between_train_steps": 0.003381013870239258, "step": 2930} {"info/global_step": 2931, "train_info/time_within_train_step": 2.6835663318634033, "step": 2931} {"train_info/time_between_train_steps": 0.003215789794921875, "step": 2931} {"info/global_step": 2932, "train_info/time_within_train_step": 2.6843717098236084, "step": 2932} {"train_info/time_between_train_steps": 0.003637552261352539, "step": 2932} {"info/global_step": 2933, "train_info/time_within_train_step": 2.684401512145996, "step": 2933} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 2933} {"info/global_step": 2934, "train_info/time_within_train_step": 2.6939897537231445, "step": 2934} {"train_info/time_between_train_steps": 0.14198899269104004, "step": 2934} {"info/global_step": 2935, "train_info/time_within_train_step": 2.6885104179382324, "step": 2935} {"train_info/time_between_train_steps": 0.0032889842987060547, "step": 2935} {"info/global_step": 2936, "train_info/time_within_train_step": 2.684002161026001, "step": 2936} {"train_info/time_between_train_steps": 0.0032291412353515625, "step": 2936} {"info/global_step": 2937, "train_info/time_within_train_step": 2.68475604057312, "step": 2937} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 2937} {"info/global_step": 2938, "train_info/time_within_train_step": 2.6861143112182617, "step": 2938} {"train_info/time_between_train_steps": 0.0032389163970947266, "step": 2938} {"info/global_step": 2939, "train_info/time_within_train_step": 2.6857247352600098, "step": 2939} {"train_info/time_between_train_steps": 0.0033338069915771484, "step": 2939} {"info/global_step": 2940, "train_info/time_within_train_step": 2.6879703998565674, "step": 2940} {"train_info/time_between_train_steps": 0.003308534622192383, "step": 2940} {"info/global_step": 2941, "train_info/time_within_train_step": 2.687052011489868, "step": 2941} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 2941} {"info/global_step": 2942, "train_info/time_within_train_step": 2.686429977416992, "step": 2942} {"train_info/time_between_train_steps": 0.0032923221588134766, "step": 2942} {"info/global_step": 2943, "train_info/time_within_train_step": 2.685465097427368, "step": 2943} {"train_info/time_between_train_steps": 0.0033080577850341797, "step": 2943} {"info/global_step": 2944, "train_info/time_within_train_step": 2.6851840019226074, "step": 2944} {"train_info/time_between_train_steps": 0.003292560577392578, "step": 2944} {"info/global_step": 2945, "train_info/time_within_train_step": 2.6861462593078613, "step": 2945} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 2945} {"info/global_step": 2946, "train_info/time_within_train_step": 2.683528423309326, "step": 2946} {"train_info/time_between_train_steps": 0.0033054351806640625, "step": 2946} {"info/global_step": 2947, "train_info/time_within_train_step": 2.707430601119995, "step": 2947} {"train_info/time_between_train_steps": 0.003245115280151367, "step": 2947} {"info/global_step": 2948, "train_info/time_within_train_step": 2.6838924884796143, "step": 2948} {"train_info/time_between_train_steps": 0.0032625198364257812, "step": 2948} {"info/global_step": 2949, "train_info/time_within_train_step": 2.6828155517578125, "step": 2949} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 2949} {"info/global_step": 2950, "train_info/time_within_train_step": 2.685730457305908, "step": 2950} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746320358, "_runtime": 8514}, "step": 2950} {"logs": {"train/loss": 3.9708, "train/learning_rate": 1.111111111111111e-05, "train/epoch": 3.13, "_timestamp": 1746320358, "_runtime": 8514}, "step": 2950} {"train_info/time_between_train_steps": 0.024283647537231445, "step": 2950} {"info/global_step": 2951, "train_info/time_within_train_step": 2.682370185852051, "step": 2951} {"train_info/time_between_train_steps": 0.0032896995544433594, "step": 2951} {"info/global_step": 2952, "train_info/time_within_train_step": 2.683681011199951, "step": 2952} {"train_info/time_between_train_steps": 0.0032906532287597656, "step": 2952} {"info/global_step": 2953, "train_info/time_within_train_step": 2.6851117610931396, "step": 2953} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 2953} {"info/global_step": 2954, "train_info/time_within_train_step": 2.684597969055176, "step": 2954} {"train_info/time_between_train_steps": 0.0032711029052734375, "step": 2954} {"info/global_step": 2955, "train_info/time_within_train_step": 2.6847219467163086, "step": 2955} {"train_info/time_between_train_steps": 0.0032770633697509766, "step": 2955} {"info/global_step": 2956, "train_info/time_within_train_step": 2.6848666667938232, "step": 2956} {"train_info/time_between_train_steps": 0.0032982826232910156, "step": 2956} {"info/global_step": 2957, "train_info/time_within_train_step": 2.9599452018737793, "step": 2957} {"train_info/time_between_train_steps": 0.0033042430877685547, "step": 2957} {"info/global_step": 2958, "train_info/time_within_train_step": 2.6857492923736572, "step": 2958} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 2958} {"info/global_step": 2959, "train_info/time_within_train_step": 2.685772180557251, "step": 2959} {"train_info/time_between_train_steps": 0.003612518310546875, "step": 2959} {"info/global_step": 2960, "train_info/time_within_train_step": 2.6850404739379883, "step": 2960} {"train_info/time_between_train_steps": 0.003613710403442383, "step": 2960} {"info/global_step": 2961, "train_info/time_within_train_step": 2.684196949005127, "step": 2961} {"train_info/time_between_train_steps": 0.003594636917114258, "step": 2961} {"info/global_step": 2962, "train_info/time_within_train_step": 2.685285806655884, "step": 2962} {"train_info/time_between_train_steps": 0.0035796165466308594, "step": 2962} {"info/global_step": 2963, "train_info/time_within_train_step": 2.6852269172668457, "step": 2963} {"train_info/time_between_train_steps": 0.003968000411987305, "step": 2963} {"info/global_step": 2964, "train_info/time_within_train_step": 2.684610605239868, "step": 2964} {"train_info/time_between_train_steps": 0.004054546356201172, "step": 2964} {"info/global_step": 2965, "train_info/time_within_train_step": 2.683964967727661, "step": 2965} {"train_info/time_between_train_steps": 0.003841876983642578, "step": 2965} {"info/global_step": 2966, "train_info/time_within_train_step": 2.684868097305298, "step": 2966} {"train_info/time_between_train_steps": 0.0045166015625, "step": 2966} {"info/global_step": 2967, "train_info/time_within_train_step": 2.6840150356292725, "step": 2967} {"train_info/time_between_train_steps": 0.004051923751831055, "step": 2967} {"info/global_step": 2968, "train_info/time_within_train_step": 2.684727668762207, "step": 2968} {"train_info/time_between_train_steps": 0.0039615631103515625, "step": 2968} {"info/global_step": 2969, "train_info/time_within_train_step": 2.6853702068328857, "step": 2969} {"train_info/time_between_train_steps": 0.00389862060546875, "step": 2969} {"info/global_step": 2970, "train_info/time_within_train_step": 2.685060739517212, "step": 2970} {"train_info/time_between_train_steps": 0.003804922103881836, "step": 2970} {"info/global_step": 2971, "train_info/time_within_train_step": 2.6860623359680176, "step": 2971} {"train_info/time_between_train_steps": 0.0038890838623046875, "step": 2971} {"info/global_step": 2972, "train_info/time_within_train_step": 2.6861684322357178, "step": 2972} {"train_info/time_between_train_steps": 0.004182338714599609, "step": 2972} {"info/global_step": 2973, "train_info/time_within_train_step": 2.685607433319092, "step": 2973} {"train_info/time_between_train_steps": 0.0038917064666748047, "step": 2973} {"info/global_step": 2974, "train_info/time_within_train_step": 2.735957145690918, "step": 2974} {"train_info/time_between_train_steps": 0.003814220428466797, "step": 2974} {"info/global_step": 2975, "train_info/time_within_train_step": 2.685288190841675, "step": 2975} {"train_info/time_between_train_steps": 0.003972530364990234, "step": 2975} {"info/global_step": 2976, "train_info/time_within_train_step": 2.6863346099853516, "step": 2976} {"train_info/time_between_train_steps": 0.003857135772705078, "step": 2976} {"info/global_step": 2977, "train_info/time_within_train_step": 2.6860833168029785, "step": 2977} {"train_info/time_between_train_steps": 0.0038521289825439453, "step": 2977} {"info/global_step": 2978, "train_info/time_within_train_step": 2.684955358505249, "step": 2978} {"train_info/time_between_train_steps": 0.003803253173828125, "step": 2978} {"info/global_step": 2979, "train_info/time_within_train_step": 2.685380220413208, "step": 2979} {"train_info/time_between_train_steps": 0.004019737243652344, "step": 2979} {"info/global_step": 2980, "train_info/time_within_train_step": 2.6841683387756348, "step": 2980} {"train_info/time_between_train_steps": 0.003998994827270508, "step": 2980} {"info/global_step": 2981, "train_info/time_within_train_step": 2.683926582336426, "step": 2981} {"train_info/time_between_train_steps": 0.0038788318634033203, "step": 2981} {"info/global_step": 2982, "train_info/time_within_train_step": 2.6851887702941895, "step": 2982} {"train_info/time_between_train_steps": 0.0038716793060302734, "step": 2982} {"info/global_step": 2983, "train_info/time_within_train_step": 2.683793306350708, "step": 2983} {"train_info/time_between_train_steps": 0.0035524368286132812, "step": 2983} {"info/global_step": 2984, "train_info/time_within_train_step": 2.6838290691375732, "step": 2984} {"train_info/time_between_train_steps": 0.003525257110595703, "step": 2984} {"info/global_step": 2985, "train_info/time_within_train_step": 2.6840670108795166, "step": 2985} {"train_info/time_between_train_steps": 0.003939628601074219, "step": 2985} {"info/global_step": 2986, "train_info/time_within_train_step": 2.6844382286071777, "step": 2986} {"train_info/time_between_train_steps": 0.0038084983825683594, "step": 2986} {"info/global_step": 2987, "train_info/time_within_train_step": 2.6848926544189453, "step": 2987} {"train_info/time_between_train_steps": 0.003910064697265625, "step": 2987} {"info/global_step": 2988, "train_info/time_within_train_step": 2.6848573684692383, "step": 2988} {"train_info/time_between_train_steps": 0.0039653778076171875, "step": 2988} {"info/global_step": 2989, "train_info/time_within_train_step": 2.6847846508026123, "step": 2989} {"train_info/time_between_train_steps": 0.003808736801147461, "step": 2989} {"info/global_step": 2990, "train_info/time_within_train_step": 2.6859922409057617, "step": 2990} {"train_info/time_between_train_steps": 0.0038356781005859375, "step": 2990} {"info/global_step": 2991, "train_info/time_within_train_step": 2.6853251457214355, "step": 2991} {"train_info/time_between_train_steps": 0.0036995410919189453, "step": 2991} {"info/global_step": 2992, "train_info/time_within_train_step": 2.684784412384033, "step": 2992} {"train_info/time_between_train_steps": 0.00399470329284668, "step": 2992} {"info/global_step": 2993, "train_info/time_within_train_step": 2.685807704925537, "step": 2993} {"train_info/time_between_train_steps": 0.0036721229553222656, "step": 2993} {"info/global_step": 2994, "train_info/time_within_train_step": 2.688661813735962, "step": 2994} {"train_info/time_between_train_steps": 0.0036935806274414062, "step": 2994} {"info/global_step": 2995, "train_info/time_within_train_step": 2.6932976245880127, "step": 2995} {"train_info/time_between_train_steps": 0.0038306713104248047, "step": 2995} {"info/global_step": 2996, "train_info/time_within_train_step": 3.160161256790161, "step": 2996} {"train_info/time_between_train_steps": 0.0032727718353271484, "step": 2996} {"info/global_step": 2997, "train_info/time_within_train_step": 2.8422813415527344, "step": 2997} {"train_info/time_between_train_steps": 0.003269195556640625, "step": 2997} {"info/global_step": 2998, "train_info/time_within_train_step": 2.681943893432617, "step": 2998} {"train_info/time_between_train_steps": 0.003565073013305664, "step": 2998} {"info/global_step": 2999, "train_info/time_within_train_step": 3.2265400886535645, "step": 2999} {"train_info/time_between_train_steps": 0.0032699108123779297, "step": 2999} {"info/global_step": 3000, "train_info/time_within_train_step": 2.6819920539855957, "step": 3000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746320495, "_runtime": 8651}, "step": 3000} {"logs": {"train/loss": 3.9496, "train/learning_rate": 0.0, "train/epoch": 3.15, "_timestamp": 1746320495, "_runtime": 8651}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746320500, "_runtime": 8656}, "step": 3000} {"logs": {"eval/loss": 4.614820957183838, "eval/runtime": 5.2275, "eval/samples_per_second": 36.346, "eval/steps_per_second": 1.148, "train/epoch": 3.15, "_timestamp": 1746320500, "_runtime": 8656}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746320500, "_runtime": 8656}, "step": 3000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.614820957183838, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 100.96974900581537, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.2275, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.346, "train/epoch": 3.15, "_timestamp": 1746320500, "_runtime": 8656}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746320521, "_runtime": 8677}, "step": 3000} {"logs": {"train/train_runtime": 8677.884, "train/train_samples_per_second": 22.125, "train/train_steps_per_second": 0.346, "train/total_flos": 2.5096577089536e+16, "train/train_loss": 4.75397075843811, "train/epoch": 3.15, "_timestamp": 1746320521, "_runtime": 8677}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1681.771484375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746320533, "_runtime": 8689}, "step": 3000} {"logs": {"eval/loss": 4.614820957183838, "eval/runtime": 4.7995, "eval/samples_per_second": 39.588, "eval/steps_per_second": 1.25, "train/epoch": 3.15, "_timestamp": 1746320533, "_runtime": 8689}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1681.771484375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746320533, "_runtime": 8689}, "step": 3000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.614820957183838, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 100.96974900581537, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 4.7995, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 39.588, "train/epoch": 3.15, "_timestamp": 1746320533, "_runtime": 8689}, "step": 3000}