{"num_parameters": 106511616, "trainable_parameters": 106511616, "step": 0} {"train_info/time_between_train_steps": 2.2734591960906982, "step": 0} {"info/global_step": 1, "train_info/time_within_train_step": 4.585665225982666, "step": 1} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 4317.87890625, "train_info/memory_reserved": 4498.0, "train_info/memory_max_reserved": 4498.0, "_timestamp": 1746897429, "_runtime": 27}, "step": 1} {"logs": {"train/loss": 10.23, "train/learning_rate": 6e-07, "train/epoch": 0.0, "_timestamp": 1746897429, "_runtime": 27}, "step": 1} {"train_info/time_between_train_steps": 0.02540731430053711, "step": 1} {"info/global_step": 2, "train_info/time_within_train_step": 2.4225106239318848, "step": 2} {"train_info/time_between_train_steps": 0.003737211227416992, "step": 2} {"info/global_step": 3, "train_info/time_within_train_step": 2.4717442989349365, "step": 3} {"train_info/time_between_train_steps": 0.0035915374755859375, "step": 3} {"info/global_step": 4, "train_info/time_within_train_step": 2.5777573585510254, "step": 4} {"train_info/time_between_train_steps": 0.003740072250366211, "step": 4} {"info/global_step": 5, "train_info/time_within_train_step": 2.6288928985595703, "step": 5} {"train_info/time_between_train_steps": 0.0038993358612060547, "step": 5} {"info/global_step": 6, "train_info/time_within_train_step": 2.6258678436279297, "step": 6} {"train_info/time_between_train_steps": 0.0035507678985595703, "step": 6} {"info/global_step": 7, "train_info/time_within_train_step": 2.6537091732025146, "step": 7} {"train_info/time_between_train_steps": 0.003614187240600586, "step": 7} {"info/global_step": 8, "train_info/time_within_train_step": 2.6412007808685303, "step": 8} {"train_info/time_between_train_steps": 0.003690004348754883, "step": 8} {"info/global_step": 9, "train_info/time_within_train_step": 2.635479688644409, "step": 9} {"train_info/time_between_train_steps": 0.003678560256958008, "step": 9} {"info/global_step": 10, "train_info/time_within_train_step": 2.9624342918395996, "step": 10} {"train_info/time_between_train_steps": 0.003587961196899414, "step": 10} {"info/global_step": 11, "train_info/time_within_train_step": 2.647695302963257, "step": 11} {"train_info/time_between_train_steps": 0.004015922546386719, "step": 11} {"info/global_step": 12, "train_info/time_within_train_step": 2.6384732723236084, "step": 12} {"train_info/time_between_train_steps": 0.003813505172729492, "step": 12} {"info/global_step": 13, "train_info/time_within_train_step": 2.6428089141845703, "step": 13} {"train_info/time_between_train_steps": 0.0038852691650390625, "step": 13} {"info/global_step": 14, "train_info/time_within_train_step": 2.655980110168457, "step": 14} {"train_info/time_between_train_steps": 0.0037157535552978516, "step": 14} {"info/global_step": 15, "train_info/time_within_train_step": 2.664846181869507, "step": 15} {"train_info/time_between_train_steps": 0.003726482391357422, "step": 15} {"info/global_step": 16, "train_info/time_within_train_step": 2.7072300910949707, "step": 16} {"train_info/time_between_train_steps": 0.003999471664428711, "step": 16} {"info/global_step": 17, "train_info/time_within_train_step": 2.645969867706299, "step": 17} {"train_info/time_between_train_steps": 0.0036182403564453125, "step": 17} {"info/global_step": 18, "train_info/time_within_train_step": 2.6573195457458496, "step": 18} {"train_info/time_between_train_steps": 0.003885984420776367, "step": 18} {"info/global_step": 19, "train_info/time_within_train_step": 2.6416070461273193, "step": 19} {"train_info/time_between_train_steps": 0.0037887096405029297, "step": 19} {"info/global_step": 20, "train_info/time_within_train_step": 2.647225856781006, "step": 20} {"train_info/time_between_train_steps": 0.0038673877716064453, "step": 20} {"info/global_step": 21, "train_info/time_within_train_step": 2.6581997871398926, "step": 21} {"train_info/time_between_train_steps": 0.003765583038330078, "step": 21} {"info/global_step": 22, "train_info/time_within_train_step": 2.6518635749816895, "step": 22} {"train_info/time_between_train_steps": 0.0038046836853027344, "step": 22} {"info/global_step": 23, "train_info/time_within_train_step": 2.642136335372925, "step": 23} {"train_info/time_between_train_steps": 0.0041332244873046875, "step": 23} {"info/global_step": 24, "train_info/time_within_train_step": 2.660740852355957, "step": 24} {"train_info/time_between_train_steps": 0.0037109851837158203, "step": 24} {"info/global_step": 25, "train_info/time_within_train_step": 2.6667697429656982, "step": 25} {"train_info/time_between_train_steps": 0.003950595855712891, "step": 25} {"info/global_step": 26, "train_info/time_within_train_step": 2.684709310531616, "step": 26} {"train_info/time_between_train_steps": 0.003942012786865234, "step": 26} {"info/global_step": 27, "train_info/time_within_train_step": 2.648357629776001, "step": 27} {"train_info/time_between_train_steps": 0.0038695335388183594, "step": 27} {"info/global_step": 28, "train_info/time_within_train_step": 2.6942086219787598, "step": 28} {"train_info/time_between_train_steps": 0.003911495208740234, "step": 28} {"info/global_step": 29, "train_info/time_within_train_step": 2.641881227493286, "step": 29} {"train_info/time_between_train_steps": 0.0039005279541015625, "step": 29} {"info/global_step": 30, "train_info/time_within_train_step": 2.6496925354003906, "step": 30} {"train_info/time_between_train_steps": 0.003684520721435547, "step": 30} {"info/global_step": 31, "train_info/time_within_train_step": 2.64616060256958, "step": 31} {"train_info/time_between_train_steps": 0.0038542747497558594, "step": 31} {"info/global_step": 32, "train_info/time_within_train_step": 2.6605215072631836, "step": 32} {"train_info/time_between_train_steps": 0.00371551513671875, "step": 32} {"info/global_step": 33, "train_info/time_within_train_step": 2.662987470626831, "step": 33} {"train_info/time_between_train_steps": 0.0037207603454589844, "step": 33} {"info/global_step": 34, "train_info/time_within_train_step": 2.657768726348877, "step": 34} {"train_info/time_between_train_steps": 0.0037622451782226562, "step": 34} {"info/global_step": 35, "train_info/time_within_train_step": 2.708662748336792, "step": 35} {"train_info/time_between_train_steps": 0.003873109817504883, "step": 35} {"info/global_step": 36, "train_info/time_within_train_step": 2.6446986198425293, "step": 36} {"train_info/time_between_train_steps": 0.0036270618438720703, "step": 36} {"info/global_step": 37, "train_info/time_within_train_step": 2.6399056911468506, "step": 37} {"train_info/time_between_train_steps": 0.004118442535400391, "step": 37} {"info/global_step": 38, "train_info/time_within_train_step": 2.6564254760742188, "step": 38} {"train_info/time_between_train_steps": 0.0036962032318115234, "step": 38} {"info/global_step": 39, "train_info/time_within_train_step": 2.653698205947876, "step": 39} {"train_info/time_between_train_steps": 0.0036618709564208984, "step": 39} {"info/global_step": 40, "train_info/time_within_train_step": 2.656532049179077, "step": 40} {"train_info/time_between_train_steps": 0.00391697883605957, "step": 40} {"info/global_step": 41, "train_info/time_within_train_step": 2.6569597721099854, "step": 41} {"train_info/time_between_train_steps": 0.003673553466796875, "step": 41} {"info/global_step": 42, "train_info/time_within_train_step": 2.652373790740967, "step": 42} {"train_info/time_between_train_steps": 0.0040493011474609375, "step": 42} {"info/global_step": 43, "train_info/time_within_train_step": 2.659292697906494, "step": 43} {"train_info/time_between_train_steps": 0.003926515579223633, "step": 43} {"info/global_step": 44, "train_info/time_within_train_step": 2.690234422683716, "step": 44} {"train_info/time_between_train_steps": 0.003915071487426758, "step": 44} {"info/global_step": 45, "train_info/time_within_train_step": 2.7272934913635254, "step": 45} {"train_info/time_between_train_steps": 0.003835439682006836, "step": 45} {"info/global_step": 46, "train_info/time_within_train_step": 2.648540735244751, "step": 46} {"train_info/time_between_train_steps": 0.003897428512573242, "step": 46} {"info/global_step": 47, "train_info/time_within_train_step": 2.6405911445617676, "step": 47} {"train_info/time_between_train_steps": 0.003656148910522461, "step": 47} {"info/global_step": 48, "train_info/time_within_train_step": 2.6590890884399414, "step": 48} {"train_info/time_between_train_steps": 0.0037429332733154297, "step": 48} {"info/global_step": 49, "train_info/time_within_train_step": 2.6482393741607666, "step": 49} {"train_info/time_between_train_steps": 0.0037784576416015625, "step": 49} {"info/global_step": 50, "train_info/time_within_train_step": 2.6488633155822754, "step": 50} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746897560, "_runtime": 158}, "step": 50} {"logs": {"train/loss": 8.7317, "train/learning_rate": 2.9999999999999997e-05, "train/epoch": 0.01, "_timestamp": 1746897560, "_runtime": 158}, "step": 50} {"train_info/time_between_train_steps": 0.024823427200317383, "step": 50} {"info/global_step": 51, "train_info/time_within_train_step": 2.6437253952026367, "step": 51} {"train_info/time_between_train_steps": 0.0036902427673339844, "step": 51} {"info/global_step": 52, "train_info/time_within_train_step": 2.6499502658843994, "step": 52} {"train_info/time_between_train_steps": 0.0038330554962158203, "step": 52} {"info/global_step": 53, "train_info/time_within_train_step": 2.655608892440796, "step": 53} {"train_info/time_between_train_steps": 0.0039250850677490234, "step": 53} {"info/global_step": 54, "train_info/time_within_train_step": 2.667764902114868, "step": 54} {"train_info/time_between_train_steps": 0.003918886184692383, "step": 54} {"info/global_step": 55, "train_info/time_within_train_step": 2.7183306217193604, "step": 55} {"train_info/time_between_train_steps": 0.0036394596099853516, "step": 55} {"info/global_step": 56, "train_info/time_within_train_step": 2.687405586242676, "step": 56} {"train_info/time_between_train_steps": 0.003753662109375, "step": 56} {"info/global_step": 57, "train_info/time_within_train_step": 2.651784896850586, "step": 57} {"train_info/time_between_train_steps": 0.003644227981567383, "step": 57} {"info/global_step": 58, "train_info/time_within_train_step": 2.6425299644470215, "step": 58} {"train_info/time_between_train_steps": 0.0039048194885253906, "step": 58} {"info/global_step": 59, "train_info/time_within_train_step": 2.6539340019226074, "step": 59} {"train_info/time_between_train_steps": 0.0038759708404541016, "step": 59} {"info/global_step": 60, "train_info/time_within_train_step": 2.6652708053588867, "step": 60} {"train_info/time_between_train_steps": 0.003772735595703125, "step": 60} {"info/global_step": 61, "train_info/time_within_train_step": 2.6586616039276123, "step": 61} {"train_info/time_between_train_steps": 0.0038917064666748047, "step": 61} {"info/global_step": 62, "train_info/time_within_train_step": 2.643420934677124, "step": 62} {"train_info/time_between_train_steps": 0.0037598609924316406, "step": 62} {"info/global_step": 63, "train_info/time_within_train_step": 2.8149406909942627, "step": 63} {"train_info/time_between_train_steps": 0.0036916732788085938, "step": 63} {"info/global_step": 64, "train_info/time_within_train_step": 2.643911123275757, "step": 64} {"train_info/time_between_train_steps": 0.0034897327423095703, "step": 64} {"info/global_step": 65, "train_info/time_within_train_step": 2.643320322036743, "step": 65} {"train_info/time_between_train_steps": 0.0036079883575439453, "step": 65} {"info/global_step": 66, "train_info/time_within_train_step": 2.654489755630493, "step": 66} {"train_info/time_between_train_steps": 0.0035750865936279297, "step": 66} {"info/global_step": 67, "train_info/time_within_train_step": 2.668888568878174, "step": 67} {"train_info/time_between_train_steps": 0.0034627914428710938, "step": 67} {"info/global_step": 68, "train_info/time_within_train_step": 2.676070213317871, "step": 68} {"train_info/time_between_train_steps": 0.003411531448364258, "step": 68} {"info/global_step": 69, "train_info/time_within_train_step": 2.6503217220306396, "step": 69} {"train_info/time_between_train_steps": 0.003551483154296875, "step": 69} {"info/global_step": 70, "train_info/time_within_train_step": 2.6623432636260986, "step": 70} {"train_info/time_between_train_steps": 0.003484964370727539, "step": 70} {"info/global_step": 71, "train_info/time_within_train_step": 2.644557237625122, "step": 71} {"train_info/time_between_train_steps": 0.0034148693084716797, "step": 71} {"info/global_step": 72, "train_info/time_within_train_step": 2.643465518951416, "step": 72} {"train_info/time_between_train_steps": 0.0037279129028320312, "step": 72} {"info/global_step": 73, "train_info/time_within_train_step": 2.6641578674316406, "step": 73} {"train_info/time_between_train_steps": 0.003650188446044922, "step": 73} {"info/global_step": 74, "train_info/time_within_train_step": 2.6652722358703613, "step": 74} {"train_info/time_between_train_steps": 0.0034224987030029297, "step": 74} {"info/global_step": 75, "train_info/time_within_train_step": 2.7066025733947754, "step": 75} {"train_info/time_between_train_steps": 0.003530740737915039, "step": 75} {"info/global_step": 76, "train_info/time_within_train_step": 2.6407859325408936, "step": 76} {"train_info/time_between_train_steps": 0.0035605430603027344, "step": 76} {"info/global_step": 77, "train_info/time_within_train_step": 2.64726185798645, "step": 77} {"train_info/time_between_train_steps": 0.003660917282104492, "step": 77} {"info/global_step": 78, "train_info/time_within_train_step": 2.66076397895813, "step": 78} {"train_info/time_between_train_steps": 0.0037462711334228516, "step": 78} {"info/global_step": 79, "train_info/time_within_train_step": 2.6423442363739014, "step": 79} {"train_info/time_between_train_steps": 0.003734588623046875, "step": 79} {"info/global_step": 80, "train_info/time_within_train_step": 2.6477696895599365, "step": 80} {"train_info/time_between_train_steps": 0.003754854202270508, "step": 80} {"info/global_step": 81, "train_info/time_within_train_step": 2.648333787918091, "step": 81} {"train_info/time_between_train_steps": 0.00379180908203125, "step": 81} {"info/global_step": 82, "train_info/time_within_train_step": 2.654003143310547, "step": 82} {"train_info/time_between_train_steps": 0.0037174224853515625, "step": 82} {"info/global_step": 83, "train_info/time_within_train_step": 2.6575427055358887, "step": 83} {"train_info/time_between_train_steps": 0.003648042678833008, "step": 83} {"info/global_step": 84, "train_info/time_within_train_step": 2.6763248443603516, "step": 84} {"train_info/time_between_train_steps": 0.003846883773803711, "step": 84} {"info/global_step": 85, "train_info/time_within_train_step": 2.7341136932373047, "step": 85} {"train_info/time_between_train_steps": 0.0036211013793945312, "step": 85} {"info/global_step": 86, "train_info/time_within_train_step": 2.664943218231201, "step": 86} {"train_info/time_between_train_steps": 0.0037903785705566406, "step": 86} {"info/global_step": 87, "train_info/time_within_train_step": 2.641519069671631, "step": 87} {"train_info/time_between_train_steps": 0.0036280155181884766, "step": 87} {"info/global_step": 88, "train_info/time_within_train_step": 2.644519329071045, "step": 88} {"train_info/time_between_train_steps": 0.003625154495239258, "step": 88} {"info/global_step": 89, "train_info/time_within_train_step": 2.643639326095581, "step": 89} {"train_info/time_between_train_steps": 0.003729581832885742, "step": 89} {"info/global_step": 90, "train_info/time_within_train_step": 2.6435885429382324, "step": 90} {"train_info/time_between_train_steps": 0.003795146942138672, "step": 90} {"info/global_step": 91, "train_info/time_within_train_step": 2.6916747093200684, "step": 91} {"train_info/time_between_train_steps": 0.00398707389831543, "step": 91} {"info/global_step": 92, "train_info/time_within_train_step": 2.6470911502838135, "step": 92} {"train_info/time_between_train_steps": 0.0038607120513916016, "step": 92} {"info/global_step": 93, "train_info/time_within_train_step": 2.6465795040130615, "step": 93} {"train_info/time_between_train_steps": 0.00410008430480957, "step": 93} {"info/global_step": 94, "train_info/time_within_train_step": 2.646484851837158, "step": 94} {"train_info/time_between_train_steps": 0.0039768218994140625, "step": 94} {"info/global_step": 95, "train_info/time_within_train_step": 2.6452558040618896, "step": 95} {"train_info/time_between_train_steps": 0.00360870361328125, "step": 95} {"info/global_step": 96, "train_info/time_within_train_step": 2.6784424781799316, "step": 96} {"train_info/time_between_train_steps": 0.003630399703979492, "step": 96} {"info/global_step": 97, "train_info/time_within_train_step": 2.6463778018951416, "step": 97} {"train_info/time_between_train_steps": 0.0037522315979003906, "step": 97} {"info/global_step": 98, "train_info/time_within_train_step": 2.6519577503204346, "step": 98} {"train_info/time_between_train_steps": 0.003850221633911133, "step": 98} {"info/global_step": 99, "train_info/time_within_train_step": 2.6468183994293213, "step": 99} {"train_info/time_between_train_steps": 0.003731966018676758, "step": 99} {"info/global_step": 100, "train_info/time_within_train_step": 2.660555601119995, "step": 100} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746897695, "_runtime": 293}, "step": 100} {"logs": {"train/loss": 7.5156, "train/learning_rate": 5.9999999999999995e-05, "train/epoch": 0.01, "_timestamp": 1746897695, "_runtime": 293}, "step": 100} {"train_info/time_between_train_steps": 0.02456045150756836, "step": 100} {"info/global_step": 101, "train_info/time_within_train_step": 2.6466431617736816, "step": 101} {"train_info/time_between_train_steps": 0.0037004947662353516, "step": 101} {"info/global_step": 102, "train_info/time_within_train_step": 2.649376392364502, "step": 102} {"train_info/time_between_train_steps": 0.0036525726318359375, "step": 102} {"info/global_step": 103, "train_info/time_within_train_step": 3.0276777744293213, "step": 103} {"train_info/time_between_train_steps": 0.003601551055908203, "step": 103} {"info/global_step": 104, "train_info/time_within_train_step": 2.6377460956573486, "step": 104} {"train_info/time_between_train_steps": 0.003618478775024414, "step": 104} {"info/global_step": 105, "train_info/time_within_train_step": 2.6396491527557373, "step": 105} {"train_info/time_between_train_steps": 0.0034296512603759766, "step": 105} {"info/global_step": 106, "train_info/time_within_train_step": 2.657653331756592, "step": 106} {"train_info/time_between_train_steps": 0.0034694671630859375, "step": 106} {"info/global_step": 107, "train_info/time_within_train_step": 2.651566743850708, "step": 107} {"train_info/time_between_train_steps": 0.0035753250122070312, "step": 107} {"info/global_step": 108, "train_info/time_within_train_step": 2.6482341289520264, "step": 108} {"train_info/time_between_train_steps": 0.0033974647521972656, "step": 108} {"info/global_step": 109, "train_info/time_within_train_step": 2.6487700939178467, "step": 109} {"train_info/time_between_train_steps": 0.003482341766357422, "step": 109} {"info/global_step": 110, "train_info/time_within_train_step": 2.6519577503204346, "step": 110} {"train_info/time_between_train_steps": 0.003590822219848633, "step": 110} {"info/global_step": 111, "train_info/time_within_train_step": 2.665163278579712, "step": 111} {"train_info/time_between_train_steps": 0.003448963165283203, "step": 111} {"info/global_step": 112, "train_info/time_within_train_step": 2.706273078918457, "step": 112} {"train_info/time_between_train_steps": 0.0033111572265625, "step": 112} {"info/global_step": 113, "train_info/time_within_train_step": 2.6508994102478027, "step": 113} {"train_info/time_between_train_steps": 0.003504037857055664, "step": 113} {"info/global_step": 114, "train_info/time_within_train_step": 2.661959409713745, "step": 114} {"train_info/time_between_train_steps": 0.003422975540161133, "step": 114} {"info/global_step": 115, "train_info/time_within_train_step": 2.6391806602478027, "step": 115} {"train_info/time_between_train_steps": 0.003373861312866211, "step": 115} {"info/global_step": 116, "train_info/time_within_train_step": 2.6454997062683105, "step": 116} {"train_info/time_between_train_steps": 0.0033228397369384766, "step": 116} {"info/global_step": 117, "train_info/time_within_train_step": 2.659065008163452, "step": 117} {"train_info/time_between_train_steps": 0.0032958984375, "step": 117} {"info/global_step": 118, "train_info/time_within_train_step": 2.6403920650482178, "step": 118} {"train_info/time_between_train_steps": 0.003381967544555664, "step": 118} {"info/global_step": 119, "train_info/time_within_train_step": 2.6433804035186768, "step": 119} {"train_info/time_between_train_steps": 0.0033571720123291016, "step": 119} {"info/global_step": 120, "train_info/time_within_train_step": 2.669602155685425, "step": 120} {"train_info/time_between_train_steps": 0.003360748291015625, "step": 120} {"info/global_step": 121, "train_info/time_within_train_step": 2.6643483638763428, "step": 121} {"train_info/time_between_train_steps": 0.003412008285522461, "step": 121} {"info/global_step": 122, "train_info/time_within_train_step": 2.6682868003845215, "step": 122} {"train_info/time_between_train_steps": 0.003294706344604492, "step": 122} {"info/global_step": 123, "train_info/time_within_train_step": 2.6733179092407227, "step": 123} {"train_info/time_between_train_steps": 0.003274202346801758, "step": 123} {"info/global_step": 124, "train_info/time_within_train_step": 2.641814947128296, "step": 124} {"train_info/time_between_train_steps": 0.003661632537841797, "step": 124} {"info/global_step": 125, "train_info/time_within_train_step": 2.65226149559021, "step": 125} {"train_info/time_between_train_steps": 0.14663338661193848, "step": 125} {"info/global_step": 126, "train_info/time_within_train_step": 2.6397342681884766, "step": 126} {"train_info/time_between_train_steps": 0.0035965442657470703, "step": 126} {"info/global_step": 127, "train_info/time_within_train_step": 2.6595511436462402, "step": 127} {"train_info/time_between_train_steps": 0.003479480743408203, "step": 127} {"info/global_step": 128, "train_info/time_within_train_step": 2.6650583744049072, "step": 128} {"train_info/time_between_train_steps": 0.0033512115478515625, "step": 128} {"info/global_step": 129, "train_info/time_within_train_step": 2.65911865234375, "step": 129} {"train_info/time_between_train_steps": 0.0032765865325927734, "step": 129} {"info/global_step": 130, "train_info/time_within_train_step": 2.701756715774536, "step": 130} {"train_info/time_between_train_steps": 0.0034432411193847656, "step": 130} {"info/global_step": 131, "train_info/time_within_train_step": 2.639336347579956, "step": 131} {"train_info/time_between_train_steps": 0.0034835338592529297, "step": 131} {"info/global_step": 132, "train_info/time_within_train_step": 2.6396939754486084, "step": 132} {"train_info/time_between_train_steps": 0.0034589767456054688, "step": 132} {"info/global_step": 133, "train_info/time_within_train_step": 2.659458637237549, "step": 133} {"train_info/time_between_train_steps": 0.0032367706298828125, "step": 133} {"info/global_step": 134, "train_info/time_within_train_step": 2.6454031467437744, "step": 134} {"train_info/time_between_train_steps": 0.0034830570220947266, "step": 134} {"info/global_step": 135, "train_info/time_within_train_step": 2.6413002014160156, "step": 135} {"train_info/time_between_train_steps": 0.0034303665161132812, "step": 135} {"info/global_step": 136, "train_info/time_within_train_step": 2.6575539112091064, "step": 136} {"train_info/time_between_train_steps": 0.0034339427947998047, "step": 136} {"info/global_step": 137, "train_info/time_within_train_step": 2.649918556213379, "step": 137} {"train_info/time_between_train_steps": 0.003414630889892578, "step": 137} {"info/global_step": 138, "train_info/time_within_train_step": 2.6589949131011963, "step": 138} {"train_info/time_between_train_steps": 0.003317594528198242, "step": 138} {"info/global_step": 139, "train_info/time_within_train_step": 2.710859537124634, "step": 139} {"train_info/time_between_train_steps": 0.003432035446166992, "step": 139} {"info/global_step": 140, "train_info/time_within_train_step": 2.68731689453125, "step": 140} {"train_info/time_between_train_steps": 0.0032854080200195312, "step": 140} {"info/global_step": 141, "train_info/time_within_train_step": 2.638458490371704, "step": 141} {"train_info/time_between_train_steps": 0.0033757686614990234, "step": 141} {"info/global_step": 142, "train_info/time_within_train_step": 2.6397011280059814, "step": 142} {"train_info/time_between_train_steps": 0.0033316612243652344, "step": 142} {"info/global_step": 143, "train_info/time_within_train_step": 2.6546289920806885, "step": 143} {"train_info/time_between_train_steps": 0.0033473968505859375, "step": 143} {"info/global_step": 144, "train_info/time_within_train_step": 2.6466116905212402, "step": 144} {"train_info/time_between_train_steps": 0.0035636425018310547, "step": 144} {"info/global_step": 145, "train_info/time_within_train_step": 2.6680684089660645, "step": 145} {"train_info/time_between_train_steps": 0.0033931732177734375, "step": 145} {"info/global_step": 146, "train_info/time_within_train_step": 2.6694514751434326, "step": 146} {"train_info/time_between_train_steps": 0.0033571720123291016, "step": 146} {"info/global_step": 147, "train_info/time_within_train_step": 2.6395201683044434, "step": 147} {"train_info/time_between_train_steps": 0.0034704208374023438, "step": 147} {"info/global_step": 148, "train_info/time_within_train_step": 2.644116163253784, "step": 148} {"train_info/time_between_train_steps": 0.0032622814178466797, "step": 148} {"info/global_step": 149, "train_info/time_within_train_step": 2.6527059078216553, "step": 149} {"train_info/time_between_train_steps": 0.0034346580505371094, "step": 149} {"info/global_step": 150, "train_info/time_within_train_step": 2.652418613433838, "step": 150} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746897830, "_runtime": 428}, "step": 150} {"logs": {"train/loss": 6.8763, "train/learning_rate": 8.999999999999999e-05, "train/epoch": 0.01, "_timestamp": 1746897830, "_runtime": 428}, "step": 150} {"train_info/time_between_train_steps": 0.024761676788330078, "step": 150} {"info/global_step": 151, "train_info/time_within_train_step": 2.6460070610046387, "step": 151} {"train_info/time_between_train_steps": 0.0033385753631591797, "step": 151} {"info/global_step": 152, "train_info/time_within_train_step": 2.641812801361084, "step": 152} {"train_info/time_between_train_steps": 0.0033750534057617188, "step": 152} {"info/global_step": 153, "train_info/time_within_train_step": 2.650261878967285, "step": 153} {"train_info/time_between_train_steps": 0.003384113311767578, "step": 153} {"info/global_step": 154, "train_info/time_within_train_step": 2.6673407554626465, "step": 154} {"train_info/time_between_train_steps": 0.003437042236328125, "step": 154} {"info/global_step": 155, "train_info/time_within_train_step": 2.6754724979400635, "step": 155} {"train_info/time_between_train_steps": 0.003418445587158203, "step": 155} {"info/global_step": 156, "train_info/time_within_train_step": 2.6482505798339844, "step": 156} {"train_info/time_between_train_steps": 0.003439664840698242, "step": 156} {"info/global_step": 157, "train_info/time_within_train_step": 2.682321786880493, "step": 157} {"train_info/time_between_train_steps": 0.003376007080078125, "step": 157} {"info/global_step": 158, "train_info/time_within_train_step": 2.639063596725464, "step": 158} {"train_info/time_between_train_steps": 0.003286600112915039, "step": 158} {"info/global_step": 159, "train_info/time_within_train_step": 2.6396734714508057, "step": 159} {"train_info/time_between_train_steps": 0.003339052200317383, "step": 159} {"info/global_step": 160, "train_info/time_within_train_step": 2.8971755504608154, "step": 160} {"train_info/time_between_train_steps": 0.0033864974975585938, "step": 160} {"info/global_step": 161, "train_info/time_within_train_step": 2.639782190322876, "step": 161} {"train_info/time_between_train_steps": 0.00347137451171875, "step": 161} {"info/global_step": 162, "train_info/time_within_train_step": 2.6466338634490967, "step": 162} {"train_info/time_between_train_steps": 0.0032167434692382812, "step": 162} {"info/global_step": 163, "train_info/time_within_train_step": 2.6640877723693848, "step": 163} {"train_info/time_between_train_steps": 0.0033638477325439453, "step": 163} {"info/global_step": 164, "train_info/time_within_train_step": 2.646538019180298, "step": 164} {"train_info/time_between_train_steps": 0.003493785858154297, "step": 164} {"info/global_step": 165, "train_info/time_within_train_step": 2.644573926925659, "step": 165} {"train_info/time_between_train_steps": 0.0032968521118164062, "step": 165} {"info/global_step": 166, "train_info/time_within_train_step": 2.6624906063079834, "step": 166} {"train_info/time_between_train_steps": 0.003257274627685547, "step": 166} {"info/global_step": 167, "train_info/time_within_train_step": 2.655451774597168, "step": 167} {"train_info/time_between_train_steps": 0.0033843517303466797, "step": 167} {"info/global_step": 168, "train_info/time_within_train_step": 2.662532091140747, "step": 168} {"train_info/time_between_train_steps": 0.003319978713989258, "step": 168} {"info/global_step": 169, "train_info/time_within_train_step": 2.6878015995025635, "step": 169} {"train_info/time_between_train_steps": 0.003448486328125, "step": 169} {"info/global_step": 170, "train_info/time_within_train_step": 2.6591858863830566, "step": 170} {"train_info/time_between_train_steps": 0.003370523452758789, "step": 170} {"info/global_step": 171, "train_info/time_within_train_step": 2.645409345626831, "step": 171} {"train_info/time_between_train_steps": 0.0034284591674804688, "step": 171} {"info/global_step": 172, "train_info/time_within_train_step": 2.6503384113311768, "step": 172} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 172} {"info/global_step": 173, "train_info/time_within_train_step": 2.642711639404297, "step": 173} {"train_info/time_between_train_steps": 0.0034530162811279297, "step": 173} {"info/global_step": 174, "train_info/time_within_train_step": 2.6413326263427734, "step": 174} {"train_info/time_between_train_steps": 0.003457307815551758, "step": 174} {"info/global_step": 175, "train_info/time_within_train_step": 2.653594732284546, "step": 175} {"train_info/time_between_train_steps": 0.0034470558166503906, "step": 175} {"info/global_step": 176, "train_info/time_within_train_step": 2.6497390270233154, "step": 176} {"train_info/time_between_train_steps": 0.0033652782440185547, "step": 176} {"info/global_step": 177, "train_info/time_within_train_step": 2.657959461212158, "step": 177} {"train_info/time_between_train_steps": 0.0033550262451171875, "step": 177} {"info/global_step": 178, "train_info/time_within_train_step": 2.6976065635681152, "step": 178} {"train_info/time_between_train_steps": 0.003396749496459961, "step": 178} {"info/global_step": 179, "train_info/time_within_train_step": 2.69093656539917, "step": 179} {"train_info/time_between_train_steps": 0.0034818649291992188, "step": 179} {"info/global_step": 180, "train_info/time_within_train_step": 2.641803503036499, "step": 180} {"train_info/time_between_train_steps": 0.003354787826538086, "step": 180} {"info/global_step": 181, "train_info/time_within_train_step": 2.647122621536255, "step": 181} {"train_info/time_between_train_steps": 0.0033414363861083984, "step": 181} {"info/global_step": 182, "train_info/time_within_train_step": 2.6599698066711426, "step": 182} {"train_info/time_between_train_steps": 0.0032570362091064453, "step": 182} {"info/global_step": 183, "train_info/time_within_train_step": 2.6641921997070312, "step": 183} {"train_info/time_between_train_steps": 0.0034911632537841797, "step": 183} {"info/global_step": 184, "train_info/time_within_train_step": 2.7064316272735596, "step": 184} {"train_info/time_between_train_steps": 0.003392457962036133, "step": 184} {"info/global_step": 185, "train_info/time_within_train_step": 2.643062114715576, "step": 185} {"train_info/time_between_train_steps": 0.0032944679260253906, "step": 185} {"info/global_step": 186, "train_info/time_within_train_step": 2.6538679599761963, "step": 186} {"train_info/time_between_train_steps": 0.003284931182861328, "step": 186} {"info/global_step": 187, "train_info/time_within_train_step": 2.646528720855713, "step": 187} {"train_info/time_between_train_steps": 0.0034253597259521484, "step": 187} {"info/global_step": 188, "train_info/time_within_train_step": 2.759873390197754, "step": 188} {"train_info/time_between_train_steps": 0.0033566951751708984, "step": 188} {"info/global_step": 189, "train_info/time_within_train_step": 2.6548449993133545, "step": 189} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 189} {"info/global_step": 190, "train_info/time_within_train_step": 2.653165578842163, "step": 190} {"train_info/time_between_train_steps": 0.0033330917358398438, "step": 190} {"info/global_step": 191, "train_info/time_within_train_step": 2.6412606239318848, "step": 191} {"train_info/time_between_train_steps": 0.0033473968505859375, "step": 191} {"info/global_step": 192, "train_info/time_within_train_step": 2.641767740249634, "step": 192} {"train_info/time_between_train_steps": 0.003290414810180664, "step": 192} {"info/global_step": 193, "train_info/time_within_train_step": 2.660536050796509, "step": 193} {"train_info/time_between_train_steps": 0.003536224365234375, "step": 193} {"info/global_step": 194, "train_info/time_within_train_step": 2.6907029151916504, "step": 194} {"train_info/time_between_train_steps": 0.0033838748931884766, "step": 194} {"info/global_step": 195, "train_info/time_within_train_step": 2.6826372146606445, "step": 195} {"train_info/time_between_train_steps": 0.0032587051391601562, "step": 195} {"info/global_step": 196, "train_info/time_within_train_step": 2.6508305072784424, "step": 196} {"train_info/time_between_train_steps": 0.00333404541015625, "step": 196} {"info/global_step": 197, "train_info/time_within_train_step": 2.686938762664795, "step": 197} {"train_info/time_between_train_steps": 0.0033719539642333984, "step": 197} {"info/global_step": 198, "train_info/time_within_train_step": 2.6458702087402344, "step": 198} {"train_info/time_between_train_steps": 0.003308534622192383, "step": 198} {"info/global_step": 199, "train_info/time_within_train_step": 2.64485764503479, "step": 199} {"train_info/time_between_train_steps": 0.003258228302001953, "step": 199} {"info/global_step": 200, "train_info/time_within_train_step": 2.6477746963500977, "step": 200} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746897964, "_runtime": 562}, "step": 200} {"logs": {"train/loss": 6.6054, "train/learning_rate": 0.00011999999999999999, "train/epoch": 0.02, "_timestamp": 1746897964, "_runtime": 562}, "step": 200} {"train_info/time_between_train_steps": 13.29012393951416, "step": 200} {"info/global_step": 201, "train_info/time_within_train_step": 2.6847658157348633, "step": 201} {"train_info/time_between_train_steps": 0.003493070602416992, "step": 201} {"info/global_step": 202, "train_info/time_within_train_step": 2.431180477142334, "step": 202} {"train_info/time_between_train_steps": 0.003509521484375, "step": 202} {"info/global_step": 203, "train_info/time_within_train_step": 2.5905022621154785, "step": 203} {"train_info/time_between_train_steps": 0.003422975540161133, "step": 203} {"info/global_step": 204, "train_info/time_within_train_step": 2.6494133472442627, "step": 204} {"train_info/time_between_train_steps": 0.0032770633697509766, "step": 204} {"info/global_step": 205, "train_info/time_within_train_step": 2.6398255825042725, "step": 205} {"train_info/time_between_train_steps": 0.0034554004669189453, "step": 205} {"info/global_step": 206, "train_info/time_within_train_step": 2.6401190757751465, "step": 206} {"train_info/time_between_train_steps": 0.0033500194549560547, "step": 206} {"info/global_step": 207, "train_info/time_within_train_step": 2.65266752243042, "step": 207} {"train_info/time_between_train_steps": 0.00324249267578125, "step": 207} {"info/global_step": 208, "train_info/time_within_train_step": 2.6652731895446777, "step": 208} {"train_info/time_between_train_steps": 0.003286123275756836, "step": 208} {"info/global_step": 209, "train_info/time_within_train_step": 2.681661367416382, "step": 209} {"train_info/time_between_train_steps": 0.0033369064331054688, "step": 209} {"info/global_step": 210, "train_info/time_within_train_step": 2.6477415561676025, "step": 210} {"train_info/time_between_train_steps": 0.003252744674682617, "step": 210} {"info/global_step": 211, "train_info/time_within_train_step": 2.6749815940856934, "step": 211} {"train_info/time_between_train_steps": 0.0033617019653320312, "step": 211} {"info/global_step": 212, "train_info/time_within_train_step": 2.6427459716796875, "step": 212} {"train_info/time_between_train_steps": 0.0033638477325439453, "step": 212} {"info/global_step": 213, "train_info/time_within_train_step": 2.6404216289520264, "step": 213} {"train_info/time_between_train_steps": 0.0034308433532714844, "step": 213} {"info/global_step": 214, "train_info/time_within_train_step": 2.682677745819092, "step": 214} {"train_info/time_between_train_steps": 0.003273487091064453, "step": 214} {"info/global_step": 215, "train_info/time_within_train_step": 2.644158363342285, "step": 215} {"train_info/time_between_train_steps": 0.0032875537872314453, "step": 215} {"info/global_step": 216, "train_info/time_within_train_step": 2.6435978412628174, "step": 216} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 216} {"info/global_step": 217, "train_info/time_within_train_step": 2.657773733139038, "step": 217} {"train_info/time_between_train_steps": 0.003368377685546875, "step": 217} {"info/global_step": 218, "train_info/time_within_train_step": 2.6603379249572754, "step": 218} {"train_info/time_between_train_steps": 0.0032339096069335938, "step": 218} {"info/global_step": 219, "train_info/time_within_train_step": 2.673186779022217, "step": 219} {"train_info/time_between_train_steps": 0.003348827362060547, "step": 219} {"info/global_step": 220, "train_info/time_within_train_step": 2.670628547668457, "step": 220} {"train_info/time_between_train_steps": 0.003427267074584961, "step": 220} {"info/global_step": 221, "train_info/time_within_train_step": 2.6840507984161377, "step": 221} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 221} {"info/global_step": 222, "train_info/time_within_train_step": 2.641887664794922, "step": 222} {"train_info/time_between_train_steps": 0.003285646438598633, "step": 222} {"info/global_step": 223, "train_info/time_within_train_step": 2.642439603805542, "step": 223} {"train_info/time_between_train_steps": 0.0032978057861328125, "step": 223} {"info/global_step": 224, "train_info/time_within_train_step": 2.6591317653656006, "step": 224} {"train_info/time_between_train_steps": 0.003694295883178711, "step": 224} {"info/global_step": 225, "train_info/time_within_train_step": 2.6533589363098145, "step": 225} {"train_info/time_between_train_steps": 0.003451108932495117, "step": 225} {"info/global_step": 226, "train_info/time_within_train_step": 2.6441752910614014, "step": 226} {"train_info/time_between_train_steps": 0.003561258316040039, "step": 226} {"info/global_step": 227, "train_info/time_within_train_step": 2.6597251892089844, "step": 227} {"train_info/time_between_train_steps": 0.003330707550048828, "step": 227} {"info/global_step": 228, "train_info/time_within_train_step": 2.651663303375244, "step": 228} {"train_info/time_between_train_steps": 0.003370523452758789, "step": 228} {"info/global_step": 229, "train_info/time_within_train_step": 2.664445161819458, "step": 229} {"train_info/time_between_train_steps": 0.0034754276275634766, "step": 229} {"info/global_step": 230, "train_info/time_within_train_step": 2.7224762439727783, "step": 230} {"train_info/time_between_train_steps": 0.0032634735107421875, "step": 230} {"info/global_step": 231, "train_info/time_within_train_step": 2.663816452026367, "step": 231} {"train_info/time_between_train_steps": 0.0034284591674804688, "step": 231} {"info/global_step": 232, "train_info/time_within_train_step": 2.640148162841797, "step": 232} {"train_info/time_between_train_steps": 0.0033829212188720703, "step": 232} {"info/global_step": 233, "train_info/time_within_train_step": 2.6531496047973633, "step": 233} {"train_info/time_between_train_steps": 0.0033218860626220703, "step": 233} {"info/global_step": 234, "train_info/time_within_train_step": 2.671975612640381, "step": 234} {"train_info/time_between_train_steps": 0.0034942626953125, "step": 234} {"info/global_step": 235, "train_info/time_within_train_step": 2.65763521194458, "step": 235} {"train_info/time_between_train_steps": 0.003597259521484375, "step": 235} {"info/global_step": 236, "train_info/time_within_train_step": 2.644638776779175, "step": 236} {"train_info/time_between_train_steps": 0.0033609867095947266, "step": 236} {"info/global_step": 237, "train_info/time_within_train_step": 2.6492562294006348, "step": 237} {"train_info/time_between_train_steps": 0.0032951831817626953, "step": 237} {"info/global_step": 238, "train_info/time_within_train_step": 2.6539714336395264, "step": 238} {"train_info/time_between_train_steps": 0.0034008026123046875, "step": 238} {"info/global_step": 239, "train_info/time_within_train_step": 2.675788402557373, "step": 239} {"train_info/time_between_train_steps": 0.0035414695739746094, "step": 239} {"info/global_step": 240, "train_info/time_within_train_step": 2.6941707134246826, "step": 240} {"train_info/time_between_train_steps": 0.003496408462524414, "step": 240} {"info/global_step": 241, "train_info/time_within_train_step": 2.659843683242798, "step": 241} {"train_info/time_between_train_steps": 0.0035164356231689453, "step": 241} {"info/global_step": 242, "train_info/time_within_train_step": 2.961336374282837, "step": 242} {"train_info/time_between_train_steps": 0.0035631656646728516, "step": 242} {"info/global_step": 243, "train_info/time_within_train_step": 2.6607160568237305, "step": 243} {"train_info/time_between_train_steps": 0.003401517868041992, "step": 243} {"info/global_step": 244, "train_info/time_within_train_step": 2.6653366088867188, "step": 244} {"train_info/time_between_train_steps": 0.0034716129302978516, "step": 244} {"info/global_step": 245, "train_info/time_within_train_step": 2.654963493347168, "step": 245} {"train_info/time_between_train_steps": 0.003496408462524414, "step": 245} {"info/global_step": 246, "train_info/time_within_train_step": 2.6626129150390625, "step": 246} {"train_info/time_between_train_steps": 0.003474712371826172, "step": 246} {"info/global_step": 247, "train_info/time_within_train_step": 2.6411991119384766, "step": 247} {"train_info/time_between_train_steps": 0.0038993358612060547, "step": 247} {"info/global_step": 248, "train_info/time_within_train_step": 2.6477267742156982, "step": 248} {"train_info/time_between_train_steps": 0.003885507583618164, "step": 248} {"info/global_step": 249, "train_info/time_within_train_step": 2.661491632461548, "step": 249} {"train_info/time_between_train_steps": 0.004037380218505859, "step": 249} {"info/global_step": 250, "train_info/time_within_train_step": 3.3656067848205566, "step": 250} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746898112, "_runtime": 710}, "step": 250} {"logs": {"train/loss": 6.3636, "train/learning_rate": 0.00015, "train/epoch": 0.03, "_timestamp": 1746898112, "_runtime": 710}, "step": 250} {"train_info/time_between_train_steps": 0.23537921905517578, "step": 250} {"info/global_step": 251, "train_info/time_within_train_step": 2.642838954925537, "step": 251} {"train_info/time_between_train_steps": 0.0035142898559570312, "step": 251} {"info/global_step": 252, "train_info/time_within_train_step": 2.6545865535736084, "step": 252} {"train_info/time_between_train_steps": 0.003511667251586914, "step": 252} {"info/global_step": 253, "train_info/time_within_train_step": 2.652324914932251, "step": 253} {"train_info/time_between_train_steps": 0.003928661346435547, "step": 253} {"info/global_step": 254, "train_info/time_within_train_step": 2.6437880992889404, "step": 254} {"train_info/time_between_train_steps": 0.003408193588256836, "step": 254} {"info/global_step": 255, "train_info/time_within_train_step": 2.6477890014648438, "step": 255} {"train_info/time_between_train_steps": 0.0034351348876953125, "step": 255} {"info/global_step": 256, "train_info/time_within_train_step": 2.6580231189727783, "step": 256} {"train_info/time_between_train_steps": 0.003462076187133789, "step": 256} {"info/global_step": 257, "train_info/time_within_train_step": 2.6727044582366943, "step": 257} {"train_info/time_between_train_steps": 0.003326416015625, "step": 257} {"info/global_step": 258, "train_info/time_within_train_step": 2.6754584312438965, "step": 258} {"train_info/time_between_train_steps": 0.003369569778442383, "step": 258} {"info/global_step": 259, "train_info/time_within_train_step": 2.655522346496582, "step": 259} {"train_info/time_between_train_steps": 0.0033559799194335938, "step": 259} {"info/global_step": 260, "train_info/time_within_train_step": 2.639159917831421, "step": 260} {"train_info/time_between_train_steps": 0.003453493118286133, "step": 260} {"info/global_step": 261, "train_info/time_within_train_step": 2.6526551246643066, "step": 261} {"train_info/time_between_train_steps": 0.0033845901489257812, "step": 261} {"info/global_step": 262, "train_info/time_within_train_step": 2.6562681198120117, "step": 262} {"train_info/time_between_train_steps": 0.003446817398071289, "step": 262} {"info/global_step": 263, "train_info/time_within_train_step": 2.6418087482452393, "step": 263} {"train_info/time_between_train_steps": 0.003426074981689453, "step": 263} {"info/global_step": 264, "train_info/time_within_train_step": 2.6431503295898438, "step": 264} {"train_info/time_between_train_steps": 0.0035610198974609375, "step": 264} {"info/global_step": 265, "train_info/time_within_train_step": 2.6543915271759033, "step": 265} {"train_info/time_between_train_steps": 0.003432750701904297, "step": 265} {"info/global_step": 266, "train_info/time_within_train_step": 2.6531970500946045, "step": 266} {"train_info/time_between_train_steps": 0.003446817398071289, "step": 266} {"info/global_step": 267, "train_info/time_within_train_step": 2.647303819656372, "step": 267} {"train_info/time_between_train_steps": 0.0033707618713378906, "step": 267} {"info/global_step": 268, "train_info/time_within_train_step": 2.6516072750091553, "step": 268} {"train_info/time_between_train_steps": 0.0035271644592285156, "step": 268} {"info/global_step": 269, "train_info/time_within_train_step": 2.65763521194458, "step": 269} {"train_info/time_between_train_steps": 0.0033729076385498047, "step": 269} {"info/global_step": 270, "train_info/time_within_train_step": 2.6722099781036377, "step": 270} {"train_info/time_between_train_steps": 0.003385782241821289, "step": 270} {"info/global_step": 271, "train_info/time_within_train_step": 2.6684224605560303, "step": 271} {"train_info/time_between_train_steps": 0.003415346145629883, "step": 271} {"info/global_step": 272, "train_info/time_within_train_step": 2.686908483505249, "step": 272} {"train_info/time_between_train_steps": 0.0033712387084960938, "step": 272} {"info/global_step": 273, "train_info/time_within_train_step": 2.6401541233062744, "step": 273} {"train_info/time_between_train_steps": 0.0035376548767089844, "step": 273} {"info/global_step": 274, "train_info/time_within_train_step": 2.6390135288238525, "step": 274} {"train_info/time_between_train_steps": 0.0033981800079345703, "step": 274} {"info/global_step": 275, "train_info/time_within_train_step": 2.661837100982666, "step": 275} {"train_info/time_between_train_steps": 0.0033228397369384766, "step": 275} {"info/global_step": 276, "train_info/time_within_train_step": 2.6506083011627197, "step": 276} {"train_info/time_between_train_steps": 0.0034208297729492188, "step": 276} {"info/global_step": 277, "train_info/time_within_train_step": 2.642930030822754, "step": 277} {"train_info/time_between_train_steps": 0.0034475326538085938, "step": 277} {"info/global_step": 278, "train_info/time_within_train_step": 2.663853168487549, "step": 278} {"train_info/time_between_train_steps": 0.0034439563751220703, "step": 278} {"info/global_step": 279, "train_info/time_within_train_step": 2.651324987411499, "step": 279} {"train_info/time_between_train_steps": 0.0032787322998046875, "step": 279} {"info/global_step": 280, "train_info/time_within_train_step": 2.659487009048462, "step": 280} {"train_info/time_between_train_steps": 0.0034983158111572266, "step": 280} {"info/global_step": 281, "train_info/time_within_train_step": 2.712308645248413, "step": 281} {"train_info/time_between_train_steps": 0.003398418426513672, "step": 281} {"info/global_step": 282, "train_info/time_within_train_step": 2.641803026199341, "step": 282} {"train_info/time_between_train_steps": 0.0033347606658935547, "step": 282} {"info/global_step": 283, "train_info/time_within_train_step": 2.640456438064575, "step": 283} {"train_info/time_between_train_steps": 0.0034439563751220703, "step": 283} {"info/global_step": 284, "train_info/time_within_train_step": 2.660980224609375, "step": 284} {"train_info/time_between_train_steps": 0.003394603729248047, "step": 284} {"info/global_step": 285, "train_info/time_within_train_step": 2.6467299461364746, "step": 285} {"train_info/time_between_train_steps": 0.0034384727478027344, "step": 285} {"info/global_step": 286, "train_info/time_within_train_step": 2.6443207263946533, "step": 286} {"train_info/time_between_train_steps": 0.0035202503204345703, "step": 286} {"info/global_step": 287, "train_info/time_within_train_step": 2.649625062942505, "step": 287} {"train_info/time_between_train_steps": 0.0034639835357666016, "step": 287} {"info/global_step": 288, "train_info/time_within_train_step": 2.6439414024353027, "step": 288} {"train_info/time_between_train_steps": 0.0034961700439453125, "step": 288} {"info/global_step": 289, "train_info/time_within_train_step": 2.6680006980895996, "step": 289} {"train_info/time_between_train_steps": 0.0033500194549560547, "step": 289} {"info/global_step": 290, "train_info/time_within_train_step": 2.6914613246917725, "step": 290} {"train_info/time_between_train_steps": 0.003294229507446289, "step": 290} {"info/global_step": 291, "train_info/time_within_train_step": 2.66312837600708, "step": 291} {"train_info/time_between_train_steps": 0.003319263458251953, "step": 291} {"info/global_step": 292, "train_info/time_within_train_step": 2.662323236465454, "step": 292} {"train_info/time_between_train_steps": 0.003484010696411133, "step": 292} {"info/global_step": 293, "train_info/time_within_train_step": 2.640401601791382, "step": 293} {"train_info/time_between_train_steps": 0.003480195999145508, "step": 293} {"info/global_step": 294, "train_info/time_within_train_step": 2.654266834259033, "step": 294} {"train_info/time_between_train_steps": 0.0034637451171875, "step": 294} {"info/global_step": 295, "train_info/time_within_train_step": 2.652944564819336, "step": 295} {"train_info/time_between_train_steps": 0.003350973129272461, "step": 295} {"info/global_step": 296, "train_info/time_within_train_step": 2.6439590454101562, "step": 296} {"train_info/time_between_train_steps": 0.0034830570220947266, "step": 296} {"info/global_step": 297, "train_info/time_within_train_step": 2.6432478427886963, "step": 297} {"train_info/time_between_train_steps": 0.003518342971801758, "step": 297} {"info/global_step": 298, "train_info/time_within_train_step": 2.641974925994873, "step": 298} {"train_info/time_between_train_steps": 0.0035381317138671875, "step": 298} {"info/global_step": 299, "train_info/time_within_train_step": 2.642889976501465, "step": 299} {"train_info/time_between_train_steps": 0.0038831233978271484, "step": 299} {"info/global_step": 300, "train_info/time_within_train_step": 2.68730092048645, "step": 300} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746898248, "_runtime": 846}, "step": 300} {"logs": {"train/loss": 6.1763, "train/learning_rate": 0.00017999999999999998, "train/epoch": 0.03, "_timestamp": 1746898248, "_runtime": 846}, "step": 300} {"train_info/time_between_train_steps": 0.4317798614501953, "step": 300} {"info/global_step": 301, "train_info/time_within_train_step": 2.641355514526367, "step": 301} {"train_info/time_between_train_steps": 0.0035903453826904297, "step": 301} {"info/global_step": 302, "train_info/time_within_train_step": 2.648319721221924, "step": 302} {"train_info/time_between_train_steps": 0.0033583641052246094, "step": 302} {"info/global_step": 303, "train_info/time_within_train_step": 2.6524903774261475, "step": 303} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 303} {"info/global_step": 304, "train_info/time_within_train_step": 2.6381092071533203, "step": 304} {"train_info/time_between_train_steps": 0.0032961368560791016, "step": 304} {"info/global_step": 305, "train_info/time_within_train_step": 2.6734299659729004, "step": 305} {"train_info/time_between_train_steps": 0.0034193992614746094, "step": 305} {"info/global_step": 306, "train_info/time_within_train_step": 2.665019989013672, "step": 306} {"train_info/time_between_train_steps": 0.0034079551696777344, "step": 306} {"info/global_step": 307, "train_info/time_within_train_step": 2.6627585887908936, "step": 307} {"train_info/time_between_train_steps": 0.003323078155517578, "step": 307} {"info/global_step": 308, "train_info/time_within_train_step": 2.6900157928466797, "step": 308} {"train_info/time_between_train_steps": 0.0032987594604492188, "step": 308} {"info/global_step": 309, "train_info/time_within_train_step": 2.645944833755493, "step": 309} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 309} {"info/global_step": 310, "train_info/time_within_train_step": 2.6389310359954834, "step": 310} {"train_info/time_between_train_steps": 0.003415822982788086, "step": 310} {"info/global_step": 311, "train_info/time_within_train_step": 2.654109239578247, "step": 311} {"train_info/time_between_train_steps": 0.0034034252166748047, "step": 311} {"info/global_step": 312, "train_info/time_within_train_step": 2.655189275741577, "step": 312} {"train_info/time_between_train_steps": 0.0033752918243408203, "step": 312} {"info/global_step": 313, "train_info/time_within_train_step": 2.7606863975524902, "step": 313} {"train_info/time_between_train_steps": 0.003464221954345703, "step": 313} {"info/global_step": 314, "train_info/time_within_train_step": 2.658051013946533, "step": 314} {"train_info/time_between_train_steps": 0.0034453868865966797, "step": 314} {"info/global_step": 315, "train_info/time_within_train_step": 2.6416566371917725, "step": 315} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 315} {"info/global_step": 316, "train_info/time_within_train_step": 2.6416094303131104, "step": 316} {"train_info/time_between_train_steps": 0.003366708755493164, "step": 316} {"info/global_step": 317, "train_info/time_within_train_step": 2.668596029281616, "step": 317} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 317} {"info/global_step": 318, "train_info/time_within_train_step": 2.6700997352600098, "step": 318} {"train_info/time_between_train_steps": 0.0033686161041259766, "step": 318} {"info/global_step": 319, "train_info/time_within_train_step": 2.670217990875244, "step": 319} {"train_info/time_between_train_steps": 0.0034990310668945312, "step": 319} {"info/global_step": 320, "train_info/time_within_train_step": 2.665632724761963, "step": 320} {"train_info/time_between_train_steps": 0.003317594528198242, "step": 320} {"info/global_step": 321, "train_info/time_within_train_step": 2.6427159309387207, "step": 321} {"train_info/time_between_train_steps": 0.0033729076385498047, "step": 321} {"info/global_step": 322, "train_info/time_within_train_step": 2.652207851409912, "step": 322} {"train_info/time_between_train_steps": 0.003383159637451172, "step": 322} {"info/global_step": 323, "train_info/time_within_train_step": 2.6515798568725586, "step": 323} {"train_info/time_between_train_steps": 0.003500699996948242, "step": 323} {"info/global_step": 324, "train_info/time_within_train_step": 2.6409294605255127, "step": 324} {"train_info/time_between_train_steps": 0.003349781036376953, "step": 324} {"info/global_step": 325, "train_info/time_within_train_step": 2.6420648097991943, "step": 325} {"train_info/time_between_train_steps": 0.0034475326538085938, "step": 325} {"info/global_step": 326, "train_info/time_within_train_step": 2.658655881881714, "step": 326} {"train_info/time_between_train_steps": 0.0034182071685791016, "step": 326} {"info/global_step": 327, "train_info/time_within_train_step": 2.6554763317108154, "step": 327} {"train_info/time_between_train_steps": 0.0033416748046875, "step": 327} {"info/global_step": 328, "train_info/time_within_train_step": 2.6671459674835205, "step": 328} {"train_info/time_between_train_steps": 0.0033109188079833984, "step": 328} {"info/global_step": 329, "train_info/time_within_train_step": 2.6753249168395996, "step": 329} {"train_info/time_between_train_steps": 0.003542661666870117, "step": 329} {"info/global_step": 330, "train_info/time_within_train_step": 2.6859371662139893, "step": 330} {"train_info/time_between_train_steps": 0.0033376216888427734, "step": 330} {"info/global_step": 331, "train_info/time_within_train_step": 2.6405673027038574, "step": 331} {"train_info/time_between_train_steps": 0.0033113956451416016, "step": 331} {"info/global_step": 332, "train_info/time_within_train_step": 2.6394214630126953, "step": 332} {"train_info/time_between_train_steps": 0.003448486328125, "step": 332} {"info/global_step": 333, "train_info/time_within_train_step": 2.6561648845672607, "step": 333} {"train_info/time_between_train_steps": 0.0033826828002929688, "step": 333} {"info/global_step": 334, "train_info/time_within_train_step": 2.651607036590576, "step": 334} {"train_info/time_between_train_steps": 0.003379344940185547, "step": 334} {"info/global_step": 335, "train_info/time_within_train_step": 2.6429202556610107, "step": 335} {"train_info/time_between_train_steps": 0.0033578872680664062, "step": 335} {"info/global_step": 336, "train_info/time_within_train_step": 2.9781265258789062, "step": 336} {"train_info/time_between_train_steps": 0.003289937973022461, "step": 336} {"info/global_step": 337, "train_info/time_within_train_step": 2.647036552429199, "step": 337} {"train_info/time_between_train_steps": 0.0032477378845214844, "step": 337} {"info/global_step": 338, "train_info/time_within_train_step": 2.6418044567108154, "step": 338} {"train_info/time_between_train_steps": 0.0035872459411621094, "step": 338} {"info/global_step": 339, "train_info/time_within_train_step": 2.654615640640259, "step": 339} {"train_info/time_between_train_steps": 0.003227710723876953, "step": 339} {"info/global_step": 340, "train_info/time_within_train_step": 2.6523807048797607, "step": 340} {"train_info/time_between_train_steps": 0.003311634063720703, "step": 340} {"info/global_step": 341, "train_info/time_within_train_step": 2.6665267944335938, "step": 341} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 341} {"info/global_step": 342, "train_info/time_within_train_step": 2.723949670791626, "step": 342} {"train_info/time_between_train_steps": 0.0032739639282226562, "step": 342} {"info/global_step": 343, "train_info/time_within_train_step": 2.66725492477417, "step": 343} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 343} {"info/global_step": 344, "train_info/time_within_train_step": 2.649503707885742, "step": 344} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 344} {"info/global_step": 345, "train_info/time_within_train_step": 2.6503725051879883, "step": 345} {"train_info/time_between_train_steps": 0.003298521041870117, "step": 345} {"info/global_step": 346, "train_info/time_within_train_step": 2.6641685962677, "step": 346} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 346} {"info/global_step": 347, "train_info/time_within_train_step": 2.7037718296051025, "step": 347} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 347} {"info/global_step": 348, "train_info/time_within_train_step": 2.639089584350586, "step": 348} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 348} {"info/global_step": 349, "train_info/time_within_train_step": 2.6463236808776855, "step": 349} {"train_info/time_between_train_steps": 0.003251791000366211, "step": 349} {"info/global_step": 350, "train_info/time_within_train_step": 2.652575969696045, "step": 350} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746898383, "_runtime": 981}, "step": 350} {"logs": {"train/loss": 6.0096, "train/learning_rate": 0.00020999999999999998, "train/epoch": 0.04, "_timestamp": 1746898383, "_runtime": 981}, "step": 350} {"train_info/time_between_train_steps": 0.0244905948638916, "step": 350} {"info/global_step": 351, "train_info/time_within_train_step": 2.6511082649230957, "step": 351} {"train_info/time_between_train_steps": 0.003417491912841797, "step": 351} {"info/global_step": 352, "train_info/time_within_train_step": 2.6613047122955322, "step": 352} {"train_info/time_between_train_steps": 0.0033559799194335938, "step": 352} {"info/global_step": 353, "train_info/time_within_train_step": 2.650545358657837, "step": 353} {"train_info/time_between_train_steps": 0.003232717514038086, "step": 353} {"info/global_step": 354, "train_info/time_within_train_step": 2.646143913269043, "step": 354} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 354} {"info/global_step": 355, "train_info/time_within_train_step": 2.6437249183654785, "step": 355} {"train_info/time_between_train_steps": 0.0034258365631103516, "step": 355} {"info/global_step": 356, "train_info/time_within_train_step": 2.6624679565429688, "step": 356} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 356} {"info/global_step": 357, "train_info/time_within_train_step": 2.6572110652923584, "step": 357} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 357} {"info/global_step": 358, "train_info/time_within_train_step": 2.6668801307678223, "step": 358} {"train_info/time_between_train_steps": 0.0032243728637695312, "step": 358} {"info/global_step": 359, "train_info/time_within_train_step": 2.677140474319458, "step": 359} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 359} {"info/global_step": 360, "train_info/time_within_train_step": 2.661465644836426, "step": 360} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 360} {"info/global_step": 361, "train_info/time_within_train_step": 2.644413948059082, "step": 361} {"train_info/time_between_train_steps": 0.0033380985260009766, "step": 361} {"info/global_step": 362, "train_info/time_within_train_step": 2.6430885791778564, "step": 362} {"train_info/time_between_train_steps": 0.003251314163208008, "step": 362} {"info/global_step": 363, "train_info/time_within_train_step": 2.649362087249756, "step": 363} {"train_info/time_between_train_steps": 0.0032808780670166016, "step": 363} {"info/global_step": 364, "train_info/time_within_train_step": 2.651484251022339, "step": 364} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 364} {"info/global_step": 365, "train_info/time_within_train_step": 2.644721031188965, "step": 365} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 365} {"info/global_step": 366, "train_info/time_within_train_step": 2.6581907272338867, "step": 366} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 366} {"info/global_step": 367, "train_info/time_within_train_step": 2.649252414703369, "step": 367} {"train_info/time_between_train_steps": 0.003319263458251953, "step": 367} {"info/global_step": 368, "train_info/time_within_train_step": 2.665539503097534, "step": 368} {"train_info/time_between_train_steps": 0.003238677978515625, "step": 368} {"info/global_step": 369, "train_info/time_within_train_step": 2.7250595092773438, "step": 369} {"train_info/time_between_train_steps": 0.003246784210205078, "step": 369} {"info/global_step": 370, "train_info/time_within_train_step": 2.654968023300171, "step": 370} {"train_info/time_between_train_steps": 0.0033185482025146484, "step": 370} {"info/global_step": 371, "train_info/time_within_train_step": 2.6386337280273438, "step": 371} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 371} {"info/global_step": 372, "train_info/time_within_train_step": 2.6519343852996826, "step": 372} {"train_info/time_between_train_steps": 0.003240823745727539, "step": 372} {"info/global_step": 373, "train_info/time_within_train_step": 2.6479289531707764, "step": 373} {"train_info/time_between_train_steps": 0.003248929977416992, "step": 373} {"info/global_step": 374, "train_info/time_within_train_step": 2.6470329761505127, "step": 374} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 374} {"info/global_step": 375, "train_info/time_within_train_step": 2.6442065238952637, "step": 375} {"train_info/time_between_train_steps": 0.12288141250610352, "step": 375} {"info/global_step": 376, "train_info/time_within_train_step": 2.6478121280670166, "step": 376} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 376} {"info/global_step": 377, "train_info/time_within_train_step": 2.6467127799987793, "step": 377} {"train_info/time_between_train_steps": 0.003231525421142578, "step": 377} {"info/global_step": 378, "train_info/time_within_train_step": 2.6424245834350586, "step": 378} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 378} {"info/global_step": 379, "train_info/time_within_train_step": 2.6669209003448486, "step": 379} {"train_info/time_between_train_steps": 0.003274202346801758, "step": 379} {"info/global_step": 380, "train_info/time_within_train_step": 2.669600486755371, "step": 380} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 380} {"info/global_step": 381, "train_info/time_within_train_step": 2.694715738296509, "step": 381} {"train_info/time_between_train_steps": 0.0032339096069335938, "step": 381} {"info/global_step": 382, "train_info/time_within_train_step": 2.6453685760498047, "step": 382} {"train_info/time_between_train_steps": 0.003225564956665039, "step": 382} {"info/global_step": 383, "train_info/time_within_train_step": 2.639620304107666, "step": 383} {"train_info/time_between_train_steps": 0.0032188892364501953, "step": 383} {"info/global_step": 384, "train_info/time_within_train_step": 2.655820846557617, "step": 384} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 384} {"info/global_step": 385, "train_info/time_within_train_step": 2.653447389602661, "step": 385} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 385} {"info/global_step": 386, "train_info/time_within_train_step": 2.6415417194366455, "step": 386} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 386} {"info/global_step": 387, "train_info/time_within_train_step": 2.6430118083953857, "step": 387} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 387} {"info/global_step": 388, "train_info/time_within_train_step": 2.6551408767700195, "step": 388} {"train_info/time_between_train_steps": 0.0032372474670410156, "step": 388} {"info/global_step": 389, "train_info/time_within_train_step": 2.667480707168579, "step": 389} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 389} {"info/global_step": 390, "train_info/time_within_train_step": 2.6817452907562256, "step": 390} {"train_info/time_between_train_steps": 0.003239154815673828, "step": 390} {"info/global_step": 391, "train_info/time_within_train_step": 2.648383378982544, "step": 391} {"train_info/time_between_train_steps": 0.0033316612243652344, "step": 391} {"info/global_step": 392, "train_info/time_within_train_step": 2.7006070613861084, "step": 392} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 392} {"info/global_step": 393, "train_info/time_within_train_step": 2.889165163040161, "step": 393} {"train_info/time_between_train_steps": 0.0033140182495117188, "step": 393} {"info/global_step": 394, "train_info/time_within_train_step": 2.681649684906006, "step": 394} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 394} {"info/global_step": 395, "train_info/time_within_train_step": 2.6471009254455566, "step": 395} {"train_info/time_between_train_steps": 0.0032558441162109375, "step": 395} {"info/global_step": 396, "train_info/time_within_train_step": 2.667224168777466, "step": 396} {"train_info/time_between_train_steps": 0.0033304691314697266, "step": 396} {"info/global_step": 397, "train_info/time_within_train_step": 2.640286445617676, "step": 397} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 397} {"info/global_step": 398, "train_info/time_within_train_step": 2.640925645828247, "step": 398} {"train_info/time_between_train_steps": 0.003259420394897461, "step": 398} {"info/global_step": 399, "train_info/time_within_train_step": 2.6626639366149902, "step": 399} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 399} {"info/global_step": 400, "train_info/time_within_train_step": 2.6466355323791504, "step": 400} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746898518, "_runtime": 1116}, "step": 400} {"logs": {"train/loss": 5.8883, "train/learning_rate": 0.00023999999999999998, "train/epoch": 0.04, "_timestamp": 1746898518, "_runtime": 1116}, "step": 400} {"train_info/time_between_train_steps": 23.277161598205566, "step": 400} {"info/global_step": 401, "train_info/time_within_train_step": 2.4428606033325195, "step": 401} {"train_info/time_between_train_steps": 0.00324249267578125, "step": 401} {"info/global_step": 402, "train_info/time_within_train_step": 2.4280056953430176, "step": 402} {"train_info/time_between_train_steps": 0.006666421890258789, "step": 402} {"info/global_step": 403, "train_info/time_within_train_step": 2.586916923522949, "step": 403} {"train_info/time_between_train_steps": 0.0066585540771484375, "step": 403} {"info/global_step": 404, "train_info/time_within_train_step": 2.6614632606506348, "step": 404} {"train_info/time_between_train_steps": 0.006680965423583984, "step": 404} {"info/global_step": 405, "train_info/time_within_train_step": 2.6756858825683594, "step": 405} {"train_info/time_between_train_steps": 0.006651401519775391, "step": 405} {"info/global_step": 406, "train_info/time_within_train_step": 2.653247356414795, "step": 406} {"train_info/time_between_train_steps": 0.006736278533935547, "step": 406} {"info/global_step": 407, "train_info/time_within_train_step": 2.680964469909668, "step": 407} {"train_info/time_between_train_steps": 0.006635904312133789, "step": 407} {"info/global_step": 408, "train_info/time_within_train_step": 2.641063928604126, "step": 408} {"train_info/time_between_train_steps": 0.006669282913208008, "step": 408} {"info/global_step": 409, "train_info/time_within_train_step": 2.6531496047973633, "step": 409} {"train_info/time_between_train_steps": 0.006608009338378906, "step": 409} {"info/global_step": 410, "train_info/time_within_train_step": 2.6507585048675537, "step": 410} {"train_info/time_between_train_steps": 0.0066339969635009766, "step": 410} {"info/global_step": 411, "train_info/time_within_train_step": 2.6445627212524414, "step": 411} {"train_info/time_between_train_steps": 0.0066831111907958984, "step": 411} {"info/global_step": 412, "train_info/time_within_train_step": 2.648495674133301, "step": 412} {"train_info/time_between_train_steps": 0.0032427310943603516, "step": 412} {"info/global_step": 413, "train_info/time_within_train_step": 2.647688627243042, "step": 413} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 413} {"info/global_step": 414, "train_info/time_within_train_step": 2.6644418239593506, "step": 414} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 414} {"info/global_step": 415, "train_info/time_within_train_step": 2.6610963344573975, "step": 415} {"train_info/time_between_train_steps": 0.003261566162109375, "step": 415} {"info/global_step": 416, "train_info/time_within_train_step": 2.655494451522827, "step": 416} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 416} {"info/global_step": 417, "train_info/time_within_train_step": 2.707129955291748, "step": 417} {"train_info/time_between_train_steps": 0.0032494068145751953, "step": 417} {"info/global_step": 418, "train_info/time_within_train_step": 2.6485164165496826, "step": 418} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 418} {"info/global_step": 419, "train_info/time_within_train_step": 2.648350954055786, "step": 419} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 419} {"info/global_step": 420, "train_info/time_within_train_step": 2.655254602432251, "step": 420} {"train_info/time_between_train_steps": 0.003241300582885742, "step": 420} {"info/global_step": 421, "train_info/time_within_train_step": 2.6500155925750732, "step": 421} {"train_info/time_between_train_steps": 0.0032913684844970703, "step": 421} {"info/global_step": 422, "train_info/time_within_train_step": 2.6503348350524902, "step": 422} {"train_info/time_between_train_steps": 0.0032176971435546875, "step": 422} {"info/global_step": 423, "train_info/time_within_train_step": 2.645833969116211, "step": 423} {"train_info/time_between_train_steps": 0.0032494068145751953, "step": 423} {"info/global_step": 424, "train_info/time_within_train_step": 2.6553359031677246, "step": 424} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 424} {"info/global_step": 425, "train_info/time_within_train_step": 2.6576836109161377, "step": 425} {"train_info/time_between_train_steps": 0.003353595733642578, "step": 425} {"info/global_step": 426, "train_info/time_within_train_step": 2.672011613845825, "step": 426} {"train_info/time_between_train_steps": 0.0032982826232910156, "step": 426} {"info/global_step": 427, "train_info/time_within_train_step": 2.7273294925689697, "step": 427} {"train_info/time_between_train_steps": 0.0033974647521972656, "step": 427} {"info/global_step": 428, "train_info/time_within_train_step": 2.6572165489196777, "step": 428} {"train_info/time_between_train_steps": 0.0033118724822998047, "step": 428} {"info/global_step": 429, "train_info/time_within_train_step": 2.6409103870391846, "step": 429} {"train_info/time_between_train_steps": 0.003285646438598633, "step": 429} {"info/global_step": 430, "train_info/time_within_train_step": 2.6528055667877197, "step": 430} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 430} {"info/global_step": 431, "train_info/time_within_train_step": 2.648449659347534, "step": 431} {"train_info/time_between_train_steps": 0.0033333301544189453, "step": 431} {"info/global_step": 432, "train_info/time_within_train_step": 2.652918815612793, "step": 432} {"train_info/time_between_train_steps": 0.0032885074615478516, "step": 432} {"info/global_step": 433, "train_info/time_within_train_step": 2.6460888385772705, "step": 433} {"train_info/time_between_train_steps": 0.003284931182861328, "step": 433} {"info/global_step": 434, "train_info/time_within_train_step": 2.646932363510132, "step": 434} {"train_info/time_between_train_steps": 0.003316640853881836, "step": 434} {"info/global_step": 435, "train_info/time_within_train_step": 2.656297445297241, "step": 435} {"train_info/time_between_train_steps": 0.003309965133666992, "step": 435} {"info/global_step": 436, "train_info/time_within_train_step": 2.6482467651367188, "step": 436} {"train_info/time_between_train_steps": 0.003454446792602539, "step": 436} {"info/global_step": 437, "train_info/time_within_train_step": 2.648402214050293, "step": 437} {"train_info/time_between_train_steps": 0.003399372100830078, "step": 437} {"info/global_step": 438, "train_info/time_within_train_step": 2.8073534965515137, "step": 438} {"train_info/time_between_train_steps": 0.0033445358276367188, "step": 438} {"info/global_step": 439, "train_info/time_within_train_step": 2.646778106689453, "step": 439} {"train_info/time_between_train_steps": 0.003293752670288086, "step": 439} {"info/global_step": 440, "train_info/time_within_train_step": 2.6586220264434814, "step": 440} {"train_info/time_between_train_steps": 0.0035834312438964844, "step": 440} {"info/global_step": 441, "train_info/time_within_train_step": 2.6441903114318848, "step": 441} {"train_info/time_between_train_steps": 0.0035257339477539062, "step": 441} {"info/global_step": 442, "train_info/time_within_train_step": 2.6450657844543457, "step": 442} {"train_info/time_between_train_steps": 0.003519296646118164, "step": 442} {"info/global_step": 443, "train_info/time_within_train_step": 2.6688804626464844, "step": 443} {"train_info/time_between_train_steps": 0.003515958786010742, "step": 443} {"info/global_step": 444, "train_info/time_within_train_step": 2.6665022373199463, "step": 444} {"train_info/time_between_train_steps": 0.0036649703979492188, "step": 444} {"info/global_step": 445, "train_info/time_within_train_step": 2.686189889907837, "step": 445} {"train_info/time_between_train_steps": 0.0036051273345947266, "step": 445} {"info/global_step": 446, "train_info/time_within_train_step": 2.6570959091186523, "step": 446} {"train_info/time_between_train_steps": 0.003551959991455078, "step": 446} {"info/global_step": 447, "train_info/time_within_train_step": 2.6598846912384033, "step": 447} {"train_info/time_between_train_steps": 0.0035173892974853516, "step": 447} {"info/global_step": 448, "train_info/time_within_train_step": 2.6478655338287354, "step": 448} {"train_info/time_between_train_steps": 0.0035414695739746094, "step": 448} {"info/global_step": 449, "train_info/time_within_train_step": 2.6558170318603516, "step": 449} {"train_info/time_between_train_steps": 0.003854036331176758, "step": 449} {"info/global_step": 450, "train_info/time_within_train_step": 2.642653703689575, "step": 450} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746898675, "_runtime": 1273}, "step": 450} {"logs": {"train/loss": 5.7833, "train/learning_rate": 0.00027, "train/epoch": 0.04, "_timestamp": 1746898675, "_runtime": 1273}, "step": 450} {"train_info/time_between_train_steps": 0.02535700798034668, "step": 450} {"info/global_step": 451, "train_info/time_within_train_step": 2.6477558612823486, "step": 451} {"train_info/time_between_train_steps": 0.003509521484375, "step": 451} {"info/global_step": 452, "train_info/time_within_train_step": 2.6437690258026123, "step": 452} {"train_info/time_between_train_steps": 0.0035932064056396484, "step": 452} {"info/global_step": 453, "train_info/time_within_train_step": 2.6718637943267822, "step": 453} {"train_info/time_between_train_steps": 0.0034720897674560547, "step": 453} {"info/global_step": 454, "train_info/time_within_train_step": 2.655902862548828, "step": 454} {"train_info/time_between_train_steps": 0.0035715103149414062, "step": 454} {"info/global_step": 455, "train_info/time_within_train_step": 2.6656558513641357, "step": 455} {"train_info/time_between_train_steps": 0.003467082977294922, "step": 455} {"info/global_step": 456, "train_info/time_within_train_step": 2.685746669769287, "step": 456} {"train_info/time_between_train_steps": 0.0034797191619873047, "step": 456} {"info/global_step": 457, "train_info/time_within_train_step": 2.669886827468872, "step": 457} {"train_info/time_between_train_steps": 0.0034668445587158203, "step": 457} {"info/global_step": 458, "train_info/time_within_train_step": 2.6410603523254395, "step": 458} {"train_info/time_between_train_steps": 0.0034902095794677734, "step": 458} {"info/global_step": 459, "train_info/time_within_train_step": 2.642305612564087, "step": 459} {"train_info/time_between_train_steps": 0.0034253597259521484, "step": 459} {"info/global_step": 460, "train_info/time_within_train_step": 2.649883985519409, "step": 460} {"train_info/time_between_train_steps": 0.003457307815551758, "step": 460} {"info/global_step": 461, "train_info/time_within_train_step": 2.643348217010498, "step": 461} {"train_info/time_between_train_steps": 0.0035774707794189453, "step": 461} {"info/global_step": 462, "train_info/time_within_train_step": 2.6552958488464355, "step": 462} {"train_info/time_between_train_steps": 0.003438234329223633, "step": 462} {"info/global_step": 463, "train_info/time_within_train_step": 2.655367374420166, "step": 463} {"train_info/time_between_train_steps": 0.003561258316040039, "step": 463} {"info/global_step": 464, "train_info/time_within_train_step": 2.668375015258789, "step": 464} {"train_info/time_between_train_steps": 0.003701925277709961, "step": 464} {"info/global_step": 465, "train_info/time_within_train_step": 2.7259645462036133, "step": 465} {"train_info/time_between_train_steps": 0.003465890884399414, "step": 465} {"info/global_step": 466, "train_info/time_within_train_step": 2.6942501068115234, "step": 466} {"train_info/time_between_train_steps": 0.00345611572265625, "step": 466} {"info/global_step": 467, "train_info/time_within_train_step": 2.6413519382476807, "step": 467} {"train_info/time_between_train_steps": 0.0034873485565185547, "step": 467} {"info/global_step": 468, "train_info/time_within_train_step": 2.6412408351898193, "step": 468} {"train_info/time_between_train_steps": 0.0035600662231445312, "step": 468} {"info/global_step": 469, "train_info/time_within_train_step": 2.6565346717834473, "step": 469} {"train_info/time_between_train_steps": 0.003478527069091797, "step": 469} {"info/global_step": 470, "train_info/time_within_train_step": 2.652705192565918, "step": 470} {"train_info/time_between_train_steps": 0.003568410873413086, "step": 470} {"info/global_step": 471, "train_info/time_within_train_step": 2.644984006881714, "step": 471} {"train_info/time_between_train_steps": 0.0035789012908935547, "step": 471} {"info/global_step": 472, "train_info/time_within_train_step": 2.651419162750244, "step": 472} {"train_info/time_between_train_steps": 0.0036673545837402344, "step": 472} {"info/global_step": 473, "train_info/time_within_train_step": 2.6459298133850098, "step": 473} {"train_info/time_between_train_steps": 0.003609180450439453, "step": 473} {"info/global_step": 474, "train_info/time_within_train_step": 2.668912172317505, "step": 474} {"train_info/time_between_train_steps": 0.0037479400634765625, "step": 474} {"info/global_step": 475, "train_info/time_within_train_step": 2.681692361831665, "step": 475} {"train_info/time_between_train_steps": 0.0035719871520996094, "step": 475} {"info/global_step": 476, "train_info/time_within_train_step": 2.686739683151245, "step": 476} {"train_info/time_between_train_steps": 0.003640890121459961, "step": 476} {"info/global_step": 477, "train_info/time_within_train_step": 3.0492141246795654, "step": 477} {"train_info/time_between_train_steps": 0.003343343734741211, "step": 477} {"info/global_step": 478, "train_info/time_within_train_step": 2.6435704231262207, "step": 478} {"train_info/time_between_train_steps": 0.003309011459350586, "step": 478} {"info/global_step": 479, "train_info/time_within_train_step": 2.644770860671997, "step": 479} {"train_info/time_between_train_steps": 0.0032815933227539062, "step": 479} {"info/global_step": 480, "train_info/time_within_train_step": 2.664139747619629, "step": 480} {"train_info/time_between_train_steps": 0.003549814224243164, "step": 480} {"info/global_step": 481, "train_info/time_within_train_step": 2.6657378673553467, "step": 481} {"train_info/time_between_train_steps": 0.0033216476440429688, "step": 481} {"info/global_step": 482, "train_info/time_within_train_step": 2.709972381591797, "step": 482} {"train_info/time_between_train_steps": 0.0033216476440429688, "step": 482} {"info/global_step": 483, "train_info/time_within_train_step": 2.6431074142456055, "step": 483} {"train_info/time_between_train_steps": 0.0032706260681152344, "step": 483} {"info/global_step": 484, "train_info/time_within_train_step": 2.6570675373077393, "step": 484} {"train_info/time_between_train_steps": 0.0032567977905273438, "step": 484} {"info/global_step": 485, "train_info/time_within_train_step": 2.645399808883667, "step": 485} {"train_info/time_between_train_steps": 0.0033817291259765625, "step": 485} {"info/global_step": 486, "train_info/time_within_train_step": 2.6468706130981445, "step": 486} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 486} {"info/global_step": 487, "train_info/time_within_train_step": 2.6576550006866455, "step": 487} {"train_info/time_between_train_steps": 0.0034406185150146484, "step": 487} {"info/global_step": 488, "train_info/time_within_train_step": 2.641484498977661, "step": 488} {"train_info/time_between_train_steps": 0.003250598907470703, "step": 488} {"info/global_step": 489, "train_info/time_within_train_step": 2.642073631286621, "step": 489} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 489} {"info/global_step": 490, "train_info/time_within_train_step": 2.6704256534576416, "step": 490} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 490} {"info/global_step": 491, "train_info/time_within_train_step": 2.664651393890381, "step": 491} {"train_info/time_between_train_steps": 0.003319978713989258, "step": 491} {"info/global_step": 492, "train_info/time_within_train_step": 2.6814615726470947, "step": 492} {"train_info/time_between_train_steps": 0.0032956600189208984, "step": 492} {"info/global_step": 493, "train_info/time_within_train_step": 2.657773733139038, "step": 493} {"train_info/time_between_train_steps": 0.003285646438598633, "step": 493} {"info/global_step": 494, "train_info/time_within_train_step": 2.6521804332733154, "step": 494} {"train_info/time_between_train_steps": 0.003284454345703125, "step": 494} {"info/global_step": 495, "train_info/time_within_train_step": 2.6545732021331787, "step": 495} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 495} {"info/global_step": 496, "train_info/time_within_train_step": 2.646543502807617, "step": 496} {"train_info/time_between_train_steps": 0.0032896995544433594, "step": 496} {"info/global_step": 497, "train_info/time_within_train_step": 2.6482350826263428, "step": 497} {"train_info/time_between_train_steps": 0.003237009048461914, "step": 497} {"info/global_step": 498, "train_info/time_within_train_step": 2.6479954719543457, "step": 498} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 498} {"info/global_step": 499, "train_info/time_within_train_step": 2.6454808712005615, "step": 499} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 499} {"info/global_step": 500, "train_info/time_within_train_step": 3.13529109954834, "step": 500} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746898810, "_runtime": 1408}, "step": 500} {"logs": {"train/loss": 5.7015, "train/learning_rate": 0.0003, "train/epoch": 0.05, "_timestamp": 1746898810, "_runtime": 1408}, "step": 500} {"train_info/time_between_train_steps": 0.34790658950805664, "step": 500} {"info/global_step": 501, "train_info/time_within_train_step": 2.641674518585205, "step": 501} {"train_info/time_between_train_steps": 0.003339529037475586, "step": 501} {"info/global_step": 502, "train_info/time_within_train_step": 2.6417500972747803, "step": 502} {"train_info/time_between_train_steps": 0.003446817398071289, "step": 502} {"info/global_step": 503, "train_info/time_within_train_step": 2.6428892612457275, "step": 503} {"train_info/time_between_train_steps": 0.0033724308013916016, "step": 503} {"info/global_step": 504, "train_info/time_within_train_step": 2.6431725025177, "step": 504} {"train_info/time_between_train_steps": 0.0033981800079345703, "step": 504} {"info/global_step": 505, "train_info/time_within_train_step": 2.6726183891296387, "step": 505} {"train_info/time_between_train_steps": 0.003256082534790039, "step": 505} {"info/global_step": 506, "train_info/time_within_train_step": 2.6642959117889404, "step": 506} {"train_info/time_between_train_steps": 0.0032966136932373047, "step": 506} {"info/global_step": 507, "train_info/time_within_train_step": 2.642504930496216, "step": 507} {"train_info/time_between_train_steps": 0.00325775146484375, "step": 507} {"info/global_step": 508, "train_info/time_within_train_step": 2.6607632637023926, "step": 508} {"train_info/time_between_train_steps": 0.003303050994873047, "step": 508} {"info/global_step": 509, "train_info/time_within_train_step": 2.6483561992645264, "step": 509} {"train_info/time_between_train_steps": 0.003283262252807617, "step": 509} {"info/global_step": 510, "train_info/time_within_train_step": 2.6513500213623047, "step": 510} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 510} {"info/global_step": 511, "train_info/time_within_train_step": 2.641477108001709, "step": 511} {"train_info/time_between_train_steps": 0.0033397674560546875, "step": 511} {"info/global_step": 512, "train_info/time_within_train_step": 2.6416172981262207, "step": 512} {"train_info/time_between_train_steps": 0.0033011436462402344, "step": 512} {"info/global_step": 513, "train_info/time_within_train_step": 2.66597843170166, "step": 513} {"train_info/time_between_train_steps": 0.0035250186920166016, "step": 513} {"info/global_step": 514, "train_info/time_within_train_step": 2.665766716003418, "step": 514} {"train_info/time_between_train_steps": 0.003351449966430664, "step": 514} {"info/global_step": 515, "train_info/time_within_train_step": 2.7115371227264404, "step": 515} {"train_info/time_between_train_steps": 0.0033850669860839844, "step": 515} {"info/global_step": 516, "train_info/time_within_train_step": 2.6490986347198486, "step": 516} {"train_info/time_between_train_steps": 0.003452777862548828, "step": 516} {"info/global_step": 517, "train_info/time_within_train_step": 2.656416893005371, "step": 517} {"train_info/time_between_train_steps": 0.003414630889892578, "step": 517} {"info/global_step": 518, "train_info/time_within_train_step": 2.642019510269165, "step": 518} {"train_info/time_between_train_steps": 0.0037593841552734375, "step": 518} {"info/global_step": 519, "train_info/time_within_train_step": 2.6452558040618896, "step": 519} {"train_info/time_between_train_steps": 0.003779172897338867, "step": 519} {"info/global_step": 520, "train_info/time_within_train_step": 2.671919107437134, "step": 520} {"train_info/time_between_train_steps": 0.0035543441772460938, "step": 520} {"info/global_step": 521, "train_info/time_within_train_step": 2.6634628772735596, "step": 521} {"train_info/time_between_train_steps": 0.0036530494689941406, "step": 521} {"info/global_step": 522, "train_info/time_within_train_step": 2.6882739067077637, "step": 522} {"train_info/time_between_train_steps": 0.0035719871520996094, "step": 522} {"info/global_step": 523, "train_info/time_within_train_step": 2.6544086933135986, "step": 523} {"train_info/time_between_train_steps": 0.0035817623138427734, "step": 523} {"info/global_step": 524, "train_info/time_within_train_step": 2.66209077835083, "step": 524} {"train_info/time_between_train_steps": 0.003609180450439453, "step": 524} {"info/global_step": 525, "train_info/time_within_train_step": 2.645219564437866, "step": 525} {"train_info/time_between_train_steps": 0.0035419464111328125, "step": 525} {"info/global_step": 526, "train_info/time_within_train_step": 2.6407957077026367, "step": 526} {"train_info/time_between_train_steps": 0.0035800933837890625, "step": 526} {"info/global_step": 527, "train_info/time_within_train_step": 2.66284441947937, "step": 527} {"train_info/time_between_train_steps": 0.0035119056701660156, "step": 527} {"info/global_step": 528, "train_info/time_within_train_step": 2.648308753967285, "step": 528} {"train_info/time_between_train_steps": 0.003568410873413086, "step": 528} {"info/global_step": 529, "train_info/time_within_train_step": 2.643596887588501, "step": 529} {"train_info/time_between_train_steps": 0.003525257110595703, "step": 529} {"info/global_step": 530, "train_info/time_within_train_step": 2.6641476154327393, "step": 530} {"train_info/time_between_train_steps": 0.0034933090209960938, "step": 530} {"info/global_step": 531, "train_info/time_within_train_step": 2.6608359813690186, "step": 531} {"train_info/time_between_train_steps": 0.0036067962646484375, "step": 531} {"info/global_step": 532, "train_info/time_within_train_step": 2.6749980449676514, "step": 532} {"train_info/time_between_train_steps": 0.00356292724609375, "step": 532} {"info/global_step": 533, "train_info/time_within_train_step": 2.6714510917663574, "step": 533} {"train_info/time_between_train_steps": 0.0035567283630371094, "step": 533} {"info/global_step": 534, "train_info/time_within_train_step": 3.0694122314453125, "step": 534} {"train_info/time_between_train_steps": 0.003328084945678711, "step": 534} {"info/global_step": 535, "train_info/time_within_train_step": 2.6428253650665283, "step": 535} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 535} {"info/global_step": 536, "train_info/time_within_train_step": 2.656153917312622, "step": 536} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 536} {"info/global_step": 537, "train_info/time_within_train_step": 2.658386707305908, "step": 537} {"train_info/time_between_train_steps": 0.003248929977416992, "step": 537} {"info/global_step": 538, "train_info/time_within_train_step": 2.671485662460327, "step": 538} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 538} {"info/global_step": 539, "train_info/time_within_train_step": 2.670042037963867, "step": 539} {"train_info/time_between_train_steps": 0.003265857696533203, "step": 539} {"info/global_step": 540, "train_info/time_within_train_step": 2.6640920639038086, "step": 540} {"train_info/time_between_train_steps": 0.0032815933227539062, "step": 540} {"info/global_step": 541, "train_info/time_within_train_step": 2.6434481143951416, "step": 541} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 541} {"info/global_step": 542, "train_info/time_within_train_step": 2.640275716781616, "step": 542} {"train_info/time_between_train_steps": 0.0033485889434814453, "step": 542} {"info/global_step": 543, "train_info/time_within_train_step": 2.6558613777160645, "step": 543} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 543} {"info/global_step": 544, "train_info/time_within_train_step": 2.6529719829559326, "step": 544} {"train_info/time_between_train_steps": 0.0033092498779296875, "step": 544} {"info/global_step": 545, "train_info/time_within_train_step": 2.6419312953948975, "step": 545} {"train_info/time_between_train_steps": 0.0032672882080078125, "step": 545} {"info/global_step": 546, "train_info/time_within_train_step": 2.6584770679473877, "step": 546} {"train_info/time_between_train_steps": 0.0034151077270507812, "step": 546} {"info/global_step": 547, "train_info/time_within_train_step": 2.650008201599121, "step": 547} {"train_info/time_between_train_steps": 0.003383636474609375, "step": 547} {"info/global_step": 548, "train_info/time_within_train_step": 2.65946364402771, "step": 548} {"train_info/time_between_train_steps": 0.0032939910888671875, "step": 548} {"info/global_step": 549, "train_info/time_within_train_step": 2.7101526260375977, "step": 549} {"train_info/time_between_train_steps": 0.0036339759826660156, "step": 549} {"info/global_step": 550, "train_info/time_within_train_step": 2.694715976715088, "step": 550} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746898945, "_runtime": 1543}, "step": 550} {"logs": {"train/loss": 5.6075, "train/learning_rate": 0.00033, "train/epoch": 0.06, "_timestamp": 1746898945, "_runtime": 1543}, "step": 550} {"train_info/time_between_train_steps": 0.024761438369750977, "step": 550} {"info/global_step": 551, "train_info/time_within_train_step": 2.68143892288208, "step": 551} {"train_info/time_between_train_steps": 0.0029556751251220703, "step": 551} {"info/global_step": 552, "train_info/time_within_train_step": 2.6390609741210938, "step": 552} {"train_info/time_between_train_steps": 0.002952098846435547, "step": 552} {"info/global_step": 553, "train_info/time_within_train_step": 2.639582395553589, "step": 553} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 553} {"info/global_step": 554, "train_info/time_within_train_step": 2.655822515487671, "step": 554} {"train_info/time_between_train_steps": 0.002943277359008789, "step": 554} {"info/global_step": 555, "train_info/time_within_train_step": 2.650876522064209, "step": 555} {"train_info/time_between_train_steps": 0.0030808448791503906, "step": 555} {"info/global_step": 556, "train_info/time_within_train_step": 2.645559310913086, "step": 556} {"train_info/time_between_train_steps": 0.0029311180114746094, "step": 556} {"info/global_step": 557, "train_info/time_within_train_step": 2.6419289112091064, "step": 557} {"train_info/time_between_train_steps": 0.002944469451904297, "step": 557} {"info/global_step": 558, "train_info/time_within_train_step": 2.6651082038879395, "step": 558} {"train_info/time_between_train_steps": 0.002996683120727539, "step": 558} {"info/global_step": 559, "train_info/time_within_train_step": 2.668093681335449, "step": 559} {"train_info/time_between_train_steps": 0.002927541732788086, "step": 559} {"info/global_step": 560, "train_info/time_within_train_step": 2.7181859016418457, "step": 560} {"train_info/time_between_train_steps": 0.002971649169921875, "step": 560} {"info/global_step": 561, "train_info/time_within_train_step": 2.647193670272827, "step": 561} {"train_info/time_between_train_steps": 0.0029213428497314453, "step": 561} {"info/global_step": 562, "train_info/time_within_train_step": 2.662161111831665, "step": 562} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 562} {"info/global_step": 563, "train_info/time_within_train_step": 2.6382503509521484, "step": 563} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 563} {"info/global_step": 564, "train_info/time_within_train_step": 2.6466445922851562, "step": 564} {"train_info/time_between_train_steps": 0.002961874008178711, "step": 564} {"info/global_step": 565, "train_info/time_within_train_step": 2.6594932079315186, "step": 565} {"train_info/time_between_train_steps": 0.0029273033142089844, "step": 565} {"info/global_step": 566, "train_info/time_within_train_step": 2.6427814960479736, "step": 566} {"train_info/time_between_train_steps": 0.002928495407104492, "step": 566} {"info/global_step": 567, "train_info/time_within_train_step": 2.642662286758423, "step": 567} {"train_info/time_between_train_steps": 0.0029401779174804688, "step": 567} {"info/global_step": 568, "train_info/time_within_train_step": 2.6669607162475586, "step": 568} {"train_info/time_between_train_steps": 0.0029892921447753906, "step": 568} {"info/global_step": 569, "train_info/time_within_train_step": 2.6634933948516846, "step": 569} {"train_info/time_between_train_steps": 0.003014087677001953, "step": 569} {"info/global_step": 570, "train_info/time_within_train_step": 2.6853485107421875, "step": 570} {"train_info/time_between_train_steps": 0.0030624866485595703, "step": 570} {"info/global_step": 571, "train_info/time_within_train_step": 2.6538243293762207, "step": 571} {"train_info/time_between_train_steps": 0.003002643585205078, "step": 571} {"info/global_step": 572, "train_info/time_within_train_step": 2.6675961017608643, "step": 572} {"train_info/time_between_train_steps": 0.0030012130737304688, "step": 572} {"info/global_step": 573, "train_info/time_within_train_step": 2.64160418510437, "step": 573} {"train_info/time_between_train_steps": 0.0030107498168945312, "step": 573} {"info/global_step": 574, "train_info/time_within_train_step": 2.639951467514038, "step": 574} {"train_info/time_between_train_steps": 0.002984762191772461, "step": 574} {"info/global_step": 575, "train_info/time_within_train_step": 2.6634981632232666, "step": 575} {"train_info/time_between_train_steps": 0.003060579299926758, "step": 575} {"info/global_step": 576, "train_info/time_within_train_step": 2.646723985671997, "step": 576} {"train_info/time_between_train_steps": 0.003105640411376953, "step": 576} {"info/global_step": 577, "train_info/time_within_train_step": 2.9736461639404297, "step": 577} {"train_info/time_between_train_steps": 0.0030066967010498047, "step": 577} {"info/global_step": 578, "train_info/time_within_train_step": 2.6478235721588135, "step": 578} {"train_info/time_between_train_steps": 0.0029125213623046875, "step": 578} {"info/global_step": 579, "train_info/time_within_train_step": 2.6449177265167236, "step": 579} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 579} {"info/global_step": 580, "train_info/time_within_train_step": 2.650841474533081, "step": 580} {"train_info/time_between_train_steps": 0.003021717071533203, "step": 580} {"info/global_step": 581, "train_info/time_within_train_step": 2.647263288497925, "step": 581} {"train_info/time_between_train_steps": 0.002985239028930664, "step": 581} {"info/global_step": 582, "train_info/time_within_train_step": 2.6430599689483643, "step": 582} {"train_info/time_between_train_steps": 0.002948760986328125, "step": 582} {"info/global_step": 583, "train_info/time_within_train_step": 2.6636877059936523, "step": 583} {"train_info/time_between_train_steps": 0.002979278564453125, "step": 583} {"info/global_step": 584, "train_info/time_within_train_step": 2.6562044620513916, "step": 584} {"train_info/time_between_train_steps": 0.003089427947998047, "step": 584} {"info/global_step": 585, "train_info/time_within_train_step": 2.6530961990356445, "step": 585} {"train_info/time_between_train_steps": 0.0029833316802978516, "step": 585} {"info/global_step": 586, "train_info/time_within_train_step": 2.700371742248535, "step": 586} {"train_info/time_between_train_steps": 0.0030040740966796875, "step": 586} {"info/global_step": 587, "train_info/time_within_train_step": 2.639791965484619, "step": 587} {"train_info/time_between_train_steps": 0.0030317306518554688, "step": 587} {"info/global_step": 588, "train_info/time_within_train_step": 2.6388511657714844, "step": 588} {"train_info/time_between_train_steps": 0.002975940704345703, "step": 588} {"info/global_step": 589, "train_info/time_within_train_step": 2.6599061489105225, "step": 589} {"train_info/time_between_train_steps": 0.003020763397216797, "step": 589} {"info/global_step": 590, "train_info/time_within_train_step": 2.646872043609619, "step": 590} {"train_info/time_between_train_steps": 0.003092050552368164, "step": 590} {"info/global_step": 591, "train_info/time_within_train_step": 2.642847776412964, "step": 591} {"train_info/time_between_train_steps": 0.002961874008178711, "step": 591} {"info/global_step": 592, "train_info/time_within_train_step": 2.6543643474578857, "step": 592} {"train_info/time_between_train_steps": 0.0029768943786621094, "step": 592} {"info/global_step": 593, "train_info/time_within_train_step": 2.650789737701416, "step": 593} {"train_info/time_between_train_steps": 0.003056049346923828, "step": 593} {"info/global_step": 594, "train_info/time_within_train_step": 2.6590397357940674, "step": 594} {"train_info/time_between_train_steps": 0.0030107498168945312, "step": 594} {"info/global_step": 595, "train_info/time_within_train_step": 2.6795847415924072, "step": 595} {"train_info/time_between_train_steps": 0.0029871463775634766, "step": 595} {"info/global_step": 596, "train_info/time_within_train_step": 2.7280006408691406, "step": 596} {"train_info/time_between_train_steps": 0.002997875213623047, "step": 596} {"info/global_step": 597, "train_info/time_within_train_step": 2.6527633666992188, "step": 597} {"train_info/time_between_train_steps": 0.003006458282470703, "step": 597} {"info/global_step": 598, "train_info/time_within_train_step": 2.6403603553771973, "step": 598} {"train_info/time_between_train_steps": 0.0030176639556884766, "step": 598} {"info/global_step": 599, "train_info/time_within_train_step": 2.654088258743286, "step": 599} {"train_info/time_between_train_steps": 0.0029783248901367188, "step": 599} {"info/global_step": 600, "train_info/time_within_train_step": 2.6473171710968018, "step": 600} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746899080, "_runtime": 1678}, "step": 600} {"logs": {"train/loss": 5.5341, "train/learning_rate": 0.00035999999999999997, "train/epoch": 0.06, "_timestamp": 1746899080, "_runtime": 1678}, "step": 600} {"train_info/time_between_train_steps": 13.449480295181274, "step": 600} {"info/global_step": 601, "train_info/time_within_train_step": 2.446119785308838, "step": 601} {"train_info/time_between_train_steps": 0.002989530563354492, "step": 601} {"info/global_step": 602, "train_info/time_within_train_step": 2.4367668628692627, "step": 602} {"train_info/time_between_train_steps": 0.003034830093383789, "step": 602} {"info/global_step": 603, "train_info/time_within_train_step": 2.599266767501831, "step": 603} {"train_info/time_between_train_steps": 0.003004789352416992, "step": 603} {"info/global_step": 604, "train_info/time_within_train_step": 2.6491916179656982, "step": 604} {"train_info/time_between_train_steps": 0.002973794937133789, "step": 604} {"info/global_step": 605, "train_info/time_within_train_step": 2.6406326293945312, "step": 605} {"train_info/time_between_train_steps": 0.0029973983764648438, "step": 605} {"info/global_step": 606, "train_info/time_within_train_step": 2.6560845375061035, "step": 606} {"train_info/time_between_train_steps": 0.002986431121826172, "step": 606} {"info/global_step": 607, "train_info/time_within_train_step": 2.650498151779175, "step": 607} {"train_info/time_between_train_steps": 0.003033161163330078, "step": 607} {"info/global_step": 608, "train_info/time_within_train_step": 2.6685171127319336, "step": 608} {"train_info/time_between_train_steps": 0.002967357635498047, "step": 608} {"info/global_step": 609, "train_info/time_within_train_step": 2.7287635803222656, "step": 609} {"train_info/time_between_train_steps": 0.002995729446411133, "step": 609} {"info/global_step": 610, "train_info/time_within_train_step": 2.666384220123291, "step": 610} {"train_info/time_between_train_steps": 0.0029516220092773438, "step": 610} {"info/global_step": 611, "train_info/time_within_train_step": 2.6435890197753906, "step": 611} {"train_info/time_between_train_steps": 0.0030028820037841797, "step": 611} {"info/global_step": 612, "train_info/time_within_train_step": 2.6429636478424072, "step": 612} {"train_info/time_between_train_steps": 0.002998828887939453, "step": 612} {"info/global_step": 613, "train_info/time_within_train_step": 2.6561248302459717, "step": 613} {"train_info/time_between_train_steps": 0.00299835205078125, "step": 613} {"info/global_step": 614, "train_info/time_within_train_step": 2.657792091369629, "step": 614} {"train_info/time_between_train_steps": 0.0031218528747558594, "step": 614} {"info/global_step": 615, "train_info/time_within_train_step": 2.646193742752075, "step": 615} {"train_info/time_between_train_steps": 0.002997159957885742, "step": 615} {"info/global_step": 616, "train_info/time_within_train_step": 2.655726194381714, "step": 616} {"train_info/time_between_train_steps": 0.0029990673065185547, "step": 616} {"info/global_step": 617, "train_info/time_within_train_step": 2.6504299640655518, "step": 617} {"train_info/time_between_train_steps": 0.0029706954956054688, "step": 617} {"info/global_step": 618, "train_info/time_within_train_step": 2.67116641998291, "step": 618} {"train_info/time_between_train_steps": 0.0030066967010498047, "step": 618} {"info/global_step": 619, "train_info/time_within_train_step": 2.6926090717315674, "step": 619} {"train_info/time_between_train_steps": 0.0029764175415039062, "step": 619} {"info/global_step": 620, "train_info/time_within_train_step": 2.6761295795440674, "step": 620} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 620} {"info/global_step": 621, "train_info/time_within_train_step": 2.670807361602783, "step": 621} {"train_info/time_between_train_steps": 0.0029854774475097656, "step": 621} {"info/global_step": 622, "train_info/time_within_train_step": 2.6457531452178955, "step": 622} {"train_info/time_between_train_steps": 0.0029625892639160156, "step": 622} {"info/global_step": 623, "train_info/time_within_train_step": 2.644843578338623, "step": 623} {"train_info/time_between_train_steps": 0.0030422210693359375, "step": 623} {"info/global_step": 624, "train_info/time_within_train_step": 2.6502652168273926, "step": 624} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 624} {"info/global_step": 625, "train_info/time_within_train_step": 2.6740033626556396, "step": 625} {"train_info/time_between_train_steps": 0.003045320510864258, "step": 625} {"info/global_step": 626, "train_info/time_within_train_step": 2.6695778369903564, "step": 626} {"train_info/time_between_train_steps": 0.003038644790649414, "step": 626} {"info/global_step": 627, "train_info/time_within_train_step": 2.662616491317749, "step": 627} {"train_info/time_between_train_steps": 0.002937793731689453, "step": 627} {"info/global_step": 628, "train_info/time_within_train_step": 2.6807973384857178, "step": 628} {"train_info/time_between_train_steps": 0.0029561519622802734, "step": 628} {"info/global_step": 629, "train_info/time_within_train_step": 2.645744800567627, "step": 629} {"train_info/time_between_train_steps": 0.002994060516357422, "step": 629} {"info/global_step": 630, "train_info/time_within_train_step": 2.6551620960235596, "step": 630} {"train_info/time_between_train_steps": 0.002956867218017578, "step": 630} {"info/global_step": 631, "train_info/time_within_train_step": 2.6473238468170166, "step": 631} {"train_info/time_between_train_steps": 0.002969026565551758, "step": 631} {"info/global_step": 632, "train_info/time_within_train_step": 2.6509811878204346, "step": 632} {"train_info/time_between_train_steps": 0.002986431121826172, "step": 632} {"info/global_step": 633, "train_info/time_within_train_step": 2.648916006088257, "step": 633} {"train_info/time_between_train_steps": 0.002992391586303711, "step": 633} {"info/global_step": 634, "train_info/time_within_train_step": 2.645662784576416, "step": 634} {"train_info/time_between_train_steps": 0.0029120445251464844, "step": 634} {"info/global_step": 635, "train_info/time_within_train_step": 2.668259620666504, "step": 635} {"train_info/time_between_train_steps": 0.003024578094482422, "step": 635} {"info/global_step": 636, "train_info/time_within_train_step": 2.6580605506896973, "step": 636} {"train_info/time_between_train_steps": 0.0030035972595214844, "step": 636} {"info/global_step": 637, "train_info/time_within_train_step": 2.663935899734497, "step": 637} {"train_info/time_between_train_steps": 0.0030024051666259766, "step": 637} {"info/global_step": 638, "train_info/time_within_train_step": 2.6946465969085693, "step": 638} {"train_info/time_between_train_steps": 0.0030503273010253906, "step": 638} {"info/global_step": 639, "train_info/time_within_train_step": 2.6664838790893555, "step": 639} {"train_info/time_between_train_steps": 0.0030875205993652344, "step": 639} {"info/global_step": 640, "train_info/time_within_train_step": 2.6427807807922363, "step": 640} {"train_info/time_between_train_steps": 0.003004789352416992, "step": 640} {"info/global_step": 641, "train_info/time_within_train_step": 2.6418285369873047, "step": 641} {"train_info/time_between_train_steps": 0.0030448436737060547, "step": 641} {"info/global_step": 642, "train_info/time_within_train_step": 2.6582837104797363, "step": 642} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 642} {"info/global_step": 643, "train_info/time_within_train_step": 2.6532514095306396, "step": 643} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 643} {"info/global_step": 644, "train_info/time_within_train_step": 2.644638776779175, "step": 644} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 644} {"info/global_step": 645, "train_info/time_within_train_step": 2.661571502685547, "step": 645} {"train_info/time_between_train_steps": 0.0031681060791015625, "step": 645} {"info/global_step": 646, "train_info/time_within_train_step": 2.652374029159546, "step": 646} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 646} {"info/global_step": 647, "train_info/time_within_train_step": 2.683725357055664, "step": 647} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 647} {"info/global_step": 648, "train_info/time_within_train_step": 2.6886112689971924, "step": 648} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 648} {"info/global_step": 649, "train_info/time_within_train_step": 2.7295472621917725, "step": 649} {"train_info/time_between_train_steps": 0.003086090087890625, "step": 649} {"info/global_step": 650, "train_info/time_within_train_step": 2.659642219543457, "step": 650} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746899227, "_runtime": 1825}, "step": 650} {"logs": {"train/loss": 5.4575, "train/learning_rate": 0.00039, "train/epoch": 0.07, "_timestamp": 1746899227, "_runtime": 1825}, "step": 650} {"train_info/time_between_train_steps": 0.024867534637451172, "step": 650} {"info/global_step": 651, "train_info/time_within_train_step": 2.641127347946167, "step": 651} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 651} {"info/global_step": 652, "train_info/time_within_train_step": 2.640690803527832, "step": 652} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 652} {"info/global_step": 653, "train_info/time_within_train_step": 2.6547482013702393, "step": 653} {"train_info/time_between_train_steps": 0.0030655860900878906, "step": 653} {"info/global_step": 654, "train_info/time_within_train_step": 2.6501364707946777, "step": 654} {"train_info/time_between_train_steps": 0.0030975341796875, "step": 654} {"info/global_step": 655, "train_info/time_within_train_step": 2.6482656002044678, "step": 655} {"train_info/time_between_train_steps": 0.0030879974365234375, "step": 655} {"info/global_step": 656, "train_info/time_within_train_step": 2.6443135738372803, "step": 656} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 656} {"info/global_step": 657, "train_info/time_within_train_step": 2.6669840812683105, "step": 657} {"train_info/time_between_train_steps": 0.0031044483184814453, "step": 657} {"info/global_step": 658, "train_info/time_within_train_step": 2.670243740081787, "step": 658} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 658} {"info/global_step": 659, "train_info/time_within_train_step": 2.684199810028076, "step": 659} {"train_info/time_between_train_steps": 0.00307464599609375, "step": 659} {"info/global_step": 660, "train_info/time_within_train_step": 2.6536872386932373, "step": 660} {"train_info/time_between_train_steps": 0.003075838088989258, "step": 660} {"info/global_step": 661, "train_info/time_within_train_step": 2.641094923019409, "step": 661} {"train_info/time_between_train_steps": 0.0030510425567626953, "step": 661} {"info/global_step": 662, "train_info/time_within_train_step": 2.6550445556640625, "step": 662} {"train_info/time_between_train_steps": 0.0031180381774902344, "step": 662} {"info/global_step": 663, "train_info/time_within_train_step": 2.6489527225494385, "step": 663} {"train_info/time_between_train_steps": 0.003093242645263672, "step": 663} {"info/global_step": 664, "train_info/time_within_train_step": 2.6530449390411377, "step": 664} {"train_info/time_between_train_steps": 0.003057241439819336, "step": 664} {"info/global_step": 665, "train_info/time_within_train_step": 2.6427996158599854, "step": 665} {"train_info/time_between_train_steps": 0.0032699108123779297, "step": 665} {"info/global_step": 666, "train_info/time_within_train_step": 2.6510634422302246, "step": 666} {"train_info/time_between_train_steps": 0.003066539764404297, "step": 666} {"info/global_step": 667, "train_info/time_within_train_step": 2.6710073947906494, "step": 667} {"train_info/time_between_train_steps": 0.003095865249633789, "step": 667} {"info/global_step": 668, "train_info/time_within_train_step": 2.672772169113159, "step": 668} {"train_info/time_between_train_steps": 0.0030944347381591797, "step": 668} {"info/global_step": 669, "train_info/time_within_train_step": 2.651724338531494, "step": 669} {"train_info/time_between_train_steps": 0.0031309127807617188, "step": 669} {"info/global_step": 670, "train_info/time_within_train_step": 2.6884214878082275, "step": 670} {"train_info/time_between_train_steps": 0.0030448436737060547, "step": 670} {"info/global_step": 671, "train_info/time_within_train_step": 2.6413755416870117, "step": 671} {"train_info/time_between_train_steps": 0.0030748844146728516, "step": 671} {"info/global_step": 672, "train_info/time_within_train_step": 2.6549441814422607, "step": 672} {"train_info/time_between_train_steps": 0.0031325817108154297, "step": 672} {"info/global_step": 673, "train_info/time_within_train_step": 2.653057098388672, "step": 673} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 673} {"info/global_step": 674, "train_info/time_within_train_step": 2.646911144256592, "step": 674} {"train_info/time_between_train_steps": 0.003055572509765625, "step": 674} {"info/global_step": 675, "train_info/time_within_train_step": 2.648585081100464, "step": 675} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 675} {"info/global_step": 676, "train_info/time_within_train_step": 2.6457326412200928, "step": 676} {"train_info/time_between_train_steps": 0.003329753875732422, "step": 676} {"info/global_step": 677, "train_info/time_within_train_step": 2.665217638015747, "step": 677} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 677} {"info/global_step": 678, "train_info/time_within_train_step": 2.663591146469116, "step": 678} {"train_info/time_between_train_steps": 0.003236055374145508, "step": 678} {"info/global_step": 679, "train_info/time_within_train_step": 2.6605095863342285, "step": 679} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 679} {"info/global_step": 680, "train_info/time_within_train_step": 2.7105770111083984, "step": 680} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 680} {"info/global_step": 681, "train_info/time_within_train_step": 2.6471974849700928, "step": 681} {"train_info/time_between_train_steps": 0.0031120777130126953, "step": 681} {"info/global_step": 682, "train_info/time_within_train_step": 2.6541285514831543, "step": 682} {"train_info/time_between_train_steps": 0.0031158924102783203, "step": 682} {"info/global_step": 683, "train_info/time_within_train_step": 2.6537740230560303, "step": 683} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 683} {"info/global_step": 684, "train_info/time_within_train_step": 2.643378257751465, "step": 684} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 684} {"info/global_step": 685, "train_info/time_within_train_step": 2.65912127494812, "step": 685} {"train_info/time_between_train_steps": 0.0031280517578125, "step": 685} {"info/global_step": 686, "train_info/time_within_train_step": 2.6525352001190186, "step": 686} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 686} {"info/global_step": 687, "train_info/time_within_train_step": 2.660400867462158, "step": 687} {"train_info/time_between_train_steps": 0.003118753433227539, "step": 687} {"info/global_step": 688, "train_info/time_within_train_step": 2.7086329460144043, "step": 688} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 688} {"info/global_step": 689, "train_info/time_within_train_step": 2.909670352935791, "step": 689} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 689} {"info/global_step": 690, "train_info/time_within_train_step": 2.654317855834961, "step": 690} {"train_info/time_between_train_steps": 0.0031328201293945312, "step": 690} {"info/global_step": 691, "train_info/time_within_train_step": 2.6676666736602783, "step": 691} {"train_info/time_between_train_steps": 0.002933025360107422, "step": 691} {"info/global_step": 692, "train_info/time_within_train_step": 2.728644847869873, "step": 692} {"train_info/time_between_train_steps": 0.002951383590698242, "step": 692} {"info/global_step": 693, "train_info/time_within_train_step": 2.6685330867767334, "step": 693} {"train_info/time_between_train_steps": 0.002917766571044922, "step": 693} {"info/global_step": 694, "train_info/time_within_train_step": 2.6404271125793457, "step": 694} {"train_info/time_between_train_steps": 0.0030002593994140625, "step": 694} {"info/global_step": 695, "train_info/time_within_train_step": 2.642240524291992, "step": 695} {"train_info/time_between_train_steps": 0.0029840469360351562, "step": 695} {"info/global_step": 696, "train_info/time_within_train_step": 2.6544957160949707, "step": 696} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 696} {"info/global_step": 697, "train_info/time_within_train_step": 2.6557867527008057, "step": 697} {"train_info/time_between_train_steps": 0.002949237823486328, "step": 697} {"info/global_step": 698, "train_info/time_within_train_step": 2.642570734024048, "step": 698} {"train_info/time_between_train_steps": 0.0029609203338623047, "step": 698} {"info/global_step": 699, "train_info/time_within_train_step": 2.6500823497772217, "step": 699} {"train_info/time_between_train_steps": 0.002962350845336914, "step": 699} {"info/global_step": 700, "train_info/time_within_train_step": 2.650362968444824, "step": 700} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746899361, "_runtime": 1959}, "step": 700} {"logs": {"train/loss": 5.3985, "train/learning_rate": 0.00041999999999999996, "train/epoch": 0.07, "_timestamp": 1746899361, "_runtime": 1959}, "step": 700} {"train_info/time_between_train_steps": 0.024608135223388672, "step": 700} {"info/global_step": 701, "train_info/time_within_train_step": 2.6646311283111572, "step": 701} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 701} {"info/global_step": 702, "train_info/time_within_train_step": 2.6861050128936768, "step": 702} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 702} {"info/global_step": 703, "train_info/time_within_train_step": 2.6500918865203857, "step": 703} {"train_info/time_between_train_steps": 0.002984285354614258, "step": 703} {"info/global_step": 704, "train_info/time_within_train_step": 2.640735626220703, "step": 704} {"train_info/time_between_train_steps": 0.002951383590698242, "step": 704} {"info/global_step": 705, "train_info/time_within_train_step": 2.643037796020508, "step": 705} {"train_info/time_between_train_steps": 0.003103017807006836, "step": 705} {"info/global_step": 706, "train_info/time_within_train_step": 2.64615797996521, "step": 706} {"train_info/time_between_train_steps": 0.003246784210205078, "step": 706} {"info/global_step": 707, "train_info/time_within_train_step": 2.811845302581787, "step": 707} {"train_info/time_between_train_steps": 0.003099203109741211, "step": 707} {"info/global_step": 708, "train_info/time_within_train_step": 2.6462016105651855, "step": 708} {"train_info/time_between_train_steps": 0.0030994415283203125, "step": 708} {"info/global_step": 709, "train_info/time_within_train_step": 2.6443426609039307, "step": 709} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 709} {"info/global_step": 710, "train_info/time_within_train_step": 2.6796998977661133, "step": 710} {"train_info/time_between_train_steps": 0.0029854774475097656, "step": 710} {"info/global_step": 711, "train_info/time_within_train_step": 2.6477925777435303, "step": 711} {"train_info/time_between_train_steps": 0.0029497146606445312, "step": 711} {"info/global_step": 712, "train_info/time_within_train_step": 2.655332326889038, "step": 712} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 712} {"info/global_step": 713, "train_info/time_within_train_step": 2.65139102935791, "step": 713} {"train_info/time_between_train_steps": 0.0029611587524414062, "step": 713} {"info/global_step": 714, "train_info/time_within_train_step": 2.659432888031006, "step": 714} {"train_info/time_between_train_steps": 0.0029730796813964844, "step": 714} {"info/global_step": 715, "train_info/time_within_train_step": 2.6459567546844482, "step": 715} {"train_info/time_between_train_steps": 0.002940654754638672, "step": 715} {"info/global_step": 716, "train_info/time_within_train_step": 2.6466050148010254, "step": 716} {"train_info/time_between_train_steps": 0.003047943115234375, "step": 716} {"info/global_step": 717, "train_info/time_within_train_step": 2.6460111141204834, "step": 717} {"train_info/time_between_train_steps": 0.002955198287963867, "step": 717} {"info/global_step": 718, "train_info/time_within_train_step": 2.6418397426605225, "step": 718} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 718} {"info/global_step": 719, "train_info/time_within_train_step": 2.6664981842041016, "step": 719} {"train_info/time_between_train_steps": 0.0029976367950439453, "step": 719} {"info/global_step": 720, "train_info/time_within_train_step": 2.668179512023926, "step": 720} {"train_info/time_between_train_steps": 0.0029449462890625, "step": 720} {"info/global_step": 721, "train_info/time_within_train_step": 2.676527976989746, "step": 721} {"train_info/time_between_train_steps": 0.0029969215393066406, "step": 721} {"info/global_step": 722, "train_info/time_within_train_step": 2.6547982692718506, "step": 722} {"train_info/time_between_train_steps": 0.002943754196166992, "step": 722} {"info/global_step": 723, "train_info/time_within_train_step": 2.6387393474578857, "step": 723} {"train_info/time_between_train_steps": 0.002951383590698242, "step": 723} {"info/global_step": 724, "train_info/time_within_train_step": 2.647721290588379, "step": 724} {"train_info/time_between_train_steps": 0.0029637813568115234, "step": 724} {"info/global_step": 725, "train_info/time_within_train_step": 2.6629438400268555, "step": 725} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 725} {"info/global_step": 726, "train_info/time_within_train_step": 2.642317533493042, "step": 726} {"train_info/time_between_train_steps": 0.0029599666595458984, "step": 726} {"info/global_step": 727, "train_info/time_within_train_step": 2.652984142303467, "step": 727} {"train_info/time_between_train_steps": 0.0029287338256835938, "step": 727} {"info/global_step": 728, "train_info/time_within_train_step": 2.6822354793548584, "step": 728} {"train_info/time_between_train_steps": 0.002920866012573242, "step": 728} {"info/global_step": 729, "train_info/time_within_train_step": 2.6493356227874756, "step": 729} {"train_info/time_between_train_steps": 0.002991199493408203, "step": 729} {"info/global_step": 730, "train_info/time_within_train_step": 2.6825833320617676, "step": 730} {"train_info/time_between_train_steps": 0.0029392242431640625, "step": 730} {"info/global_step": 731, "train_info/time_within_train_step": 2.6399335861206055, "step": 731} {"train_info/time_between_train_steps": 0.0029191970825195312, "step": 731} {"info/global_step": 732, "train_info/time_within_train_step": 2.647247314453125, "step": 732} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 732} {"info/global_step": 733, "train_info/time_within_train_step": 2.6674485206604004, "step": 733} {"train_info/time_between_train_steps": 0.003062725067138672, "step": 733} {"info/global_step": 734, "train_info/time_within_train_step": 2.6411356925964355, "step": 734} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 734} {"info/global_step": 735, "train_info/time_within_train_step": 2.643470525741577, "step": 735} {"train_info/time_between_train_steps": 0.003011941909790039, "step": 735} {"info/global_step": 736, "train_info/time_within_train_step": 2.655705213546753, "step": 736} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 736} {"info/global_step": 737, "train_info/time_within_train_step": 2.659209966659546, "step": 737} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 737} {"info/global_step": 738, "train_info/time_within_train_step": 2.675166606903076, "step": 738} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 738} {"info/global_step": 739, "train_info/time_within_train_step": 2.664766311645508, "step": 739} {"train_info/time_between_train_steps": 0.0032606124877929688, "step": 739} {"info/global_step": 740, "train_info/time_within_train_step": 2.7063796520233154, "step": 740} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 740} {"info/global_step": 741, "train_info/time_within_train_step": 2.641148567199707, "step": 741} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 741} {"info/global_step": 742, "train_info/time_within_train_step": 2.652043342590332, "step": 742} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 742} {"info/global_step": 743, "train_info/time_within_train_step": 2.656002998352051, "step": 743} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 743} {"info/global_step": 744, "train_info/time_within_train_step": 2.6448564529418945, "step": 744} {"train_info/time_between_train_steps": 0.003124237060546875, "step": 744} {"info/global_step": 745, "train_info/time_within_train_step": 2.6487863063812256, "step": 745} {"train_info/time_between_train_steps": 0.003122568130493164, "step": 745} {"info/global_step": 746, "train_info/time_within_train_step": 2.6500425338745117, "step": 746} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 746} {"info/global_step": 747, "train_info/time_within_train_step": 2.6509993076324463, "step": 747} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 747} {"info/global_step": 748, "train_info/time_within_train_step": 2.659418821334839, "step": 748} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 748} {"info/global_step": 749, "train_info/time_within_train_step": 2.8256514072418213, "step": 749} {"train_info/time_between_train_steps": 0.0030138492584228516, "step": 749} {"info/global_step": 750, "train_info/time_within_train_step": 3.112307071685791, "step": 750} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746899497, "_runtime": 2095}, "step": 750} {"logs": {"train/loss": 5.3167, "train/learning_rate": 0.00045, "train/epoch": 0.07, "_timestamp": 1746899497, "_runtime": 2095}, "step": 750} {"train_info/time_between_train_steps": 0.02406454086303711, "step": 750} {"info/global_step": 751, "train_info/time_within_train_step": 2.6468400955200195, "step": 751} {"train_info/time_between_train_steps": 0.0029420852661132812, "step": 751} {"info/global_step": 752, "train_info/time_within_train_step": 2.649817705154419, "step": 752} {"train_info/time_between_train_steps": 0.002978801727294922, "step": 752} {"info/global_step": 753, "train_info/time_within_train_step": 2.6481003761291504, "step": 753} {"train_info/time_between_train_steps": 0.0029375553131103516, "step": 753} {"info/global_step": 754, "train_info/time_within_train_step": 2.648069381713867, "step": 754} {"train_info/time_between_train_steps": 0.0029616355895996094, "step": 754} {"info/global_step": 755, "train_info/time_within_train_step": 2.649366617202759, "step": 755} {"train_info/time_between_train_steps": 0.002988576889038086, "step": 755} {"info/global_step": 756, "train_info/time_within_train_step": 2.6569437980651855, "step": 756} {"train_info/time_between_train_steps": 0.002955913543701172, "step": 756} {"info/global_step": 757, "train_info/time_within_train_step": 2.6537275314331055, "step": 757} {"train_info/time_between_train_steps": 0.002989530563354492, "step": 757} {"info/global_step": 758, "train_info/time_within_train_step": 2.665113687515259, "step": 758} {"train_info/time_between_train_steps": 0.003021240234375, "step": 758} {"info/global_step": 759, "train_info/time_within_train_step": 2.721750259399414, "step": 759} {"train_info/time_between_train_steps": 0.002958536148071289, "step": 759} {"info/global_step": 760, "train_info/time_within_train_step": 2.6765642166137695, "step": 760} {"train_info/time_between_train_steps": 0.0029604434967041016, "step": 760} {"info/global_step": 761, "train_info/time_within_train_step": 2.6410117149353027, "step": 761} {"train_info/time_between_train_steps": 0.0030248165130615234, "step": 761} {"info/global_step": 762, "train_info/time_within_train_step": 2.6591460704803467, "step": 762} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 762} {"info/global_step": 763, "train_info/time_within_train_step": 2.6467456817626953, "step": 763} {"train_info/time_between_train_steps": 0.002989530563354492, "step": 763} {"info/global_step": 764, "train_info/time_within_train_step": 2.6465678215026855, "step": 764} {"train_info/time_between_train_steps": 0.0029497146606445312, "step": 764} {"info/global_step": 765, "train_info/time_within_train_step": 2.6464648246765137, "step": 765} {"train_info/time_between_train_steps": 0.0029942989349365234, "step": 765} {"info/global_step": 766, "train_info/time_within_train_step": 2.643930673599243, "step": 766} {"train_info/time_between_train_steps": 0.0029876232147216797, "step": 766} {"info/global_step": 767, "train_info/time_within_train_step": 2.6665844917297363, "step": 767} {"train_info/time_between_train_steps": 0.0030519962310791016, "step": 767} {"info/global_step": 768, "train_info/time_within_train_step": 2.669703483581543, "step": 768} {"train_info/time_between_train_steps": 0.002965688705444336, "step": 768} {"info/global_step": 769, "train_info/time_within_train_step": 2.6846680641174316, "step": 769} {"train_info/time_between_train_steps": 0.00295257568359375, "step": 769} {"info/global_step": 770, "train_info/time_within_train_step": 2.65112042427063, "step": 770} {"train_info/time_between_train_steps": 0.0032587051391601562, "step": 770} {"info/global_step": 771, "train_info/time_within_train_step": 2.642259359359741, "step": 771} {"train_info/time_between_train_steps": 0.0029151439666748047, "step": 771} {"info/global_step": 772, "train_info/time_within_train_step": 2.653475284576416, "step": 772} {"train_info/time_between_train_steps": 0.0029871463775634766, "step": 772} {"info/global_step": 773, "train_info/time_within_train_step": 2.6509647369384766, "step": 773} {"train_info/time_between_train_steps": 0.0029287338256835938, "step": 773} {"info/global_step": 774, "train_info/time_within_train_step": 2.6482009887695312, "step": 774} {"train_info/time_between_train_steps": 0.0029439926147460938, "step": 774} {"info/global_step": 775, "train_info/time_within_train_step": 2.6430869102478027, "step": 775} {"train_info/time_between_train_steps": 0.002966642379760742, "step": 775} {"info/global_step": 776, "train_info/time_within_train_step": 2.646301507949829, "step": 776} {"train_info/time_between_train_steps": 0.0029523372650146484, "step": 776} {"info/global_step": 777, "train_info/time_within_train_step": 2.670403242111206, "step": 777} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 777} {"info/global_step": 778, "train_info/time_within_train_step": 2.6656875610351562, "step": 778} {"train_info/time_between_train_steps": 0.00299072265625, "step": 778} {"info/global_step": 779, "train_info/time_within_train_step": 2.6651129722595215, "step": 779} {"train_info/time_between_train_steps": 0.002985715866088867, "step": 779} {"info/global_step": 780, "train_info/time_within_train_step": 2.6743900775909424, "step": 780} {"train_info/time_between_train_steps": 0.0030553340911865234, "step": 780} {"info/global_step": 781, "train_info/time_within_train_step": 2.6454107761383057, "step": 781} {"train_info/time_between_train_steps": 0.002985715866088867, "step": 781} {"info/global_step": 782, "train_info/time_within_train_step": 2.652766466140747, "step": 782} {"train_info/time_between_train_steps": 0.002971172332763672, "step": 782} {"info/global_step": 783, "train_info/time_within_train_step": 2.648064136505127, "step": 783} {"train_info/time_between_train_steps": 0.0029296875, "step": 783} {"info/global_step": 784, "train_info/time_within_train_step": 2.6462509632110596, "step": 784} {"train_info/time_between_train_steps": 0.0029289722442626953, "step": 784} {"info/global_step": 785, "train_info/time_within_train_step": 2.649887800216675, "step": 785} {"train_info/time_between_train_steps": 0.0029518604278564453, "step": 785} {"info/global_step": 786, "train_info/time_within_train_step": 2.6459298133850098, "step": 786} {"train_info/time_between_train_steps": 0.002970457077026367, "step": 786} {"info/global_step": 787, "train_info/time_within_train_step": 2.6632373332977295, "step": 787} {"train_info/time_between_train_steps": 0.0029447078704833984, "step": 787} {"info/global_step": 788, "train_info/time_within_train_step": 2.6617350578308105, "step": 788} {"train_info/time_between_train_steps": 0.0030088424682617188, "step": 788} {"info/global_step": 789, "train_info/time_within_train_step": 2.7435476779937744, "step": 789} {"train_info/time_between_train_steps": 0.0030858516693115234, "step": 789} {"info/global_step": 790, "train_info/time_within_train_step": 2.6541993618011475, "step": 790} {"train_info/time_between_train_steps": 0.0030274391174316406, "step": 790} {"info/global_step": 791, "train_info/time_within_train_step": 2.708177328109741, "step": 791} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 791} {"info/global_step": 792, "train_info/time_within_train_step": 2.6507530212402344, "step": 792} {"train_info/time_between_train_steps": 0.003071308135986328, "step": 792} {"info/global_step": 793, "train_info/time_within_train_step": 2.6481170654296875, "step": 793} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 793} {"info/global_step": 794, "train_info/time_within_train_step": 2.646700143814087, "step": 794} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 794} {"info/global_step": 795, "train_info/time_within_train_step": 2.6492197513580322, "step": 795} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 795} {"info/global_step": 796, "train_info/time_within_train_step": 2.650947332382202, "step": 796} {"train_info/time_between_train_steps": 0.0032498836517333984, "step": 796} {"info/global_step": 797, "train_info/time_within_train_step": 2.643808364868164, "step": 797} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 797} {"info/global_step": 798, "train_info/time_within_train_step": 2.6579535007476807, "step": 798} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 798} {"info/global_step": 799, "train_info/time_within_train_step": 2.65403413772583, "step": 799} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 799} {"info/global_step": 800, "train_info/time_within_train_step": 2.6646549701690674, "step": 800} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746899631, "_runtime": 2229}, "step": 800} {"logs": {"train/loss": 5.2486, "train/learning_rate": 0.00047999999999999996, "train/epoch": 0.08, "_timestamp": 1746899631, "_runtime": 2229}, "step": 800} {"train_info/time_between_train_steps": 14.149431228637695, "step": 800} {"info/global_step": 801, "train_info/time_within_train_step": 2.442532539367676, "step": 801} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 801} {"info/global_step": 802, "train_info/time_within_train_step": 2.437061309814453, "step": 802} {"train_info/time_between_train_steps": 0.0031099319458007812, "step": 802} {"info/global_step": 803, "train_info/time_within_train_step": 2.615659236907959, "step": 803} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 803} {"info/global_step": 804, "train_info/time_within_train_step": 2.653043508529663, "step": 804} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 804} {"info/global_step": 805, "train_info/time_within_train_step": 2.6398165225982666, "step": 805} {"train_info/time_between_train_steps": 0.003062009811401367, "step": 805} {"info/global_step": 806, "train_info/time_within_train_step": 2.6413118839263916, "step": 806} {"train_info/time_between_train_steps": 0.003129720687866211, "step": 806} {"info/global_step": 807, "train_info/time_within_train_step": 2.668761730194092, "step": 807} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 807} {"info/global_step": 808, "train_info/time_within_train_step": 2.6641342639923096, "step": 808} {"train_info/time_between_train_steps": 0.0031206607818603516, "step": 808} {"info/global_step": 809, "train_info/time_within_train_step": 2.6582770347595215, "step": 809} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 809} {"info/global_step": 810, "train_info/time_within_train_step": 2.680832624435425, "step": 810} {"train_info/time_between_train_steps": 0.0031478404998779297, "step": 810} {"info/global_step": 811, "train_info/time_within_train_step": 2.639357089996338, "step": 811} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 811} {"info/global_step": 812, "train_info/time_within_train_step": 2.653968572616577, "step": 812} {"train_info/time_between_train_steps": 0.0031042098999023438, "step": 812} {"info/global_step": 813, "train_info/time_within_train_step": 2.6566505432128906, "step": 813} {"train_info/time_between_train_steps": 0.003113985061645508, "step": 813} {"info/global_step": 814, "train_info/time_within_train_step": 2.6428472995758057, "step": 814} {"train_info/time_between_train_steps": 0.003090381622314453, "step": 814} {"info/global_step": 815, "train_info/time_within_train_step": 2.644009590148926, "step": 815} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 815} {"info/global_step": 816, "train_info/time_within_train_step": 2.651111602783203, "step": 816} {"train_info/time_between_train_steps": 0.0031206607818603516, "step": 816} {"info/global_step": 817, "train_info/time_within_train_step": 2.659716844558716, "step": 817} {"train_info/time_between_train_steps": 0.0030961036682128906, "step": 817} {"info/global_step": 818, "train_info/time_within_train_step": 2.6710641384124756, "step": 818} {"train_info/time_between_train_steps": 0.003100872039794922, "step": 818} {"info/global_step": 819, "train_info/time_within_train_step": 2.66292405128479, "step": 819} {"train_info/time_between_train_steps": 0.0031120777130126953, "step": 819} {"info/global_step": 820, "train_info/time_within_train_step": 2.70029354095459, "step": 820} {"train_info/time_between_train_steps": 0.0030813217163085938, "step": 820} {"info/global_step": 821, "train_info/time_within_train_step": 2.6413984298706055, "step": 821} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 821} {"info/global_step": 822, "train_info/time_within_train_step": 2.646665334701538, "step": 822} {"train_info/time_between_train_steps": 0.003077268600463867, "step": 822} {"info/global_step": 823, "train_info/time_within_train_step": 2.648973226547241, "step": 823} {"train_info/time_between_train_steps": 0.0030939579010009766, "step": 823} {"info/global_step": 824, "train_info/time_within_train_step": 2.6514365673065186, "step": 824} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 824} {"info/global_step": 825, "train_info/time_within_train_step": 2.64481782913208, "step": 825} {"train_info/time_between_train_steps": 0.0030663013458251953, "step": 825} {"info/global_step": 826, "train_info/time_within_train_step": 2.6546471118927, "step": 826} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 826} {"info/global_step": 827, "train_info/time_within_train_step": 2.6558501720428467, "step": 827} {"train_info/time_between_train_steps": 0.003075838088989258, "step": 827} {"info/global_step": 828, "train_info/time_within_train_step": 2.6418538093566895, "step": 828} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 828} {"info/global_step": 829, "train_info/time_within_train_step": 2.6404545307159424, "step": 829} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 829} {"info/global_step": 830, "train_info/time_within_train_step": 2.6465823650360107, "step": 830} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 830} {"info/global_step": 831, "train_info/time_within_train_step": 2.663250684738159, "step": 831} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 831} {"info/global_step": 832, "train_info/time_within_train_step": 2.6424601078033447, "step": 832} {"train_info/time_between_train_steps": 0.003118753433227539, "step": 832} {"info/global_step": 833, "train_info/time_within_train_step": 2.6435532569885254, "step": 833} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 833} {"info/global_step": 834, "train_info/time_within_train_step": 2.6457414627075195, "step": 834} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 834} {"info/global_step": 835, "train_info/time_within_train_step": 2.749870777130127, "step": 835} {"train_info/time_between_train_steps": 0.0030307769775390625, "step": 835} {"info/global_step": 836, "train_info/time_within_train_step": 2.720933675765991, "step": 836} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 836} {"info/global_step": 837, "train_info/time_within_train_step": 2.651317596435547, "step": 837} {"train_info/time_between_train_steps": 0.002955198287963867, "step": 837} {"info/global_step": 838, "train_info/time_within_train_step": 2.645678758621216, "step": 838} {"train_info/time_between_train_steps": 0.0030188560485839844, "step": 838} {"info/global_step": 839, "train_info/time_within_train_step": 2.649510383605957, "step": 839} {"train_info/time_between_train_steps": 0.0030732154846191406, "step": 839} {"info/global_step": 840, "train_info/time_within_train_step": 2.6474099159240723, "step": 840} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 840} {"info/global_step": 841, "train_info/time_within_train_step": 2.6712989807128906, "step": 841} {"train_info/time_between_train_steps": 0.0032911300659179688, "step": 841} {"info/global_step": 842, "train_info/time_within_train_step": 2.652209520339966, "step": 842} {"train_info/time_between_train_steps": 0.003030538558959961, "step": 842} {"info/global_step": 843, "train_info/time_within_train_step": 2.6565587520599365, "step": 843} {"train_info/time_between_train_steps": 0.003106355667114258, "step": 843} {"info/global_step": 844, "train_info/time_within_train_step": 2.6490468978881836, "step": 844} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 844} {"info/global_step": 845, "train_info/time_within_train_step": 2.6581859588623047, "step": 845} {"train_info/time_between_train_steps": 0.003532886505126953, "step": 845} {"info/global_step": 846, "train_info/time_within_train_step": 2.6941452026367188, "step": 846} {"train_info/time_between_train_steps": 0.003241300582885742, "step": 846} {"info/global_step": 847, "train_info/time_within_train_step": 2.713484525680542, "step": 847} {"train_info/time_between_train_steps": 0.0033135414123535156, "step": 847} {"info/global_step": 848, "train_info/time_within_train_step": 2.6398227214813232, "step": 848} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 848} {"info/global_step": 849, "train_info/time_within_train_step": 2.6397812366485596, "step": 849} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 849} {"info/global_step": 850, "train_info/time_within_train_step": 2.663503646850586, "step": 850} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746899779, "_runtime": 2377}, "step": 850} {"logs": {"train/loss": 5.1809, "train/learning_rate": 0.0005099999999999999, "train/epoch": 0.09, "_timestamp": 1746899779, "_runtime": 2377}, "step": 850} {"train_info/time_between_train_steps": 0.024248600006103516, "step": 850} {"info/global_step": 851, "train_info/time_within_train_step": 2.6486566066741943, "step": 851} {"train_info/time_between_train_steps": 0.0033986568450927734, "step": 851} {"info/global_step": 852, "train_info/time_within_train_step": 2.64927339553833, "step": 852} {"train_info/time_between_train_steps": 0.0031807422637939453, "step": 852} {"info/global_step": 853, "train_info/time_within_train_step": 2.651338577270508, "step": 853} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 853} {"info/global_step": 854, "train_info/time_within_train_step": 2.6465654373168945, "step": 854} {"train_info/time_between_train_steps": 0.003376007080078125, "step": 854} {"info/global_step": 855, "train_info/time_within_train_step": 2.669807195663452, "step": 855} {"train_info/time_between_train_steps": 0.0033235549926757812, "step": 855} {"info/global_step": 856, "train_info/time_within_train_step": 2.6921236515045166, "step": 856} {"train_info/time_between_train_steps": 0.003459930419921875, "step": 856} {"info/global_step": 857, "train_info/time_within_train_step": 2.6600241661071777, "step": 857} {"train_info/time_between_train_steps": 0.003741741180419922, "step": 857} {"info/global_step": 858, "train_info/time_within_train_step": 2.664186954498291, "step": 858} {"train_info/time_between_train_steps": 0.0036232471466064453, "step": 858} {"info/global_step": 859, "train_info/time_within_train_step": 2.6411330699920654, "step": 859} {"train_info/time_between_train_steps": 0.003818035125732422, "step": 859} {"info/global_step": 860, "train_info/time_within_train_step": 2.641756534576416, "step": 860} {"train_info/time_between_train_steps": 0.0038242340087890625, "step": 860} {"info/global_step": 861, "train_info/time_within_train_step": 2.6473548412323, "step": 861} {"train_info/time_between_train_steps": 0.0039560794830322266, "step": 861} {"info/global_step": 862, "train_info/time_within_train_step": 2.6666836738586426, "step": 862} {"train_info/time_between_train_steps": 0.004300594329833984, "step": 862} {"info/global_step": 863, "train_info/time_within_train_step": 2.644737720489502, "step": 863} {"train_info/time_between_train_steps": 0.0034143924713134766, "step": 863} {"train_info/time_between_train_steps": 2.328549861907959, "step": 863} {"info/global_step": 864, "train_info/time_within_train_step": 2.9111690521240234, "step": 864} {"train_info/time_between_train_steps": 0.003227710723876953, "step": 864} {"info/global_step": 865, "train_info/time_within_train_step": 2.6709723472595215, "step": 865} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 865} {"info/global_step": 866, "train_info/time_within_train_step": 2.6482322216033936, "step": 866} {"train_info/time_between_train_steps": 0.003136157989501953, "step": 866} {"info/global_step": 867, "train_info/time_within_train_step": 2.6435985565185547, "step": 867} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 867} {"info/global_step": 868, "train_info/time_within_train_step": 2.6526434421539307, "step": 868} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 868} {"info/global_step": 869, "train_info/time_within_train_step": 2.6404716968536377, "step": 869} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 869} {"info/global_step": 870, "train_info/time_within_train_step": 2.643588066101074, "step": 870} {"train_info/time_between_train_steps": 0.003130197525024414, "step": 870} {"info/global_step": 871, "train_info/time_within_train_step": 2.6482582092285156, "step": 871} {"train_info/time_between_train_steps": 0.003112316131591797, "step": 871} {"info/global_step": 872, "train_info/time_within_train_step": 2.65073299407959, "step": 872} {"train_info/time_between_train_steps": 0.0031387805938720703, "step": 872} {"info/global_step": 873, "train_info/time_within_train_step": 2.6572704315185547, "step": 873} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 873} {"info/global_step": 874, "train_info/time_within_train_step": 2.679365873336792, "step": 874} {"train_info/time_between_train_steps": 0.0031189918518066406, "step": 874} {"info/global_step": 875, "train_info/time_within_train_step": 2.7208900451660156, "step": 875} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 875} {"info/global_step": 876, "train_info/time_within_train_step": 2.645660400390625, "step": 876} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 876} {"info/global_step": 877, "train_info/time_within_train_step": 2.637734889984131, "step": 877} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 877} {"info/global_step": 878, "train_info/time_within_train_step": 2.658482074737549, "step": 878} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 878} {"info/global_step": 879, "train_info/time_within_train_step": 2.646017074584961, "step": 879} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 879} {"info/global_step": 880, "train_info/time_within_train_step": 2.6446616649627686, "step": 880} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 880} {"info/global_step": 881, "train_info/time_within_train_step": 2.6464054584503174, "step": 881} {"train_info/time_between_train_steps": 0.0032074451446533203, "step": 881} {"info/global_step": 882, "train_info/time_within_train_step": 2.6421802043914795, "step": 882} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 882} {"info/global_step": 883, "train_info/time_within_train_step": 2.666660785675049, "step": 883} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 883} {"info/global_step": 884, "train_info/time_within_train_step": 2.6790897846221924, "step": 884} {"train_info/time_between_train_steps": 0.0031473636627197266, "step": 884} {"info/global_step": 885, "train_info/time_within_train_step": 2.688955783843994, "step": 885} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 885} {"info/global_step": 886, "train_info/time_within_train_step": 2.6460938453674316, "step": 886} {"train_info/time_between_train_steps": 0.0032744407653808594, "step": 886} {"info/global_step": 887, "train_info/time_within_train_step": 2.6395466327667236, "step": 887} {"train_info/time_between_train_steps": 0.003477334976196289, "step": 887} {"info/global_step": 888, "train_info/time_within_train_step": 2.6544086933135986, "step": 888} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 888} {"info/global_step": 889, "train_info/time_within_train_step": 2.649505615234375, "step": 889} {"train_info/time_between_train_steps": 0.0033860206604003906, "step": 889} {"info/global_step": 890, "train_info/time_within_train_step": 2.6416268348693848, "step": 890} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 890} {"info/global_step": 891, "train_info/time_within_train_step": 2.6523590087890625, "step": 891} {"train_info/time_between_train_steps": 0.0031158924102783203, "step": 891} {"info/global_step": 892, "train_info/time_within_train_step": 2.6685681343078613, "step": 892} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 892} {"info/global_step": 893, "train_info/time_within_train_step": 2.65854811668396, "step": 893} {"train_info/time_between_train_steps": 0.0032377243041992188, "step": 893} {"info/global_step": 894, "train_info/time_within_train_step": 2.683223247528076, "step": 894} {"train_info/time_between_train_steps": 0.0031189918518066406, "step": 894} {"info/global_step": 895, "train_info/time_within_train_step": 2.63981032371521, "step": 895} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 895} {"info/global_step": 896, "train_info/time_within_train_step": 2.65297532081604, "step": 896} {"train_info/time_between_train_steps": 0.0031054019927978516, "step": 896} {"info/global_step": 897, "train_info/time_within_train_step": 2.6583871841430664, "step": 897} {"train_info/time_between_train_steps": 0.0031082630157470703, "step": 897} {"info/global_step": 898, "train_info/time_within_train_step": 2.641115665435791, "step": 898} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 898} {"info/global_step": 899, "train_info/time_within_train_step": 2.6424942016601562, "step": 899} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 899} {"info/global_step": 900, "train_info/time_within_train_step": 2.652820348739624, "step": 900} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746899915, "_runtime": 2513}, "step": 900} {"logs": {"train/loss": 5.1464, "train/learning_rate": 0.00054, "train/epoch": 1.0, "_timestamp": 1746899915, "_runtime": 2513}, "step": 900} {"train_info/time_between_train_steps": 0.025001049041748047, "step": 900} {"info/global_step": 901, "train_info/time_within_train_step": 2.6633732318878174, "step": 901} {"train_info/time_between_train_steps": 0.003124237060546875, "step": 901} {"info/global_step": 902, "train_info/time_within_train_step": 2.6527037620544434, "step": 902} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 902} {"info/global_step": 903, "train_info/time_within_train_step": 2.6596999168395996, "step": 903} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 903} {"info/global_step": 904, "train_info/time_within_train_step": 2.6936659812927246, "step": 904} {"train_info/time_between_train_steps": 0.0030951499938964844, "step": 904} {"info/global_step": 905, "train_info/time_within_train_step": 2.891166925430298, "step": 905} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 905} {"info/global_step": 906, "train_info/time_within_train_step": 2.6736361980438232, "step": 906} {"train_info/time_between_train_steps": 0.003106832504272461, "step": 906} {"info/global_step": 907, "train_info/time_within_train_step": 2.6622979640960693, "step": 907} {"train_info/time_between_train_steps": 0.0031042098999023438, "step": 907} {"info/global_step": 908, "train_info/time_within_train_step": 2.6977033615112305, "step": 908} {"train_info/time_between_train_steps": 0.0032842159271240234, "step": 908} {"info/global_step": 909, "train_info/time_within_train_step": 2.640040874481201, "step": 909} {"train_info/time_between_train_steps": 0.0034847259521484375, "step": 909} {"info/global_step": 910, "train_info/time_within_train_step": 2.6435229778289795, "step": 910} {"train_info/time_between_train_steps": 0.003413677215576172, "step": 910} {"info/global_step": 911, "train_info/time_within_train_step": 2.6433324813842773, "step": 911} {"train_info/time_between_train_steps": 0.0032711029052734375, "step": 911} {"info/global_step": 912, "train_info/time_within_train_step": 2.6436896324157715, "step": 912} {"train_info/time_between_train_steps": 0.0033936500549316406, "step": 912} {"info/global_step": 913, "train_info/time_within_train_step": 2.645251512527466, "step": 913} {"train_info/time_between_train_steps": 0.0033304691314697266, "step": 913} {"info/global_step": 914, "train_info/time_within_train_step": 2.64839506149292, "step": 914} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 914} {"info/global_step": 915, "train_info/time_within_train_step": 2.643202304840088, "step": 915} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 915} {"info/global_step": 916, "train_info/time_within_train_step": 2.6783833503723145, "step": 916} {"train_info/time_between_train_steps": 0.0031359195709228516, "step": 916} {"info/global_step": 917, "train_info/time_within_train_step": 2.6404201984405518, "step": 917} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 917} {"info/global_step": 918, "train_info/time_within_train_step": 2.6465067863464355, "step": 918} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 918} {"info/global_step": 919, "train_info/time_within_train_step": 2.6398978233337402, "step": 919} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 919} {"info/global_step": 920, "train_info/time_within_train_step": 2.66106915473938, "step": 920} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 920} {"info/global_step": 921, "train_info/time_within_train_step": 2.655482769012451, "step": 921} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 921} {"info/global_step": 922, "train_info/time_within_train_step": 2.662999391555786, "step": 922} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 922} {"info/global_step": 923, "train_info/time_within_train_step": 2.6806447505950928, "step": 923} {"train_info/time_between_train_steps": 0.003227710723876953, "step": 923} {"info/global_step": 924, "train_info/time_within_train_step": 2.641045570373535, "step": 924} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 924} {"info/global_step": 925, "train_info/time_within_train_step": 2.6426870822906494, "step": 925} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 925} {"info/global_step": 926, "train_info/time_within_train_step": 2.7578253746032715, "step": 926} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 926} {"info/global_step": 927, "train_info/time_within_train_step": 2.6422741413116455, "step": 927} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 927} {"info/global_step": 928, "train_info/time_within_train_step": 2.65826153755188, "step": 928} {"train_info/time_between_train_steps": 0.0031280517578125, "step": 928} {"info/global_step": 929, "train_info/time_within_train_step": 2.6473307609558105, "step": 929} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 929} {"info/global_step": 930, "train_info/time_within_train_step": 2.661201238632202, "step": 930} {"train_info/time_between_train_steps": 0.0032329559326171875, "step": 930} {"info/global_step": 931, "train_info/time_within_train_step": 2.7184197902679443, "step": 931} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 931} {"info/global_step": 932, "train_info/time_within_train_step": 2.6612281799316406, "step": 932} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 932} {"info/global_step": 933, "train_info/time_within_train_step": 2.639673948287964, "step": 933} {"train_info/time_between_train_steps": 0.0032520294189453125, "step": 933} {"info/global_step": 934, "train_info/time_within_train_step": 2.6588706970214844, "step": 934} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 934} {"info/global_step": 935, "train_info/time_within_train_step": 2.6464591026306152, "step": 935} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 935} {"info/global_step": 936, "train_info/time_within_train_step": 2.648923873901367, "step": 936} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 936} {"info/global_step": 937, "train_info/time_within_train_step": 2.6447465419769287, "step": 937} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 937} {"info/global_step": 938, "train_info/time_within_train_step": 2.6405656337738037, "step": 938} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 938} {"info/global_step": 939, "train_info/time_within_train_step": 2.6668245792388916, "step": 939} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 939} {"info/global_step": 940, "train_info/time_within_train_step": 2.6818981170654297, "step": 940} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 940} {"info/global_step": 941, "train_info/time_within_train_step": 2.6752138137817383, "step": 941} {"train_info/time_between_train_steps": 0.0031473636627197266, "step": 941} {"info/global_step": 942, "train_info/time_within_train_step": 2.6541078090667725, "step": 942} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 942} {"info/global_step": 943, "train_info/time_within_train_step": 2.6395719051361084, "step": 943} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 943} {"info/global_step": 944, "train_info/time_within_train_step": 2.654737949371338, "step": 944} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 944} {"info/global_step": 945, "train_info/time_within_train_step": 2.658289909362793, "step": 945} {"train_info/time_between_train_steps": 0.003130197525024414, "step": 945} {"info/global_step": 946, "train_info/time_within_train_step": 2.6428685188293457, "step": 946} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 946} {"info/global_step": 947, "train_info/time_within_train_step": 2.6428492069244385, "step": 947} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 947} {"info/global_step": 948, "train_info/time_within_train_step": 2.6518537998199463, "step": 948} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 948} {"info/global_step": 949, "train_info/time_within_train_step": 2.667356252670288, "step": 949} {"train_info/time_between_train_steps": 0.0031387805938720703, "step": 949} {"info/global_step": 950, "train_info/time_within_train_step": 2.67561674118042, "step": 950} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746900051, "_runtime": 2649}, "step": 950} {"logs": {"train/loss": 5.0426, "train/learning_rate": 0.00057, "train/epoch": 1.01, "_timestamp": 1746900051, "_runtime": 2649}, "step": 950} {"train_info/time_between_train_steps": 0.024219274520874023, "step": 950} {"info/global_step": 951, "train_info/time_within_train_step": 2.686081647872925, "step": 951} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 951} {"info/global_step": 952, "train_info/time_within_train_step": 2.6540629863739014, "step": 952} {"train_info/time_between_train_steps": 0.003126382827758789, "step": 952} {"info/global_step": 953, "train_info/time_within_train_step": 2.665045976638794, "step": 953} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 953} {"info/global_step": 954, "train_info/time_within_train_step": 2.6458182334899902, "step": 954} {"train_info/time_between_train_steps": 0.0031585693359375, "step": 954} {"info/global_step": 955, "train_info/time_within_train_step": 2.641676187515259, "step": 955} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 955} {"info/global_step": 956, "train_info/time_within_train_step": 2.6667726039886475, "step": 956} {"train_info/time_between_train_steps": 0.0031604766845703125, "step": 956} {"info/global_step": 957, "train_info/time_within_train_step": 2.6480605602264404, "step": 957} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 957} {"info/global_step": 958, "train_info/time_within_train_step": 2.643324136734009, "step": 958} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 958} {"info/global_step": 959, "train_info/time_within_train_step": 2.6642892360687256, "step": 959} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 959} {"info/global_step": 960, "train_info/time_within_train_step": 2.641793966293335, "step": 960} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 960} {"info/global_step": 961, "train_info/time_within_train_step": 2.6663763523101807, "step": 961} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 961} {"info/global_step": 962, "train_info/time_within_train_step": 2.6422016620635986, "step": 962} {"train_info/time_between_train_steps": 0.003119945526123047, "step": 962} {"info/global_step": 963, "train_info/time_within_train_step": 2.643097400665283, "step": 963} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 963} {"info/global_step": 964, "train_info/time_within_train_step": 2.6553685665130615, "step": 964} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 964} {"info/global_step": 965, "train_info/time_within_train_step": 2.654785633087158, "step": 965} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 965} {"info/global_step": 966, "train_info/time_within_train_step": 2.6952452659606934, "step": 966} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 966} {"info/global_step": 967, "train_info/time_within_train_step": 2.717677593231201, "step": 967} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 967} {"info/global_step": 968, "train_info/time_within_train_step": 2.64208722114563, "step": 968} {"train_info/time_between_train_steps": 0.0032618045806884766, "step": 968} {"info/global_step": 969, "train_info/time_within_train_step": 2.640211343765259, "step": 969} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 969} {"info/global_step": 970, "train_info/time_within_train_step": 2.658278226852417, "step": 970} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 970} {"info/global_step": 971, "train_info/time_within_train_step": 2.6485490798950195, "step": 971} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 971} {"info/global_step": 972, "train_info/time_within_train_step": 2.648127794265747, "step": 972} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 972} {"info/global_step": 973, "train_info/time_within_train_step": 2.645427703857422, "step": 973} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 973} {"info/global_step": 974, "train_info/time_within_train_step": 2.645017623901367, "step": 974} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 974} {"info/global_step": 975, "train_info/time_within_train_step": 2.6645894050598145, "step": 975} {"train_info/time_between_train_steps": 0.003470182418823242, "step": 975} {"info/global_step": 976, "train_info/time_within_train_step": 2.6653237342834473, "step": 976} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 976} {"info/global_step": 977, "train_info/time_within_train_step": 2.7086374759674072, "step": 977} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 977} {"info/global_step": 978, "train_info/time_within_train_step": 2.6413004398345947, "step": 978} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 978} {"info/global_step": 979, "train_info/time_within_train_step": 2.654973030090332, "step": 979} {"train_info/time_between_train_steps": 0.003133058547973633, "step": 979} {"info/global_step": 980, "train_info/time_within_train_step": 2.64638352394104, "step": 980} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 980} {"info/global_step": 981, "train_info/time_within_train_step": 2.6445651054382324, "step": 981} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 981} {"info/global_step": 982, "train_info/time_within_train_step": 2.6556475162506104, "step": 982} {"train_info/time_between_train_steps": 0.0031425952911376953, "step": 982} {"info/global_step": 983, "train_info/time_within_train_step": 2.6421971321105957, "step": 983} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 983} {"info/global_step": 984, "train_info/time_within_train_step": 2.6439146995544434, "step": 984} {"train_info/time_between_train_steps": 0.003188610076904297, "step": 984} {"info/global_step": 985, "train_info/time_within_train_step": 2.670372247695923, "step": 985} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 985} {"info/global_step": 986, "train_info/time_within_train_step": 2.6619927883148193, "step": 986} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 986} {"info/global_step": 987, "train_info/time_within_train_step": 2.6746444702148438, "step": 987} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 987} {"info/global_step": 988, "train_info/time_within_train_step": 2.6633095741271973, "step": 988} {"train_info/time_between_train_steps": 0.1229546070098877, "step": 988} {"info/global_step": 989, "train_info/time_within_train_step": 2.6729307174682617, "step": 989} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 989} {"info/global_step": 990, "train_info/time_within_train_step": 2.668018102645874, "step": 990} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 990} {"info/global_step": 991, "train_info/time_within_train_step": 2.6483185291290283, "step": 991} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 991} {"info/global_step": 992, "train_info/time_within_train_step": 2.650257110595703, "step": 992} {"train_info/time_between_train_steps": 0.003134012222290039, "step": 992} {"info/global_step": 993, "train_info/time_within_train_step": 2.6486129760742188, "step": 993} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 993} {"info/global_step": 994, "train_info/time_within_train_step": 2.646172285079956, "step": 994} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 994} {"info/global_step": 995, "train_info/time_within_train_step": 2.6478936672210693, "step": 995} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 995} {"info/global_step": 996, "train_info/time_within_train_step": 2.65161395072937, "step": 996} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 996} {"info/global_step": 997, "train_info/time_within_train_step": 2.6648879051208496, "step": 997} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 997} {"info/global_step": 998, "train_info/time_within_train_step": 2.6602587699890137, "step": 998} {"train_info/time_between_train_steps": 0.003156423568725586, "step": 998} {"info/global_step": 999, "train_info/time_within_train_step": 2.8957581520080566, "step": 999} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 999} {"info/global_step": 1000, "train_info/time_within_train_step": 3.0930933952331543, "step": 1000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 5350.0, "train_info/memory_max_reserved": 5350.0, "_timestamp": 1746900186, "_runtime": 2784}, "step": 1000} {"logs": {"train/loss": 4.9904, "train/learning_rate": 0.0006, "train/epoch": 1.01, "_timestamp": 1746900186, "_runtime": 2784}, "step": 1000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746900191, "_runtime": 2789}, "step": 1000} {"logs": {"eval/loss": 5.356438159942627, "eval/runtime": 5.1939, "eval/samples_per_second": 36.966, "eval/steps_per_second": 1.155, "train/epoch": 1.01, "_timestamp": 1746900191, "_runtime": 2789}, "step": 1000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746900191, "_runtime": 2789}, "step": 1000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 5.356438159942627, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 211.96860200268063, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1939, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.966, "train/epoch": 1.01, "_timestamp": 1746900191, "_runtime": 2789}, "step": 1000} {"train_info/time_between_train_steps": 18.606414794921875, "step": 1000} {"info/global_step": 1001, "train_info/time_within_train_step": 2.4472689628601074, "step": 1001} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 1001} {"info/global_step": 1002, "train_info/time_within_train_step": 2.4335765838623047, "step": 1002} {"train_info/time_between_train_steps": 0.0031397342681884766, "step": 1002} {"info/global_step": 1003, "train_info/time_within_train_step": 2.612456798553467, "step": 1003} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 1003} {"info/global_step": 1004, "train_info/time_within_train_step": 2.638897180557251, "step": 1004} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 1004} {"info/global_step": 1005, "train_info/time_within_train_step": 2.644315481185913, "step": 1005} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 1005} {"info/global_step": 1006, "train_info/time_within_train_step": 2.666828155517578, "step": 1006} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 1006} {"info/global_step": 1007, "train_info/time_within_train_step": 2.6844658851623535, "step": 1007} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 1007} {"info/global_step": 1008, "train_info/time_within_train_step": 2.667905330657959, "step": 1008} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 1008} {"info/global_step": 1009, "train_info/time_within_train_step": 2.6684443950653076, "step": 1009} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 1009} {"info/global_step": 1010, "train_info/time_within_train_step": 2.64705753326416, "step": 1010} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 1010} {"info/global_step": 1011, "train_info/time_within_train_step": 2.647733688354492, "step": 1011} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 1011} {"info/global_step": 1012, "train_info/time_within_train_step": 2.6630890369415283, "step": 1012} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 1012} {"info/global_step": 1013, "train_info/time_within_train_step": 2.6428987979888916, "step": 1013} {"train_info/time_between_train_steps": 0.0032808780670166016, "step": 1013} {"info/global_step": 1014, "train_info/time_within_train_step": 2.6430439949035645, "step": 1014} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 1014} {"info/global_step": 1015, "train_info/time_within_train_step": 2.655778408050537, "step": 1015} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 1015} {"info/global_step": 1016, "train_info/time_within_train_step": 2.6610186100006104, "step": 1016} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 1016} {"info/global_step": 1017, "train_info/time_within_train_step": 2.6736812591552734, "step": 1017} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 1017} {"info/global_step": 1018, "train_info/time_within_train_step": 2.6423699855804443, "step": 1018} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 1018} {"info/global_step": 1019, "train_info/time_within_train_step": 2.649021625518799, "step": 1019} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 1019} {"info/global_step": 1020, "train_info/time_within_train_step": 2.6628098487854004, "step": 1020} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 1020} {"info/global_step": 1021, "train_info/time_within_train_step": 2.6412806510925293, "step": 1021} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 1021} {"info/global_step": 1022, "train_info/time_within_train_step": 2.6461262702941895, "step": 1022} {"train_info/time_between_train_steps": 0.003368854522705078, "step": 1022} {"info/global_step": 1023, "train_info/time_within_train_step": 2.6498920917510986, "step": 1023} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 1023} {"info/global_step": 1024, "train_info/time_within_train_step": 2.653266668319702, "step": 1024} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 1024} {"info/global_step": 1025, "train_info/time_within_train_step": 2.6581616401672363, "step": 1025} {"train_info/time_between_train_steps": 0.003242969512939453, "step": 1025} {"info/global_step": 1026, "train_info/time_within_train_step": 2.6758410930633545, "step": 1026} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 1026} {"info/global_step": 1027, "train_info/time_within_train_step": 2.7294118404388428, "step": 1027} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 1027} {"info/global_step": 1028, "train_info/time_within_train_step": 2.6647868156433105, "step": 1028} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 1028} {"info/global_step": 1029, "train_info/time_within_train_step": 2.6414759159088135, "step": 1029} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 1029} {"info/global_step": 1030, "train_info/time_within_train_step": 2.64530611038208, "step": 1030} {"train_info/time_between_train_steps": 0.0032167434692382812, "step": 1030} {"info/global_step": 1031, "train_info/time_within_train_step": 2.6525797843933105, "step": 1031} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 1031} {"info/global_step": 1032, "train_info/time_within_train_step": 2.6536927223205566, "step": 1032} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 1032} {"info/global_step": 1033, "train_info/time_within_train_step": 2.6448121070861816, "step": 1033} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 1033} {"info/global_step": 1034, "train_info/time_within_train_step": 2.650221824645996, "step": 1034} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 1034} {"info/global_step": 1035, "train_info/time_within_train_step": 2.6578924655914307, "step": 1035} {"train_info/time_between_train_steps": 0.003423452377319336, "step": 1035} {"info/global_step": 1036, "train_info/time_within_train_step": 2.6685638427734375, "step": 1036} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 1036} {"info/global_step": 1037, "train_info/time_within_train_step": 2.7239575386047363, "step": 1037} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 1037} {"info/global_step": 1038, "train_info/time_within_train_step": 2.6563968658447266, "step": 1038} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 1038} {"info/global_step": 1039, "train_info/time_within_train_step": 2.665098190307617, "step": 1039} {"train_info/time_between_train_steps": 0.003473997116088867, "step": 1039} {"info/global_step": 1040, "train_info/time_within_train_step": 2.6397645473480225, "step": 1040} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 1040} {"info/global_step": 1041, "train_info/time_within_train_step": 2.6539700031280518, "step": 1041} {"train_info/time_between_train_steps": 0.0031290054321289062, "step": 1041} {"info/global_step": 1042, "train_info/time_within_train_step": 2.661614179611206, "step": 1042} {"train_info/time_between_train_steps": 0.003124237060546875, "step": 1042} {"info/global_step": 1043, "train_info/time_within_train_step": 2.64184308052063, "step": 1043} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 1043} {"info/global_step": 1044, "train_info/time_within_train_step": 2.6429827213287354, "step": 1044} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 1044} {"info/global_step": 1045, "train_info/time_within_train_step": 2.6639578342437744, "step": 1045} {"train_info/time_between_train_steps": 0.0031332969665527344, "step": 1045} {"info/global_step": 1046, "train_info/time_within_train_step": 2.6682815551757812, "step": 1046} {"train_info/time_between_train_steps": 0.0032727718353271484, "step": 1046} {"info/global_step": 1047, "train_info/time_within_train_step": 2.685713291168213, "step": 1047} {"train_info/time_between_train_steps": 0.003193378448486328, "step": 1047} {"info/global_step": 1048, "train_info/time_within_train_step": 2.6507349014282227, "step": 1048} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 1048} {"info/global_step": 1049, "train_info/time_within_train_step": 2.6785545349121094, "step": 1049} {"train_info/time_between_train_steps": 0.003261566162109375, "step": 1049} {"info/global_step": 1050, "train_info/time_within_train_step": 2.639496326446533, "step": 1050} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746900338, "_runtime": 2936}, "step": 1050} {"logs": {"train/loss": 4.9272, "train/learning_rate": 0.0005966666666666667, "train/epoch": 1.02, "_timestamp": 1746900338, "_runtime": 2936}, "step": 1050} {"train_info/time_between_train_steps": 0.02472686767578125, "step": 1050} {"info/global_step": 1051, "train_info/time_within_train_step": 2.7671620845794678, "step": 1051} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 1051} {"info/global_step": 1052, "train_info/time_within_train_step": 2.641792058944702, "step": 1052} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 1052} {"info/global_step": 1053, "train_info/time_within_train_step": 2.8906750679016113, "step": 1053} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 1053} {"info/global_step": 1054, "train_info/time_within_train_step": 2.6502065658569336, "step": 1054} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 1054} {"info/global_step": 1055, "train_info/time_within_train_step": 2.6423587799072266, "step": 1055} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 1055} {"info/global_step": 1056, "train_info/time_within_train_step": 2.646456003189087, "step": 1056} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 1056} {"info/global_step": 1057, "train_info/time_within_train_step": 2.645915985107422, "step": 1057} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 1057} {"info/global_step": 1058, "train_info/time_within_train_step": 2.661412000656128, "step": 1058} {"train_info/time_between_train_steps": 0.0031578540802001953, "step": 1058} {"info/global_step": 1059, "train_info/time_within_train_step": 2.6631524562835693, "step": 1059} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 1059} {"info/global_step": 1060, "train_info/time_within_train_step": 2.6576061248779297, "step": 1060} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 1060} {"info/global_step": 1061, "train_info/time_within_train_step": 2.7082691192626953, "step": 1061} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 1061} {"info/global_step": 1062, "train_info/time_within_train_step": 2.6411290168762207, "step": 1062} {"train_info/time_between_train_steps": 0.003271341323852539, "step": 1062} {"info/global_step": 1063, "train_info/time_within_train_step": 2.639803886413574, "step": 1063} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 1063} {"info/global_step": 1064, "train_info/time_within_train_step": 2.6578259468078613, "step": 1064} {"train_info/time_between_train_steps": 0.0032510757446289062, "step": 1064} {"info/global_step": 1065, "train_info/time_within_train_step": 2.652765989303589, "step": 1065} {"train_info/time_between_train_steps": 0.003337383270263672, "step": 1065} {"info/global_step": 1066, "train_info/time_within_train_step": 2.6434004306793213, "step": 1066} {"train_info/time_between_train_steps": 0.0034699440002441406, "step": 1066} {"info/global_step": 1067, "train_info/time_within_train_step": 2.660282611846924, "step": 1067} {"train_info/time_between_train_steps": 0.003521442413330078, "step": 1067} {"info/global_step": 1068, "train_info/time_within_train_step": 2.6513867378234863, "step": 1068} {"train_info/time_between_train_steps": 0.003531217575073242, "step": 1068} {"info/global_step": 1069, "train_info/time_within_train_step": 2.665142297744751, "step": 1069} {"train_info/time_between_train_steps": 0.0035407543182373047, "step": 1069} {"info/global_step": 1070, "train_info/time_within_train_step": 2.7215576171875, "step": 1070} {"train_info/time_between_train_steps": 0.0036382675170898438, "step": 1070} {"info/global_step": 1071, "train_info/time_within_train_step": 2.68918776512146, "step": 1071} {"train_info/time_between_train_steps": 0.003537893295288086, "step": 1071} {"info/global_step": 1072, "train_info/time_within_train_step": 2.6409473419189453, "step": 1072} {"train_info/time_between_train_steps": 0.0037581920623779297, "step": 1072} {"info/global_step": 1073, "train_info/time_within_train_step": 2.6423511505126953, "step": 1073} {"train_info/time_between_train_steps": 0.0036869049072265625, "step": 1073} {"info/global_step": 1074, "train_info/time_within_train_step": 2.661257028579712, "step": 1074} {"train_info/time_between_train_steps": 0.0036253929138183594, "step": 1074} {"info/global_step": 1075, "train_info/time_within_train_step": 2.655406951904297, "step": 1075} {"train_info/time_between_train_steps": 0.003676176071166992, "step": 1075} {"info/global_step": 1076, "train_info/time_within_train_step": 2.644139051437378, "step": 1076} {"train_info/time_between_train_steps": 0.0036504268646240234, "step": 1076} {"info/global_step": 1077, "train_info/time_within_train_step": 2.652179479598999, "step": 1077} {"train_info/time_between_train_steps": 0.0036230087280273438, "step": 1077} {"info/global_step": 1078, "train_info/time_within_train_step": 2.651282548904419, "step": 1078} {"train_info/time_between_train_steps": 0.0037441253662109375, "step": 1078} {"info/global_step": 1079, "train_info/time_within_train_step": 2.6702957153320312, "step": 1079} {"train_info/time_between_train_steps": 0.003655672073364258, "step": 1079} {"info/global_step": 1080, "train_info/time_within_train_step": 2.710885524749756, "step": 1080} {"train_info/time_between_train_steps": 0.0035581588745117188, "step": 1080} {"info/global_step": 1081, "train_info/time_within_train_step": 2.6467790603637695, "step": 1081} {"train_info/time_between_train_steps": 0.003561735153198242, "step": 1081} {"info/global_step": 1082, "train_info/time_within_train_step": 2.662130355834961, "step": 1082} {"train_info/time_between_train_steps": 0.003664255142211914, "step": 1082} {"info/global_step": 1083, "train_info/time_within_train_step": 2.6566855907440186, "step": 1083} {"train_info/time_between_train_steps": 0.003612041473388672, "step": 1083} {"info/global_step": 1084, "train_info/time_within_train_step": 2.6440956592559814, "step": 1084} {"train_info/time_between_train_steps": 0.003556966781616211, "step": 1084} {"info/global_step": 1085, "train_info/time_within_train_step": 2.6450390815734863, "step": 1085} {"train_info/time_between_train_steps": 0.0035812854766845703, "step": 1085} {"info/global_step": 1086, "train_info/time_within_train_step": 2.6709392070770264, "step": 1086} {"train_info/time_between_train_steps": 0.0036318302154541016, "step": 1086} {"info/global_step": 1087, "train_info/time_within_train_step": 2.6649961471557617, "step": 1087} {"train_info/time_between_train_steps": 0.003653287887573242, "step": 1087} {"info/global_step": 1088, "train_info/time_within_train_step": 2.6693360805511475, "step": 1088} {"train_info/time_between_train_steps": 0.0036640167236328125, "step": 1088} {"info/global_step": 1089, "train_info/time_within_train_step": 2.6697957515716553, "step": 1089} {"train_info/time_between_train_steps": 0.0035538673400878906, "step": 1089} {"info/global_step": 1090, "train_info/time_within_train_step": 2.646778106689453, "step": 1090} {"train_info/time_between_train_steps": 0.003571033477783203, "step": 1090} {"info/global_step": 1091, "train_info/time_within_train_step": 2.6543309688568115, "step": 1091} {"train_info/time_between_train_steps": 0.0034956932067871094, "step": 1091} {"info/global_step": 1092, "train_info/time_within_train_step": 2.6495683193206787, "step": 1092} {"train_info/time_between_train_steps": 0.003584146499633789, "step": 1092} {"info/global_step": 1093, "train_info/time_within_train_step": 2.6465377807617188, "step": 1093} {"train_info/time_between_train_steps": 0.0035486221313476562, "step": 1093} {"info/global_step": 1094, "train_info/time_within_train_step": 3.0088157653808594, "step": 1094} {"train_info/time_between_train_steps": 0.003477811813354492, "step": 1094} {"info/global_step": 1095, "train_info/time_within_train_step": 2.6499643325805664, "step": 1095} {"train_info/time_between_train_steps": 0.003438234329223633, "step": 1095} {"info/global_step": 1096, "train_info/time_within_train_step": 2.6513867378234863, "step": 1096} {"train_info/time_between_train_steps": 0.0035905838012695312, "step": 1096} {"info/global_step": 1097, "train_info/time_within_train_step": 2.6475069522857666, "step": 1097} {"train_info/time_between_train_steps": 0.0034797191619873047, "step": 1097} {"info/global_step": 1098, "train_info/time_within_train_step": 2.6503915786743164, "step": 1098} {"train_info/time_between_train_steps": 0.0038094520568847656, "step": 1098} {"info/global_step": 1099, "train_info/time_within_train_step": 2.6470224857330322, "step": 1099} {"train_info/time_between_train_steps": 0.003535032272338867, "step": 1099} {"info/global_step": 1100, "train_info/time_within_train_step": 2.6454999446868896, "step": 1100} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746900473, "_runtime": 3071}, "step": 1100} {"logs": {"train/loss": 4.8651, "train/learning_rate": 0.0005933333333333333, "train/epoch": 1.02, "_timestamp": 1746900473, "_runtime": 3071}, "step": 1100} {"train_info/time_between_train_steps": 0.02470564842224121, "step": 1100} {"info/global_step": 1101, "train_info/time_within_train_step": 2.6552181243896484, "step": 1101} {"train_info/time_between_train_steps": 0.0035865306854248047, "step": 1101} {"info/global_step": 1102, "train_info/time_within_train_step": 2.679750919342041, "step": 1102} {"train_info/time_between_train_steps": 0.0034978389739990234, "step": 1102} {"info/global_step": 1103, "train_info/time_within_train_step": 2.6657865047454834, "step": 1103} {"train_info/time_between_train_steps": 0.00362396240234375, "step": 1103} {"info/global_step": 1104, "train_info/time_within_train_step": 2.674875020980835, "step": 1104} {"train_info/time_between_train_steps": 0.0035600662231445312, "step": 1104} {"info/global_step": 1105, "train_info/time_within_train_step": 2.7039895057678223, "step": 1105} {"train_info/time_between_train_steps": 0.003434419631958008, "step": 1105} {"info/global_step": 1106, "train_info/time_within_train_step": 2.6494266986846924, "step": 1106} {"train_info/time_between_train_steps": 0.0034821033477783203, "step": 1106} {"info/global_step": 1107, "train_info/time_within_train_step": 2.648362398147583, "step": 1107} {"train_info/time_between_train_steps": 0.003482341766357422, "step": 1107} {"info/global_step": 1108, "train_info/time_within_train_step": 2.6505987644195557, "step": 1108} {"train_info/time_between_train_steps": 0.0035316944122314453, "step": 1108} {"info/global_step": 1109, "train_info/time_within_train_step": 2.6481666564941406, "step": 1109} {"train_info/time_between_train_steps": 0.0035355091094970703, "step": 1109} {"info/global_step": 1110, "train_info/time_within_train_step": 2.648733139038086, "step": 1110} {"train_info/time_between_train_steps": 0.003439188003540039, "step": 1110} {"info/global_step": 1111, "train_info/time_within_train_step": 2.6467928886413574, "step": 1111} {"train_info/time_between_train_steps": 0.0034923553466796875, "step": 1111} {"info/global_step": 1112, "train_info/time_within_train_step": 2.642199754714966, "step": 1112} {"train_info/time_between_train_steps": 0.0035696029663085938, "step": 1112} {"info/global_step": 1113, "train_info/time_within_train_step": 2.6504499912261963, "step": 1113} {"train_info/time_between_train_steps": 0.18081974983215332, "step": 1113} {"info/global_step": 1114, "train_info/time_within_train_step": 2.648519277572632, "step": 1114} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 1114} {"info/global_step": 1115, "train_info/time_within_train_step": 2.6458659172058105, "step": 1115} {"train_info/time_between_train_steps": 0.0034694671630859375, "step": 1115} {"info/global_step": 1116, "train_info/time_within_train_step": 2.644186019897461, "step": 1116} {"train_info/time_between_train_steps": 0.0036656856536865234, "step": 1116} {"info/global_step": 1117, "train_info/time_within_train_step": 2.645517349243164, "step": 1117} {"train_info/time_between_train_steps": 0.003471851348876953, "step": 1117} {"info/global_step": 1118, "train_info/time_within_train_step": 2.6440470218658447, "step": 1118} {"train_info/time_between_train_steps": 0.003423929214477539, "step": 1118} {"info/global_step": 1119, "train_info/time_within_train_step": 2.642868757247925, "step": 1119} {"train_info/time_between_train_steps": 0.0034394264221191406, "step": 1119} {"info/global_step": 1120, "train_info/time_within_train_step": 2.6695327758789062, "step": 1120} {"train_info/time_between_train_steps": 0.0033097267150878906, "step": 1120} {"info/global_step": 1121, "train_info/time_within_train_step": 2.6654675006866455, "step": 1121} {"train_info/time_between_train_steps": 0.003452301025390625, "step": 1121} {"info/global_step": 1122, "train_info/time_within_train_step": 2.642160654067993, "step": 1122} {"train_info/time_between_train_steps": 0.0034198760986328125, "step": 1122} {"info/global_step": 1123, "train_info/time_within_train_step": 2.669421911239624, "step": 1123} {"train_info/time_between_train_steps": 0.0034627914428710938, "step": 1123} {"info/global_step": 1124, "train_info/time_within_train_step": 2.6449010372161865, "step": 1124} {"train_info/time_between_train_steps": 0.003427743911743164, "step": 1124} {"info/global_step": 1125, "train_info/time_within_train_step": 2.6552767753601074, "step": 1125} {"train_info/time_between_train_steps": 0.0033936500549316406, "step": 1125} {"info/global_step": 1126, "train_info/time_within_train_step": 2.6580874919891357, "step": 1126} {"train_info/time_between_train_steps": 0.003448486328125, "step": 1126} {"info/global_step": 1127, "train_info/time_within_train_step": 2.654618978500366, "step": 1127} {"train_info/time_between_train_steps": 0.003512144088745117, "step": 1127} {"info/global_step": 1128, "train_info/time_within_train_step": 2.664477586746216, "step": 1128} {"train_info/time_between_train_steps": 0.0034797191619873047, "step": 1128} {"info/global_step": 1129, "train_info/time_within_train_step": 2.6656434535980225, "step": 1129} {"train_info/time_between_train_steps": 0.0035247802734375, "step": 1129} {"info/global_step": 1130, "train_info/time_within_train_step": 2.7246274948120117, "step": 1130} {"train_info/time_between_train_steps": 0.003554105758666992, "step": 1130} {"info/global_step": 1131, "train_info/time_within_train_step": 2.670246124267578, "step": 1131} {"train_info/time_between_train_steps": 0.003505706787109375, "step": 1131} {"info/global_step": 1132, "train_info/time_within_train_step": 2.639669418334961, "step": 1132} {"train_info/time_between_train_steps": 0.0034432411193847656, "step": 1132} {"info/global_step": 1133, "train_info/time_within_train_step": 2.6433823108673096, "step": 1133} {"train_info/time_between_train_steps": 0.0034780502319335938, "step": 1133} {"info/global_step": 1134, "train_info/time_within_train_step": 2.6549394130706787, "step": 1134} {"train_info/time_between_train_steps": 0.0034437179565429688, "step": 1134} {"info/global_step": 1135, "train_info/time_within_train_step": 2.6531457901000977, "step": 1135} {"train_info/time_between_train_steps": 0.0033371448516845703, "step": 1135} {"info/global_step": 1136, "train_info/time_within_train_step": 2.641610622406006, "step": 1136} {"train_info/time_between_train_steps": 0.003424406051635742, "step": 1136} {"info/global_step": 1137, "train_info/time_within_train_step": 2.6481266021728516, "step": 1137} {"train_info/time_between_train_steps": 0.0034928321838378906, "step": 1137} {"info/global_step": 1138, "train_info/time_within_train_step": 2.653714179992676, "step": 1138} {"train_info/time_between_train_steps": 0.0033915042877197266, "step": 1138} {"info/global_step": 1139, "train_info/time_within_train_step": 2.6498634815216064, "step": 1139} {"train_info/time_between_train_steps": 0.003912210464477539, "step": 1139} {"info/global_step": 1140, "train_info/time_within_train_step": 2.6513590812683105, "step": 1140} {"train_info/time_between_train_steps": 0.004173755645751953, "step": 1140} {"info/global_step": 1141, "train_info/time_within_train_step": 2.6501009464263916, "step": 1141} {"train_info/time_between_train_steps": 0.004178047180175781, "step": 1141} {"info/global_step": 1142, "train_info/time_within_train_step": 2.6468451023101807, "step": 1142} {"train_info/time_between_train_steps": 0.003810405731201172, "step": 1142} {"info/global_step": 1143, "train_info/time_within_train_step": 2.672826051712036, "step": 1143} {"train_info/time_between_train_steps": 0.003928184509277344, "step": 1143} {"info/global_step": 1144, "train_info/time_within_train_step": 2.6669840812683105, "step": 1144} {"train_info/time_between_train_steps": 0.003883838653564453, "step": 1144} {"info/global_step": 1145, "train_info/time_within_train_step": 2.673710346221924, "step": 1145} {"train_info/time_between_train_steps": 0.003812074661254883, "step": 1145} {"info/global_step": 1146, "train_info/time_within_train_step": 2.667508602142334, "step": 1146} {"train_info/time_between_train_steps": 0.0038864612579345703, "step": 1146} {"info/global_step": 1147, "train_info/time_within_train_step": 2.650956630706787, "step": 1147} {"train_info/time_between_train_steps": 0.0038449764251708984, "step": 1147} {"info/global_step": 1148, "train_info/time_within_train_step": 2.649851083755493, "step": 1148} {"train_info/time_between_train_steps": 0.0040585994720458984, "step": 1148} {"info/global_step": 1149, "train_info/time_within_train_step": 2.649308919906616, "step": 1149} {"train_info/time_between_train_steps": 0.003895282745361328, "step": 1149} {"info/global_step": 1150, "train_info/time_within_train_step": 2.653526782989502, "step": 1150} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746900608, "_runtime": 3206}, "step": 1150} {"logs": {"train/loss": 4.8154, "train/learning_rate": 0.0005899999999999999, "train/epoch": 1.03, "_timestamp": 1746900608, "_runtime": 3206}, "step": 1150} {"train_info/time_between_train_steps": 0.02542901039123535, "step": 1150} {"info/global_step": 1151, "train_info/time_within_train_step": 2.6451711654663086, "step": 1151} {"train_info/time_between_train_steps": 0.003702402114868164, "step": 1151} {"info/global_step": 1152, "train_info/time_within_train_step": 2.644782543182373, "step": 1152} {"train_info/time_between_train_steps": 0.004019260406494141, "step": 1152} {"info/global_step": 1153, "train_info/time_within_train_step": 2.6576969623565674, "step": 1153} {"train_info/time_between_train_steps": 0.003868579864501953, "step": 1153} {"info/global_step": 1154, "train_info/time_within_train_step": 2.7129998207092285, "step": 1154} {"train_info/time_between_train_steps": 0.003717184066772461, "step": 1154} {"info/global_step": 1155, "train_info/time_within_train_step": 2.661001682281494, "step": 1155} {"train_info/time_between_train_steps": 0.0040929317474365234, "step": 1155} {"info/global_step": 1156, "train_info/time_within_train_step": 2.6463301181793213, "step": 1156} {"train_info/time_between_train_steps": 0.003766775131225586, "step": 1156} {"info/global_step": 1157, "train_info/time_within_train_step": 2.6432018280029297, "step": 1157} {"train_info/time_between_train_steps": 0.0038313865661621094, "step": 1157} {"info/global_step": 1158, "train_info/time_within_train_step": 2.658997058868408, "step": 1158} {"train_info/time_between_train_steps": 0.0038242340087890625, "step": 1158} {"info/global_step": 1159, "train_info/time_within_train_step": 2.653737783432007, "step": 1159} {"train_info/time_between_train_steps": 0.003875255584716797, "step": 1159} {"info/global_step": 1160, "train_info/time_within_train_step": 2.648336410522461, "step": 1160} {"train_info/time_between_train_steps": 0.0038428306579589844, "step": 1160} {"info/global_step": 1161, "train_info/time_within_train_step": 2.6616334915161133, "step": 1161} {"train_info/time_between_train_steps": 0.0036690235137939453, "step": 1161} {"info/global_step": 1162, "train_info/time_within_train_step": 2.6581335067749023, "step": 1162} {"train_info/time_between_train_steps": 0.0037827491760253906, "step": 1162} {"info/global_step": 1163, "train_info/time_within_train_step": 2.6612277030944824, "step": 1163} {"train_info/time_between_train_steps": 0.00400996208190918, "step": 1163} {"info/global_step": 1164, "train_info/time_within_train_step": 2.6936426162719727, "step": 1164} {"train_info/time_between_train_steps": 0.0037987232208251953, "step": 1164} {"info/global_step": 1165, "train_info/time_within_train_step": 2.72590708732605, "step": 1165} {"train_info/time_between_train_steps": 0.0038604736328125, "step": 1165} {"info/global_step": 1166, "train_info/time_within_train_step": 2.6564719676971436, "step": 1166} {"train_info/time_between_train_steps": 0.003775358200073242, "step": 1166} {"info/global_step": 1167, "train_info/time_within_train_step": 2.6423442363739014, "step": 1167} {"train_info/time_between_train_steps": 0.003762960433959961, "step": 1167} {"info/global_step": 1168, "train_info/time_within_train_step": 2.6523232460021973, "step": 1168} {"train_info/time_between_train_steps": 0.0038499832153320312, "step": 1168} {"info/global_step": 1169, "train_info/time_within_train_step": 2.6694869995117188, "step": 1169} {"train_info/time_between_train_steps": 0.0036416053771972656, "step": 1169} {"info/global_step": 1170, "train_info/time_within_train_step": 2.6584279537200928, "step": 1170} {"train_info/time_between_train_steps": 0.003640413284301758, "step": 1170} {"info/global_step": 1171, "train_info/time_within_train_step": 2.649433135986328, "step": 1171} {"train_info/time_between_train_steps": 0.0037298202514648438, "step": 1171} {"info/global_step": 1172, "train_info/time_within_train_step": 2.6456122398376465, "step": 1172} {"train_info/time_between_train_steps": 0.0037431716918945312, "step": 1172} {"info/global_step": 1173, "train_info/time_within_train_step": 2.667335271835327, "step": 1173} {"train_info/time_between_train_steps": 0.00363922119140625, "step": 1173} {"info/global_step": 1174, "train_info/time_within_train_step": 2.666687488555908, "step": 1174} {"train_info/time_between_train_steps": 0.003446340560913086, "step": 1174} {"info/global_step": 1175, "train_info/time_within_train_step": 2.711561918258667, "step": 1175} {"train_info/time_between_train_steps": 0.0036079883575439453, "step": 1175} {"info/global_step": 1176, "train_info/time_within_train_step": 2.810025930404663, "step": 1176} {"train_info/time_between_train_steps": 0.0033223628997802734, "step": 1176} {"info/global_step": 1177, "train_info/time_within_train_step": 2.6855053901672363, "step": 1177} {"train_info/time_between_train_steps": 0.003339529037475586, "step": 1177} {"info/global_step": 1178, "train_info/time_within_train_step": 2.6774165630340576, "step": 1178} {"train_info/time_between_train_steps": 0.003301858901977539, "step": 1178} {"info/global_step": 1179, "train_info/time_within_train_step": 2.658233880996704, "step": 1179} {"train_info/time_between_train_steps": 0.0033042430877685547, "step": 1179} {"info/global_step": 1180, "train_info/time_within_train_step": 2.6451010704040527, "step": 1180} {"train_info/time_between_train_steps": 0.0033063888549804688, "step": 1180} {"info/global_step": 1181, "train_info/time_within_train_step": 2.670438766479492, "step": 1181} {"train_info/time_between_train_steps": 0.003392457962036133, "step": 1181} {"info/global_step": 1182, "train_info/time_within_train_step": 2.6641364097595215, "step": 1182} {"train_info/time_between_train_steps": 0.003337383270263672, "step": 1182} {"info/global_step": 1183, "train_info/time_within_train_step": 2.684265375137329, "step": 1183} {"train_info/time_between_train_steps": 0.0033049583435058594, "step": 1183} {"info/global_step": 1184, "train_info/time_within_train_step": 2.6567604541778564, "step": 1184} {"train_info/time_between_train_steps": 0.003312349319458008, "step": 1184} {"info/global_step": 1185, "train_info/time_within_train_step": 2.659668207168579, "step": 1185} {"train_info/time_between_train_steps": 0.0033211708068847656, "step": 1185} {"info/global_step": 1186, "train_info/time_within_train_step": 2.6471498012542725, "step": 1186} {"train_info/time_between_train_steps": 0.003316164016723633, "step": 1186} {"info/global_step": 1187, "train_info/time_within_train_step": 2.6434853076934814, "step": 1187} {"train_info/time_between_train_steps": 0.0033016204833984375, "step": 1187} {"info/global_step": 1188, "train_info/time_within_train_step": 3.0205883979797363, "step": 1188} {"train_info/time_between_train_steps": 0.003251314163208008, "step": 1188} {"info/global_step": 1189, "train_info/time_within_train_step": 2.6522674560546875, "step": 1189} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 1189} {"info/global_step": 1190, "train_info/time_within_train_step": 2.6714282035827637, "step": 1190} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 1190} {"info/global_step": 1191, "train_info/time_within_train_step": 2.640172243118286, "step": 1191} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 1191} {"info/global_step": 1192, "train_info/time_within_train_step": 2.6412088871002197, "step": 1192} {"train_info/time_between_train_steps": 0.003232240676879883, "step": 1192} {"info/global_step": 1193, "train_info/time_within_train_step": 2.686394691467285, "step": 1193} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 1193} {"info/global_step": 1194, "train_info/time_within_train_step": 2.6417651176452637, "step": 1194} {"train_info/time_between_train_steps": 0.0032393932342529297, "step": 1194} {"info/global_step": 1195, "train_info/time_within_train_step": 2.6528754234313965, "step": 1195} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 1195} {"info/global_step": 1196, "train_info/time_within_train_step": 2.6466360092163086, "step": 1196} {"train_info/time_between_train_steps": 0.0032367706298828125, "step": 1196} {"info/global_step": 1197, "train_info/time_within_train_step": 2.662834405899048, "step": 1197} {"train_info/time_between_train_steps": 0.0032355785369873047, "step": 1197} {"info/global_step": 1198, "train_info/time_within_train_step": 2.659907341003418, "step": 1198} {"train_info/time_between_train_steps": 0.00323486328125, "step": 1198} {"info/global_step": 1199, "train_info/time_within_train_step": 2.6553127765655518, "step": 1199} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 1199} {"info/global_step": 1200, "train_info/time_within_train_step": 2.7060530185699463, "step": 1200} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746900743, "_runtime": 3341}, "step": 1200} {"logs": {"train/loss": 4.7609, "train/learning_rate": 0.0005866666666666665, "train/epoch": 1.03, "_timestamp": 1746900743, "_runtime": 3341}, "step": 1200} {"train_info/time_between_train_steps": 14.246984243392944, "step": 1200} {"info/global_step": 1201, "train_info/time_within_train_step": 2.4292752742767334, "step": 1201} {"train_info/time_between_train_steps": 0.00325775146484375, "step": 1201} {"info/global_step": 1202, "train_info/time_within_train_step": 2.464423179626465, "step": 1202} {"train_info/time_between_train_steps": 0.003251314163208008, "step": 1202} {"info/global_step": 1203, "train_info/time_within_train_step": 2.628488063812256, "step": 1203} {"train_info/time_between_train_steps": 0.0032889842987060547, "step": 1203} {"info/global_step": 1204, "train_info/time_within_train_step": 2.638899326324463, "step": 1204} {"train_info/time_between_train_steps": 0.0032830238342285156, "step": 1204} {"info/global_step": 1205, "train_info/time_within_train_step": 2.6505346298217773, "step": 1205} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 1205} {"info/global_step": 1206, "train_info/time_within_train_step": 2.6469595432281494, "step": 1206} {"train_info/time_between_train_steps": 0.0033080577850341797, "step": 1206} {"info/global_step": 1207, "train_info/time_within_train_step": 2.6670830249786377, "step": 1207} {"train_info/time_between_train_steps": 0.0035905838012695312, "step": 1207} {"info/global_step": 1208, "train_info/time_within_train_step": 2.6965606212615967, "step": 1208} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 1208} {"info/global_step": 1209, "train_info/time_within_train_step": 2.656702756881714, "step": 1209} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 1209} {"info/global_step": 1210, "train_info/time_within_train_step": 2.6655166149139404, "step": 1210} {"train_info/time_between_train_steps": 0.0033109188079833984, "step": 1210} {"info/global_step": 1211, "train_info/time_within_train_step": 2.641301393508911, "step": 1211} {"train_info/time_between_train_steps": 0.0033254623413085938, "step": 1211} {"info/global_step": 1212, "train_info/time_within_train_step": 2.6449668407440186, "step": 1212} {"train_info/time_between_train_steps": 0.0035376548767089844, "step": 1212} {"info/global_step": 1213, "train_info/time_within_train_step": 2.644846200942993, "step": 1213} {"train_info/time_between_train_steps": 0.0035898685455322266, "step": 1213} {"info/global_step": 1214, "train_info/time_within_train_step": 2.6503522396087646, "step": 1214} {"train_info/time_between_train_steps": 0.003545045852661133, "step": 1214} {"info/global_step": 1215, "train_info/time_within_train_step": 2.6722381114959717, "step": 1215} {"train_info/time_between_train_steps": 0.0036482810974121094, "step": 1215} {"info/global_step": 1216, "train_info/time_within_train_step": 2.669795274734497, "step": 1216} {"train_info/time_between_train_steps": 0.0035996437072753906, "step": 1216} {"info/global_step": 1217, "train_info/time_within_train_step": 2.64943265914917, "step": 1217} {"train_info/time_between_train_steps": 0.0038046836853027344, "step": 1217} {"info/global_step": 1218, "train_info/time_within_train_step": 2.6791768074035645, "step": 1218} {"train_info/time_between_train_steps": 0.004122257232666016, "step": 1218} {"info/global_step": 1219, "train_info/time_within_train_step": 2.644054651260376, "step": 1219} {"train_info/time_between_train_steps": 0.00376129150390625, "step": 1219} {"info/global_step": 1220, "train_info/time_within_train_step": 2.650718927383423, "step": 1220} {"train_info/time_between_train_steps": 0.0036787986755371094, "step": 1220} {"info/global_step": 1221, "train_info/time_within_train_step": 2.6631720066070557, "step": 1221} {"train_info/time_between_train_steps": 0.003741025924682617, "step": 1221} {"info/global_step": 1222, "train_info/time_within_train_step": 2.6480836868286133, "step": 1222} {"train_info/time_between_train_steps": 0.003666400909423828, "step": 1222} {"info/global_step": 1223, "train_info/time_within_train_step": 2.64693284034729, "step": 1223} {"train_info/time_between_train_steps": 0.003881216049194336, "step": 1223} {"info/global_step": 1224, "train_info/time_within_train_step": 2.658369779586792, "step": 1224} {"train_info/time_between_train_steps": 0.0038115978240966797, "step": 1224} {"info/global_step": 1225, "train_info/time_within_train_step": 2.663001298904419, "step": 1225} {"train_info/time_between_train_steps": 0.00380706787109375, "step": 1225} {"info/global_step": 1226, "train_info/time_within_train_step": 2.67681884765625, "step": 1226} {"train_info/time_between_train_steps": 0.003737211227416992, "step": 1226} {"info/global_step": 1227, "train_info/time_within_train_step": 2.668363332748413, "step": 1227} {"train_info/time_between_train_steps": 0.0037338733673095703, "step": 1227} {"info/global_step": 1228, "train_info/time_within_train_step": 2.7070908546447754, "step": 1228} {"train_info/time_between_train_steps": 0.003679513931274414, "step": 1228} {"info/global_step": 1229, "train_info/time_within_train_step": 2.643761396408081, "step": 1229} {"train_info/time_between_train_steps": 0.0036172866821289062, "step": 1229} {"info/global_step": 1230, "train_info/time_within_train_step": 2.6488747596740723, "step": 1230} {"train_info/time_between_train_steps": 0.0036389827728271484, "step": 1230} {"info/global_step": 1231, "train_info/time_within_train_step": 2.67893123626709, "step": 1231} {"train_info/time_between_train_steps": 0.0036826133728027344, "step": 1231} {"info/global_step": 1232, "train_info/time_within_train_step": 2.648090362548828, "step": 1232} {"train_info/time_between_train_steps": 0.0035943984985351562, "step": 1232} {"info/global_step": 1233, "train_info/time_within_train_step": 3.05472731590271, "step": 1233} {"train_info/time_between_train_steps": 0.0032498836517333984, "step": 1233} {"info/global_step": 1234, "train_info/time_within_train_step": 2.707407236099243, "step": 1234} {"train_info/time_between_train_steps": 0.003384828567504883, "step": 1234} {"info/global_step": 1235, "train_info/time_within_train_step": 2.651057004928589, "step": 1235} {"train_info/time_between_train_steps": 0.0032682418823242188, "step": 1235} {"info/global_step": 1236, "train_info/time_within_train_step": 2.6483781337738037, "step": 1236} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 1236} {"info/global_step": 1237, "train_info/time_within_train_step": 2.6567165851593018, "step": 1237} {"train_info/time_between_train_steps": 0.0032470226287841797, "step": 1237} {"info/global_step": 1238, "train_info/time_within_train_step": 2.6442618370056152, "step": 1238} {"train_info/time_between_train_steps": 0.1456754207611084, "step": 1238} {"info/global_step": 1239, "train_info/time_within_train_step": 2.65775728225708, "step": 1239} {"train_info/time_between_train_steps": 0.003391265869140625, "step": 1239} {"info/global_step": 1240, "train_info/time_within_train_step": 2.6429929733276367, "step": 1240} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 1240} {"info/global_step": 1241, "train_info/time_within_train_step": 2.6459529399871826, "step": 1241} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 1241} {"info/global_step": 1242, "train_info/time_within_train_step": 2.6497323513031006, "step": 1242} {"train_info/time_between_train_steps": 0.0034019947052001953, "step": 1242} {"info/global_step": 1243, "train_info/time_within_train_step": 2.6537065505981445, "step": 1243} {"train_info/time_between_train_steps": 0.0033419132232666016, "step": 1243} {"info/global_step": 1244, "train_info/time_within_train_step": 2.659329891204834, "step": 1244} {"train_info/time_between_train_steps": 0.003365039825439453, "step": 1244} {"info/global_step": 1245, "train_info/time_within_train_step": 2.6909029483795166, "step": 1245} {"train_info/time_between_train_steps": 0.003495454788208008, "step": 1245} {"info/global_step": 1246, "train_info/time_within_train_step": 2.7287633419036865, "step": 1246} {"train_info/time_between_train_steps": 0.003498077392578125, "step": 1246} {"info/global_step": 1247, "train_info/time_within_train_step": 2.649566888809204, "step": 1247} {"train_info/time_between_train_steps": 0.003576040267944336, "step": 1247} {"info/global_step": 1248, "train_info/time_within_train_step": 2.6420388221740723, "step": 1248} {"train_info/time_between_train_steps": 0.0034952163696289062, "step": 1248} {"info/global_step": 1249, "train_info/time_within_train_step": 2.6560049057006836, "step": 1249} {"train_info/time_between_train_steps": 0.003551006317138672, "step": 1249} {"info/global_step": 1250, "train_info/time_within_train_step": 3.1771812438964844, "step": 1250} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746900892, "_runtime": 3490}, "step": 1250} {"logs": {"train/loss": 4.7109, "train/learning_rate": 0.0005833333333333333, "train/epoch": 1.04, "_timestamp": 1746900892, "_runtime": 3490}, "step": 1250} {"train_info/time_between_train_steps": 0.024940013885498047, "step": 1250} {"info/global_step": 1251, "train_info/time_within_train_step": 2.6598312854766846, "step": 1251} {"train_info/time_between_train_steps": 0.003556489944458008, "step": 1251} {"info/global_step": 1252, "train_info/time_within_train_step": 2.6531636714935303, "step": 1252} {"train_info/time_between_train_steps": 0.0035407543182373047, "step": 1252} {"info/global_step": 1253, "train_info/time_within_train_step": 2.6779561042785645, "step": 1253} {"train_info/time_between_train_steps": 0.0035858154296875, "step": 1253} {"info/global_step": 1254, "train_info/time_within_train_step": 2.684318780899048, "step": 1254} {"train_info/time_between_train_steps": 0.003468036651611328, "step": 1254} {"info/global_step": 1255, "train_info/time_within_train_step": 2.7060742378234863, "step": 1255} {"train_info/time_between_train_steps": 0.0035021305084228516, "step": 1255} {"info/global_step": 1256, "train_info/time_within_train_step": 2.6410839557647705, "step": 1256} {"train_info/time_between_train_steps": 0.0035200119018554688, "step": 1256} {"info/global_step": 1257, "train_info/time_within_train_step": 2.640772819519043, "step": 1257} {"train_info/time_between_train_steps": 0.0036089420318603516, "step": 1257} {"info/global_step": 1258, "train_info/time_within_train_step": 2.6578104496002197, "step": 1258} {"train_info/time_between_train_steps": 0.003551483154296875, "step": 1258} {"info/global_step": 1259, "train_info/time_within_train_step": 2.661687135696411, "step": 1259} {"train_info/time_between_train_steps": 0.0036025047302246094, "step": 1259} {"info/global_step": 1260, "train_info/time_within_train_step": 2.6436753273010254, "step": 1260} {"train_info/time_between_train_steps": 0.0035631656646728516, "step": 1260} {"info/global_step": 1261, "train_info/time_within_train_step": 2.652132511138916, "step": 1261} {"train_info/time_between_train_steps": 0.003492116928100586, "step": 1261} {"info/global_step": 1262, "train_info/time_within_train_step": 2.650313377380371, "step": 1262} {"train_info/time_between_train_steps": 0.0035567283630371094, "step": 1262} {"info/global_step": 1263, "train_info/time_within_train_step": 2.6685972213745117, "step": 1263} {"train_info/time_between_train_steps": 0.003537416458129883, "step": 1263} {"info/global_step": 1264, "train_info/time_within_train_step": 2.7003989219665527, "step": 1264} {"train_info/time_between_train_steps": 0.0034246444702148438, "step": 1264} {"info/global_step": 1265, "train_info/time_within_train_step": 2.659367322921753, "step": 1265} {"train_info/time_between_train_steps": 0.0035054683685302734, "step": 1265} {"info/global_step": 1266, "train_info/time_within_train_step": 2.6645448207855225, "step": 1266} {"train_info/time_between_train_steps": 0.003465414047241211, "step": 1266} {"info/global_step": 1267, "train_info/time_within_train_step": 2.641512870788574, "step": 1267} {"train_info/time_between_train_steps": 0.0034520626068115234, "step": 1267} {"info/global_step": 1268, "train_info/time_within_train_step": 2.6630730628967285, "step": 1268} {"train_info/time_between_train_steps": 0.003552675247192383, "step": 1268} {"info/global_step": 1269, "train_info/time_within_train_step": 2.6661477088928223, "step": 1269} {"train_info/time_between_train_steps": 0.0035789012908935547, "step": 1269} {"info/global_step": 1270, "train_info/time_within_train_step": 2.6777350902557373, "step": 1270} {"train_info/time_between_train_steps": 0.0034427642822265625, "step": 1270} {"info/global_step": 1271, "train_info/time_within_train_step": 2.6466469764709473, "step": 1271} {"train_info/time_between_train_steps": 0.0035026073455810547, "step": 1271} {"info/global_step": 1272, "train_info/time_within_train_step": 2.6535117626190186, "step": 1272} {"train_info/time_between_train_steps": 0.0035104751586914062, "step": 1272} {"info/global_step": 1273, "train_info/time_within_train_step": 2.648461103439331, "step": 1273} {"train_info/time_between_train_steps": 0.003436565399169922, "step": 1273} {"info/global_step": 1274, "train_info/time_within_train_step": 2.659827709197998, "step": 1274} {"train_info/time_between_train_steps": 0.003489255905151367, "step": 1274} {"info/global_step": 1275, "train_info/time_within_train_step": 2.651665210723877, "step": 1275} {"train_info/time_between_train_steps": 0.003501415252685547, "step": 1275} {"info/global_step": 1276, "train_info/time_within_train_step": 2.6655712127685547, "step": 1276} {"train_info/time_between_train_steps": 0.003574371337890625, "step": 1276} {"info/global_step": 1277, "train_info/time_within_train_step": 2.660881519317627, "step": 1277} {"train_info/time_between_train_steps": 0.003523588180541992, "step": 1277} {"info/global_step": 1278, "train_info/time_within_train_step": 2.7107019424438477, "step": 1278} {"train_info/time_between_train_steps": 0.003474712371826172, "step": 1278} {"info/global_step": 1279, "train_info/time_within_train_step": 2.6510918140411377, "step": 1279} {"train_info/time_between_train_steps": 0.003515958786010742, "step": 1279} {"info/global_step": 1280, "train_info/time_within_train_step": 2.6494054794311523, "step": 1280} {"train_info/time_between_train_steps": 0.0034646987915039062, "step": 1280} {"info/global_step": 1281, "train_info/time_within_train_step": 2.6471025943756104, "step": 1281} {"train_info/time_between_train_steps": 0.0034949779510498047, "step": 1281} {"info/global_step": 1282, "train_info/time_within_train_step": 2.649982213973999, "step": 1282} {"train_info/time_between_train_steps": 0.003498077392578125, "step": 1282} {"info/global_step": 1283, "train_info/time_within_train_step": 2.6534249782562256, "step": 1283} {"train_info/time_between_train_steps": 0.0035245418548583984, "step": 1283} {"info/global_step": 1284, "train_info/time_within_train_step": 2.6452481746673584, "step": 1284} {"train_info/time_between_train_steps": 0.0034265518188476562, "step": 1284} {"info/global_step": 1285, "train_info/time_within_train_step": 2.657316207885742, "step": 1285} {"train_info/time_between_train_steps": 0.0035400390625, "step": 1285} {"info/global_step": 1286, "train_info/time_within_train_step": 2.6536569595336914, "step": 1286} {"train_info/time_between_train_steps": 0.0034575462341308594, "step": 1286} {"info/global_step": 1287, "train_info/time_within_train_step": 2.6611549854278564, "step": 1287} {"train_info/time_between_train_steps": 0.0034847259521484375, "step": 1287} {"info/global_step": 1288, "train_info/time_within_train_step": 2.717693328857422, "step": 1288} {"train_info/time_between_train_steps": 0.003519773483276367, "step": 1288} {"info/global_step": 1289, "train_info/time_within_train_step": 2.703197479248047, "step": 1289} {"train_info/time_between_train_steps": 0.0035152435302734375, "step": 1289} {"info/global_step": 1290, "train_info/time_within_train_step": 2.6420297622680664, "step": 1290} {"train_info/time_between_train_steps": 0.0034897327423095703, "step": 1290} {"info/global_step": 1291, "train_info/time_within_train_step": 2.642063617706299, "step": 1291} {"train_info/time_between_train_steps": 0.003530740737915039, "step": 1291} {"info/global_step": 1292, "train_info/time_within_train_step": 2.664397716522217, "step": 1292} {"train_info/time_between_train_steps": 0.0034744739532470703, "step": 1292} {"info/global_step": 1293, "train_info/time_within_train_step": 2.6491763591766357, "step": 1293} {"train_info/time_between_train_steps": 0.003509521484375, "step": 1293} {"info/global_step": 1294, "train_info/time_within_train_step": 2.646470069885254, "step": 1294} {"train_info/time_between_train_steps": 0.0035784244537353516, "step": 1294} {"info/global_step": 1295, "train_info/time_within_train_step": 2.6489877700805664, "step": 1295} {"train_info/time_between_train_steps": 0.003420591354370117, "step": 1295} {"info/global_step": 1296, "train_info/time_within_train_step": 2.6437015533447266, "step": 1296} {"train_info/time_between_train_steps": 0.0035169124603271484, "step": 1296} {"info/global_step": 1297, "train_info/time_within_train_step": 2.668704032897949, "step": 1297} {"train_info/time_between_train_steps": 0.0034189224243164062, "step": 1297} {"info/global_step": 1298, "train_info/time_within_train_step": 2.670893669128418, "step": 1298} {"train_info/time_between_train_steps": 0.0033941268920898438, "step": 1298} {"info/global_step": 1299, "train_info/time_within_train_step": 2.6536779403686523, "step": 1299} {"train_info/time_between_train_steps": 0.003445863723754883, "step": 1299} {"info/global_step": 1300, "train_info/time_within_train_step": 2.6626639366149902, "step": 1300} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746901026, "_runtime": 3624}, "step": 1300} {"logs": {"train/loss": 4.6781, "train/learning_rate": 0.00058, "train/epoch": 1.04, "_timestamp": 1746901026, "_runtime": 3624}, "step": 1300} {"train_info/time_between_train_steps": 0.03257632255554199, "step": 1300} {"info/global_step": 1301, "train_info/time_within_train_step": 2.831622362136841, "step": 1301} {"train_info/time_between_train_steps": 0.0032958984375, "step": 1301} {"info/global_step": 1302, "train_info/time_within_train_step": 2.6514976024627686, "step": 1302} {"train_info/time_between_train_steps": 0.003261566162109375, "step": 1302} {"info/global_step": 1303, "train_info/time_within_train_step": 2.664609670639038, "step": 1303} {"train_info/time_between_train_steps": 0.00328826904296875, "step": 1303} {"info/global_step": 1304, "train_info/time_within_train_step": 2.6408865451812744, "step": 1304} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 1304} {"info/global_step": 1305, "train_info/time_within_train_step": 2.649959087371826, "step": 1305} {"train_info/time_between_train_steps": 0.0032799243927001953, "step": 1305} {"info/global_step": 1306, "train_info/time_within_train_step": 2.660383701324463, "step": 1306} {"train_info/time_between_train_steps": 0.003254413604736328, "step": 1306} {"info/global_step": 1307, "train_info/time_within_train_step": 2.6434552669525146, "step": 1307} {"train_info/time_between_train_steps": 0.0033249855041503906, "step": 1307} {"info/global_step": 1308, "train_info/time_within_train_step": 2.644101619720459, "step": 1308} {"train_info/time_between_train_steps": 0.0032711029052734375, "step": 1308} {"info/global_step": 1309, "train_info/time_within_train_step": 2.6612255573272705, "step": 1309} {"train_info/time_between_train_steps": 0.0032715797424316406, "step": 1309} {"info/global_step": 1310, "train_info/time_within_train_step": 2.6666512489318848, "step": 1310} {"train_info/time_between_train_steps": 0.0033757686614990234, "step": 1310} {"info/global_step": 1311, "train_info/time_within_train_step": 2.6861348152160645, "step": 1311} {"train_info/time_between_train_steps": 0.003314495086669922, "step": 1311} {"info/global_step": 1312, "train_info/time_within_train_step": 2.6474995613098145, "step": 1312} {"train_info/time_between_train_steps": 0.003303050994873047, "step": 1312} {"info/global_step": 1313, "train_info/time_within_train_step": 2.6851918697357178, "step": 1313} {"train_info/time_between_train_steps": 0.0033097267150878906, "step": 1313} {"info/global_step": 1314, "train_info/time_within_train_step": 2.6412644386291504, "step": 1314} {"train_info/time_between_train_steps": 0.0033528804779052734, "step": 1314} {"info/global_step": 1315, "train_info/time_within_train_step": 2.6474242210388184, "step": 1315} {"train_info/time_between_train_steps": 0.003294706344604492, "step": 1315} {"info/global_step": 1316, "train_info/time_within_train_step": 2.66120982170105, "step": 1316} {"train_info/time_between_train_steps": 0.0032868385314941406, "step": 1316} {"info/global_step": 1317, "train_info/time_within_train_step": 2.6436800956726074, "step": 1317} {"train_info/time_between_train_steps": 0.0033996105194091797, "step": 1317} {"info/global_step": 1318, "train_info/time_within_train_step": 2.643380880355835, "step": 1318} {"train_info/time_between_train_steps": 0.0032732486724853516, "step": 1318} {"info/global_step": 1319, "train_info/time_within_train_step": 2.643528938293457, "step": 1319} {"train_info/time_between_train_steps": 0.0034363269805908203, "step": 1319} {"info/global_step": 1320, "train_info/time_within_train_step": 2.735454797744751, "step": 1320} {"train_info/time_between_train_steps": 0.003613710403442383, "step": 1320} {"info/global_step": 1321, "train_info/time_within_train_step": 2.7596964836120605, "step": 1321} {"train_info/time_between_train_steps": 0.0034875869750976562, "step": 1321} {"info/global_step": 1322, "train_info/time_within_train_step": 2.6541287899017334, "step": 1322} {"train_info/time_between_train_steps": 0.003403186798095703, "step": 1322} {"info/global_step": 1323, "train_info/time_within_train_step": 2.643066644668579, "step": 1323} {"train_info/time_between_train_steps": 0.003453969955444336, "step": 1323} {"info/global_step": 1324, "train_info/time_within_train_step": 2.6436760425567627, "step": 1324} {"train_info/time_between_train_steps": 0.003659486770629883, "step": 1324} {"info/global_step": 1325, "train_info/time_within_train_step": 2.6416897773742676, "step": 1325} {"train_info/time_between_train_steps": 0.0035805702209472656, "step": 1325} {"info/global_step": 1326, "train_info/time_within_train_step": 2.6430985927581787, "step": 1326} {"train_info/time_between_train_steps": 0.003634214401245117, "step": 1326} {"info/global_step": 1327, "train_info/time_within_train_step": 2.6430444717407227, "step": 1327} {"train_info/time_between_train_steps": 0.003434896469116211, "step": 1327} {"info/global_step": 1328, "train_info/time_within_train_step": 2.9831557273864746, "step": 1328} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 1328} {"info/global_step": 1329, "train_info/time_within_train_step": 2.6388895511627197, "step": 1329} {"train_info/time_between_train_steps": 0.003257274627685547, "step": 1329} {"info/global_step": 1330, "train_info/time_within_train_step": 2.6787993907928467, "step": 1330} {"train_info/time_between_train_steps": 0.0032918453216552734, "step": 1330} {"info/global_step": 1331, "train_info/time_within_train_step": 2.6506268978118896, "step": 1331} {"train_info/time_between_train_steps": 0.0032510757446289062, "step": 1331} {"info/global_step": 1332, "train_info/time_within_train_step": 2.647123098373413, "step": 1332} {"train_info/time_between_train_steps": 0.003293275833129883, "step": 1332} {"info/global_step": 1333, "train_info/time_within_train_step": 2.6486504077911377, "step": 1333} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 1333} {"info/global_step": 1334, "train_info/time_within_train_step": 2.654942274093628, "step": 1334} {"train_info/time_between_train_steps": 0.003276824951171875, "step": 1334} {"info/global_step": 1335, "train_info/time_within_train_step": 2.686310291290283, "step": 1335} {"train_info/time_between_train_steps": 0.003251314163208008, "step": 1335} {"info/global_step": 1336, "train_info/time_within_train_step": 2.7055485248565674, "step": 1336} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 1336} {"info/global_step": 1337, "train_info/time_within_train_step": 2.638545513153076, "step": 1337} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 1337} {"info/global_step": 1338, "train_info/time_within_train_step": 2.6495590209960938, "step": 1338} {"train_info/time_between_train_steps": 0.0032858848571777344, "step": 1338} {"info/global_step": 1339, "train_info/time_within_train_step": 2.6500356197357178, "step": 1339} {"train_info/time_between_train_steps": 0.003249645233154297, "step": 1339} {"info/global_step": 1340, "train_info/time_within_train_step": 2.6467366218566895, "step": 1340} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 1340} {"info/global_step": 1341, "train_info/time_within_train_step": 2.647960662841797, "step": 1341} {"train_info/time_between_train_steps": 0.003221273422241211, "step": 1341} {"info/global_step": 1342, "train_info/time_within_train_step": 2.6443536281585693, "step": 1342} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 1342} {"info/global_step": 1343, "train_info/time_within_train_step": 2.66841721534729, "step": 1343} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 1343} {"info/global_step": 1344, "train_info/time_within_train_step": 2.6947662830352783, "step": 1344} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 1344} {"info/global_step": 1345, "train_info/time_within_train_step": 2.6641921997070312, "step": 1345} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 1345} {"info/global_step": 1346, "train_info/time_within_train_step": 2.6637487411499023, "step": 1346} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 1346} {"info/global_step": 1347, "train_info/time_within_train_step": 2.6538233757019043, "step": 1347} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 1347} {"info/global_step": 1348, "train_info/time_within_train_step": 2.6564884185791016, "step": 1348} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 1348} {"info/global_step": 1349, "train_info/time_within_train_step": 2.679931879043579, "step": 1349} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 1349} {"info/global_step": 1350, "train_info/time_within_train_step": 2.6399130821228027, "step": 1350} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746901164, "_runtime": 3762}, "step": 1350} {"logs": {"train/loss": 4.6524, "train/learning_rate": 0.0005766666666666666, "train/epoch": 1.05, "_timestamp": 1746901164, "_runtime": 3762}, "step": 1350} {"train_info/time_between_train_steps": 0.024998903274536133, "step": 1350} {"info/global_step": 1351, "train_info/time_within_train_step": 2.64563250541687, "step": 1351} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 1351} {"info/global_step": 1352, "train_info/time_within_train_step": 2.6429293155670166, "step": 1352} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 1352} {"info/global_step": 1353, "train_info/time_within_train_step": 2.6616790294647217, "step": 1353} {"train_info/time_between_train_steps": 0.0032525062561035156, "step": 1353} {"info/global_step": 1354, "train_info/time_within_train_step": 2.6487412452697754, "step": 1354} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 1354} {"info/global_step": 1355, "train_info/time_within_train_step": 2.643906831741333, "step": 1355} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 1355} {"info/global_step": 1356, "train_info/time_within_train_step": 2.664705991744995, "step": 1356} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 1356} {"info/global_step": 1357, "train_info/time_within_train_step": 2.658803939819336, "step": 1357} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 1357} {"info/global_step": 1358, "train_info/time_within_train_step": 2.65575909614563, "step": 1358} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 1358} {"info/global_step": 1359, "train_info/time_within_train_step": 2.709456443786621, "step": 1359} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 1359} {"info/global_step": 1360, "train_info/time_within_train_step": 2.644099235534668, "step": 1360} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 1360} {"info/global_step": 1361, "train_info/time_within_train_step": 2.648073673248291, "step": 1361} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 1361} {"info/global_step": 1362, "train_info/time_within_train_step": 2.659388303756714, "step": 1362} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 1362} {"info/global_step": 1363, "train_info/time_within_train_step": 2.643737554550171, "step": 1363} {"train_info/time_between_train_steps": 0.10892128944396973, "step": 1363} {"info/global_step": 1364, "train_info/time_within_train_step": 2.653244972229004, "step": 1364} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 1364} {"info/global_step": 1365, "train_info/time_within_train_step": 2.657580852508545, "step": 1365} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 1365} {"info/global_step": 1366, "train_info/time_within_train_step": 2.665794849395752, "step": 1366} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 1366} {"info/global_step": 1367, "train_info/time_within_train_step": 2.659937620162964, "step": 1367} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 1367} {"info/global_step": 1368, "train_info/time_within_train_step": 2.6525075435638428, "step": 1368} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 1368} {"info/global_step": 1369, "train_info/time_within_train_step": 2.661153793334961, "step": 1369} {"train_info/time_between_train_steps": 0.003248453140258789, "step": 1369} {"info/global_step": 1370, "train_info/time_within_train_step": 2.717252492904663, "step": 1370} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 1370} {"info/global_step": 1371, "train_info/time_within_train_step": 2.668020486831665, "step": 1371} {"train_info/time_between_train_steps": 0.003226757049560547, "step": 1371} {"info/global_step": 1372, "train_info/time_within_train_step": 2.6399049758911133, "step": 1372} {"train_info/time_between_train_steps": 0.003389120101928711, "step": 1372} {"info/global_step": 1373, "train_info/time_within_train_step": 2.652578353881836, "step": 1373} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 1373} {"info/global_step": 1374, "train_info/time_within_train_step": 2.648353099822998, "step": 1374} {"train_info/time_between_train_steps": 0.0032682418823242188, "step": 1374} {"info/global_step": 1375, "train_info/time_within_train_step": 2.6508243083953857, "step": 1375} {"train_info/time_between_train_steps": 0.0032596588134765625, "step": 1375} {"info/global_step": 1376, "train_info/time_within_train_step": 2.645641803741455, "step": 1376} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 1376} {"info/global_step": 1377, "train_info/time_within_train_step": 2.6444718837738037, "step": 1377} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 1377} {"info/global_step": 1378, "train_info/time_within_train_step": 2.667086124420166, "step": 1378} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 1378} {"info/global_step": 1379, "train_info/time_within_train_step": 2.6699655055999756, "step": 1379} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 1379} {"info/global_step": 1380, "train_info/time_within_train_step": 2.678241729736328, "step": 1380} {"train_info/time_between_train_steps": 0.003289461135864258, "step": 1380} {"info/global_step": 1381, "train_info/time_within_train_step": 2.6520118713378906, "step": 1381} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 1381} {"info/global_step": 1382, "train_info/time_within_train_step": 2.684920072555542, "step": 1382} {"train_info/time_between_train_steps": 0.0032339096069335938, "step": 1382} {"info/global_step": 1383, "train_info/time_within_train_step": 2.6419577598571777, "step": 1383} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 1383} {"info/global_step": 1384, "train_info/time_within_train_step": 2.6438984870910645, "step": 1384} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 1384} {"info/global_step": 1385, "train_info/time_within_train_step": 2.899729013442993, "step": 1385} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 1385} {"info/global_step": 1386, "train_info/time_within_train_step": 2.6409542560577393, "step": 1386} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 1386} {"info/global_step": 1387, "train_info/time_within_train_step": 2.6501049995422363, "step": 1387} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 1387} {"info/global_step": 1388, "train_info/time_within_train_step": 2.6604857444763184, "step": 1388} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 1388} {"info/global_step": 1389, "train_info/time_within_train_step": 2.643203020095825, "step": 1389} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 1389} {"info/global_step": 1390, "train_info/time_within_train_step": 2.643768787384033, "step": 1390} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 1390} {"info/global_step": 1391, "train_info/time_within_train_step": 2.6626555919647217, "step": 1391} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 1391} {"info/global_step": 1392, "train_info/time_within_train_step": 2.659080982208252, "step": 1392} {"train_info/time_between_train_steps": 0.0032324790954589844, "step": 1392} {"info/global_step": 1393, "train_info/time_within_train_step": 2.6707229614257812, "step": 1393} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 1393} {"info/global_step": 1394, "train_info/time_within_train_step": 2.6741256713867188, "step": 1394} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 1394} {"info/global_step": 1395, "train_info/time_within_train_step": 2.6724789142608643, "step": 1395} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 1395} {"info/global_step": 1396, "train_info/time_within_train_step": 2.6407930850982666, "step": 1396} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 1396} {"info/global_step": 1397, "train_info/time_within_train_step": 2.657625913619995, "step": 1397} {"train_info/time_between_train_steps": 0.0032405853271484375, "step": 1397} {"info/global_step": 1398, "train_info/time_within_train_step": 2.6423091888427734, "step": 1398} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 1398} {"info/global_step": 1399, "train_info/time_within_train_step": 2.6463544368743896, "step": 1399} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 1399} {"info/global_step": 1400, "train_info/time_within_train_step": 2.648275852203369, "step": 1400} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746901298, "_runtime": 3896}, "step": 1400} {"logs": {"train/loss": 4.6041, "train/learning_rate": 0.0005733333333333334, "train/epoch": 1.05, "_timestamp": 1746901298, "_runtime": 3896}, "step": 1400} {"train_info/time_between_train_steps": 14.711772680282593, "step": 1400} {"info/global_step": 1401, "train_info/time_within_train_step": 2.4412245750427246, "step": 1401} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 1401} {"info/global_step": 1402, "train_info/time_within_train_step": 2.4429869651794434, "step": 1402} {"train_info/time_between_train_steps": 0.003245115280151367, "step": 1402} {"info/global_step": 1403, "train_info/time_within_train_step": 2.590287208557129, "step": 1403} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 1403} {"info/global_step": 1404, "train_info/time_within_train_step": 2.6477208137512207, "step": 1404} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 1404} {"info/global_step": 1405, "train_info/time_within_train_step": 2.6419079303741455, "step": 1405} {"train_info/time_between_train_steps": 0.003301858901977539, "step": 1405} {"info/global_step": 1406, "train_info/time_within_train_step": 2.643505573272705, "step": 1406} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 1406} {"info/global_step": 1407, "train_info/time_within_train_step": 2.6622395515441895, "step": 1407} {"train_info/time_between_train_steps": 0.0032553672790527344, "step": 1407} {"info/global_step": 1408, "train_info/time_within_train_step": 2.6682093143463135, "step": 1408} {"train_info/time_between_train_steps": 0.003233194351196289, "step": 1408} {"info/global_step": 1409, "train_info/time_within_train_step": 2.6789791584014893, "step": 1409} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 1409} {"info/global_step": 1410, "train_info/time_within_train_step": 2.6553092002868652, "step": 1410} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 1410} {"info/global_step": 1411, "train_info/time_within_train_step": 2.6409847736358643, "step": 1411} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 1411} {"info/global_step": 1412, "train_info/time_within_train_step": 2.6570980548858643, "step": 1412} {"train_info/time_between_train_steps": 0.0032203197479248047, "step": 1412} {"info/global_step": 1413, "train_info/time_within_train_step": 2.655400514602661, "step": 1413} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 1413} {"info/global_step": 1414, "train_info/time_within_train_step": 2.6629018783569336, "step": 1414} {"train_info/time_between_train_steps": 0.0029137134552001953, "step": 1414} {"info/global_step": 1415, "train_info/time_within_train_step": 2.6435389518737793, "step": 1415} {"train_info/time_between_train_steps": 0.002904653549194336, "step": 1415} {"info/global_step": 1416, "train_info/time_within_train_step": 2.6505701541900635, "step": 1416} {"train_info/time_between_train_steps": 0.0029296875, "step": 1416} {"info/global_step": 1417, "train_info/time_within_train_step": 2.668668508529663, "step": 1417} {"train_info/time_between_train_steps": 0.002907991409301758, "step": 1417} {"info/global_step": 1418, "train_info/time_within_train_step": 2.685849666595459, "step": 1418} {"train_info/time_between_train_steps": 0.0028705596923828125, "step": 1418} {"info/global_step": 1419, "train_info/time_within_train_step": 2.651977300643921, "step": 1419} {"train_info/time_between_train_steps": 0.002897500991821289, "step": 1419} {"info/global_step": 1420, "train_info/time_within_train_step": 2.66512393951416, "step": 1420} {"train_info/time_between_train_steps": 0.0029401779174804688, "step": 1420} {"info/global_step": 1421, "train_info/time_within_train_step": 2.647454023361206, "step": 1421} {"train_info/time_between_train_steps": 0.002871990203857422, "step": 1421} {"info/global_step": 1422, "train_info/time_within_train_step": 2.644521474838257, "step": 1422} {"train_info/time_between_train_steps": 0.00295257568359375, "step": 1422} {"info/global_step": 1423, "train_info/time_within_train_step": 2.65570068359375, "step": 1423} {"train_info/time_between_train_steps": 0.0029096603393554688, "step": 1423} {"info/global_step": 1424, "train_info/time_within_train_step": 2.649899482727051, "step": 1424} {"train_info/time_between_train_steps": 0.002915620803833008, "step": 1424} {"info/global_step": 1425, "train_info/time_within_train_step": 2.6510488986968994, "step": 1425} {"train_info/time_between_train_steps": 0.0028972625732421875, "step": 1425} {"info/global_step": 1426, "train_info/time_within_train_step": 2.6600465774536133, "step": 1426} {"train_info/time_between_train_steps": 0.0029010772705078125, "step": 1426} {"info/global_step": 1427, "train_info/time_within_train_step": 2.679147958755493, "step": 1427} {"train_info/time_between_train_steps": 0.0029120445251464844, "step": 1427} {"info/global_step": 1428, "train_info/time_within_train_step": 2.6760497093200684, "step": 1428} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 1428} {"info/global_step": 1429, "train_info/time_within_train_step": 2.6945130825042725, "step": 1429} {"train_info/time_between_train_steps": 0.002913236618041992, "step": 1429} {"info/global_step": 1430, "train_info/time_within_train_step": 2.656222343444824, "step": 1430} {"train_info/time_between_train_steps": 0.0029048919677734375, "step": 1430} {"info/global_step": 1431, "train_info/time_within_train_step": 2.6475648880004883, "step": 1431} {"train_info/time_between_train_steps": 0.0028879642486572266, "step": 1431} {"info/global_step": 1432, "train_info/time_within_train_step": 2.645308494567871, "step": 1432} {"train_info/time_between_train_steps": 0.002895832061767578, "step": 1432} {"info/global_step": 1433, "train_info/time_within_train_step": 2.654136896133423, "step": 1433} {"train_info/time_between_train_steps": 0.002894878387451172, "step": 1433} {"info/global_step": 1434, "train_info/time_within_train_step": 2.6543660163879395, "step": 1434} {"train_info/time_between_train_steps": 0.002900838851928711, "step": 1434} {"info/global_step": 1435, "train_info/time_within_train_step": 2.6458683013916016, "step": 1435} {"train_info/time_between_train_steps": 0.002923727035522461, "step": 1435} {"info/global_step": 1436, "train_info/time_within_train_step": 2.6586475372314453, "step": 1436} {"train_info/time_between_train_steps": 0.002913951873779297, "step": 1436} {"info/global_step": 1437, "train_info/time_within_train_step": 2.651677370071411, "step": 1437} {"train_info/time_between_train_steps": 0.0029642581939697266, "step": 1437} {"info/global_step": 1438, "train_info/time_within_train_step": 2.665227174758911, "step": 1438} {"train_info/time_between_train_steps": 0.0029098987579345703, "step": 1438} {"info/global_step": 1439, "train_info/time_within_train_step": 2.72259521484375, "step": 1439} {"train_info/time_between_train_steps": 0.0030705928802490234, "step": 1439} {"info/global_step": 1440, "train_info/time_within_train_step": 2.6400351524353027, "step": 1440} {"train_info/time_between_train_steps": 0.0029375553131103516, "step": 1440} {"info/global_step": 1441, "train_info/time_within_train_step": 2.6389119625091553, "step": 1441} {"train_info/time_between_train_steps": 0.002952098846435547, "step": 1441} {"info/global_step": 1442, "train_info/time_within_train_step": 2.6603732109069824, "step": 1442} {"train_info/time_between_train_steps": 0.0031032562255859375, "step": 1442} {"info/global_step": 1443, "train_info/time_within_train_step": 2.6505327224731445, "step": 1443} {"train_info/time_between_train_steps": 0.0029358863830566406, "step": 1443} {"info/global_step": 1444, "train_info/time_within_train_step": 2.7080461978912354, "step": 1444} {"train_info/time_between_train_steps": 0.00289154052734375, "step": 1444} {"info/global_step": 1445, "train_info/time_within_train_step": 2.6503958702087402, "step": 1445} {"train_info/time_between_train_steps": 0.0030357837677001953, "step": 1445} {"info/global_step": 1446, "train_info/time_within_train_step": 2.6665215492248535, "step": 1446} {"train_info/time_between_train_steps": 0.0030083656311035156, "step": 1446} {"info/global_step": 1447, "train_info/time_within_train_step": 2.6404592990875244, "step": 1447} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 1447} {"info/global_step": 1448, "train_info/time_within_train_step": 2.6477057933807373, "step": 1448} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 1448} {"info/global_step": 1449, "train_info/time_within_train_step": 2.6621344089508057, "step": 1449} {"train_info/time_between_train_steps": 0.003115415573120117, "step": 1449} {"info/global_step": 1450, "train_info/time_within_train_step": 2.643725633621216, "step": 1450} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746901446, "_runtime": 4044}, "step": 1450} {"logs": {"train/loss": 4.5805, "train/learning_rate": 0.00057, "train/epoch": 1.06, "_timestamp": 1746901446, "_runtime": 4044}, "step": 1450} {"train_info/time_between_train_steps": 0.024839401245117188, "step": 1450} {"info/global_step": 1451, "train_info/time_within_train_step": 2.641547203063965, "step": 1451} {"train_info/time_between_train_steps": 0.0030460357666015625, "step": 1451} {"info/global_step": 1452, "train_info/time_within_train_step": 2.647404193878174, "step": 1452} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 1452} {"info/global_step": 1453, "train_info/time_within_train_step": 2.6693367958068848, "step": 1453} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 1453} {"info/global_step": 1454, "train_info/time_within_train_step": 2.667970895767212, "step": 1454} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 1454} {"info/global_step": 1455, "train_info/time_within_train_step": 2.653864860534668, "step": 1455} {"train_info/time_between_train_steps": 0.003091096878051758, "step": 1455} {"info/global_step": 1456, "train_info/time_within_train_step": 2.686429977416992, "step": 1456} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 1456} {"info/global_step": 1457, "train_info/time_within_train_step": 2.641300678253174, "step": 1457} {"train_info/time_between_train_steps": 0.0031130313873291016, "step": 1457} {"info/global_step": 1458, "train_info/time_within_train_step": 2.654340982437134, "step": 1458} {"train_info/time_between_train_steps": 0.0031223297119140625, "step": 1458} {"info/global_step": 1459, "train_info/time_within_train_step": 2.655832052230835, "step": 1459} {"train_info/time_between_train_steps": 0.003107309341430664, "step": 1459} {"info/global_step": 1460, "train_info/time_within_train_step": 2.6421072483062744, "step": 1460} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 1460} {"info/global_step": 1461, "train_info/time_within_train_step": 2.644752025604248, "step": 1461} {"train_info/time_between_train_steps": 0.0031228065490722656, "step": 1461} {"info/global_step": 1462, "train_info/time_within_train_step": 2.66448974609375, "step": 1462} {"train_info/time_between_train_steps": 0.0030641555786132812, "step": 1462} {"info/global_step": 1463, "train_info/time_within_train_step": 2.6559152603149414, "step": 1463} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 1463} {"info/global_step": 1464, "train_info/time_within_train_step": 2.661128520965576, "step": 1464} {"train_info/time_between_train_steps": 0.0031280517578125, "step": 1464} {"info/global_step": 1465, "train_info/time_within_train_step": 2.6934049129486084, "step": 1465} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 1465} {"info/global_step": 1466, "train_info/time_within_train_step": 2.6576573848724365, "step": 1466} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 1466} {"info/global_step": 1467, "train_info/time_within_train_step": 2.6465659141540527, "step": 1467} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 1467} {"info/global_step": 1468, "train_info/time_within_train_step": 2.6480929851531982, "step": 1468} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 1468} {"info/global_step": 1469, "train_info/time_within_train_step": 2.6589462757110596, "step": 1469} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 1469} {"info/global_step": 1470, "train_info/time_within_train_step": 2.9643516540527344, "step": 1470} {"train_info/time_between_train_steps": 0.0029344558715820312, "step": 1470} {"info/global_step": 1471, "train_info/time_within_train_step": 2.6392621994018555, "step": 1471} {"train_info/time_between_train_steps": 0.0029325485229492188, "step": 1471} {"info/global_step": 1472, "train_info/time_within_train_step": 2.6393816471099854, "step": 1472} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 1472} {"info/global_step": 1473, "train_info/time_within_train_step": 2.6554923057556152, "step": 1473} {"train_info/time_between_train_steps": 0.003017902374267578, "step": 1473} {"info/global_step": 1474, "train_info/time_within_train_step": 2.6508193016052246, "step": 1474} {"train_info/time_between_train_steps": 0.002985715866088867, "step": 1474} {"info/global_step": 1475, "train_info/time_within_train_step": 2.642519474029541, "step": 1475} {"train_info/time_between_train_steps": 0.002967357635498047, "step": 1475} {"info/global_step": 1476, "train_info/time_within_train_step": 2.649477005004883, "step": 1476} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 1476} {"info/global_step": 1477, "train_info/time_within_train_step": 2.6584084033966064, "step": 1477} {"train_info/time_between_train_steps": 0.003080606460571289, "step": 1477} {"info/global_step": 1478, "train_info/time_within_train_step": 2.695974111557007, "step": 1478} {"train_info/time_between_train_steps": 0.0030074119567871094, "step": 1478} {"info/global_step": 1479, "train_info/time_within_train_step": 2.6876630783081055, "step": 1479} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 1479} {"info/global_step": 1480, "train_info/time_within_train_step": 2.639467716217041, "step": 1480} {"train_info/time_between_train_steps": 0.003088712692260742, "step": 1480} {"info/global_step": 1481, "train_info/time_within_train_step": 2.639536142349243, "step": 1481} {"train_info/time_between_train_steps": 0.004033803939819336, "step": 1481} {"info/global_step": 1482, "train_info/time_within_train_step": 2.6602439880371094, "step": 1482} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 1482} {"info/global_step": 1483, "train_info/time_within_train_step": 2.654262065887451, "step": 1483} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 1483} {"info/global_step": 1484, "train_info/time_within_train_step": 2.6417975425720215, "step": 1484} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 1484} {"info/global_step": 1485, "train_info/time_within_train_step": 2.648451805114746, "step": 1485} {"train_info/time_between_train_steps": 0.003129720687866211, "step": 1485} {"info/global_step": 1486, "train_info/time_within_train_step": 2.6505911350250244, "step": 1486} {"train_info/time_between_train_steps": 0.0031197071075439453, "step": 1486} {"info/global_step": 1487, "train_info/time_within_train_step": 2.6654956340789795, "step": 1487} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 1487} {"info/global_step": 1488, "train_info/time_within_train_step": 2.7070472240448, "step": 1488} {"train_info/time_between_train_steps": 0.0030584335327148438, "step": 1488} {"info/global_step": 1489, "train_info/time_within_train_step": 2.6397087574005127, "step": 1489} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 1489} {"info/global_step": 1490, "train_info/time_within_train_step": 2.6460113525390625, "step": 1490} {"train_info/time_between_train_steps": 0.003103494644165039, "step": 1490} {"info/global_step": 1491, "train_info/time_within_train_step": 2.6517221927642822, "step": 1491} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 1491} {"info/global_step": 1492, "train_info/time_within_train_step": 2.647456645965576, "step": 1492} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 1492} {"info/global_step": 1493, "train_info/time_within_train_step": 2.647892475128174, "step": 1493} {"train_info/time_between_train_steps": 0.003101348876953125, "step": 1493} {"info/global_step": 1494, "train_info/time_within_train_step": 2.641859769821167, "step": 1494} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 1494} {"info/global_step": 1495, "train_info/time_within_train_step": 2.653262138366699, "step": 1495} {"train_info/time_between_train_steps": 0.003098011016845703, "step": 1495} {"info/global_step": 1496, "train_info/time_within_train_step": 2.6634247303009033, "step": 1496} {"train_info/time_between_train_steps": 0.003083944320678711, "step": 1496} {"info/global_step": 1497, "train_info/time_within_train_step": 2.680506706237793, "step": 1497} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 1497} {"info/global_step": 1498, "train_info/time_within_train_step": 2.658337116241455, "step": 1498} {"train_info/time_between_train_steps": 0.0030450820922851562, "step": 1498} {"info/global_step": 1499, "train_info/time_within_train_step": 2.6519761085510254, "step": 1499} {"train_info/time_between_train_steps": 0.0031113624572753906, "step": 1499} {"info/global_step": 1500, "train_info/time_within_train_step": 3.230394124984741, "step": 1500} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746901581, "_runtime": 4179}, "step": 1500} {"logs": {"train/loss": 4.5365, "train/learning_rate": 0.0005666666666666666, "train/epoch": 1.06, "_timestamp": 1746901581, "_runtime": 4179}, "step": 1500} {"train_info/time_between_train_steps": 0.02426624298095703, "step": 1500} {"info/global_step": 1501, "train_info/time_within_train_step": 2.6552178859710693, "step": 1501} {"train_info/time_between_train_steps": 0.0031290054321289062, "step": 1501} {"info/global_step": 1502, "train_info/time_within_train_step": 2.641308307647705, "step": 1502} {"train_info/time_between_train_steps": 0.003106832504272461, "step": 1502} {"info/global_step": 1503, "train_info/time_within_train_step": 2.6457741260528564, "step": 1503} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 1503} {"info/global_step": 1504, "train_info/time_within_train_step": 2.6684844493865967, "step": 1504} {"train_info/time_between_train_steps": 0.0030906200408935547, "step": 1504} {"info/global_step": 1505, "train_info/time_within_train_step": 2.670778512954712, "step": 1505} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 1505} {"info/global_step": 1506, "train_info/time_within_train_step": 2.642127752304077, "step": 1506} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 1506} {"info/global_step": 1507, "train_info/time_within_train_step": 2.660303831100464, "step": 1507} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 1507} {"info/global_step": 1508, "train_info/time_within_train_step": 2.6465468406677246, "step": 1508} {"train_info/time_between_train_steps": 0.003091573715209961, "step": 1508} {"info/global_step": 1509, "train_info/time_within_train_step": 2.6420462131500244, "step": 1509} {"train_info/time_between_train_steps": 0.003780841827392578, "step": 1509} {"info/global_step": 1510, "train_info/time_within_train_step": 2.662360191345215, "step": 1510} {"train_info/time_between_train_steps": 0.003081083297729492, "step": 1510} {"info/global_step": 1511, "train_info/time_within_train_step": 2.6565144062042236, "step": 1511} {"train_info/time_between_train_steps": 0.003108978271484375, "step": 1511} {"info/global_step": 1512, "train_info/time_within_train_step": 2.6642706394195557, "step": 1512} {"train_info/time_between_train_steps": 0.0031003952026367188, "step": 1512} {"info/global_step": 1513, "train_info/time_within_train_step": 2.685948371887207, "step": 1513} {"train_info/time_between_train_steps": 0.0030450820922851562, "step": 1513} {"info/global_step": 1514, "train_info/time_within_train_step": 2.676090955734253, "step": 1514} {"train_info/time_between_train_steps": 0.0031366348266601562, "step": 1514} {"info/global_step": 1515, "train_info/time_within_train_step": 2.64031720161438, "step": 1515} {"train_info/time_between_train_steps": 0.003112316131591797, "step": 1515} {"info/global_step": 1516, "train_info/time_within_train_step": 2.6403775215148926, "step": 1516} {"train_info/time_between_train_steps": 0.003053426742553711, "step": 1516} {"info/global_step": 1517, "train_info/time_within_train_step": 2.6547608375549316, "step": 1517} {"train_info/time_between_train_steps": 0.0030906200408935547, "step": 1517} {"info/global_step": 1518, "train_info/time_within_train_step": 2.652925729751587, "step": 1518} {"train_info/time_between_train_steps": 0.0030608177185058594, "step": 1518} {"info/global_step": 1519, "train_info/time_within_train_step": 2.64260196685791, "step": 1519} {"train_info/time_between_train_steps": 0.003081083297729492, "step": 1519} {"info/global_step": 1520, "train_info/time_within_train_step": 2.659559965133667, "step": 1520} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 1520} {"info/global_step": 1521, "train_info/time_within_train_step": 2.6508095264434814, "step": 1521} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 1521} {"info/global_step": 1522, "train_info/time_within_train_step": 2.661343574523926, "step": 1522} {"train_info/time_between_train_steps": 0.003270864486694336, "step": 1522} {"info/global_step": 1523, "train_info/time_within_train_step": 2.7110092639923096, "step": 1523} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 1523} {"info/global_step": 1524, "train_info/time_within_train_step": 2.6937716007232666, "step": 1524} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 1524} {"info/global_step": 1525, "train_info/time_within_train_step": 2.64089035987854, "step": 1525} {"train_info/time_between_train_steps": 0.0031528472900390625, "step": 1525} {"info/global_step": 1526, "train_info/time_within_train_step": 2.6404874324798584, "step": 1526} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 1526} {"info/global_step": 1527, "train_info/time_within_train_step": 2.6549665927886963, "step": 1527} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 1527} {"info/global_step": 1528, "train_info/time_within_train_step": 2.6449527740478516, "step": 1528} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 1528} {"info/global_step": 1529, "train_info/time_within_train_step": 2.6429591178894043, "step": 1529} {"train_info/time_between_train_steps": 0.0033292770385742188, "step": 1529} {"info/global_step": 1530, "train_info/time_within_train_step": 2.6490583419799805, "step": 1530} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 1530} {"info/global_step": 1531, "train_info/time_within_train_step": 2.6434457302093506, "step": 1531} {"train_info/time_between_train_steps": 0.003307819366455078, "step": 1531} {"info/global_step": 1532, "train_info/time_within_train_step": 2.6424319744110107, "step": 1532} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 1532} {"info/global_step": 1533, "train_info/time_within_train_step": 2.891380548477173, "step": 1533} {"train_info/time_between_train_steps": 0.003002166748046875, "step": 1533} {"info/global_step": 1534, "train_info/time_within_train_step": 2.638598680496216, "step": 1534} {"train_info/time_between_train_steps": 0.0029137134552001953, "step": 1534} {"info/global_step": 1535, "train_info/time_within_train_step": 2.695629596710205, "step": 1535} {"train_info/time_between_train_steps": 0.0029480457305908203, "step": 1535} {"info/global_step": 1536, "train_info/time_within_train_step": 2.658550977706909, "step": 1536} {"train_info/time_between_train_steps": 0.003028392791748047, "step": 1536} {"info/global_step": 1537, "train_info/time_within_train_step": 2.677705764770508, "step": 1537} {"train_info/time_between_train_steps": 0.003003358840942383, "step": 1537} {"info/global_step": 1538, "train_info/time_within_train_step": 2.6754605770111084, "step": 1538} {"train_info/time_between_train_steps": 0.0028879642486572266, "step": 1538} {"info/global_step": 1539, "train_info/time_within_train_step": 2.6608963012695312, "step": 1539} {"train_info/time_between_train_steps": 0.0029397010803222656, "step": 1539} {"info/global_step": 1540, "train_info/time_within_train_step": 2.6456997394561768, "step": 1540} {"train_info/time_between_train_steps": 0.0029964447021484375, "step": 1540} {"info/global_step": 1541, "train_info/time_within_train_step": 2.6567444801330566, "step": 1541} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 1541} {"info/global_step": 1542, "train_info/time_within_train_step": 2.641118288040161, "step": 1542} {"train_info/time_between_train_steps": 0.0030324459075927734, "step": 1542} {"info/global_step": 1543, "train_info/time_within_train_step": 2.642939329147339, "step": 1543} {"train_info/time_between_train_steps": 0.0029916763305664062, "step": 1543} {"info/global_step": 1544, "train_info/time_within_train_step": 2.651386260986328, "step": 1544} {"train_info/time_between_train_steps": 0.0029289722442626953, "step": 1544} {"info/global_step": 1545, "train_info/time_within_train_step": 2.650033473968506, "step": 1545} {"train_info/time_between_train_steps": 0.0029230117797851562, "step": 1545} {"info/global_step": 1546, "train_info/time_within_train_step": 2.6583685874938965, "step": 1546} {"train_info/time_between_train_steps": 0.0030562877655029297, "step": 1546} {"info/global_step": 1547, "train_info/time_within_train_step": 2.694338798522949, "step": 1547} {"train_info/time_between_train_steps": 0.0030198097229003906, "step": 1547} {"info/global_step": 1548, "train_info/time_within_train_step": 2.706329584121704, "step": 1548} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 1548} {"info/global_step": 1549, "train_info/time_within_train_step": 2.639718532562256, "step": 1549} {"train_info/time_between_train_steps": 0.003065824508666992, "step": 1549} {"info/global_step": 1550, "train_info/time_within_train_step": 2.6400723457336426, "step": 1550} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746901716, "_runtime": 4314}, "step": 1550} {"logs": {"train/loss": 4.5209, "train/learning_rate": 0.0005633333333333333, "train/epoch": 1.07, "_timestamp": 1746901716, "_runtime": 4314}, "step": 1550} {"train_info/time_between_train_steps": 0.0248720645904541, "step": 1550} {"info/global_step": 1551, "train_info/time_within_train_step": 2.6594862937927246, "step": 1551} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 1551} {"info/global_step": 1552, "train_info/time_within_train_step": 2.6460275650024414, "step": 1552} {"train_info/time_between_train_steps": 0.0032453536987304688, "step": 1552} {"info/global_step": 1553, "train_info/time_within_train_step": 2.6434943675994873, "step": 1553} {"train_info/time_between_train_steps": 0.0032629966735839844, "step": 1553} {"info/global_step": 1554, "train_info/time_within_train_step": 2.648961067199707, "step": 1554} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 1554} {"info/global_step": 1555, "train_info/time_within_train_step": 2.6440677642822266, "step": 1555} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 1555} {"info/global_step": 1556, "train_info/time_within_train_step": 2.668151617050171, "step": 1556} {"train_info/time_between_train_steps": 0.0031402111053466797, "step": 1556} {"info/global_step": 1557, "train_info/time_within_train_step": 2.696385622024536, "step": 1557} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 1557} {"info/global_step": 1558, "train_info/time_within_train_step": 2.6589303016662598, "step": 1558} {"train_info/time_between_train_steps": 0.0031273365020751953, "step": 1558} {"info/global_step": 1559, "train_info/time_within_train_step": 2.6645350456237793, "step": 1559} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 1559} {"info/global_step": 1560, "train_info/time_within_train_step": 2.6411564350128174, "step": 1560} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 1560} {"info/global_step": 1561, "train_info/time_within_train_step": 2.653980255126953, "step": 1561} {"train_info/time_between_train_steps": 0.0030927658081054688, "step": 1561} {"info/global_step": 1562, "train_info/time_within_train_step": 2.667302131652832, "step": 1562} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 1562} {"info/global_step": 1563, "train_info/time_within_train_step": 2.6663007736206055, "step": 1563} {"train_info/time_between_train_steps": 0.003093719482421875, "step": 1563} {"info/global_step": 1564, "train_info/time_within_train_step": 2.6656625270843506, "step": 1564} {"train_info/time_between_train_steps": 0.003204345703125, "step": 1564} {"info/global_step": 1565, "train_info/time_within_train_step": 2.6653807163238525, "step": 1565} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 1565} {"info/global_step": 1566, "train_info/time_within_train_step": 2.6738007068634033, "step": 1566} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 1566} {"info/global_step": 1567, "train_info/time_within_train_step": 2.6417126655578613, "step": 1567} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 1567} {"info/global_step": 1568, "train_info/time_within_train_step": 2.652794361114502, "step": 1568} {"train_info/time_between_train_steps": 0.0030794143676757812, "step": 1568} {"info/global_step": 1569, "train_info/time_within_train_step": 2.653759241104126, "step": 1569} {"train_info/time_between_train_steps": 0.0031151771545410156, "step": 1569} {"info/global_step": 1570, "train_info/time_within_train_step": 2.6419780254364014, "step": 1570} {"train_info/time_between_train_steps": 0.003133058547973633, "step": 1570} {"info/global_step": 1571, "train_info/time_within_train_step": 2.6418347358703613, "step": 1571} {"train_info/time_between_train_steps": 0.0031156539916992188, "step": 1571} {"info/global_step": 1572, "train_info/time_within_train_step": 2.6547398567199707, "step": 1572} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 1572} {"info/global_step": 1573, "train_info/time_within_train_step": 2.6598682403564453, "step": 1573} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 1573} {"info/global_step": 1574, "train_info/time_within_train_step": 2.672241687774658, "step": 1574} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 1574} {"info/global_step": 1575, "train_info/time_within_train_step": 2.8597426414489746, "step": 1575} {"train_info/time_between_train_steps": 0.0029201507568359375, "step": 1575} {"info/global_step": 1576, "train_info/time_within_train_step": 2.6536054611206055, "step": 1576} {"train_info/time_between_train_steps": 0.0029833316802978516, "step": 1576} {"info/global_step": 1577, "train_info/time_within_train_step": 2.656503915786743, "step": 1577} {"train_info/time_between_train_steps": 0.0029680728912353516, "step": 1577} {"info/global_step": 1578, "train_info/time_within_train_step": 2.702279567718506, "step": 1578} {"train_info/time_between_train_steps": 0.0029048919677734375, "step": 1578} {"info/global_step": 1579, "train_info/time_within_train_step": 2.6485652923583984, "step": 1579} {"train_info/time_between_train_steps": 0.0030558109283447266, "step": 1579} {"info/global_step": 1580, "train_info/time_within_train_step": 2.6457879543304443, "step": 1580} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 1580} {"info/global_step": 1581, "train_info/time_within_train_step": 2.6492393016815186, "step": 1581} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 1581} {"info/global_step": 1582, "train_info/time_within_train_step": 2.64892840385437, "step": 1582} {"train_info/time_between_train_steps": 0.0029222965240478516, "step": 1582} {"info/global_step": 1583, "train_info/time_within_train_step": 2.647508144378662, "step": 1583} {"train_info/time_between_train_steps": 0.0029096603393554688, "step": 1583} {"info/global_step": 1584, "train_info/time_within_train_step": 2.6580810546875, "step": 1584} {"train_info/time_between_train_steps": 0.0029535293579101562, "step": 1584} {"info/global_step": 1585, "train_info/time_within_train_step": 2.652327537536621, "step": 1585} {"train_info/time_between_train_steps": 0.0029146671295166016, "step": 1585} {"info/global_step": 1586, "train_info/time_within_train_step": 2.6598854064941406, "step": 1586} {"train_info/time_between_train_steps": 0.0029633045196533203, "step": 1586} {"info/global_step": 1587, "train_info/time_within_train_step": 2.7100560665130615, "step": 1587} {"train_info/time_between_train_steps": 0.002918243408203125, "step": 1587} {"info/global_step": 1588, "train_info/time_within_train_step": 2.692314386367798, "step": 1588} {"train_info/time_between_train_steps": 0.002904653549194336, "step": 1588} {"info/global_step": 1589, "train_info/time_within_train_step": 2.6444008350372314, "step": 1589} {"train_info/time_between_train_steps": 0.002916574478149414, "step": 1589} {"info/global_step": 1590, "train_info/time_within_train_step": 2.638967275619507, "step": 1590} {"train_info/time_between_train_steps": 0.0029251575469970703, "step": 1590} {"info/global_step": 1591, "train_info/time_within_train_step": 2.6569066047668457, "step": 1591} {"train_info/time_between_train_steps": 0.002958536148071289, "step": 1591} {"info/global_step": 1592, "train_info/time_within_train_step": 2.653757333755493, "step": 1592} {"train_info/time_between_train_steps": 0.0029311180114746094, "step": 1592} {"info/global_step": 1593, "train_info/time_within_train_step": 2.6418144702911377, "step": 1593} {"train_info/time_between_train_steps": 0.0029532909393310547, "step": 1593} {"info/global_step": 1594, "train_info/time_within_train_step": 2.6487884521484375, "step": 1594} {"train_info/time_between_train_steps": 0.0028836727142333984, "step": 1594} {"info/global_step": 1595, "train_info/time_within_train_step": 2.654615879058838, "step": 1595} {"train_info/time_between_train_steps": 0.002972841262817383, "step": 1595} {"info/global_step": 1596, "train_info/time_within_train_step": 2.6654891967773438, "step": 1596} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 1596} {"info/global_step": 1597, "train_info/time_within_train_step": 2.7094948291778564, "step": 1597} {"train_info/time_between_train_steps": 0.0029304027557373047, "step": 1597} {"info/global_step": 1598, "train_info/time_within_train_step": 2.64202880859375, "step": 1598} {"train_info/time_between_train_steps": 0.002879619598388672, "step": 1598} {"info/global_step": 1599, "train_info/time_within_train_step": 2.652949094772339, "step": 1599} {"train_info/time_between_train_steps": 0.002970457077026367, "step": 1599} {"info/global_step": 1600, "train_info/time_within_train_step": 2.647597312927246, "step": 1600} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746901851, "_runtime": 4449}, "step": 1600} {"logs": {"train/loss": 4.4895, "train/learning_rate": 0.00056, "train/epoch": 1.07, "_timestamp": 1746901851, "_runtime": 4449}, "step": 1600} {"train_info/time_between_train_steps": 14.695259094238281, "step": 1600} {"info/global_step": 1601, "train_info/time_within_train_step": 2.440546989440918, "step": 1601} {"train_info/time_between_train_steps": 0.0029380321502685547, "step": 1601} {"info/global_step": 1602, "train_info/time_within_train_step": 2.4265527725219727, "step": 1602} {"train_info/time_between_train_steps": 0.002949237823486328, "step": 1602} {"info/global_step": 1603, "train_info/time_within_train_step": 2.59688138961792, "step": 1603} {"train_info/time_between_train_steps": 0.0029840469360351562, "step": 1603} {"info/global_step": 1604, "train_info/time_within_train_step": 2.6445209980010986, "step": 1604} {"train_info/time_between_train_steps": 0.0029900074005126953, "step": 1604} {"info/global_step": 1605, "train_info/time_within_train_step": 2.638906717300415, "step": 1605} {"train_info/time_between_train_steps": 0.002958059310913086, "step": 1605} {"info/global_step": 1606, "train_info/time_within_train_step": 2.6630775928497314, "step": 1606} {"train_info/time_between_train_steps": 0.0029664039611816406, "step": 1606} {"info/global_step": 1607, "train_info/time_within_train_step": 2.6549265384674072, "step": 1607} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 1607} {"info/global_step": 1608, "train_info/time_within_train_step": 2.653616428375244, "step": 1608} {"train_info/time_between_train_steps": 0.002956867218017578, "step": 1608} {"info/global_step": 1609, "train_info/time_within_train_step": 2.69897723197937, "step": 1609} {"train_info/time_between_train_steps": 0.0030057430267333984, "step": 1609} {"info/global_step": 1610, "train_info/time_within_train_step": 2.652815341949463, "step": 1610} {"train_info/time_between_train_steps": 0.0029273033142089844, "step": 1610} {"info/global_step": 1611, "train_info/time_within_train_step": 2.646519899368286, "step": 1611} {"train_info/time_between_train_steps": 0.002994060516357422, "step": 1611} {"info/global_step": 1612, "train_info/time_within_train_step": 2.64664888381958, "step": 1612} {"train_info/time_between_train_steps": 0.0029535293579101562, "step": 1612} {"info/global_step": 1613, "train_info/time_within_train_step": 2.648804187774658, "step": 1613} {"train_info/time_between_train_steps": 0.0030007362365722656, "step": 1613} {"info/global_step": 1614, "train_info/time_within_train_step": 2.6563892364501953, "step": 1614} {"train_info/time_between_train_steps": 0.002974271774291992, "step": 1614} {"info/global_step": 1615, "train_info/time_within_train_step": 2.6458590030670166, "step": 1615} {"train_info/time_between_train_steps": 0.0029456615447998047, "step": 1615} {"info/global_step": 1616, "train_info/time_within_train_step": 2.6553502082824707, "step": 1616} {"train_info/time_between_train_steps": 0.0029637813568115234, "step": 1616} {"info/global_step": 1617, "train_info/time_within_train_step": 2.6530842781066895, "step": 1617} {"train_info/time_between_train_steps": 0.002997875213623047, "step": 1617} {"info/global_step": 1618, "train_info/time_within_train_step": 2.667604684829712, "step": 1618} {"train_info/time_between_train_steps": 0.002958059310913086, "step": 1618} {"info/global_step": 1619, "train_info/time_within_train_step": 2.7246241569519043, "step": 1619} {"train_info/time_between_train_steps": 0.002986431121826172, "step": 1619} {"info/global_step": 1620, "train_info/time_within_train_step": 2.685699939727783, "step": 1620} {"train_info/time_between_train_steps": 0.002938508987426758, "step": 1620} {"info/global_step": 1621, "train_info/time_within_train_step": 2.6406161785125732, "step": 1621} {"train_info/time_between_train_steps": 0.0029430389404296875, "step": 1621} {"info/global_step": 1622, "train_info/time_within_train_step": 2.6422557830810547, "step": 1622} {"train_info/time_between_train_steps": 0.0030145645141601562, "step": 1622} {"info/global_step": 1623, "train_info/time_within_train_step": 2.6555373668670654, "step": 1623} {"train_info/time_between_train_steps": 0.002965211868286133, "step": 1623} {"info/global_step": 1624, "train_info/time_within_train_step": 2.6607322692871094, "step": 1624} {"train_info/time_between_train_steps": 0.0029752254486083984, "step": 1624} {"info/global_step": 1625, "train_info/time_within_train_step": 2.6443612575531006, "step": 1625} {"train_info/time_between_train_steps": 0.002958536148071289, "step": 1625} {"info/global_step": 1626, "train_info/time_within_train_step": 2.6525983810424805, "step": 1626} {"train_info/time_between_train_steps": 0.003009319305419922, "step": 1626} {"info/global_step": 1627, "train_info/time_within_train_step": 2.64747953414917, "step": 1627} {"train_info/time_between_train_steps": 0.002960205078125, "step": 1627} {"info/global_step": 1628, "train_info/time_within_train_step": 2.669450044631958, "step": 1628} {"train_info/time_between_train_steps": 0.0029976367950439453, "step": 1628} {"info/global_step": 1629, "train_info/time_within_train_step": 2.6915688514709473, "step": 1629} {"train_info/time_between_train_steps": 0.0029315948486328125, "step": 1629} {"info/global_step": 1630, "train_info/time_within_train_step": 2.6657896041870117, "step": 1630} {"train_info/time_between_train_steps": 0.0029489994049072266, "step": 1630} {"info/global_step": 1631, "train_info/time_within_train_step": 2.670849084854126, "step": 1631} {"train_info/time_between_train_steps": 0.002951383590698242, "step": 1631} {"info/global_step": 1632, "train_info/time_within_train_step": 2.647172212600708, "step": 1632} {"train_info/time_between_train_steps": 0.002914905548095703, "step": 1632} {"info/global_step": 1633, "train_info/time_within_train_step": 2.654169797897339, "step": 1633} {"train_info/time_between_train_steps": 0.002956390380859375, "step": 1633} {"info/global_step": 1634, "train_info/time_within_train_step": 2.650707960128784, "step": 1634} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 1634} {"info/global_step": 1635, "train_info/time_within_train_step": 2.6459832191467285, "step": 1635} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 1635} {"info/global_step": 1636, "train_info/time_within_train_step": 2.647778034210205, "step": 1636} {"train_info/time_between_train_steps": 0.002949237823486328, "step": 1636} {"info/global_step": 1637, "train_info/time_within_train_step": 2.652231454849243, "step": 1637} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 1637} {"info/global_step": 1638, "train_info/time_within_train_step": 2.6595983505249023, "step": 1638} {"train_info/time_between_train_steps": 0.002977132797241211, "step": 1638} {"info/global_step": 1639, "train_info/time_within_train_step": 2.6858937740325928, "step": 1639} {"train_info/time_between_train_steps": 0.003376483917236328, "step": 1639} {"info/global_step": 1640, "train_info/time_within_train_step": 2.6564395427703857, "step": 1640} {"train_info/time_between_train_steps": 0.0029637813568115234, "step": 1640} {"info/global_step": 1641, "train_info/time_within_train_step": 2.708184242248535, "step": 1641} {"train_info/time_between_train_steps": 0.0029196739196777344, "step": 1641} {"info/global_step": 1642, "train_info/time_within_train_step": 2.643381118774414, "step": 1642} {"train_info/time_between_train_steps": 0.002977609634399414, "step": 1642} {"info/global_step": 1643, "train_info/time_within_train_step": 2.647524118423462, "step": 1643} {"train_info/time_between_train_steps": 0.002980470657348633, "step": 1643} {"info/global_step": 1644, "train_info/time_within_train_step": 2.6562936305999756, "step": 1644} {"train_info/time_between_train_steps": 0.002903461456298828, "step": 1644} {"info/global_step": 1645, "train_info/time_within_train_step": 2.651848077774048, "step": 1645} {"train_info/time_between_train_steps": 0.002962350845336914, "step": 1645} {"info/global_step": 1646, "train_info/time_within_train_step": 2.648611068725586, "step": 1646} {"train_info/time_between_train_steps": 0.002964496612548828, "step": 1646} {"info/global_step": 1647, "train_info/time_within_train_step": 2.64550518989563, "step": 1647} {"train_info/time_between_train_steps": 0.002948760986328125, "step": 1647} {"info/global_step": 1648, "train_info/time_within_train_step": 2.6518239974975586, "step": 1648} {"train_info/time_between_train_steps": 0.002995729446411133, "step": 1648} {"info/global_step": 1649, "train_info/time_within_train_step": 2.659271478652954, "step": 1649} {"train_info/time_between_train_steps": 0.0030732154846191406, "step": 1649} {"info/global_step": 1650, "train_info/time_within_train_step": 2.6782031059265137, "step": 1650} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746901999, "_runtime": 4597}, "step": 1650} {"logs": {"train/loss": 4.4638, "train/learning_rate": 0.0005566666666666667, "train/epoch": 1.08, "_timestamp": 1746901999, "_runtime": 4597}, "step": 1650} {"train_info/time_between_train_steps": 0.024587154388427734, "step": 1650} {"info/global_step": 1651, "train_info/time_within_train_step": 2.7080578804016113, "step": 1651} {"train_info/time_between_train_steps": 0.0031502246856689453, "step": 1651} {"info/global_step": 1652, "train_info/time_within_train_step": 2.719871997833252, "step": 1652} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 1652} {"info/global_step": 1653, "train_info/time_within_train_step": 2.6443004608154297, "step": 1653} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 1653} {"info/global_step": 1654, "train_info/time_within_train_step": 2.6409902572631836, "step": 1654} {"train_info/time_between_train_steps": 0.0031108856201171875, "step": 1654} {"info/global_step": 1655, "train_info/time_within_train_step": 2.6595194339752197, "step": 1655} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 1655} {"info/global_step": 1656, "train_info/time_within_train_step": 2.6469473838806152, "step": 1656} {"train_info/time_between_train_steps": 0.003104686737060547, "step": 1656} {"info/global_step": 1657, "train_info/time_within_train_step": 2.647233009338379, "step": 1657} {"train_info/time_between_train_steps": 0.003055095672607422, "step": 1657} {"info/global_step": 1658, "train_info/time_within_train_step": 2.6487457752227783, "step": 1658} {"train_info/time_between_train_steps": 0.0030565261840820312, "step": 1658} {"info/global_step": 1659, "train_info/time_within_train_step": 2.645101547241211, "step": 1659} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 1659} {"info/global_step": 1660, "train_info/time_within_train_step": 2.668769359588623, "step": 1660} {"train_info/time_between_train_steps": 0.003098726272583008, "step": 1660} {"info/global_step": 1661, "train_info/time_within_train_step": 2.6819536685943604, "step": 1661} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 1661} {"info/global_step": 1662, "train_info/time_within_train_step": 2.6820716857910156, "step": 1662} {"train_info/time_between_train_steps": 0.003088235855102539, "step": 1662} {"info/global_step": 1663, "train_info/time_within_train_step": 2.653892755508423, "step": 1663} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 1663} {"info/global_step": 1664, "train_info/time_within_train_step": 2.6403603553771973, "step": 1664} {"train_info/time_between_train_steps": 0.0031430721282958984, "step": 1664} {"info/global_step": 1665, "train_info/time_within_train_step": 2.655198574066162, "step": 1665} {"train_info/time_between_train_steps": 0.003065347671508789, "step": 1665} {"info/global_step": 1666, "train_info/time_within_train_step": 2.652855396270752, "step": 1666} {"train_info/time_between_train_steps": 0.003123760223388672, "step": 1666} {"info/global_step": 1667, "train_info/time_within_train_step": 2.646228313446045, "step": 1667} {"train_info/time_between_train_steps": 0.003071308135986328, "step": 1667} {"info/global_step": 1668, "train_info/time_within_train_step": 2.643559217453003, "step": 1668} {"train_info/time_between_train_steps": 0.0031061172485351562, "step": 1668} {"info/global_step": 1669, "train_info/time_within_train_step": 2.646996021270752, "step": 1669} {"train_info/time_between_train_steps": 0.003044605255126953, "step": 1669} {"info/global_step": 1670, "train_info/time_within_train_step": 2.679408311843872, "step": 1670} {"train_info/time_between_train_steps": 0.0031371116638183594, "step": 1670} {"info/global_step": 1671, "train_info/time_within_train_step": 2.6643993854522705, "step": 1671} {"train_info/time_between_train_steps": 0.0030791759490966797, "step": 1671} {"info/global_step": 1672, "train_info/time_within_train_step": 2.6725332736968994, "step": 1672} {"train_info/time_between_train_steps": 0.003091573715209961, "step": 1672} {"info/global_step": 1673, "train_info/time_within_train_step": 2.664835214614868, "step": 1673} {"train_info/time_between_train_steps": 0.0030968189239501953, "step": 1673} {"info/global_step": 1674, "train_info/time_within_train_step": 2.648062229156494, "step": 1674} {"train_info/time_between_train_steps": 0.0030503273010253906, "step": 1674} {"info/global_step": 1675, "train_info/time_within_train_step": 2.650568962097168, "step": 1675} {"train_info/time_between_train_steps": 0.0030982494354248047, "step": 1675} {"info/global_step": 1676, "train_info/time_within_train_step": 2.646664619445801, "step": 1676} {"train_info/time_between_train_steps": 0.0030617713928222656, "step": 1676} {"info/global_step": 1677, "train_info/time_within_train_step": 2.650148868560791, "step": 1677} {"train_info/time_between_train_steps": 0.003133058547973633, "step": 1677} {"info/global_step": 1678, "train_info/time_within_train_step": 2.6483986377716064, "step": 1678} {"train_info/time_between_train_steps": 0.003086566925048828, "step": 1678} {"info/global_step": 1679, "train_info/time_within_train_step": 2.6457462310791016, "step": 1679} {"train_info/time_between_train_steps": 0.0031588077545166016, "step": 1679} {"info/global_step": 1680, "train_info/time_within_train_step": 2.663869857788086, "step": 1680} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 1680} {"info/global_step": 1681, "train_info/time_within_train_step": 2.6655373573303223, "step": 1681} {"train_info/time_between_train_steps": 0.0030868053436279297, "step": 1681} {"info/global_step": 1682, "train_info/time_within_train_step": 2.7536559104919434, "step": 1682} {"train_info/time_between_train_steps": 0.0029840469360351562, "step": 1682} {"info/global_step": 1683, "train_info/time_within_train_step": 2.6619620323181152, "step": 1683} {"train_info/time_between_train_steps": 0.0029489994049072266, "step": 1683} {"info/global_step": 1684, "train_info/time_within_train_step": 2.7030298709869385, "step": 1684} {"train_info/time_between_train_steps": 0.0029282569885253906, "step": 1684} {"info/global_step": 1685, "train_info/time_within_train_step": 2.639411687850952, "step": 1685} {"train_info/time_between_train_steps": 0.0030219554901123047, "step": 1685} {"info/global_step": 1686, "train_info/time_within_train_step": 2.6450588703155518, "step": 1686} {"train_info/time_between_train_steps": 0.002992868423461914, "step": 1686} {"info/global_step": 1687, "train_info/time_within_train_step": 2.666110038757324, "step": 1687} {"train_info/time_between_train_steps": 0.002998828887939453, "step": 1687} {"info/global_step": 1688, "train_info/time_within_train_step": 2.6418075561523438, "step": 1688} {"train_info/time_between_train_steps": 0.0030014514923095703, "step": 1688} {"info/global_step": 1689, "train_info/time_within_train_step": 2.643643856048584, "step": 1689} {"train_info/time_between_train_steps": 0.002947092056274414, "step": 1689} {"info/global_step": 1690, "train_info/time_within_train_step": 2.6499431133270264, "step": 1690} {"train_info/time_between_train_steps": 0.002980947494506836, "step": 1690} {"info/global_step": 1691, "train_info/time_within_train_step": 2.6525626182556152, "step": 1691} {"train_info/time_between_train_steps": 0.0029611587524414062, "step": 1691} {"info/global_step": 1692, "train_info/time_within_train_step": 2.65952730178833, "step": 1692} {"train_info/time_between_train_steps": 0.003042936325073242, "step": 1692} {"info/global_step": 1693, "train_info/time_within_train_step": 2.6780951023101807, "step": 1693} {"train_info/time_between_train_steps": 0.0030486583709716797, "step": 1693} {"info/global_step": 1694, "train_info/time_within_train_step": 2.7282352447509766, "step": 1694} {"train_info/time_between_train_steps": 0.002950429916381836, "step": 1694} {"info/global_step": 1695, "train_info/time_within_train_step": 2.6528592109680176, "step": 1695} {"train_info/time_between_train_steps": 0.0029833316802978516, "step": 1695} {"info/global_step": 1696, "train_info/time_within_train_step": 2.6402103900909424, "step": 1696} {"train_info/time_between_train_steps": 0.0029549598693847656, "step": 1696} {"info/global_step": 1697, "train_info/time_within_train_step": 2.6590707302093506, "step": 1697} {"train_info/time_between_train_steps": 0.002973794937133789, "step": 1697} {"info/global_step": 1698, "train_info/time_within_train_step": 2.6477842330932617, "step": 1698} {"train_info/time_between_train_steps": 0.0030279159545898438, "step": 1698} {"info/global_step": 1699, "train_info/time_within_train_step": 2.6484575271606445, "step": 1699} {"train_info/time_between_train_steps": 0.0030202865600585938, "step": 1699} {"info/global_step": 1700, "train_info/time_within_train_step": 2.6471917629241943, "step": 1700} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746902134, "_runtime": 4732}, "step": 1700} {"logs": {"train/loss": 4.438, "train/learning_rate": 0.0005533333333333333, "train/epoch": 1.08, "_timestamp": 1746902134, "_runtime": 4732}, "step": 1700} {"train_info/time_between_train_steps": 0.024869918823242188, "step": 1700} {"info/global_step": 1701, "train_info/time_within_train_step": 2.6493070125579834, "step": 1701} {"train_info/time_between_train_steps": 0.003328561782836914, "step": 1701} {"info/global_step": 1702, "train_info/time_within_train_step": 2.66709566116333, "step": 1702} {"train_info/time_between_train_steps": 0.003221273422241211, "step": 1702} {"info/global_step": 1703, "train_info/time_within_train_step": 2.7096030712127686, "step": 1703} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 1703} {"info/global_step": 1704, "train_info/time_within_train_step": 2.6421496868133545, "step": 1704} {"train_info/time_between_train_steps": 0.003404378890991211, "step": 1704} {"info/global_step": 1705, "train_info/time_within_train_step": 2.644505023956299, "step": 1705} {"train_info/time_between_train_steps": 0.0033240318298339844, "step": 1705} {"info/global_step": 1706, "train_info/time_within_train_step": 2.653761386871338, "step": 1706} {"train_info/time_between_train_steps": 0.003629446029663086, "step": 1706} {"info/global_step": 1707, "train_info/time_within_train_step": 2.6518502235412598, "step": 1707} {"train_info/time_between_train_steps": 0.003342866897583008, "step": 1707} {"info/global_step": 1708, "train_info/time_within_train_step": 2.6505696773529053, "step": 1708} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 1708} {"info/global_step": 1709, "train_info/time_within_train_step": 2.644470453262329, "step": 1709} {"train_info/time_between_train_steps": 0.0034363269805908203, "step": 1709} {"info/global_step": 1710, "train_info/time_within_train_step": 2.6473052501678467, "step": 1710} {"train_info/time_between_train_steps": 0.003261566162109375, "step": 1710} {"info/global_step": 1711, "train_info/time_within_train_step": 2.684807300567627, "step": 1711} {"train_info/time_between_train_steps": 0.003481149673461914, "step": 1711} {"info/global_step": 1712, "train_info/time_within_train_step": 2.6516273021698, "step": 1712} {"train_info/time_between_train_steps": 0.003284931182861328, "step": 1712} {"info/global_step": 1713, "train_info/time_within_train_step": 2.7213521003723145, "step": 1713} {"train_info/time_between_train_steps": 0.0032639503479003906, "step": 1713} {"info/global_step": 1714, "train_info/time_within_train_step": 2.6531713008880615, "step": 1714} {"train_info/time_between_train_steps": 0.003517627716064453, "step": 1714} {"info/global_step": 1715, "train_info/time_within_train_step": 2.643738031387329, "step": 1715} {"train_info/time_between_train_steps": 0.00351715087890625, "step": 1715} {"info/global_step": 1716, "train_info/time_within_train_step": 2.644897699356079, "step": 1716} {"train_info/time_between_train_steps": 0.003343820571899414, "step": 1716} {"info/global_step": 1717, "train_info/time_within_train_step": 2.649526834487915, "step": 1717} {"train_info/time_between_train_steps": 0.0035696029663085938, "step": 1717} {"info/global_step": 1718, "train_info/time_within_train_step": 2.66096830368042, "step": 1718} {"train_info/time_between_train_steps": 0.003947734832763672, "step": 1718} {"info/global_step": 1719, "train_info/time_within_train_step": 2.66806960105896, "step": 1719} {"train_info/time_between_train_steps": 0.0036368370056152344, "step": 1719} {"info/global_step": 1720, "train_info/time_within_train_step": 2.7117953300476074, "step": 1720} {"train_info/time_between_train_steps": 0.003917217254638672, "step": 1720} {"info/global_step": 1721, "train_info/time_within_train_step": 2.647570848464966, "step": 1721} {"train_info/time_between_train_steps": 0.0034248828887939453, "step": 1721} {"info/global_step": 1722, "train_info/time_within_train_step": 2.66165828704834, "step": 1722} {"train_info/time_between_train_steps": 0.004114389419555664, "step": 1722} {"info/global_step": 1723, "train_info/time_within_train_step": 2.6442031860351562, "step": 1723} {"train_info/time_between_train_steps": 0.003749370574951172, "step": 1723} {"info/global_step": 1724, "train_info/time_within_train_step": 2.651139497756958, "step": 1724} {"train_info/time_between_train_steps": 0.00418543815612793, "step": 1724} {"info/global_step": 1725, "train_info/time_within_train_step": 2.6660430431365967, "step": 1725} {"train_info/time_between_train_steps": 0.004776954650878906, "step": 1725} {"info/global_step": 1726, "train_info/time_within_train_step": 2.6466336250305176, "step": 1726} {"train_info/time_between_train_steps": 0.0035552978515625, "step": 1726} {"train_info/time_between_train_steps": 2.493161916732788, "step": 1726} {"info/global_step": 1727, "train_info/time_within_train_step": 2.6220176219940186, "step": 1727} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 1727} {"info/global_step": 1728, "train_info/time_within_train_step": 2.640591621398926, "step": 1728} {"train_info/time_between_train_steps": 0.00359344482421875, "step": 1728} {"info/global_step": 1729, "train_info/time_within_train_step": 2.652998208999634, "step": 1729} {"train_info/time_between_train_steps": 0.0033957958221435547, "step": 1729} {"info/global_step": 1730, "train_info/time_within_train_step": 2.6519763469696045, "step": 1730} {"train_info/time_between_train_steps": 0.0031309127807617188, "step": 1730} {"info/global_step": 1731, "train_info/time_within_train_step": 2.6410090923309326, "step": 1731} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 1731} {"info/global_step": 1732, "train_info/time_within_train_step": 2.645238161087036, "step": 1732} {"train_info/time_between_train_steps": 0.0033178329467773438, "step": 1732} {"info/global_step": 1733, "train_info/time_within_train_step": 2.6416001319885254, "step": 1733} {"train_info/time_between_train_steps": 0.0033109188079833984, "step": 1733} {"info/global_step": 1734, "train_info/time_within_train_step": 2.6360886096954346, "step": 1734} {"train_info/time_between_train_steps": 0.0033042430877685547, "step": 1734} {"info/global_step": 1735, "train_info/time_within_train_step": 3.050699472427368, "step": 1735} {"train_info/time_between_train_steps": 0.003246307373046875, "step": 1735} {"info/global_step": 1736, "train_info/time_within_train_step": 2.613797426223755, "step": 1736} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 1736} {"info/global_step": 1737, "train_info/time_within_train_step": 2.638763666152954, "step": 1737} {"train_info/time_between_train_steps": 0.003334522247314453, "step": 1737} {"info/global_step": 1738, "train_info/time_within_train_step": 2.6230175495147705, "step": 1738} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 1738} {"info/global_step": 1739, "train_info/time_within_train_step": 2.638197660446167, "step": 1739} {"train_info/time_between_train_steps": 0.003294706344604492, "step": 1739} {"info/global_step": 1740, "train_info/time_within_train_step": 2.637002468109131, "step": 1740} {"train_info/time_between_train_steps": 0.0032858848571777344, "step": 1740} {"info/global_step": 1741, "train_info/time_within_train_step": 2.6350631713867188, "step": 1741} {"train_info/time_between_train_steps": 0.0034737586975097656, "step": 1741} {"info/global_step": 1742, "train_info/time_within_train_step": 2.622889280319214, "step": 1742} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 1742} {"info/global_step": 1743, "train_info/time_within_train_step": 2.5860774517059326, "step": 1743} {"train_info/time_between_train_steps": 0.0032753944396972656, "step": 1743} {"info/global_step": 1744, "train_info/time_within_train_step": 2.614912271499634, "step": 1744} {"train_info/time_between_train_steps": 0.003313302993774414, "step": 1744} {"info/global_step": 1745, "train_info/time_within_train_step": 2.5965194702148438, "step": 1745} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 1745} {"info/global_step": 1746, "train_info/time_within_train_step": 2.6399521827697754, "step": 1746} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 1746} {"info/global_step": 1747, "train_info/time_within_train_step": 2.6747756004333496, "step": 1747} {"train_info/time_between_train_steps": 0.0032219886779785156, "step": 1747} {"info/global_step": 1748, "train_info/time_within_train_step": 2.6428723335266113, "step": 1748} {"train_info/time_between_train_steps": 0.0031244754791259766, "step": 1748} {"info/global_step": 1749, "train_info/time_within_train_step": 2.649693012237549, "step": 1749} {"train_info/time_between_train_steps": 0.0031328201293945312, "step": 1749} {"info/global_step": 1750, "train_info/time_within_train_step": 3.2092831134796143, "step": 1750} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746902280, "_runtime": 4878}, "step": 1750} {"logs": {"train/loss": 4.4473, "train/learning_rate": 0.0005499999999999999, "train/epoch": 2.0, "_timestamp": 1746902280, "_runtime": 4878}, "step": 1750} {"train_info/time_between_train_steps": 0.0235593318939209, "step": 1750} {"info/global_step": 1751, "train_info/time_within_train_step": 2.640550374984741, "step": 1751} {"train_info/time_between_train_steps": 0.0031108856201171875, "step": 1751} {"info/global_step": 1752, "train_info/time_within_train_step": 2.64207124710083, "step": 1752} {"train_info/time_between_train_steps": 0.0031120777130126953, "step": 1752} {"info/global_step": 1753, "train_info/time_within_train_step": 2.6689069271087646, "step": 1753} {"train_info/time_between_train_steps": 0.003229856491088867, "step": 1753} {"info/global_step": 1754, "train_info/time_within_train_step": 2.6442675590515137, "step": 1754} {"train_info/time_between_train_steps": 0.003122568130493164, "step": 1754} {"info/global_step": 1755, "train_info/time_within_train_step": 2.6573123931884766, "step": 1755} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 1755} {"info/global_step": 1756, "train_info/time_within_train_step": 2.6632778644561768, "step": 1756} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 1756} {"info/global_step": 1757, "train_info/time_within_train_step": 2.6594691276550293, "step": 1757} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 1757} {"info/global_step": 1758, "train_info/time_within_train_step": 2.6969244480133057, "step": 1758} {"train_info/time_between_train_steps": 0.0031223297119140625, "step": 1758} {"info/global_step": 1759, "train_info/time_within_train_step": 2.6385512351989746, "step": 1759} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 1759} {"info/global_step": 1760, "train_info/time_within_train_step": 2.6395158767700195, "step": 1760} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 1760} {"info/global_step": 1761, "train_info/time_within_train_step": 2.6604812145233154, "step": 1761} {"train_info/time_between_train_steps": 0.0032486915588378906, "step": 1761} {"info/global_step": 1762, "train_info/time_within_train_step": 2.6521530151367188, "step": 1762} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 1762} {"info/global_step": 1763, "train_info/time_within_train_step": 2.643685817718506, "step": 1763} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 1763} {"info/global_step": 1764, "train_info/time_within_train_step": 2.6561050415039062, "step": 1764} {"train_info/time_between_train_steps": 0.003124713897705078, "step": 1764} {"info/global_step": 1765, "train_info/time_within_train_step": 2.6498587131500244, "step": 1765} {"train_info/time_between_train_steps": 0.0033652782440185547, "step": 1765} {"info/global_step": 1766, "train_info/time_within_train_step": 2.65861439704895, "step": 1766} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 1766} {"info/global_step": 1767, "train_info/time_within_train_step": 2.716427803039551, "step": 1767} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 1767} {"info/global_step": 1768, "train_info/time_within_train_step": 2.691202163696289, "step": 1768} {"train_info/time_between_train_steps": 0.0031175613403320312, "step": 1768} {"info/global_step": 1769, "train_info/time_within_train_step": 2.654841661453247, "step": 1769} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 1769} {"info/global_step": 1770, "train_info/time_within_train_step": 2.6403610706329346, "step": 1770} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 1770} {"info/global_step": 1771, "train_info/time_within_train_step": 2.6557724475860596, "step": 1771} {"train_info/time_between_train_steps": 0.0031180381774902344, "step": 1771} {"info/global_step": 1772, "train_info/time_within_train_step": 2.653808355331421, "step": 1772} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 1772} {"info/global_step": 1773, "train_info/time_within_train_step": 2.643949508666992, "step": 1773} {"train_info/time_between_train_steps": 0.0031273365020751953, "step": 1773} {"info/global_step": 1774, "train_info/time_within_train_step": 2.652261734008789, "step": 1774} {"train_info/time_between_train_steps": 0.00312042236328125, "step": 1774} {"info/global_step": 1775, "train_info/time_within_train_step": 2.650658130645752, "step": 1775} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 1775} {"info/global_step": 1776, "train_info/time_within_train_step": 2.6557137966156006, "step": 1776} {"train_info/time_between_train_steps": 0.0033349990844726562, "step": 1776} {"info/global_step": 1777, "train_info/time_within_train_step": 2.663574457168579, "step": 1777} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 1777} {"info/global_step": 1778, "train_info/time_within_train_step": 2.6582818031311035, "step": 1778} {"train_info/time_between_train_steps": 0.0032324790954589844, "step": 1778} {"info/global_step": 1779, "train_info/time_within_train_step": 2.653698444366455, "step": 1779} {"train_info/time_between_train_steps": 0.003286600112915039, "step": 1779} {"info/global_step": 1780, "train_info/time_within_train_step": 2.879547119140625, "step": 1780} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 1780} {"info/global_step": 1781, "train_info/time_within_train_step": 2.644057035446167, "step": 1781} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 1781} {"info/global_step": 1782, "train_info/time_within_train_step": 2.6518497467041016, "step": 1782} {"train_info/time_between_train_steps": 0.003364086151123047, "step": 1782} {"info/global_step": 1783, "train_info/time_within_train_step": 2.6503546237945557, "step": 1783} {"train_info/time_between_train_steps": 0.0032486915588378906, "step": 1783} {"info/global_step": 1784, "train_info/time_within_train_step": 2.6694650650024414, "step": 1784} {"train_info/time_between_train_steps": 0.0031256675720214844, "step": 1784} {"info/global_step": 1785, "train_info/time_within_train_step": 2.690035343170166, "step": 1785} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 1785} {"info/global_step": 1786, "train_info/time_within_train_step": 2.663193702697754, "step": 1786} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 1786} {"info/global_step": 1787, "train_info/time_within_train_step": 2.6634178161621094, "step": 1787} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 1787} {"info/global_step": 1788, "train_info/time_within_train_step": 2.6456973552703857, "step": 1788} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 1788} {"info/global_step": 1789, "train_info/time_within_train_step": 2.7682583332061768, "step": 1789} {"train_info/time_between_train_steps": 0.0032672882080078125, "step": 1789} {"info/global_step": 1790, "train_info/time_within_train_step": 2.6713855266571045, "step": 1790} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 1790} {"info/global_step": 1791, "train_info/time_within_train_step": 2.64962100982666, "step": 1791} {"train_info/time_between_train_steps": 0.003225564956665039, "step": 1791} {"info/global_step": 1792, "train_info/time_within_train_step": 2.6878299713134766, "step": 1792} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 1792} {"info/global_step": 1793, "train_info/time_within_train_step": 2.64693021774292, "step": 1793} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 1793} {"info/global_step": 1794, "train_info/time_within_train_step": 2.6524221897125244, "step": 1794} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 1794} {"info/global_step": 1795, "train_info/time_within_train_step": 2.6595420837402344, "step": 1795} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 1795} {"info/global_step": 1796, "train_info/time_within_train_step": 2.663954973220825, "step": 1796} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 1796} {"info/global_step": 1797, "train_info/time_within_train_step": 2.644134044647217, "step": 1797} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 1797} {"info/global_step": 1798, "train_info/time_within_train_step": 2.6638195514678955, "step": 1798} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 1798} {"info/global_step": 1799, "train_info/time_within_train_step": 2.6762478351593018, "step": 1799} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 1799} {"info/global_step": 1800, "train_info/time_within_train_step": 2.6828787326812744, "step": 1800} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746902415, "_runtime": 5013}, "step": 1800} {"logs": {"train/loss": 4.3935, "train/learning_rate": 0.0005466666666666667, "train/epoch": 2.01, "_timestamp": 1746902415, "_runtime": 5013}, "step": 1800} {"train_info/time_between_train_steps": 64.65532374382019, "step": 1800} {"info/global_step": 1801, "train_info/time_within_train_step": 2.436414957046509, "step": 1801} {"train_info/time_between_train_steps": 0.0034799575805664062, "step": 1801} {"info/global_step": 1802, "train_info/time_within_train_step": 2.418339252471924, "step": 1802} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 1802} {"info/global_step": 1803, "train_info/time_within_train_step": 2.5204038619995117, "step": 1803} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 1803} {"info/global_step": 1804, "train_info/time_within_train_step": 2.6298389434814453, "step": 1804} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 1804} {"info/global_step": 1805, "train_info/time_within_train_step": 2.6354000568389893, "step": 1805} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 1805} {"info/global_step": 1806, "train_info/time_within_train_step": 2.6529829502105713, "step": 1806} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 1806} {"info/global_step": 1807, "train_info/time_within_train_step": 2.64860200881958, "step": 1807} {"train_info/time_between_train_steps": 0.0031402111053466797, "step": 1807} {"info/global_step": 1808, "train_info/time_within_train_step": 2.6559994220733643, "step": 1808} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 1808} {"info/global_step": 1809, "train_info/time_within_train_step": 2.697604179382324, "step": 1809} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 1809} {"info/global_step": 1810, "train_info/time_within_train_step": 2.701493263244629, "step": 1810} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 1810} {"info/global_step": 1811, "train_info/time_within_train_step": 2.6404528617858887, "step": 1811} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 1811} {"info/global_step": 1812, "train_info/time_within_train_step": 2.641467332839966, "step": 1812} {"train_info/time_between_train_steps": 0.0031256675720214844, "step": 1812} {"info/global_step": 1813, "train_info/time_within_train_step": 2.659761905670166, "step": 1813} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 1813} {"info/global_step": 1814, "train_info/time_within_train_step": 2.6530826091766357, "step": 1814} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 1814} {"info/global_step": 1815, "train_info/time_within_train_step": 2.643977165222168, "step": 1815} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 1815} {"info/global_step": 1816, "train_info/time_within_train_step": 2.642646312713623, "step": 1816} {"train_info/time_between_train_steps": 0.003116607666015625, "step": 1816} {"info/global_step": 1817, "train_info/time_within_train_step": 2.641134262084961, "step": 1817} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 1817} {"info/global_step": 1818, "train_info/time_within_train_step": 2.658088445663452, "step": 1818} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 1818} {"info/global_step": 1819, "train_info/time_within_train_step": 2.653075695037842, "step": 1819} {"train_info/time_between_train_steps": 0.0031702518463134766, "step": 1819} {"info/global_step": 1820, "train_info/time_within_train_step": 2.6443541049957275, "step": 1820} {"train_info/time_between_train_steps": 0.0031020641326904297, "step": 1820} {"info/global_step": 1821, "train_info/time_within_train_step": 2.6531643867492676, "step": 1821} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 1821} {"info/global_step": 1822, "train_info/time_within_train_step": 2.648466110229492, "step": 1822} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 1822} {"info/global_step": 1823, "train_info/time_within_train_step": 2.672401189804077, "step": 1823} {"train_info/time_between_train_steps": 0.0031490325927734375, "step": 1823} {"info/global_step": 1824, "train_info/time_within_train_step": 2.6670095920562744, "step": 1824} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 1824} {"info/global_step": 1825, "train_info/time_within_train_step": 2.657226085662842, "step": 1825} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 1825} {"info/global_step": 1826, "train_info/time_within_train_step": 2.685457944869995, "step": 1826} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 1826} {"info/global_step": 1827, "train_info/time_within_train_step": 2.6407649517059326, "step": 1827} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 1827} {"info/global_step": 1828, "train_info/time_within_train_step": 2.6556591987609863, "step": 1828} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 1828} {"info/global_step": 1829, "train_info/time_within_train_step": 2.658282995223999, "step": 1829} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 1829} {"info/global_step": 1830, "train_info/time_within_train_step": 2.6425483226776123, "step": 1830} {"train_info/time_between_train_steps": 0.0031223297119140625, "step": 1830} {"info/global_step": 1831, "train_info/time_within_train_step": 2.6430764198303223, "step": 1831} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 1831} {"info/global_step": 1832, "train_info/time_within_train_step": 2.6659882068634033, "step": 1832} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 1832} {"info/global_step": 1833, "train_info/time_within_train_step": 2.660020351409912, "step": 1833} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 1833} {"info/global_step": 1834, "train_info/time_within_train_step": 2.6620841026306152, "step": 1834} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 1834} {"info/global_step": 1835, "train_info/time_within_train_step": 2.704692840576172, "step": 1835} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 1835} {"info/global_step": 1836, "train_info/time_within_train_step": 2.661316156387329, "step": 1836} {"train_info/time_between_train_steps": 0.0031211376190185547, "step": 1836} {"info/global_step": 1837, "train_info/time_within_train_step": 2.665088653564453, "step": 1837} {"train_info/time_between_train_steps": 0.003109455108642578, "step": 1837} {"info/global_step": 1838, "train_info/time_within_train_step": 2.6545867919921875, "step": 1838} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 1838} {"info/global_step": 1839, "train_info/time_within_train_step": 2.643300771713257, "step": 1839} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 1839} {"info/global_step": 1840, "train_info/time_within_train_step": 2.65598201751709, "step": 1840} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 1840} {"info/global_step": 1841, "train_info/time_within_train_step": 2.651137590408325, "step": 1841} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 1841} {"info/global_step": 1842, "train_info/time_within_train_step": 2.6597557067871094, "step": 1842} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 1842} {"info/global_step": 1843, "train_info/time_within_train_step": 2.6938345432281494, "step": 1843} {"train_info/time_between_train_steps": 0.003204345703125, "step": 1843} {"info/global_step": 1844, "train_info/time_within_train_step": 2.7186756134033203, "step": 1844} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 1844} {"info/global_step": 1845, "train_info/time_within_train_step": 2.6451759338378906, "step": 1845} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 1845} {"info/global_step": 1846, "train_info/time_within_train_step": 2.6423261165618896, "step": 1846} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 1846} {"info/global_step": 1847, "train_info/time_within_train_step": 2.66074538230896, "step": 1847} {"train_info/time_between_train_steps": 0.003275156021118164, "step": 1847} {"info/global_step": 1848, "train_info/time_within_train_step": 2.647733449935913, "step": 1848} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 1848} {"info/global_step": 1849, "train_info/time_within_train_step": 2.6475796699523926, "step": 1849} {"train_info/time_between_train_steps": 0.0034017562866210938, "step": 1849} {"info/global_step": 1850, "train_info/time_within_train_step": 2.6486587524414062, "step": 1850} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746902613, "_runtime": 5211}, "step": 1850} {"logs": {"train/loss": 4.3725, "train/learning_rate": 0.0005433333333333333, "train/epoch": 2.01, "_timestamp": 1746902613, "_runtime": 5211}, "step": 1850} {"train_info/time_between_train_steps": 0.02408599853515625, "step": 1850} {"info/global_step": 1851, "train_info/time_within_train_step": 2.651749849319458, "step": 1851} {"train_info/time_between_train_steps": 0.182142972946167, "step": 1851} {"info/global_step": 1852, "train_info/time_within_train_step": 2.6529552936553955, "step": 1852} {"train_info/time_between_train_steps": 0.0034067630767822266, "step": 1852} {"info/global_step": 1853, "train_info/time_within_train_step": 2.645312786102295, "step": 1853} {"train_info/time_between_train_steps": 0.0033397674560546875, "step": 1853} {"info/global_step": 1854, "train_info/time_within_train_step": 2.6487061977386475, "step": 1854} {"train_info/time_between_train_steps": 0.003396272659301758, "step": 1854} {"info/global_step": 1855, "train_info/time_within_train_step": 2.6606199741363525, "step": 1855} {"train_info/time_between_train_steps": 0.003543376922607422, "step": 1855} {"info/global_step": 1856, "train_info/time_within_train_step": 2.669412136077881, "step": 1856} {"train_info/time_between_train_steps": 0.0033807754516601562, "step": 1856} {"info/global_step": 1857, "train_info/time_within_train_step": 2.671708106994629, "step": 1857} {"train_info/time_between_train_steps": 0.003460407257080078, "step": 1857} {"info/global_step": 1858, "train_info/time_within_train_step": 2.6877284049987793, "step": 1858} {"train_info/time_between_train_steps": 0.0034058094024658203, "step": 1858} {"info/global_step": 1859, "train_info/time_within_train_step": 2.6516268253326416, "step": 1859} {"train_info/time_between_train_steps": 0.0033941268920898438, "step": 1859} {"info/global_step": 1860, "train_info/time_within_train_step": 2.642021417617798, "step": 1860} {"train_info/time_between_train_steps": 0.003510713577270508, "step": 1860} {"info/global_step": 1861, "train_info/time_within_train_step": 2.6550703048706055, "step": 1861} {"train_info/time_between_train_steps": 0.003518342971801758, "step": 1861} {"info/global_step": 1862, "train_info/time_within_train_step": 3.0196008682250977, "step": 1862} {"train_info/time_between_train_steps": 0.0034227371215820312, "step": 1862} {"info/global_step": 1863, "train_info/time_within_train_step": 2.702317953109741, "step": 1863} {"train_info/time_between_train_steps": 0.003494739532470703, "step": 1863} {"info/global_step": 1864, "train_info/time_within_train_step": 2.6421751976013184, "step": 1864} {"train_info/time_between_train_steps": 0.0034284591674804688, "step": 1864} {"info/global_step": 1865, "train_info/time_within_train_step": 2.643625020980835, "step": 1865} {"train_info/time_between_train_steps": 0.0035393238067626953, "step": 1865} {"info/global_step": 1866, "train_info/time_within_train_step": 2.648881196975708, "step": 1866} {"train_info/time_between_train_steps": 0.003445148468017578, "step": 1866} {"info/global_step": 1867, "train_info/time_within_train_step": 2.6629817485809326, "step": 1867} {"train_info/time_between_train_steps": 0.003508329391479492, "step": 1867} {"info/global_step": 1868, "train_info/time_within_train_step": 2.645258903503418, "step": 1868} {"train_info/time_between_train_steps": 0.0035750865936279297, "step": 1868} {"info/global_step": 1869, "train_info/time_within_train_step": 2.643775224685669, "step": 1869} {"train_info/time_between_train_steps": 0.003479480743408203, "step": 1869} {"info/global_step": 1870, "train_info/time_within_train_step": 2.665715217590332, "step": 1870} {"train_info/time_between_train_steps": 0.0034630298614501953, "step": 1870} {"info/global_step": 1871, "train_info/time_within_train_step": 2.6697964668273926, "step": 1871} {"train_info/time_between_train_steps": 0.003478527069091797, "step": 1871} {"info/global_step": 1872, "train_info/time_within_train_step": 2.6869313716888428, "step": 1872} {"train_info/time_between_train_steps": 0.0034837722778320312, "step": 1872} {"info/global_step": 1873, "train_info/time_within_train_step": 2.65000057220459, "step": 1873} {"train_info/time_between_train_steps": 0.0034377574920654297, "step": 1873} {"info/global_step": 1874, "train_info/time_within_train_step": 2.6829497814178467, "step": 1874} {"train_info/time_between_train_steps": 0.0034699440002441406, "step": 1874} {"info/global_step": 1875, "train_info/time_within_train_step": 2.6411666870117188, "step": 1875} {"train_info/time_between_train_steps": 0.0035452842712402344, "step": 1875} {"info/global_step": 1876, "train_info/time_within_train_step": 2.646742820739746, "step": 1876} {"train_info/time_between_train_steps": 0.003565549850463867, "step": 1876} {"info/global_step": 1877, "train_info/time_within_train_step": 2.667673349380493, "step": 1877} {"train_info/time_between_train_steps": 0.0036563873291015625, "step": 1877} {"info/global_step": 1878, "train_info/time_within_train_step": 2.6472280025482178, "step": 1878} {"train_info/time_between_train_steps": 0.003507852554321289, "step": 1878} {"info/global_step": 1879, "train_info/time_within_train_step": 2.6442222595214844, "step": 1879} {"train_info/time_between_train_steps": 0.0037534236907958984, "step": 1879} {"info/global_step": 1880, "train_info/time_within_train_step": 2.663767099380493, "step": 1880} {"train_info/time_between_train_steps": 0.0036344528198242188, "step": 1880} {"info/global_step": 1881, "train_info/time_within_train_step": 2.6678738594055176, "step": 1881} {"train_info/time_between_train_steps": 0.003582000732421875, "step": 1881} {"info/global_step": 1882, "train_info/time_within_train_step": 2.652918815612793, "step": 1882} {"train_info/time_between_train_steps": 0.003590106964111328, "step": 1882} {"info/global_step": 1883, "train_info/time_within_train_step": 2.6759939193725586, "step": 1883} {"train_info/time_between_train_steps": 0.0036344528198242188, "step": 1883} {"info/global_step": 1884, "train_info/time_within_train_step": 2.730703830718994, "step": 1884} {"train_info/time_between_train_steps": 0.0035309791564941406, "step": 1884} {"info/global_step": 1885, "train_info/time_within_train_step": 2.663684606552124, "step": 1885} {"train_info/time_between_train_steps": 0.003575563430786133, "step": 1885} {"info/global_step": 1886, "train_info/time_within_train_step": 2.6519060134887695, "step": 1886} {"train_info/time_between_train_steps": 0.0035867691040039062, "step": 1886} {"info/global_step": 1887, "train_info/time_within_train_step": 2.641893148422241, "step": 1887} {"train_info/time_between_train_steps": 0.0035712718963623047, "step": 1887} {"info/global_step": 1888, "train_info/time_within_train_step": 2.6699795722961426, "step": 1888} {"train_info/time_between_train_steps": 0.0035293102264404297, "step": 1888} {"info/global_step": 1889, "train_info/time_within_train_step": 2.6546175479888916, "step": 1889} {"train_info/time_between_train_steps": 0.003522157669067383, "step": 1889} {"info/global_step": 1890, "train_info/time_within_train_step": 2.645529270172119, "step": 1890} {"train_info/time_between_train_steps": 0.0035750865936279297, "step": 1890} {"info/global_step": 1891, "train_info/time_within_train_step": 2.6521754264831543, "step": 1891} {"train_info/time_between_train_steps": 0.0036814212799072266, "step": 1891} {"info/global_step": 1892, "train_info/time_within_train_step": 2.645961046218872, "step": 1892} {"train_info/time_between_train_steps": 0.0035064220428466797, "step": 1892} {"info/global_step": 1893, "train_info/time_within_train_step": 2.669055461883545, "step": 1893} {"train_info/time_between_train_steps": 0.003492116928100586, "step": 1893} {"info/global_step": 1894, "train_info/time_within_train_step": 2.669386863708496, "step": 1894} {"train_info/time_between_train_steps": 0.003452777862548828, "step": 1894} {"info/global_step": 1895, "train_info/time_within_train_step": 2.657292366027832, "step": 1895} {"train_info/time_between_train_steps": 0.0034782886505126953, "step": 1895} {"info/global_step": 1896, "train_info/time_within_train_step": 2.6665751934051514, "step": 1896} {"train_info/time_between_train_steps": 0.0034971237182617188, "step": 1896} {"info/global_step": 1897, "train_info/time_within_train_step": 2.6425750255584717, "step": 1897} {"train_info/time_between_train_steps": 0.0034117698669433594, "step": 1897} {"info/global_step": 1898, "train_info/time_within_train_step": 2.6559739112854004, "step": 1898} {"train_info/time_between_train_steps": 0.003461599349975586, "step": 1898} {"info/global_step": 1899, "train_info/time_within_train_step": 2.6600446701049805, "step": 1899} {"train_info/time_between_train_steps": 0.003398895263671875, "step": 1899} {"info/global_step": 1900, "train_info/time_within_train_step": 2.648481607437134, "step": 1900} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746902747, "_runtime": 5345}, "step": 1900} {"logs": {"train/loss": 4.3503, "train/learning_rate": 0.00054, "train/epoch": 2.02, "_timestamp": 1746902747, "_runtime": 5345}, "step": 1900} {"train_info/time_between_train_steps": 0.02421092987060547, "step": 1900} {"info/global_step": 1901, "train_info/time_within_train_step": 2.659993886947632, "step": 1901} {"train_info/time_between_train_steps": 0.0035555362701416016, "step": 1901} {"info/global_step": 1902, "train_info/time_within_train_step": 2.674952268600464, "step": 1902} {"train_info/time_between_train_steps": 0.0034399032592773438, "step": 1902} {"info/global_step": 1903, "train_info/time_within_train_step": 2.6768734455108643, "step": 1903} {"train_info/time_between_train_steps": 0.0036013126373291016, "step": 1903} {"info/global_step": 1904, "train_info/time_within_train_step": 2.6515517234802246, "step": 1904} {"train_info/time_between_train_steps": 0.0036411285400390625, "step": 1904} {"info/global_step": 1905, "train_info/time_within_train_step": 2.6929931640625, "step": 1905} {"train_info/time_between_train_steps": 0.0034263134002685547, "step": 1905} {"info/global_step": 1906, "train_info/time_within_train_step": 2.642162561416626, "step": 1906} {"train_info/time_between_train_steps": 0.004613637924194336, "step": 1906} {"info/global_step": 1907, "train_info/time_within_train_step": 2.6557180881500244, "step": 1907} {"train_info/time_between_train_steps": 0.003499269485473633, "step": 1907} {"info/global_step": 1908, "train_info/time_within_train_step": 2.6587533950805664, "step": 1908} {"train_info/time_between_train_steps": 0.0034313201904296875, "step": 1908} {"info/global_step": 1909, "train_info/time_within_train_step": 2.643541097640991, "step": 1909} {"train_info/time_between_train_steps": 0.003487110137939453, "step": 1909} {"info/global_step": 1910, "train_info/time_within_train_step": 2.673013210296631, "step": 1910} {"train_info/time_between_train_steps": 0.003602743148803711, "step": 1910} {"info/global_step": 1911, "train_info/time_within_train_step": 2.6679787635803223, "step": 1911} {"train_info/time_between_train_steps": 0.0034360885620117188, "step": 1911} {"info/global_step": 1912, "train_info/time_within_train_step": 2.6975131034851074, "step": 1912} {"train_info/time_between_train_steps": 0.003448963165283203, "step": 1912} {"info/global_step": 1913, "train_info/time_within_train_step": 2.641174554824829, "step": 1913} {"train_info/time_between_train_steps": 0.0034444332122802734, "step": 1913} {"info/global_step": 1914, "train_info/time_within_train_step": 2.8235909938812256, "step": 1914} {"train_info/time_between_train_steps": 0.0033004283905029297, "step": 1914} {"info/global_step": 1915, "train_info/time_within_train_step": 2.6532843112945557, "step": 1915} {"train_info/time_between_train_steps": 0.003299236297607422, "step": 1915} {"info/global_step": 1916, "train_info/time_within_train_step": 2.647144317626953, "step": 1916} {"train_info/time_between_train_steps": 0.0032906532287597656, "step": 1916} {"info/global_step": 1917, "train_info/time_within_train_step": 2.6463167667388916, "step": 1917} {"train_info/time_between_train_steps": 0.0032863616943359375, "step": 1917} {"info/global_step": 1918, "train_info/time_within_train_step": 2.6486804485321045, "step": 1918} {"train_info/time_between_train_steps": 0.003288745880126953, "step": 1918} {"info/global_step": 1919, "train_info/time_within_train_step": 2.6523091793060303, "step": 1919} {"train_info/time_between_train_steps": 0.0033195018768310547, "step": 1919} {"info/global_step": 1920, "train_info/time_within_train_step": 2.965089797973633, "step": 1920} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 1920} {"info/global_step": 1921, "train_info/time_within_train_step": 2.641298770904541, "step": 1921} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 1921} {"info/global_step": 1922, "train_info/time_within_train_step": 2.662916898727417, "step": 1922} {"train_info/time_between_train_steps": 0.0032074451446533203, "step": 1922} {"info/global_step": 1923, "train_info/time_within_train_step": 2.6473116874694824, "step": 1923} {"train_info/time_between_train_steps": 0.003227710723876953, "step": 1923} {"info/global_step": 1924, "train_info/time_within_train_step": 2.643216371536255, "step": 1924} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 1924} {"info/global_step": 1925, "train_info/time_within_train_step": 2.6535842418670654, "step": 1925} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 1925} {"info/global_step": 1926, "train_info/time_within_train_step": 2.6506216526031494, "step": 1926} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 1926} {"info/global_step": 1927, "train_info/time_within_train_step": 2.658867835998535, "step": 1927} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 1927} {"info/global_step": 1928, "train_info/time_within_train_step": 2.694420576095581, "step": 1928} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 1928} {"info/global_step": 1929, "train_info/time_within_train_step": 2.711418867111206, "step": 1929} {"train_info/time_between_train_steps": 0.0032503604888916016, "step": 1929} {"info/global_step": 1930, "train_info/time_within_train_step": 2.638956069946289, "step": 1930} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 1930} {"info/global_step": 1931, "train_info/time_within_train_step": 2.6399073600769043, "step": 1931} {"train_info/time_between_train_steps": 0.003496885299682617, "step": 1931} {"info/global_step": 1932, "train_info/time_within_train_step": 2.6663036346435547, "step": 1932} {"train_info/time_between_train_steps": 0.0035238265991210938, "step": 1932} {"info/global_step": 1933, "train_info/time_within_train_step": 2.6475000381469727, "step": 1933} {"train_info/time_between_train_steps": 0.003561258316040039, "step": 1933} {"info/global_step": 1934, "train_info/time_within_train_step": 2.6473512649536133, "step": 1934} {"train_info/time_between_train_steps": 0.004022121429443359, "step": 1934} {"info/global_step": 1935, "train_info/time_within_train_step": 2.6513843536376953, "step": 1935} {"train_info/time_between_train_steps": 0.00408625602722168, "step": 1935} {"info/global_step": 1936, "train_info/time_within_train_step": 2.6446373462677, "step": 1936} {"train_info/time_between_train_steps": 0.0038220882415771484, "step": 1936} {"info/global_step": 1937, "train_info/time_within_train_step": 2.6484169960021973, "step": 1937} {"train_info/time_between_train_steps": 0.003952741622924805, "step": 1937} {"info/global_step": 1938, "train_info/time_within_train_step": 2.647010564804077, "step": 1938} {"train_info/time_between_train_steps": 0.004002094268798828, "step": 1938} {"info/global_step": 1939, "train_info/time_within_train_step": 2.68221116065979, "step": 1939} {"train_info/time_between_train_steps": 0.00391840934753418, "step": 1939} {"info/global_step": 1940, "train_info/time_within_train_step": 2.6467502117156982, "step": 1940} {"train_info/time_between_train_steps": 0.0037369728088378906, "step": 1940} {"info/global_step": 1941, "train_info/time_within_train_step": 2.6541247367858887, "step": 1941} {"train_info/time_between_train_steps": 0.0039484500885009766, "step": 1941} {"info/global_step": 1942, "train_info/time_within_train_step": 2.6481125354766846, "step": 1942} {"train_info/time_between_train_steps": 0.0038080215454101562, "step": 1942} {"info/global_step": 1943, "train_info/time_within_train_step": 2.667635440826416, "step": 1943} {"train_info/time_between_train_steps": 0.0037724971771240234, "step": 1943} {"info/global_step": 1944, "train_info/time_within_train_step": 2.6506283283233643, "step": 1944} {"train_info/time_between_train_steps": 0.003717660903930664, "step": 1944} {"info/global_step": 1945, "train_info/time_within_train_step": 2.645195960998535, "step": 1945} {"train_info/time_between_train_steps": 0.003826141357421875, "step": 1945} {"info/global_step": 1946, "train_info/time_within_train_step": 2.6606976985931396, "step": 1946} {"train_info/time_between_train_steps": 0.003694295883178711, "step": 1946} {"info/global_step": 1947, "train_info/time_within_train_step": 2.651317596435547, "step": 1947} {"train_info/time_between_train_steps": 0.0038068294525146484, "step": 1947} {"info/global_step": 1948, "train_info/time_within_train_step": 2.659992218017578, "step": 1948} {"train_info/time_between_train_steps": 0.00391840934753418, "step": 1948} {"info/global_step": 1949, "train_info/time_within_train_step": 2.691150426864624, "step": 1949} {"train_info/time_between_train_steps": 0.0037221908569335938, "step": 1949} {"info/global_step": 1950, "train_info/time_within_train_step": 2.732367992401123, "step": 1950} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746902884, "_runtime": 5482}, "step": 1950} {"logs": {"train/loss": 4.325, "train/learning_rate": 0.0005366666666666666, "train/epoch": 2.02, "_timestamp": 1746902884, "_runtime": 5482}, "step": 1950} {"train_info/time_between_train_steps": 0.024324655532836914, "step": 1950} {"info/global_step": 1951, "train_info/time_within_train_step": 2.727384090423584, "step": 1951} {"train_info/time_between_train_steps": 0.003911018371582031, "step": 1951} {"info/global_step": 1952, "train_info/time_within_train_step": 2.6504464149475098, "step": 1952} {"train_info/time_between_train_steps": 0.0037698745727539062, "step": 1952} {"info/global_step": 1953, "train_info/time_within_train_step": 2.6431729793548584, "step": 1953} {"train_info/time_between_train_steps": 0.0038073062896728516, "step": 1953} {"info/global_step": 1954, "train_info/time_within_train_step": 2.6561789512634277, "step": 1954} {"train_info/time_between_train_steps": 0.0037772655487060547, "step": 1954} {"info/global_step": 1955, "train_info/time_within_train_step": 2.6503560543060303, "step": 1955} {"train_info/time_between_train_steps": 0.0037178993225097656, "step": 1955} {"info/global_step": 1956, "train_info/time_within_train_step": 2.6532247066497803, "step": 1956} {"train_info/time_between_train_steps": 0.003847360610961914, "step": 1956} {"info/global_step": 1957, "train_info/time_within_train_step": 2.645685911178589, "step": 1957} {"train_info/time_between_train_steps": 0.004098176956176758, "step": 1957} {"info/global_step": 1958, "train_info/time_within_train_step": 2.6510608196258545, "step": 1958} {"train_info/time_between_train_steps": 0.0037403106689453125, "step": 1958} {"info/global_step": 1959, "train_info/time_within_train_step": 2.6602044105529785, "step": 1959} {"train_info/time_between_train_steps": 0.003853321075439453, "step": 1959} {"info/global_step": 1960, "train_info/time_within_train_step": 2.668755292892456, "step": 1960} {"train_info/time_between_train_steps": 0.003638744354248047, "step": 1960} {"info/global_step": 1961, "train_info/time_within_train_step": 3.070380449295044, "step": 1961} {"train_info/time_between_train_steps": 0.003332853317260742, "step": 1961} {"info/global_step": 1962, "train_info/time_within_train_step": 2.644247531890869, "step": 1962} {"train_info/time_between_train_steps": 0.003339529037475586, "step": 1962} {"info/global_step": 1963, "train_info/time_within_train_step": 2.648669481277466, "step": 1963} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 1963} {"info/global_step": 1964, "train_info/time_within_train_step": 2.6435012817382812, "step": 1964} {"train_info/time_between_train_steps": 0.003262042999267578, "step": 1964} {"info/global_step": 1965, "train_info/time_within_train_step": 2.667783498764038, "step": 1965} {"train_info/time_between_train_steps": 0.003278017044067383, "step": 1965} {"info/global_step": 1966, "train_info/time_within_train_step": 2.680725336074829, "step": 1966} {"train_info/time_between_train_steps": 0.003639698028564453, "step": 1966} {"info/global_step": 1967, "train_info/time_within_train_step": 2.6824426651000977, "step": 1967} {"train_info/time_between_train_steps": 0.003268003463745117, "step": 1967} {"info/global_step": 1968, "train_info/time_within_train_step": 2.654680013656616, "step": 1968} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 1968} {"info/global_step": 1969, "train_info/time_within_train_step": 2.6461293697357178, "step": 1969} {"train_info/time_between_train_steps": 0.0032958984375, "step": 1969} {"info/global_step": 1970, "train_info/time_within_train_step": 2.6565983295440674, "step": 1970} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 1970} {"info/global_step": 1971, "train_info/time_within_train_step": 2.644416093826294, "step": 1971} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 1971} {"info/global_step": 1972, "train_info/time_within_train_step": 2.6455929279327393, "step": 1972} {"train_info/time_between_train_steps": 0.0032501220703125, "step": 1972} {"info/global_step": 1973, "train_info/time_within_train_step": 2.670436143875122, "step": 1973} {"train_info/time_between_train_steps": 0.003262758255004883, "step": 1973} {"info/global_step": 1974, "train_info/time_within_train_step": 2.667625904083252, "step": 1974} {"train_info/time_between_train_steps": 0.0033423900604248047, "step": 1974} {"info/global_step": 1975, "train_info/time_within_train_step": 2.657393217086792, "step": 1975} {"train_info/time_between_train_steps": 0.0032837390899658203, "step": 1975} {"info/global_step": 1976, "train_info/time_within_train_step": 2.7077150344848633, "step": 1976} {"train_info/time_between_train_steps": 0.14865875244140625, "step": 1976} {"info/global_step": 1977, "train_info/time_within_train_step": 2.679926872253418, "step": 1977} {"train_info/time_between_train_steps": 0.0033049583435058594, "step": 1977} {"info/global_step": 1978, "train_info/time_within_train_step": 2.651681423187256, "step": 1978} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 1978} {"info/global_step": 1979, "train_info/time_within_train_step": 2.68501877784729, "step": 1979} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 1979} {"info/global_step": 1980, "train_info/time_within_train_step": 2.640441656112671, "step": 1980} {"train_info/time_between_train_steps": 0.003190755844116211, "step": 1980} {"info/global_step": 1981, "train_info/time_within_train_step": 2.647897720336914, "step": 1981} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 1981} {"info/global_step": 1982, "train_info/time_within_train_step": 2.6658570766448975, "step": 1982} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 1982} {"info/global_step": 1983, "train_info/time_within_train_step": 2.646624803543091, "step": 1983} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 1983} {"info/global_step": 1984, "train_info/time_within_train_step": 2.643436908721924, "step": 1984} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 1984} {"info/global_step": 1985, "train_info/time_within_train_step": 2.660979747772217, "step": 1985} {"train_info/time_between_train_steps": 0.004474639892578125, "step": 1985} {"info/global_step": 1986, "train_info/time_within_train_step": 2.6601154804229736, "step": 1986} {"train_info/time_between_train_steps": 0.003235340118408203, "step": 1986} {"info/global_step": 1987, "train_info/time_within_train_step": 2.672212600708008, "step": 1987} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 1987} {"info/global_step": 1988, "train_info/time_within_train_step": 2.6688482761383057, "step": 1988} {"train_info/time_between_train_steps": 0.003250598907470703, "step": 1988} {"info/global_step": 1989, "train_info/time_within_train_step": 2.6954755783081055, "step": 1989} {"train_info/time_between_train_steps": 0.003204345703125, "step": 1989} {"info/global_step": 1990, "train_info/time_within_train_step": 2.64711594581604, "step": 1990} {"train_info/time_between_train_steps": 0.003183126449584961, "step": 1990} {"info/global_step": 1991, "train_info/time_within_train_step": 2.652665376663208, "step": 1991} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 1991} {"info/global_step": 1992, "train_info/time_within_train_step": 2.6689679622650146, "step": 1992} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 1992} {"info/global_step": 1993, "train_info/time_within_train_step": 2.728776454925537, "step": 1993} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 1993} {"info/global_step": 1994, "train_info/time_within_train_step": 2.6703951358795166, "step": 1994} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 1994} {"info/global_step": 1995, "train_info/time_within_train_step": 2.6404824256896973, "step": 1995} {"train_info/time_between_train_steps": 0.003297567367553711, "step": 1995} {"info/global_step": 1996, "train_info/time_within_train_step": 2.6409988403320312, "step": 1996} {"train_info/time_between_train_steps": 0.003261089324951172, "step": 1996} {"info/global_step": 1997, "train_info/time_within_train_step": 2.659804582595825, "step": 1997} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 1997} {"info/global_step": 1998, "train_info/time_within_train_step": 2.6555416584014893, "step": 1998} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 1998} {"info/global_step": 1999, "train_info/time_within_train_step": 2.643099784851074, "step": 1999} {"train_info/time_between_train_steps": 0.0032732486724853516, "step": 1999} {"info/global_step": 2000, "train_info/time_within_train_step": 3.2568557262420654, "step": 2000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746903019, "_runtime": 5617}, "step": 2000} {"logs": {"train/loss": 4.3075, "train/learning_rate": 0.0005333333333333333, "train/epoch": 2.03, "_timestamp": 1746903019, "_runtime": 5617}, "step": 2000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746903024, "_runtime": 5622}, "step": 2000} {"logs": {"eval/loss": 4.778219223022461, "eval/runtime": 5.1712, "eval/samples_per_second": 37.129, "eval/steps_per_second": 1.16, "train/epoch": 2.03, "_timestamp": 1746903024, "_runtime": 5622}, "step": 2000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746903024, "_runtime": 5622}, "step": 2000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.778219223022461, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 118.89244049815034, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1712, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 37.129, "train/epoch": 2.03, "_timestamp": 1746903024, "_runtime": 5622}, "step": 2000} {"train_info/time_between_train_steps": 18.43690538406372, "step": 2000} {"info/global_step": 2001, "train_info/time_within_train_step": 2.45688796043396, "step": 2001} {"train_info/time_between_train_steps": 0.003229856491088867, "step": 2001} {"info/global_step": 2002, "train_info/time_within_train_step": 2.4684488773345947, "step": 2002} {"train_info/time_between_train_steps": 0.003299713134765625, "step": 2002} {"info/global_step": 2003, "train_info/time_within_train_step": 2.6576836109161377, "step": 2003} {"train_info/time_between_train_steps": 0.0032651424407958984, "step": 2003} {"info/global_step": 2004, "train_info/time_within_train_step": 2.658285617828369, "step": 2004} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 2004} {"info/global_step": 2005, "train_info/time_within_train_step": 2.697594404220581, "step": 2005} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 2005} {"info/global_step": 2006, "train_info/time_within_train_step": 2.6398065090179443, "step": 2006} {"train_info/time_between_train_steps": 0.0032629966735839844, "step": 2006} {"info/global_step": 2007, "train_info/time_within_train_step": 2.6384315490722656, "step": 2007} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 2007} {"info/global_step": 2008, "train_info/time_within_train_step": 2.6653120517730713, "step": 2008} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 2008} {"info/global_step": 2009, "train_info/time_within_train_step": 2.6470630168914795, "step": 2009} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 2009} {"info/global_step": 2010, "train_info/time_within_train_step": 2.643282413482666, "step": 2010} {"train_info/time_between_train_steps": 0.003238677978515625, "step": 2010} {"info/global_step": 2011, "train_info/time_within_train_step": 2.654366970062256, "step": 2011} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 2011} {"info/global_step": 2012, "train_info/time_within_train_step": 2.6515274047851562, "step": 2012} {"train_info/time_between_train_steps": 0.0032629966735839844, "step": 2012} {"info/global_step": 2013, "train_info/time_within_train_step": 2.6610846519470215, "step": 2013} {"train_info/time_between_train_steps": 0.003226757049560547, "step": 2013} {"info/global_step": 2014, "train_info/time_within_train_step": 2.690549612045288, "step": 2014} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 2014} {"info/global_step": 2015, "train_info/time_within_train_step": 2.6617472171783447, "step": 2015} {"train_info/time_between_train_steps": 0.0032358169555664062, "step": 2015} {"info/global_step": 2016, "train_info/time_within_train_step": 2.642446756362915, "step": 2016} {"train_info/time_between_train_steps": 0.003222942352294922, "step": 2016} {"info/global_step": 2017, "train_info/time_within_train_step": 2.6541218757629395, "step": 2017} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 2017} {"info/global_step": 2018, "train_info/time_within_train_step": 2.652799606323242, "step": 2018} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 2018} {"info/global_step": 2019, "train_info/time_within_train_step": 2.6555166244506836, "step": 2019} {"train_info/time_between_train_steps": 0.003226041793823242, "step": 2019} {"info/global_step": 2020, "train_info/time_within_train_step": 2.6455278396606445, "step": 2020} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 2020} {"info/global_step": 2021, "train_info/time_within_train_step": 2.650155544281006, "step": 2021} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 2021} {"info/global_step": 2022, "train_info/time_within_train_step": 2.6602365970611572, "step": 2022} {"train_info/time_between_train_steps": 0.0032596588134765625, "step": 2022} {"info/global_step": 2023, "train_info/time_within_train_step": 2.675306797027588, "step": 2023} {"train_info/time_between_train_steps": 0.0032682418823242188, "step": 2023} {"info/global_step": 2024, "train_info/time_within_train_step": 2.7112085819244385, "step": 2024} {"train_info/time_between_train_steps": 0.003173828125, "step": 2024} {"info/global_step": 2025, "train_info/time_within_train_step": 2.6506764888763428, "step": 2025} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 2025} {"info/global_step": 2026, "train_info/time_within_train_step": 2.671487808227539, "step": 2026} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 2026} {"info/global_step": 2027, "train_info/time_within_train_step": 2.6609432697296143, "step": 2027} {"train_info/time_between_train_steps": 0.0032875537872314453, "step": 2027} {"info/global_step": 2028, "train_info/time_within_train_step": 2.649543046951294, "step": 2028} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 2028} {"info/global_step": 2029, "train_info/time_within_train_step": 2.6460721492767334, "step": 2029} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 2029} {"info/global_step": 2030, "train_info/time_within_train_step": 2.672199010848999, "step": 2030} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 2030} {"info/global_step": 2031, "train_info/time_within_train_step": 2.6694271564483643, "step": 2031} {"train_info/time_between_train_steps": 0.0032074451446533203, "step": 2031} {"info/global_step": 2032, "train_info/time_within_train_step": 2.9122042655944824, "step": 2032} {"train_info/time_between_train_steps": 0.003271341323852539, "step": 2032} {"info/global_step": 2033, "train_info/time_within_train_step": 2.645275592803955, "step": 2033} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 2033} {"info/global_step": 2034, "train_info/time_within_train_step": 2.6712069511413574, "step": 2034} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 2034} {"info/global_step": 2035, "train_info/time_within_train_step": 2.6709580421447754, "step": 2035} {"train_info/time_between_train_steps": 0.0032062530517578125, "step": 2035} {"info/global_step": 2036, "train_info/time_within_train_step": 2.660696506500244, "step": 2036} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 2036} {"info/global_step": 2037, "train_info/time_within_train_step": 2.6814005374908447, "step": 2037} {"train_info/time_between_train_steps": 0.003246307373046875, "step": 2037} {"info/global_step": 2038, "train_info/time_within_train_step": 2.6467056274414062, "step": 2038} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 2038} {"info/global_step": 2039, "train_info/time_within_train_step": 2.761705160140991, "step": 2039} {"train_info/time_between_train_steps": 0.0032548904418945312, "step": 2039} {"info/global_step": 2040, "train_info/time_within_train_step": 2.6409904956817627, "step": 2040} {"train_info/time_between_train_steps": 0.003248929977416992, "step": 2040} {"info/global_step": 2041, "train_info/time_within_train_step": 2.648820638656616, "step": 2041} {"train_info/time_between_train_steps": 0.0032320022583007812, "step": 2041} {"info/global_step": 2042, "train_info/time_within_train_step": 2.6554877758026123, "step": 2042} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 2042} {"info/global_step": 2043, "train_info/time_within_train_step": 2.6736738681793213, "step": 2043} {"train_info/time_between_train_steps": 0.003275632858276367, "step": 2043} {"info/global_step": 2044, "train_info/time_within_train_step": 2.6970930099487305, "step": 2044} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 2044} {"info/global_step": 2045, "train_info/time_within_train_step": 2.642653465270996, "step": 2045} {"train_info/time_between_train_steps": 0.003269672393798828, "step": 2045} {"info/global_step": 2046, "train_info/time_within_train_step": 2.6431446075439453, "step": 2046} {"train_info/time_between_train_steps": 0.0033333301544189453, "step": 2046} {"info/global_step": 2047, "train_info/time_within_train_step": 2.664832353591919, "step": 2047} {"train_info/time_between_train_steps": 0.003359556198120117, "step": 2047} {"info/global_step": 2048, "train_info/time_within_train_step": 2.649940013885498, "step": 2048} {"train_info/time_between_train_steps": 0.0034279823303222656, "step": 2048} {"info/global_step": 2049, "train_info/time_within_train_step": 2.6446831226348877, "step": 2049} {"train_info/time_between_train_steps": 0.003777742385864258, "step": 2049} {"info/global_step": 2050, "train_info/time_within_train_step": 2.655431032180786, "step": 2050} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746903172, "_runtime": 5770}, "step": 2050} {"logs": {"train/loss": 4.292, "train/learning_rate": 0.00053, "train/epoch": 2.03, "_timestamp": 1746903172, "_runtime": 5770}, "step": 2050} {"train_info/time_between_train_steps": 0.02526092529296875, "step": 2050} {"info/global_step": 2051, "train_info/time_within_train_step": 2.661207914352417, "step": 2051} {"train_info/time_between_train_steps": 0.0039823055267333984, "step": 2051} {"info/global_step": 2052, "train_info/time_within_train_step": 2.654697895050049, "step": 2052} {"train_info/time_between_train_steps": 0.003922939300537109, "step": 2052} {"info/global_step": 2053, "train_info/time_within_train_step": 2.6627285480499268, "step": 2053} {"train_info/time_between_train_steps": 0.003611326217651367, "step": 2053} {"info/global_step": 2054, "train_info/time_within_train_step": 2.712559461593628, "step": 2054} {"train_info/time_between_train_steps": 0.003718852996826172, "step": 2054} {"info/global_step": 2055, "train_info/time_within_train_step": 2.698657751083374, "step": 2055} {"train_info/time_between_train_steps": 0.0036165714263916016, "step": 2055} {"info/global_step": 2056, "train_info/time_within_train_step": 2.6433377265930176, "step": 2056} {"train_info/time_between_train_steps": 0.003968238830566406, "step": 2056} {"info/global_step": 2057, "train_info/time_within_train_step": 2.642322540283203, "step": 2057} {"train_info/time_between_train_steps": 0.0036773681640625, "step": 2057} {"info/global_step": 2058, "train_info/time_within_train_step": 2.667236804962158, "step": 2058} {"train_info/time_between_train_steps": 0.003784656524658203, "step": 2058} {"info/global_step": 2059, "train_info/time_within_train_step": 2.64910888671875, "step": 2059} {"train_info/time_between_train_steps": 0.003622293472290039, "step": 2059} {"info/global_step": 2060, "train_info/time_within_train_step": 2.6446585655212402, "step": 2060} {"train_info/time_between_train_steps": 0.003778696060180664, "step": 2060} {"info/global_step": 2061, "train_info/time_within_train_step": 2.6502864360809326, "step": 2061} {"train_info/time_between_train_steps": 0.003816366195678711, "step": 2061} {"info/global_step": 2062, "train_info/time_within_train_step": 2.6462037563323975, "step": 2062} {"train_info/time_between_train_steps": 0.003573179244995117, "step": 2062} {"info/global_step": 2063, "train_info/time_within_train_step": 2.6692283153533936, "step": 2063} {"train_info/time_between_train_steps": 0.0036602020263671875, "step": 2063} {"info/global_step": 2064, "train_info/time_within_train_step": 2.670527219772339, "step": 2064} {"train_info/time_between_train_steps": 0.0037021636962890625, "step": 2064} {"info/global_step": 2065, "train_info/time_within_train_step": 2.6922247409820557, "step": 2065} {"train_info/time_between_train_steps": 0.003652334213256836, "step": 2065} {"info/global_step": 2066, "train_info/time_within_train_step": 2.651343584060669, "step": 2066} {"train_info/time_between_train_steps": 0.0037088394165039062, "step": 2066} {"info/global_step": 2067, "train_info/time_within_train_step": 2.6459484100341797, "step": 2067} {"train_info/time_between_train_steps": 0.0036039352416992188, "step": 2067} {"info/global_step": 2068, "train_info/time_within_train_step": 2.6561715602874756, "step": 2068} {"train_info/time_between_train_steps": 0.003545045852661133, "step": 2068} {"info/global_step": 2069, "train_info/time_within_train_step": 2.651383638381958, "step": 2069} {"train_info/time_between_train_steps": 0.0036869049072265625, "step": 2069} {"info/global_step": 2070, "train_info/time_within_train_step": 2.6510426998138428, "step": 2070} {"train_info/time_between_train_steps": 0.003629446029663086, "step": 2070} {"info/global_step": 2071, "train_info/time_within_train_step": 2.6440131664276123, "step": 2071} {"train_info/time_between_train_steps": 0.003715991973876953, "step": 2071} {"info/global_step": 2072, "train_info/time_within_train_step": 2.648465633392334, "step": 2072} {"train_info/time_between_train_steps": 0.0036003589630126953, "step": 2072} {"info/global_step": 2073, "train_info/time_within_train_step": 2.671076774597168, "step": 2073} {"train_info/time_between_train_steps": 0.0037424564361572266, "step": 2073} {"info/global_step": 2074, "train_info/time_within_train_step": 2.6712048053741455, "step": 2074} {"train_info/time_between_train_steps": 0.0037424564361572266, "step": 2074} {"info/global_step": 2075, "train_info/time_within_train_step": 3.0694596767425537, "step": 2075} {"train_info/time_between_train_steps": 0.003266572952270508, "step": 2075} {"info/global_step": 2076, "train_info/time_within_train_step": 2.6587772369384766, "step": 2076} {"train_info/time_between_train_steps": 0.0035517215728759766, "step": 2076} {"info/global_step": 2077, "train_info/time_within_train_step": 2.6442313194274902, "step": 2077} {"train_info/time_between_train_steps": 0.003457784652709961, "step": 2077} {"info/global_step": 2078, "train_info/time_within_train_step": 2.6585235595703125, "step": 2078} {"train_info/time_between_train_steps": 0.003453493118286133, "step": 2078} {"info/global_step": 2079, "train_info/time_within_train_step": 2.6656599044799805, "step": 2079} {"train_info/time_between_train_steps": 0.0034132003784179688, "step": 2079} {"info/global_step": 2080, "train_info/time_within_train_step": 2.6685891151428223, "step": 2080} {"train_info/time_between_train_steps": 0.0034241676330566406, "step": 2080} {"info/global_step": 2081, "train_info/time_within_train_step": 2.6881697177886963, "step": 2081} {"train_info/time_between_train_steps": 0.0034503936767578125, "step": 2081} {"info/global_step": 2082, "train_info/time_within_train_step": 2.6523964405059814, "step": 2082} {"train_info/time_between_train_steps": 0.003415346145629883, "step": 2082} {"info/global_step": 2083, "train_info/time_within_train_step": 2.684802293777466, "step": 2083} {"train_info/time_between_train_steps": 0.003422975540161133, "step": 2083} {"info/global_step": 2084, "train_info/time_within_train_step": 2.6421732902526855, "step": 2084} {"train_info/time_between_train_steps": 0.0035185813903808594, "step": 2084} {"info/global_step": 2085, "train_info/time_within_train_step": 2.6597626209259033, "step": 2085} {"train_info/time_between_train_steps": 0.0035855770111083984, "step": 2085} {"info/global_step": 2086, "train_info/time_within_train_step": 2.660825490951538, "step": 2086} {"train_info/time_between_train_steps": 0.0035953521728515625, "step": 2086} {"info/global_step": 2087, "train_info/time_within_train_step": 2.6745810508728027, "step": 2087} {"train_info/time_between_train_steps": 0.003579378128051758, "step": 2087} {"info/global_step": 2088, "train_info/time_within_train_step": 2.66646409034729, "step": 2088} {"train_info/time_between_train_steps": 0.0035288333892822266, "step": 2088} {"info/global_step": 2089, "train_info/time_within_train_step": 2.704723596572876, "step": 2089} {"train_info/time_between_train_steps": 0.003525972366333008, "step": 2089} {"info/global_step": 2090, "train_info/time_within_train_step": 2.65419864654541, "step": 2090} {"train_info/time_between_train_steps": 0.0034780502319335938, "step": 2090} {"info/global_step": 2091, "train_info/time_within_train_step": 2.6487839221954346, "step": 2091} {"train_info/time_between_train_steps": 0.003527402877807617, "step": 2091} {"info/global_step": 2092, "train_info/time_within_train_step": 2.653974771499634, "step": 2092} {"train_info/time_between_train_steps": 0.003512144088745117, "step": 2092} {"info/global_step": 2093, "train_info/time_within_train_step": 2.653071641921997, "step": 2093} {"train_info/time_between_train_steps": 0.0034379959106445312, "step": 2093} {"info/global_step": 2094, "train_info/time_within_train_step": 2.655221462249756, "step": 2094} {"train_info/time_between_train_steps": 0.0034852027893066406, "step": 2094} {"info/global_step": 2095, "train_info/time_within_train_step": 2.6632633209228516, "step": 2095} {"train_info/time_between_train_steps": 0.0034351348876953125, "step": 2095} {"info/global_step": 2096, "train_info/time_within_train_step": 2.682223320007324, "step": 2096} {"train_info/time_between_train_steps": 0.0035576820373535156, "step": 2096} {"info/global_step": 2097, "train_info/time_within_train_step": 2.7369544506073, "step": 2097} {"train_info/time_between_train_steps": 0.003579854965209961, "step": 2097} {"info/global_step": 2098, "train_info/time_within_train_step": 2.6728498935699463, "step": 2098} {"train_info/time_between_train_steps": 0.0035042762756347656, "step": 2098} {"info/global_step": 2099, "train_info/time_within_train_step": 2.6449227333068848, "step": 2099} {"train_info/time_between_train_steps": 0.003545522689819336, "step": 2099} {"info/global_step": 2100, "train_info/time_within_train_step": 2.6512563228607178, "step": 2100} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746903306, "_runtime": 5904}, "step": 2100} {"logs": {"train/loss": 4.2619, "train/learning_rate": 0.0005266666666666666, "train/epoch": 2.04, "_timestamp": 1746903306, "_runtime": 5904}, "step": 2100} {"train_info/time_between_train_steps": 0.0246427059173584, "step": 2100} {"info/global_step": 2101, "train_info/time_within_train_step": 2.660689115524292, "step": 2101} {"train_info/time_between_train_steps": 0.16617536544799805, "step": 2101} {"info/global_step": 2102, "train_info/time_within_train_step": 2.643540620803833, "step": 2102} {"train_info/time_between_train_steps": 0.0033860206604003906, "step": 2102} {"info/global_step": 2103, "train_info/time_within_train_step": 2.660963296890259, "step": 2103} {"train_info/time_between_train_steps": 0.0033919811248779297, "step": 2103} {"info/global_step": 2104, "train_info/time_within_train_step": 2.653587818145752, "step": 2104} {"train_info/time_between_train_steps": 0.0033130645751953125, "step": 2104} {"info/global_step": 2105, "train_info/time_within_train_step": 2.643265962600708, "step": 2105} {"train_info/time_between_train_steps": 0.0033159255981445312, "step": 2105} {"info/global_step": 2106, "train_info/time_within_train_step": 2.653442144393921, "step": 2106} {"train_info/time_between_train_steps": 0.0033359527587890625, "step": 2106} {"info/global_step": 2107, "train_info/time_within_train_step": 2.6483561992645264, "step": 2107} {"train_info/time_between_train_steps": 0.0034706592559814453, "step": 2107} {"info/global_step": 2108, "train_info/time_within_train_step": 2.6718053817749023, "step": 2108} {"train_info/time_between_train_steps": 0.003654003143310547, "step": 2108} {"info/global_step": 2109, "train_info/time_within_train_step": 2.6902923583984375, "step": 2109} {"train_info/time_between_train_steps": 0.0034339427947998047, "step": 2109} {"info/global_step": 2110, "train_info/time_within_train_step": 2.680159091949463, "step": 2110} {"train_info/time_between_train_steps": 0.0035123825073242188, "step": 2110} {"info/global_step": 2111, "train_info/time_within_train_step": 2.658869743347168, "step": 2111} {"train_info/time_between_train_steps": 0.0036296844482421875, "step": 2111} {"info/global_step": 2112, "train_info/time_within_train_step": 2.643009901046753, "step": 2112} {"train_info/time_between_train_steps": 0.003526926040649414, "step": 2112} {"info/global_step": 2113, "train_info/time_within_train_step": 2.6600401401519775, "step": 2113} {"train_info/time_between_train_steps": 0.003608226776123047, "step": 2113} {"info/global_step": 2114, "train_info/time_within_train_step": 2.654902458190918, "step": 2114} {"train_info/time_between_train_steps": 0.003559112548828125, "step": 2114} {"info/global_step": 2115, "train_info/time_within_train_step": 2.647223472595215, "step": 2115} {"train_info/time_between_train_steps": 0.004018306732177734, "step": 2115} {"info/global_step": 2116, "train_info/time_within_train_step": 2.648022413253784, "step": 2116} {"train_info/time_between_train_steps": 0.0035104751586914062, "step": 2116} {"info/global_step": 2117, "train_info/time_within_train_step": 2.6564948558807373, "step": 2117} {"train_info/time_between_train_steps": 0.0035414695739746094, "step": 2117} {"info/global_step": 2118, "train_info/time_within_train_step": 2.6745553016662598, "step": 2118} {"train_info/time_between_train_steps": 0.0035457611083984375, "step": 2118} {"info/global_step": 2119, "train_info/time_within_train_step": 2.677811861038208, "step": 2119} {"train_info/time_between_train_steps": 0.0035715103149414062, "step": 2119} {"info/global_step": 2120, "train_info/time_within_train_step": 2.653810501098633, "step": 2120} {"train_info/time_between_train_steps": 0.0036056041717529297, "step": 2120} {"info/global_step": 2121, "train_info/time_within_train_step": 2.691767692565918, "step": 2121} {"train_info/time_between_train_steps": 0.003529071807861328, "step": 2121} {"info/global_step": 2122, "train_info/time_within_train_step": 2.6410951614379883, "step": 2122} {"train_info/time_between_train_steps": 0.0034668445587158203, "step": 2122} {"info/global_step": 2123, "train_info/time_within_train_step": 2.6537039279937744, "step": 2123} {"train_info/time_between_train_steps": 0.003503084182739258, "step": 2123} {"info/global_step": 2124, "train_info/time_within_train_step": 2.6612777709960938, "step": 2124} {"train_info/time_between_train_steps": 0.003469228744506836, "step": 2124} {"info/global_step": 2125, "train_info/time_within_train_step": 2.6450347900390625, "step": 2125} {"train_info/time_between_train_steps": 0.0035109519958496094, "step": 2125} {"info/global_step": 2126, "train_info/time_within_train_step": 2.6445107460021973, "step": 2126} {"train_info/time_between_train_steps": 0.0034818649291992188, "step": 2126} {"info/global_step": 2127, "train_info/time_within_train_step": 2.6819875240325928, "step": 2127} {"train_info/time_between_train_steps": 0.003471851348876953, "step": 2127} {"info/global_step": 2128, "train_info/time_within_train_step": 2.6404876708984375, "step": 2128} {"train_info/time_between_train_steps": 0.003487825393676758, "step": 2128} {"info/global_step": 2129, "train_info/time_within_train_step": 2.64267897605896, "step": 2129} {"train_info/time_between_train_steps": 0.0034830570220947266, "step": 2129} {"info/global_step": 2130, "train_info/time_within_train_step": 2.673135995864868, "step": 2130} {"train_info/time_between_train_steps": 0.003561258316040039, "step": 2130} {"info/global_step": 2131, "train_info/time_within_train_step": 2.648726463317871, "step": 2131} {"train_info/time_between_train_steps": 0.003589153289794922, "step": 2131} {"info/global_step": 2132, "train_info/time_within_train_step": 2.644918441772461, "step": 2132} {"train_info/time_between_train_steps": 0.0034558773040771484, "step": 2132} {"info/global_step": 2133, "train_info/time_within_train_step": 2.653808116912842, "step": 2133} {"train_info/time_between_train_steps": 0.0034942626953125, "step": 2133} {"info/global_step": 2134, "train_info/time_within_train_step": 2.6532514095306396, "step": 2134} {"train_info/time_between_train_steps": 0.0036029815673828125, "step": 2134} {"info/global_step": 2135, "train_info/time_within_train_step": 2.660645008087158, "step": 2135} {"train_info/time_between_train_steps": 0.003463268280029297, "step": 2135} {"info/global_step": 2136, "train_info/time_within_train_step": 2.6841304302215576, "step": 2136} {"train_info/time_between_train_steps": 0.0034227371215820312, "step": 2136} {"info/global_step": 2137, "train_info/time_within_train_step": 2.6441497802734375, "step": 2137} {"train_info/time_between_train_steps": 0.0035257339477539062, "step": 2137} {"info/global_step": 2138, "train_info/time_within_train_step": 2.654449462890625, "step": 2138} {"train_info/time_between_train_steps": 0.0035390853881835938, "step": 2138} {"info/global_step": 2139, "train_info/time_within_train_step": 2.648221254348755, "step": 2139} {"train_info/time_between_train_steps": 0.003759145736694336, "step": 2139} {"info/global_step": 2140, "train_info/time_within_train_step": 2.683631420135498, "step": 2140} {"train_info/time_between_train_steps": 0.0037386417388916016, "step": 2140} {"info/global_step": 2141, "train_info/time_within_train_step": 2.647076368331909, "step": 2141} {"train_info/time_between_train_steps": 0.003763437271118164, "step": 2141} {"info/global_step": 2142, "train_info/time_within_train_step": 2.6484146118164062, "step": 2142} {"train_info/time_between_train_steps": 0.003643512725830078, "step": 2142} {"info/global_step": 2143, "train_info/time_within_train_step": 2.6470515727996826, "step": 2143} {"train_info/time_between_train_steps": 0.003674745559692383, "step": 2143} {"info/global_step": 2144, "train_info/time_within_train_step": 2.6491692066192627, "step": 2144} {"train_info/time_between_train_steps": 0.0034933090209960938, "step": 2144} {"info/global_step": 2145, "train_info/time_within_train_step": 2.669261932373047, "step": 2145} {"train_info/time_between_train_steps": 0.003450632095336914, "step": 2145} {"info/global_step": 2146, "train_info/time_within_train_step": 2.6736972332000732, "step": 2146} {"train_info/time_between_train_steps": 0.003503084182739258, "step": 2146} {"info/global_step": 2147, "train_info/time_within_train_step": 2.646176338195801, "step": 2147} {"train_info/time_between_train_steps": 0.00344085693359375, "step": 2147} {"info/global_step": 2148, "train_info/time_within_train_step": 2.649949312210083, "step": 2148} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 2148} {"info/global_step": 2149, "train_info/time_within_train_step": 2.644843578338623, "step": 2149} {"train_info/time_between_train_steps": 0.003451824188232422, "step": 2149} {"info/global_step": 2150, "train_info/time_within_train_step": 2.66878080368042, "step": 2150} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746903441, "_runtime": 6039}, "step": 2150} {"logs": {"train/loss": 4.2555, "train/learning_rate": 0.0005233333333333333, "train/epoch": 2.04, "_timestamp": 1746903441, "_runtime": 6039}, "step": 2150} {"train_info/time_between_train_steps": 0.02587413787841797, "step": 2150} {"info/global_step": 2151, "train_info/time_within_train_step": 2.670529842376709, "step": 2151} {"train_info/time_between_train_steps": 0.003472566604614258, "step": 2151} {"info/global_step": 2152, "train_info/time_within_train_step": 2.6840405464172363, "step": 2152} {"train_info/time_between_train_steps": 0.003480195999145508, "step": 2152} {"info/global_step": 2153, "train_info/time_within_train_step": 2.697006940841675, "step": 2153} {"train_info/time_between_train_steps": 0.0034487247467041016, "step": 2153} {"info/global_step": 2154, "train_info/time_within_train_step": 2.648171901702881, "step": 2154} {"train_info/time_between_train_steps": 0.0034723281860351562, "step": 2154} {"info/global_step": 2155, "train_info/time_within_train_step": 2.64483904838562, "step": 2155} {"train_info/time_between_train_steps": 0.0034372806549072266, "step": 2155} {"info/global_step": 2156, "train_info/time_within_train_step": 2.6545987129211426, "step": 2156} {"train_info/time_between_train_steps": 0.0034477710723876953, "step": 2156} {"info/global_step": 2157, "train_info/time_within_train_step": 2.652740240097046, "step": 2157} {"train_info/time_between_train_steps": 0.003599405288696289, "step": 2157} {"info/global_step": 2158, "train_info/time_within_train_step": 2.6505746841430664, "step": 2158} {"train_info/time_between_train_steps": 0.003396272659301758, "step": 2158} {"info/global_step": 2159, "train_info/time_within_train_step": 2.645320177078247, "step": 2159} {"train_info/time_between_train_steps": 0.0034580230712890625, "step": 2159} {"info/global_step": 2160, "train_info/time_within_train_step": 2.649662494659424, "step": 2160} {"train_info/time_between_train_steps": 0.003380298614501953, "step": 2160} {"info/global_step": 2161, "train_info/time_within_train_step": 2.6616203784942627, "step": 2161} {"train_info/time_between_train_steps": 0.003355264663696289, "step": 2161} {"info/global_step": 2162, "train_info/time_within_train_step": 2.6818535327911377, "step": 2162} {"train_info/time_between_train_steps": 0.0034673213958740234, "step": 2162} {"info/global_step": 2163, "train_info/time_within_train_step": 2.642298936843872, "step": 2163} {"train_info/time_between_train_steps": 0.003415822982788086, "step": 2163} {"info/global_step": 2164, "train_info/time_within_train_step": 2.771153450012207, "step": 2164} {"train_info/time_between_train_steps": 0.0032639503479003906, "step": 2164} {"info/global_step": 2165, "train_info/time_within_train_step": 2.6417245864868164, "step": 2165} {"train_info/time_between_train_steps": 0.003305673599243164, "step": 2165} {"info/global_step": 2166, "train_info/time_within_train_step": 2.6493237018585205, "step": 2166} {"train_info/time_between_train_steps": 0.00341033935546875, "step": 2166} {"info/global_step": 2167, "train_info/time_within_train_step": 2.66412091255188, "step": 2167} {"train_info/time_between_train_steps": 0.00325775146484375, "step": 2167} {"info/global_step": 2168, "train_info/time_within_train_step": 2.647611618041992, "step": 2168} {"train_info/time_between_train_steps": 0.0032906532287597656, "step": 2168} {"info/global_step": 2169, "train_info/time_within_train_step": 2.645253896713257, "step": 2169} {"train_info/time_between_train_steps": 0.003308534622192383, "step": 2169} {"info/global_step": 2170, "train_info/time_within_train_step": 2.6653378009796143, "step": 2170} {"train_info/time_between_train_steps": 0.0033006668090820312, "step": 2170} {"info/global_step": 2171, "train_info/time_within_train_step": 2.661362886428833, "step": 2171} {"train_info/time_between_train_steps": 0.0033020973205566406, "step": 2171} {"info/global_step": 2172, "train_info/time_within_train_step": 2.9872641563415527, "step": 2172} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 2172} {"info/global_step": 2173, "train_info/time_within_train_step": 2.648634433746338, "step": 2173} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 2173} {"info/global_step": 2174, "train_info/time_within_train_step": 2.644238233566284, "step": 2174} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 2174} {"info/global_step": 2175, "train_info/time_within_train_step": 2.6655094623565674, "step": 2175} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 2175} {"info/global_step": 2176, "train_info/time_within_train_step": 2.6591172218322754, "step": 2176} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 2176} {"info/global_step": 2177, "train_info/time_within_train_step": 2.667217969894409, "step": 2177} {"train_info/time_between_train_steps": 0.0032753944396972656, "step": 2177} {"info/global_step": 2178, "train_info/time_within_train_step": 2.6798951625823975, "step": 2178} {"train_info/time_between_train_steps": 0.003233194351196289, "step": 2178} {"info/global_step": 2179, "train_info/time_within_train_step": 2.666195869445801, "step": 2179} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 2179} {"info/global_step": 2180, "train_info/time_within_train_step": 2.64530348777771, "step": 2180} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 2180} {"info/global_step": 2181, "train_info/time_within_train_step": 2.6427581310272217, "step": 2181} {"train_info/time_between_train_steps": 0.0031425952911376953, "step": 2181} {"info/global_step": 2182, "train_info/time_within_train_step": 2.654453754425049, "step": 2182} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 2182} {"info/global_step": 2183, "train_info/time_within_train_step": 2.6544809341430664, "step": 2183} {"train_info/time_between_train_steps": 0.003214120864868164, "step": 2183} {"info/global_step": 2184, "train_info/time_within_train_step": 2.645491361618042, "step": 2184} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 2184} {"info/global_step": 2185, "train_info/time_within_train_step": 2.6551244258880615, "step": 2185} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 2185} {"info/global_step": 2186, "train_info/time_within_train_step": 2.6573283672332764, "step": 2186} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 2186} {"info/global_step": 2187, "train_info/time_within_train_step": 2.671265125274658, "step": 2187} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 2187} {"info/global_step": 2188, "train_info/time_within_train_step": 2.7282769680023193, "step": 2188} {"train_info/time_between_train_steps": 0.003251791000366211, "step": 2188} {"info/global_step": 2189, "train_info/time_within_train_step": 2.665527582168579, "step": 2189} {"train_info/time_between_train_steps": 0.0033075809478759766, "step": 2189} {"info/global_step": 2190, "train_info/time_within_train_step": 2.647110939025879, "step": 2190} {"train_info/time_between_train_steps": 0.003261089324951172, "step": 2190} {"info/global_step": 2191, "train_info/time_within_train_step": 2.6623377799987793, "step": 2191} {"train_info/time_between_train_steps": 0.00672149658203125, "step": 2191} {"info/global_step": 2192, "train_info/time_within_train_step": 2.662288188934326, "step": 2192} {"train_info/time_between_train_steps": 0.0066699981689453125, "step": 2192} {"info/global_step": 2193, "train_info/time_within_train_step": 2.6673429012298584, "step": 2193} {"train_info/time_between_train_steps": 0.0033850669860839844, "step": 2193} {"info/global_step": 2194, "train_info/time_within_train_step": 2.6590166091918945, "step": 2194} {"train_info/time_between_train_steps": 0.0033271312713623047, "step": 2194} {"info/global_step": 2195, "train_info/time_within_train_step": 2.647596836090088, "step": 2195} {"train_info/time_between_train_steps": 0.003298521041870117, "step": 2195} {"info/global_step": 2196, "train_info/time_within_train_step": 2.6729767322540283, "step": 2196} {"train_info/time_between_train_steps": 0.003463268280029297, "step": 2196} {"info/global_step": 2197, "train_info/time_within_train_step": 2.674379825592041, "step": 2197} {"train_info/time_between_train_steps": 0.0032966136932373047, "step": 2197} {"info/global_step": 2198, "train_info/time_within_train_step": 2.7000367641448975, "step": 2198} {"train_info/time_between_train_steps": 0.003400564193725586, "step": 2198} {"info/global_step": 2199, "train_info/time_within_train_step": 2.6534688472747803, "step": 2199} {"train_info/time_between_train_steps": 0.003389120101928711, "step": 2199} {"info/global_step": 2200, "train_info/time_within_train_step": 2.648249864578247, "step": 2200} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746903576, "_runtime": 6174}, "step": 2200} {"logs": {"train/loss": 4.2472, "train/learning_rate": 0.00052, "train/epoch": 2.05, "_timestamp": 1746903576, "_runtime": 6174}, "step": 2200} {"train_info/time_between_train_steps": 13.171848773956299, "step": 2200} {"info/global_step": 2201, "train_info/time_within_train_step": 2.4443674087524414, "step": 2201} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 2201} {"info/global_step": 2202, "train_info/time_within_train_step": 2.485534191131592, "step": 2202} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 2202} {"info/global_step": 2203, "train_info/time_within_train_step": 2.647484064102173, "step": 2203} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 2203} {"info/global_step": 2204, "train_info/time_within_train_step": 2.645840883255005, "step": 2204} {"train_info/time_between_train_steps": 0.0032727718353271484, "step": 2204} {"info/global_step": 2205, "train_info/time_within_train_step": 2.6479744911193848, "step": 2205} {"train_info/time_between_train_steps": 0.0033054351806640625, "step": 2205} {"info/global_step": 2206, "train_info/time_within_train_step": 2.6597325801849365, "step": 2206} {"train_info/time_between_train_steps": 0.0032923221588134766, "step": 2206} {"info/global_step": 2207, "train_info/time_within_train_step": 2.6533262729644775, "step": 2207} {"train_info/time_between_train_steps": 0.0032651424407958984, "step": 2207} {"info/global_step": 2208, "train_info/time_within_train_step": 2.659532308578491, "step": 2208} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 2208} {"info/global_step": 2209, "train_info/time_within_train_step": 2.7001867294311523, "step": 2209} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 2209} {"info/global_step": 2210, "train_info/time_within_train_step": 2.7016665935516357, "step": 2210} {"train_info/time_between_train_steps": 0.0032787322998046875, "step": 2210} {"info/global_step": 2211, "train_info/time_within_train_step": 2.642345905303955, "step": 2211} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 2211} {"info/global_step": 2212, "train_info/time_within_train_step": 2.6430001258850098, "step": 2212} {"train_info/time_between_train_steps": 0.003298521041870117, "step": 2212} {"info/global_step": 2213, "train_info/time_within_train_step": 2.666449546813965, "step": 2213} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 2213} {"info/global_step": 2214, "train_info/time_within_train_step": 2.6494219303131104, "step": 2214} {"train_info/time_between_train_steps": 0.0032300949096679688, "step": 2214} {"info/global_step": 2215, "train_info/time_within_train_step": 2.6472480297088623, "step": 2215} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 2215} {"info/global_step": 2216, "train_info/time_within_train_step": 2.6503095626831055, "step": 2216} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 2216} {"info/global_step": 2217, "train_info/time_within_train_step": 2.6449732780456543, "step": 2217} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 2217} {"info/global_step": 2218, "train_info/time_within_train_step": 2.669792413711548, "step": 2218} {"train_info/time_between_train_steps": 0.003259420394897461, "step": 2218} {"info/global_step": 2219, "train_info/time_within_train_step": 2.6600441932678223, "step": 2219} {"train_info/time_between_train_steps": 0.0031604766845703125, "step": 2219} {"info/global_step": 2220, "train_info/time_within_train_step": 2.6527700424194336, "step": 2220} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 2220} {"info/global_step": 2221, "train_info/time_within_train_step": 2.6649277210235596, "step": 2221} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 2221} {"info/global_step": 2222, "train_info/time_within_train_step": 2.6706337928771973, "step": 2222} {"train_info/time_between_train_steps": 0.0032384395599365234, "step": 2222} {"info/global_step": 2223, "train_info/time_within_train_step": 2.682466506958008, "step": 2223} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 2223} {"info/global_step": 2224, "train_info/time_within_train_step": 2.6552679538726807, "step": 2224} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 2224} {"info/global_step": 2225, "train_info/time_within_train_step": 2.689689874649048, "step": 2225} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 2225} {"info/global_step": 2226, "train_info/time_within_train_step": 2.6473515033721924, "step": 2226} {"train_info/time_between_train_steps": 0.10913658142089844, "step": 2226} {"info/global_step": 2227, "train_info/time_within_train_step": 2.6871113777160645, "step": 2227} {"train_info/time_between_train_steps": 0.0032787322998046875, "step": 2227} {"info/global_step": 2228, "train_info/time_within_train_step": 2.642889976501465, "step": 2228} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 2228} {"info/global_step": 2229, "train_info/time_within_train_step": 2.650054693222046, "step": 2229} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 2229} {"info/global_step": 2230, "train_info/time_within_train_step": 2.6631217002868652, "step": 2230} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 2230} {"info/global_step": 2231, "train_info/time_within_train_step": 2.6450893878936768, "step": 2231} {"train_info/time_between_train_steps": 0.0032427310943603516, "step": 2231} {"info/global_step": 2232, "train_info/time_within_train_step": 2.6461896896362305, "step": 2232} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 2232} {"info/global_step": 2233, "train_info/time_within_train_step": 2.6545562744140625, "step": 2233} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 2233} {"info/global_step": 2234, "train_info/time_within_train_step": 2.6608386039733887, "step": 2234} {"train_info/time_between_train_steps": 0.003290414810180664, "step": 2234} {"info/global_step": 2235, "train_info/time_within_train_step": 2.6757702827453613, "step": 2235} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 2235} {"info/global_step": 2236, "train_info/time_within_train_step": 2.6748692989349365, "step": 2236} {"train_info/time_between_train_steps": 0.0032439231872558594, "step": 2236} {"info/global_step": 2237, "train_info/time_within_train_step": 2.7068333625793457, "step": 2237} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 2237} {"info/global_step": 2238, "train_info/time_within_train_step": 2.6442906856536865, "step": 2238} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 2238} {"info/global_step": 2239, "train_info/time_within_train_step": 2.649625301361084, "step": 2239} {"train_info/time_between_train_steps": 0.0032341480255126953, "step": 2239} {"info/global_step": 2240, "train_info/time_within_train_step": 2.6603729724884033, "step": 2240} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 2240} {"info/global_step": 2241, "train_info/time_within_train_step": 2.643045663833618, "step": 2241} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 2241} {"info/global_step": 2242, "train_info/time_within_train_step": 2.6465048789978027, "step": 2242} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 2242} {"info/global_step": 2243, "train_info/time_within_train_step": 2.659802198410034, "step": 2243} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 2243} {"info/global_step": 2244, "train_info/time_within_train_step": 2.655336618423462, "step": 2244} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 2244} {"info/global_step": 2245, "train_info/time_within_train_step": 2.660994529724121, "step": 2245} {"train_info/time_between_train_steps": 0.003380298614501953, "step": 2245} {"info/global_step": 2246, "train_info/time_within_train_step": 2.709972620010376, "step": 2246} {"train_info/time_between_train_steps": 0.0032744407653808594, "step": 2246} {"info/global_step": 2247, "train_info/time_within_train_step": 2.7166290283203125, "step": 2247} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 2247} {"info/global_step": 2248, "train_info/time_within_train_step": 2.9495253562927246, "step": 2248} {"train_info/time_between_train_steps": 0.0032722949981689453, "step": 2248} {"info/global_step": 2249, "train_info/time_within_train_step": 2.653773546218872, "step": 2249} {"train_info/time_between_train_steps": 0.003489971160888672, "step": 2249} {"info/global_step": 2250, "train_info/time_within_train_step": 3.2671918869018555, "step": 2250} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746903724, "_runtime": 6322}, "step": 2250} {"logs": {"train/loss": 4.22, "train/learning_rate": 0.0005166666666666667, "train/epoch": 2.05, "_timestamp": 1746903724, "_runtime": 6322}, "step": 2250} {"train_info/time_between_train_steps": 0.025299787521362305, "step": 2250} {"info/global_step": 2251, "train_info/time_within_train_step": 2.708041191101074, "step": 2251} {"train_info/time_between_train_steps": 0.0034677982330322266, "step": 2251} {"info/global_step": 2252, "train_info/time_within_train_step": 2.6495091915130615, "step": 2252} {"train_info/time_between_train_steps": 0.0034525394439697266, "step": 2252} {"info/global_step": 2253, "train_info/time_within_train_step": 2.6478939056396484, "step": 2253} {"train_info/time_between_train_steps": 0.0035054683685302734, "step": 2253} {"info/global_step": 2254, "train_info/time_within_train_step": 2.651444911956787, "step": 2254} {"train_info/time_between_train_steps": 0.0034818649291992188, "step": 2254} {"info/global_step": 2255, "train_info/time_within_train_step": 2.64979887008667, "step": 2255} {"train_info/time_between_train_steps": 0.0034263134002685547, "step": 2255} {"info/global_step": 2256, "train_info/time_within_train_step": 2.6506574153900146, "step": 2256} {"train_info/time_between_train_steps": 0.003444194793701172, "step": 2256} {"info/global_step": 2257, "train_info/time_within_train_step": 2.6465768814086914, "step": 2257} {"train_info/time_between_train_steps": 0.003436565399169922, "step": 2257} {"info/global_step": 2258, "train_info/time_within_train_step": 2.6639254093170166, "step": 2258} {"train_info/time_between_train_steps": 0.0034089088439941406, "step": 2258} {"info/global_step": 2259, "train_info/time_within_train_step": 2.6573169231414795, "step": 2259} {"train_info/time_between_train_steps": 0.0035467147827148438, "step": 2259} {"info/global_step": 2260, "train_info/time_within_train_step": 2.6672585010528564, "step": 2260} {"train_info/time_between_train_steps": 0.003398418426513672, "step": 2260} {"info/global_step": 2261, "train_info/time_within_train_step": 2.723606824874878, "step": 2261} {"train_info/time_between_train_steps": 0.003448963165283203, "step": 2261} {"info/global_step": 2262, "train_info/time_within_train_step": 2.68985915184021, "step": 2262} {"train_info/time_between_train_steps": 0.0034973621368408203, "step": 2262} {"info/global_step": 2263, "train_info/time_within_train_step": 2.6422927379608154, "step": 2263} {"train_info/time_between_train_steps": 0.0033910274505615234, "step": 2263} {"info/global_step": 2264, "train_info/time_within_train_step": 2.6436524391174316, "step": 2264} {"train_info/time_between_train_steps": 0.0033965110778808594, "step": 2264} {"info/global_step": 2265, "train_info/time_within_train_step": 2.659679889678955, "step": 2265} {"train_info/time_between_train_steps": 0.0034055709838867188, "step": 2265} {"info/global_step": 2266, "train_info/time_within_train_step": 2.655714988708496, "step": 2266} {"train_info/time_between_train_steps": 0.0034685134887695312, "step": 2266} {"info/global_step": 2267, "train_info/time_within_train_step": 2.6474530696868896, "step": 2267} {"train_info/time_between_train_steps": 0.0034608840942382812, "step": 2267} {"info/global_step": 2268, "train_info/time_within_train_step": 2.652541160583496, "step": 2268} {"train_info/time_between_train_steps": 0.003397703170776367, "step": 2268} {"info/global_step": 2269, "train_info/time_within_train_step": 2.651930093765259, "step": 2269} {"train_info/time_between_train_steps": 0.003525257110595703, "step": 2269} {"info/global_step": 2270, "train_info/time_within_train_step": 2.67091703414917, "step": 2270} {"train_info/time_between_train_steps": 0.003491640090942383, "step": 2270} {"info/global_step": 2271, "train_info/time_within_train_step": 2.6964428424835205, "step": 2271} {"train_info/time_between_train_steps": 0.0034487247467041016, "step": 2271} {"info/global_step": 2272, "train_info/time_within_train_step": 2.669796943664551, "step": 2272} {"train_info/time_between_train_steps": 0.0034177303314208984, "step": 2272} {"info/global_step": 2273, "train_info/time_within_train_step": 2.660214424133301, "step": 2273} {"train_info/time_between_train_steps": 0.0036172866821289062, "step": 2273} {"info/global_step": 2274, "train_info/time_within_train_step": 2.6427409648895264, "step": 2274} {"train_info/time_between_train_steps": 0.003508329391479492, "step": 2274} {"info/global_step": 2275, "train_info/time_within_train_step": 2.6631338596343994, "step": 2275} {"train_info/time_between_train_steps": 0.003509044647216797, "step": 2275} {"info/global_step": 2276, "train_info/time_within_train_step": 2.6557064056396484, "step": 2276} {"train_info/time_between_train_steps": 0.0036020278930664062, "step": 2276} {"info/global_step": 2277, "train_info/time_within_train_step": 2.6925301551818848, "step": 2277} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 2277} {"info/global_step": 2278, "train_info/time_within_train_step": 2.667201042175293, "step": 2278} {"train_info/time_between_train_steps": 0.003099203109741211, "step": 2278} {"info/global_step": 2279, "train_info/time_within_train_step": 2.6663756370544434, "step": 2279} {"train_info/time_between_train_steps": 0.0031104087829589844, "step": 2279} {"info/global_step": 2280, "train_info/time_within_train_step": 2.672877311706543, "step": 2280} {"train_info/time_between_train_steps": 0.003094196319580078, "step": 2280} {"info/global_step": 2281, "train_info/time_within_train_step": 2.647207260131836, "step": 2281} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 2281} {"info/global_step": 2282, "train_info/time_within_train_step": 2.6554653644561768, "step": 2282} {"train_info/time_between_train_steps": 0.0030906200408935547, "step": 2282} {"info/global_step": 2283, "train_info/time_within_train_step": 2.656644582748413, "step": 2283} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 2283} {"info/global_step": 2284, "train_info/time_within_train_step": 2.6442389488220215, "step": 2284} {"train_info/time_between_train_steps": 0.003140687942504883, "step": 2284} {"info/global_step": 2285, "train_info/time_within_train_step": 2.6470701694488525, "step": 2285} {"train_info/time_between_train_steps": 0.0030813217163085938, "step": 2285} {"info/global_step": 2286, "train_info/time_within_train_step": 2.647784471511841, "step": 2286} {"train_info/time_between_train_steps": 0.0031104087829589844, "step": 2286} {"info/global_step": 2287, "train_info/time_within_train_step": 2.6649229526519775, "step": 2287} {"train_info/time_between_train_steps": 0.003109455108642578, "step": 2287} {"info/global_step": 2288, "train_info/time_within_train_step": 2.6642708778381348, "step": 2288} {"train_info/time_between_train_steps": 0.0030989646911621094, "step": 2288} {"info/global_step": 2289, "train_info/time_within_train_step": 2.6561920642852783, "step": 2289} {"train_info/time_between_train_steps": 0.0030803680419921875, "step": 2289} {"info/global_step": 2290, "train_info/time_within_train_step": 2.7073655128479004, "step": 2290} {"train_info/time_between_train_steps": 0.003082752227783203, "step": 2290} {"info/global_step": 2291, "train_info/time_within_train_step": 2.646623373031616, "step": 2291} {"train_info/time_between_train_steps": 0.0030765533447265625, "step": 2291} {"info/global_step": 2292, "train_info/time_within_train_step": 2.6432526111602783, "step": 2292} {"train_info/time_between_train_steps": 0.003103017807006836, "step": 2292} {"info/global_step": 2293, "train_info/time_within_train_step": 2.656609296798706, "step": 2293} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 2293} {"info/global_step": 2294, "train_info/time_within_train_step": 2.65394926071167, "step": 2294} {"train_info/time_between_train_steps": 0.0031015872955322266, "step": 2294} {"info/global_step": 2295, "train_info/time_within_train_step": 2.644282341003418, "step": 2295} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 2295} {"info/global_step": 2296, "train_info/time_within_train_step": 2.6564671993255615, "step": 2296} {"train_info/time_between_train_steps": 0.003105640411376953, "step": 2296} {"info/global_step": 2297, "train_info/time_within_train_step": 2.6526358127593994, "step": 2297} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 2297} {"info/global_step": 2298, "train_info/time_within_train_step": 2.664395809173584, "step": 2298} {"train_info/time_between_train_steps": 0.003136157989501953, "step": 2298} {"info/global_step": 2299, "train_info/time_within_train_step": 2.724860906600952, "step": 2299} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 2299} {"info/global_step": 2300, "train_info/time_within_train_step": 2.6771960258483887, "step": 2300} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746903859, "_runtime": 6457}, "step": 2300} {"logs": {"train/loss": 4.2107, "train/learning_rate": 0.0005133333333333333, "train/epoch": 2.06, "_timestamp": 1746903859, "_runtime": 6457}, "step": 2300} {"train_info/time_between_train_steps": 0.03091716766357422, "step": 2300} {"info/global_step": 2301, "train_info/time_within_train_step": 2.6408331394195557, "step": 2301} {"train_info/time_between_train_steps": 0.0030596256256103516, "step": 2301} {"info/global_step": 2302, "train_info/time_within_train_step": 2.642218589782715, "step": 2302} {"train_info/time_between_train_steps": 0.0031006336212158203, "step": 2302} {"info/global_step": 2303, "train_info/time_within_train_step": 2.665255069732666, "step": 2303} {"train_info/time_between_train_steps": 0.0030934810638427734, "step": 2303} {"info/global_step": 2304, "train_info/time_within_train_step": 2.647599220275879, "step": 2304} {"train_info/time_between_train_steps": 0.0030629634857177734, "step": 2304} {"info/global_step": 2305, "train_info/time_within_train_step": 2.647237539291382, "step": 2305} {"train_info/time_between_train_steps": 0.003093719482421875, "step": 2305} {"info/global_step": 2306, "train_info/time_within_train_step": 2.6499040126800537, "step": 2306} {"train_info/time_between_train_steps": 0.0030524730682373047, "step": 2306} {"info/global_step": 2307, "train_info/time_within_train_step": 2.643899917602539, "step": 2307} {"train_info/time_between_train_steps": 0.003073453903198242, "step": 2307} {"info/global_step": 2308, "train_info/time_within_train_step": 2.6670689582824707, "step": 2308} {"train_info/time_between_train_steps": 0.0033135414123535156, "step": 2308} {"info/global_step": 2309, "train_info/time_within_train_step": 2.963914155960083, "step": 2309} {"train_info/time_between_train_steps": 0.003006458282470703, "step": 2309} {"info/global_step": 2310, "train_info/time_within_train_step": 2.6492743492126465, "step": 2310} {"train_info/time_between_train_steps": 0.002905130386352539, "step": 2310} {"info/global_step": 2311, "train_info/time_within_train_step": 2.6481521129608154, "step": 2311} {"train_info/time_between_train_steps": 0.0029594898223876953, "step": 2311} {"info/global_step": 2312, "train_info/time_within_train_step": 2.645514726638794, "step": 2312} {"train_info/time_between_train_steps": 0.002996683120727539, "step": 2312} {"info/global_step": 2313, "train_info/time_within_train_step": 2.6623828411102295, "step": 2313} {"train_info/time_between_train_steps": 0.0030298233032226562, "step": 2313} {"info/global_step": 2314, "train_info/time_within_train_step": 2.6748387813568115, "step": 2314} {"train_info/time_between_train_steps": 0.002946138381958008, "step": 2314} {"info/global_step": 2315, "train_info/time_within_train_step": 2.7177140712738037, "step": 2315} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 2315} {"info/global_step": 2316, "train_info/time_within_train_step": 2.6602706909179688, "step": 2316} {"train_info/time_between_train_steps": 0.003021240234375, "step": 2316} {"info/global_step": 2317, "train_info/time_within_train_step": 2.6765170097351074, "step": 2317} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 2317} {"info/global_step": 2318, "train_info/time_within_train_step": 2.6426753997802734, "step": 2318} {"train_info/time_between_train_steps": 0.0029833316802978516, "step": 2318} {"info/global_step": 2319, "train_info/time_within_train_step": 2.6590192317962646, "step": 2319} {"train_info/time_between_train_steps": 0.002932310104370117, "step": 2319} {"info/global_step": 2320, "train_info/time_within_train_step": 2.666151285171509, "step": 2320} {"train_info/time_between_train_steps": 0.0029709339141845703, "step": 2320} {"info/global_step": 2321, "train_info/time_within_train_step": 2.650176763534546, "step": 2321} {"train_info/time_between_train_steps": 0.002925395965576172, "step": 2321} {"info/global_step": 2322, "train_info/time_within_train_step": 2.642033576965332, "step": 2322} {"train_info/time_between_train_steps": 0.0029535293579101562, "step": 2322} {"info/global_step": 2323, "train_info/time_within_train_step": 2.6525025367736816, "step": 2323} {"train_info/time_between_train_steps": 0.002943754196166992, "step": 2323} {"info/global_step": 2324, "train_info/time_within_train_step": 2.6875483989715576, "step": 2324} {"train_info/time_between_train_steps": 0.0029366016387939453, "step": 2324} {"info/global_step": 2325, "train_info/time_within_train_step": 2.641239881515503, "step": 2325} {"train_info/time_between_train_steps": 0.002959012985229492, "step": 2325} {"info/global_step": 2326, "train_info/time_within_train_step": 2.655979633331299, "step": 2326} {"train_info/time_between_train_steps": 0.0029883384704589844, "step": 2326} {"info/global_step": 2327, "train_info/time_within_train_step": 2.656604290008545, "step": 2327} {"train_info/time_between_train_steps": 0.0029990673065185547, "step": 2327} {"info/global_step": 2328, "train_info/time_within_train_step": 2.6427414417266846, "step": 2328} {"train_info/time_between_train_steps": 0.0029942989349365234, "step": 2328} {"info/global_step": 2329, "train_info/time_within_train_step": 2.6454341411590576, "step": 2329} {"train_info/time_between_train_steps": 0.002927541732788086, "step": 2329} {"info/global_step": 2330, "train_info/time_within_train_step": 2.6507863998413086, "step": 2330} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 2330} {"info/global_step": 2331, "train_info/time_within_train_step": 2.6630406379699707, "step": 2331} {"train_info/time_between_train_steps": 0.0029726028442382812, "step": 2331} {"info/global_step": 2332, "train_info/time_within_train_step": 2.664623498916626, "step": 2332} {"train_info/time_between_train_steps": 0.0029664039611816406, "step": 2332} {"info/global_step": 2333, "train_info/time_within_train_step": 2.659160614013672, "step": 2333} {"train_info/time_between_train_steps": 0.002985239028930664, "step": 2333} {"info/global_step": 2334, "train_info/time_within_train_step": 2.710325241088867, "step": 2334} {"train_info/time_between_train_steps": 0.0029392242431640625, "step": 2334} {"info/global_step": 2335, "train_info/time_within_train_step": 2.645965099334717, "step": 2335} {"train_info/time_between_train_steps": 0.0029685497283935547, "step": 2335} {"info/global_step": 2336, "train_info/time_within_train_step": 2.648517370223999, "step": 2336} {"train_info/time_between_train_steps": 0.0029511451721191406, "step": 2336} {"info/global_step": 2337, "train_info/time_within_train_step": 2.651973247528076, "step": 2337} {"train_info/time_between_train_steps": 0.0029108524322509766, "step": 2337} {"info/global_step": 2338, "train_info/time_within_train_step": 2.6476895809173584, "step": 2338} {"train_info/time_between_train_steps": 0.0029578208923339844, "step": 2338} {"info/global_step": 2339, "train_info/time_within_train_step": 2.6535961627960205, "step": 2339} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 2339} {"info/global_step": 2340, "train_info/time_within_train_step": 2.6446611881256104, "step": 2340} {"train_info/time_between_train_steps": 0.0029408931732177734, "step": 2340} {"info/global_step": 2341, "train_info/time_within_train_step": 2.6579864025115967, "step": 2341} {"train_info/time_between_train_steps": 0.0033004283905029297, "step": 2341} {"info/global_step": 2342, "train_info/time_within_train_step": 2.653635263442993, "step": 2342} {"train_info/time_between_train_steps": 0.0029609203338623047, "step": 2342} {"info/global_step": 2343, "train_info/time_within_train_step": 2.6655073165893555, "step": 2343} {"train_info/time_between_train_steps": 0.0030853748321533203, "step": 2343} {"info/global_step": 2344, "train_info/time_within_train_step": 2.668792247772217, "step": 2344} {"train_info/time_between_train_steps": 0.003069639205932617, "step": 2344} {"info/global_step": 2345, "train_info/time_within_train_step": 2.643718957901001, "step": 2345} {"train_info/time_between_train_steps": 0.0033872127532958984, "step": 2345} {"info/global_step": 2346, "train_info/time_within_train_step": 2.6453449726104736, "step": 2346} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 2346} {"info/global_step": 2347, "train_info/time_within_train_step": 2.643458843231201, "step": 2347} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 2347} {"info/global_step": 2348, "train_info/time_within_train_step": 2.644167900085449, "step": 2348} {"train_info/time_between_train_steps": 0.0030858516693115234, "step": 2348} {"info/global_step": 2349, "train_info/time_within_train_step": 2.643765449523926, "step": 2349} {"train_info/time_between_train_steps": 0.003067493438720703, "step": 2349} {"info/global_step": 2350, "train_info/time_within_train_step": 2.643242597579956, "step": 2350} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746903996, "_runtime": 6594}, "step": 2350} {"logs": {"train/loss": 4.1856, "train/learning_rate": 0.0005099999999999999, "train/epoch": 2.06, "_timestamp": 1746903996, "_runtime": 6594}, "step": 2350} {"train_info/time_between_train_steps": 0.5308599472045898, "step": 2350} {"info/global_step": 2351, "train_info/time_within_train_step": 2.623363733291626, "step": 2351} {"train_info/time_between_train_steps": 0.002948760986328125, "step": 2351} {"info/global_step": 2352, "train_info/time_within_train_step": 2.6675891876220703, "step": 2352} {"train_info/time_between_train_steps": 0.0029706954956054688, "step": 2352} {"info/global_step": 2353, "train_info/time_within_train_step": 2.6664862632751465, "step": 2353} {"train_info/time_between_train_steps": 0.0030221939086914062, "step": 2353} {"info/global_step": 2354, "train_info/time_within_train_step": 2.83069109916687, "step": 2354} {"train_info/time_between_train_steps": 0.0029718875885009766, "step": 2354} {"info/global_step": 2355, "train_info/time_within_train_step": 2.6841650009155273, "step": 2355} {"train_info/time_between_train_steps": 0.003001689910888672, "step": 2355} {"info/global_step": 2356, "train_info/time_within_train_step": 2.6619300842285156, "step": 2356} {"train_info/time_between_train_steps": 0.002981901168823242, "step": 2356} {"info/global_step": 2357, "train_info/time_within_train_step": 2.7046093940734863, "step": 2357} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 2357} {"info/global_step": 2358, "train_info/time_within_train_step": 2.6391923427581787, "step": 2358} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 2358} {"info/global_step": 2359, "train_info/time_within_train_step": 2.6398110389709473, "step": 2359} {"train_info/time_between_train_steps": 0.0029382705688476562, "step": 2359} {"info/global_step": 2360, "train_info/time_within_train_step": 2.66329026222229, "step": 2360} {"train_info/time_between_train_steps": 0.0029413700103759766, "step": 2360} {"info/global_step": 2361, "train_info/time_within_train_step": 2.6479592323303223, "step": 2361} {"train_info/time_between_train_steps": 0.0029375553131103516, "step": 2361} {"info/global_step": 2362, "train_info/time_within_train_step": 2.643923282623291, "step": 2362} {"train_info/time_between_train_steps": 0.002938508987426758, "step": 2362} {"info/global_step": 2363, "train_info/time_within_train_step": 2.6578757762908936, "step": 2363} {"train_info/time_between_train_steps": 0.0029413700103759766, "step": 2363} {"info/global_step": 2364, "train_info/time_within_train_step": 2.650304079055786, "step": 2364} {"train_info/time_between_train_steps": 0.0029611587524414062, "step": 2364} {"info/global_step": 2365, "train_info/time_within_train_step": 2.6691551208496094, "step": 2365} {"train_info/time_between_train_steps": 0.0029463768005371094, "step": 2365} {"info/global_step": 2366, "train_info/time_within_train_step": 2.7110002040863037, "step": 2366} {"train_info/time_between_train_steps": 0.0029523372650146484, "step": 2366} {"info/global_step": 2367, "train_info/time_within_train_step": 2.6893155574798584, "step": 2367} {"train_info/time_between_train_steps": 0.0029578208923339844, "step": 2367} {"info/global_step": 2368, "train_info/time_within_train_step": 2.641216278076172, "step": 2368} {"train_info/time_between_train_steps": 0.0029730796813964844, "step": 2368} {"info/global_step": 2369, "train_info/time_within_train_step": 2.640381097793579, "step": 2369} {"train_info/time_between_train_steps": 0.0029420852661132812, "step": 2369} {"info/global_step": 2370, "train_info/time_within_train_step": 2.6537959575653076, "step": 2370} {"train_info/time_between_train_steps": 0.002985715866088867, "step": 2370} {"info/global_step": 2371, "train_info/time_within_train_step": 2.65820050239563, "step": 2371} {"train_info/time_between_train_steps": 0.002936840057373047, "step": 2371} {"info/global_step": 2372, "train_info/time_within_train_step": 2.645228385925293, "step": 2372} {"train_info/time_between_train_steps": 0.0029392242431640625, "step": 2372} {"info/global_step": 2373, "train_info/time_within_train_step": 2.6485321521759033, "step": 2373} {"train_info/time_between_train_steps": 0.0029571056365966797, "step": 2373} {"info/global_step": 2374, "train_info/time_within_train_step": 2.653252363204956, "step": 2374} {"train_info/time_between_train_steps": 0.0030257701873779297, "step": 2374} {"info/global_step": 2375, "train_info/time_within_train_step": 2.67048978805542, "step": 2375} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 2375} {"info/global_step": 2376, "train_info/time_within_train_step": 2.70967173576355, "step": 2376} {"train_info/time_between_train_steps": 0.0030601024627685547, "step": 2376} {"info/global_step": 2377, "train_info/time_within_train_step": 2.640937089920044, "step": 2377} {"train_info/time_between_train_steps": 0.0029497146606445312, "step": 2377} {"info/global_step": 2378, "train_info/time_within_train_step": 2.6570546627044678, "step": 2378} {"train_info/time_between_train_steps": 0.002907276153564453, "step": 2378} {"info/global_step": 2379, "train_info/time_within_train_step": 2.648193836212158, "step": 2379} {"train_info/time_between_train_steps": 0.0029611587524414062, "step": 2379} {"info/global_step": 2380, "train_info/time_within_train_step": 2.6466917991638184, "step": 2380} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 2380} {"info/global_step": 2381, "train_info/time_within_train_step": 2.6568055152893066, "step": 2381} {"train_info/time_between_train_steps": 0.0029959678649902344, "step": 2381} {"info/global_step": 2382, "train_info/time_within_train_step": 2.6451361179351807, "step": 2382} {"train_info/time_between_train_steps": 0.0029671192169189453, "step": 2382} {"info/global_step": 2383, "train_info/time_within_train_step": 2.6516458988189697, "step": 2383} {"train_info/time_between_train_steps": 0.003014802932739258, "step": 2383} {"info/global_step": 2384, "train_info/time_within_train_step": 2.672211170196533, "step": 2384} {"train_info/time_between_train_steps": 0.0029382705688476562, "step": 2384} {"info/global_step": 2385, "train_info/time_within_train_step": 2.6660048961639404, "step": 2385} {"train_info/time_between_train_steps": 0.0029773712158203125, "step": 2385} {"info/global_step": 2386, "train_info/time_within_train_step": 2.658172130584717, "step": 2386} {"train_info/time_between_train_steps": 0.0029489994049072266, "step": 2386} {"info/global_step": 2387, "train_info/time_within_train_step": 2.6434779167175293, "step": 2387} {"train_info/time_between_train_steps": 0.0029761791229248047, "step": 2387} {"info/global_step": 2388, "train_info/time_within_train_step": 2.6613004207611084, "step": 2388} {"train_info/time_between_train_steps": 0.002913951873779297, "step": 2388} {"info/global_step": 2389, "train_info/time_within_train_step": 2.6513571739196777, "step": 2389} {"train_info/time_between_train_steps": 0.0029578208923339844, "step": 2389} {"info/global_step": 2390, "train_info/time_within_train_step": 2.64508056640625, "step": 2390} {"train_info/time_between_train_steps": 0.0029535293579101562, "step": 2390} {"info/global_step": 2391, "train_info/time_within_train_step": 2.6671547889709473, "step": 2391} {"train_info/time_between_train_steps": 0.002916574478149414, "step": 2391} {"info/global_step": 2392, "train_info/time_within_train_step": 2.655745506286621, "step": 2392} {"train_info/time_between_train_steps": 0.002936124801635742, "step": 2392} {"info/global_step": 2393, "train_info/time_within_train_step": 2.656015634536743, "step": 2393} {"train_info/time_between_train_steps": 0.002935171127319336, "step": 2393} {"info/global_step": 2394, "train_info/time_within_train_step": 2.706432580947876, "step": 2394} {"train_info/time_between_train_steps": 0.002968311309814453, "step": 2394} {"info/global_step": 2395, "train_info/time_within_train_step": 2.649263381958008, "step": 2395} {"train_info/time_between_train_steps": 0.0029304027557373047, "step": 2395} {"info/global_step": 2396, "train_info/time_within_train_step": 2.646691083908081, "step": 2396} {"train_info/time_between_train_steps": 0.0029611587524414062, "step": 2396} {"info/global_step": 2397, "train_info/time_within_train_step": 2.656773328781128, "step": 2397} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 2397} {"info/global_step": 2398, "train_info/time_within_train_step": 2.643627882003784, "step": 2398} {"train_info/time_between_train_steps": 0.0029249191284179688, "step": 2398} {"info/global_step": 2399, "train_info/time_within_train_step": 2.6439478397369385, "step": 2399} {"train_info/time_between_train_steps": 0.0029535293579101562, "step": 2399} {"info/global_step": 2400, "train_info/time_within_train_step": 2.6539552211761475, "step": 2400} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746904131, "_runtime": 6729}, "step": 2400} {"logs": {"train/loss": 4.1802, "train/learning_rate": 0.0005066666666666667, "train/epoch": 2.07, "_timestamp": 1746904131, "_runtime": 6729}, "step": 2400} {"train_info/time_between_train_steps": 25.794679880142212, "step": 2400} {"info/global_step": 2401, "train_info/time_within_train_step": 2.457505226135254, "step": 2401} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 2401} {"info/global_step": 2402, "train_info/time_within_train_step": 2.4241538047790527, "step": 2402} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 2402} {"info/global_step": 2403, "train_info/time_within_train_step": 2.5542266368865967, "step": 2403} {"train_info/time_between_train_steps": 0.0029392242431640625, "step": 2403} {"info/global_step": 2404, "train_info/time_within_train_step": 2.6550893783569336, "step": 2404} {"train_info/time_between_train_steps": 0.0029571056365966797, "step": 2404} {"info/global_step": 2405, "train_info/time_within_train_step": 2.6429038047790527, "step": 2405} {"train_info/time_between_train_steps": 0.002939939498901367, "step": 2405} {"info/global_step": 2406, "train_info/time_within_train_step": 2.654031753540039, "step": 2406} {"train_info/time_between_train_steps": 0.0030181407928466797, "step": 2406} {"info/global_step": 2407, "train_info/time_within_train_step": 2.6525027751922607, "step": 2407} {"train_info/time_between_train_steps": 0.0029108524322509766, "step": 2407} {"info/global_step": 2408, "train_info/time_within_train_step": 2.6433165073394775, "step": 2408} {"train_info/time_between_train_steps": 0.0029397010803222656, "step": 2408} {"info/global_step": 2409, "train_info/time_within_train_step": 2.644667863845825, "step": 2409} {"train_info/time_between_train_steps": 0.00299072265625, "step": 2409} {"info/global_step": 2410, "train_info/time_within_train_step": 2.653630018234253, "step": 2410} {"train_info/time_between_train_steps": 0.0029642581939697266, "step": 2410} {"info/global_step": 2411, "train_info/time_within_train_step": 2.660801649093628, "step": 2411} {"train_info/time_between_train_steps": 0.0029087066650390625, "step": 2411} {"info/global_step": 2412, "train_info/time_within_train_step": 2.6692559719085693, "step": 2412} {"train_info/time_between_train_steps": 0.002942800521850586, "step": 2412} {"info/global_step": 2413, "train_info/time_within_train_step": 2.6614537239074707, "step": 2413} {"train_info/time_between_train_steps": 0.0029387474060058594, "step": 2413} {"info/global_step": 2414, "train_info/time_within_train_step": 2.711007833480835, "step": 2414} {"train_info/time_between_train_steps": 0.002972841262817383, "step": 2414} {"info/global_step": 2415, "train_info/time_within_train_step": 2.6542861461639404, "step": 2415} {"train_info/time_between_train_steps": 0.0029408931732177734, "step": 2415} {"info/global_step": 2416, "train_info/time_within_train_step": 2.649432897567749, "step": 2416} {"train_info/time_between_train_steps": 0.002946138381958008, "step": 2416} {"info/global_step": 2417, "train_info/time_within_train_step": 2.652658462524414, "step": 2417} {"train_info/time_between_train_steps": 0.0029747486114501953, "step": 2417} {"info/global_step": 2418, "train_info/time_within_train_step": 2.651519775390625, "step": 2418} {"train_info/time_between_train_steps": 0.002902507781982422, "step": 2418} {"info/global_step": 2419, "train_info/time_within_train_step": 2.654305934906006, "step": 2419} {"train_info/time_between_train_steps": 0.002924680709838867, "step": 2419} {"info/global_step": 2420, "train_info/time_within_train_step": 2.650491952896118, "step": 2420} {"train_info/time_between_train_steps": 0.00292205810546875, "step": 2420} {"info/global_step": 2421, "train_info/time_within_train_step": 2.655280113220215, "step": 2421} {"train_info/time_between_train_steps": 0.0029599666595458984, "step": 2421} {"info/global_step": 2422, "train_info/time_within_train_step": 2.6591005325317383, "step": 2422} {"train_info/time_between_train_steps": 0.0030133724212646484, "step": 2422} {"info/global_step": 2423, "train_info/time_within_train_step": 2.6868677139282227, "step": 2423} {"train_info/time_between_train_steps": 0.0029456615447998047, "step": 2423} {"info/global_step": 2424, "train_info/time_within_train_step": 2.7223494052886963, "step": 2424} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 2424} {"info/global_step": 2425, "train_info/time_within_train_step": 2.7308430671691895, "step": 2425} {"train_info/time_between_train_steps": 0.0029380321502685547, "step": 2425} {"info/global_step": 2426, "train_info/time_within_train_step": 2.6514792442321777, "step": 2426} {"train_info/time_between_train_steps": 0.0029420852661132812, "step": 2426} {"info/global_step": 2427, "train_info/time_within_train_step": 2.6418137550354004, "step": 2427} {"train_info/time_between_train_steps": 0.0029299259185791016, "step": 2427} {"info/global_step": 2428, "train_info/time_within_train_step": 2.6612493991851807, "step": 2428} {"train_info/time_between_train_steps": 0.0029251575469970703, "step": 2428} {"info/global_step": 2429, "train_info/time_within_train_step": 2.649233818054199, "step": 2429} {"train_info/time_between_train_steps": 0.002964019775390625, "step": 2429} {"info/global_step": 2430, "train_info/time_within_train_step": 2.650242567062378, "step": 2430} {"train_info/time_between_train_steps": 0.0029044151306152344, "step": 2430} {"info/global_step": 2431, "train_info/time_within_train_step": 2.648421049118042, "step": 2431} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 2431} {"info/global_step": 2432, "train_info/time_within_train_step": 2.6438815593719482, "step": 2432} {"train_info/time_between_train_steps": 0.0030128955841064453, "step": 2432} {"info/global_step": 2433, "train_info/time_within_train_step": 2.6696619987487793, "step": 2433} {"train_info/time_between_train_steps": 0.0030059814453125, "step": 2433} {"info/global_step": 2434, "train_info/time_within_train_step": 2.671067953109741, "step": 2434} {"train_info/time_between_train_steps": 0.002950429916381836, "step": 2434} {"info/global_step": 2435, "train_info/time_within_train_step": 2.6945486068725586, "step": 2435} {"train_info/time_between_train_steps": 0.0029926300048828125, "step": 2435} {"info/global_step": 2436, "train_info/time_within_train_step": 2.647855281829834, "step": 2436} {"train_info/time_between_train_steps": 0.0029370784759521484, "step": 2436} {"info/global_step": 2437, "train_info/time_within_train_step": 2.6449475288391113, "step": 2437} {"train_info/time_between_train_steps": 0.0029709339141845703, "step": 2437} {"info/global_step": 2438, "train_info/time_within_train_step": 2.658306121826172, "step": 2438} {"train_info/time_between_train_steps": 0.0029230117797851562, "step": 2438} {"info/global_step": 2439, "train_info/time_within_train_step": 2.6576900482177734, "step": 2439} {"train_info/time_between_train_steps": 0.0029230117797851562, "step": 2439} {"info/global_step": 2440, "train_info/time_within_train_step": 2.6457526683807373, "step": 2440} {"train_info/time_between_train_steps": 0.002934694290161133, "step": 2440} {"info/global_step": 2441, "train_info/time_within_train_step": 2.6462504863739014, "step": 2441} {"train_info/time_between_train_steps": 0.002953767776489258, "step": 2441} {"info/global_step": 2442, "train_info/time_within_train_step": 2.6561925411224365, "step": 2442} {"train_info/time_between_train_steps": 0.0029675960540771484, "step": 2442} {"info/global_step": 2443, "train_info/time_within_train_step": 2.691553831100464, "step": 2443} {"train_info/time_between_train_steps": 0.0029175281524658203, "step": 2443} {"info/global_step": 2444, "train_info/time_within_train_step": 2.6713361740112305, "step": 2444} {"train_info/time_between_train_steps": 0.0029549598693847656, "step": 2444} {"info/global_step": 2445, "train_info/time_within_train_step": 2.6595957279205322, "step": 2445} {"train_info/time_between_train_steps": 0.002942323684692383, "step": 2445} {"info/global_step": 2446, "train_info/time_within_train_step": 2.677503824234009, "step": 2446} {"train_info/time_between_train_steps": 0.0029144287109375, "step": 2446} {"info/global_step": 2447, "train_info/time_within_train_step": 2.649090051651001, "step": 2447} {"train_info/time_between_train_steps": 0.002925872802734375, "step": 2447} {"info/global_step": 2448, "train_info/time_within_train_step": 2.647012710571289, "step": 2448} {"train_info/time_between_train_steps": 0.002943754196166992, "step": 2448} {"info/global_step": 2449, "train_info/time_within_train_step": 2.6517295837402344, "step": 2449} {"train_info/time_between_train_steps": 0.002917766571044922, "step": 2449} {"info/global_step": 2450, "train_info/time_within_train_step": 2.6516270637512207, "step": 2450} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746904291, "_runtime": 6889}, "step": 2450} {"logs": {"train/loss": 4.1641, "train/learning_rate": 0.0005033333333333333, "train/epoch": 2.07, "_timestamp": 1746904291, "_runtime": 6889}, "step": 2450} {"train_info/time_between_train_steps": 0.023088455200195312, "step": 2450} {"info/global_step": 2451, "train_info/time_within_train_step": 2.644974708557129, "step": 2451} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 2451} {"info/global_step": 2452, "train_info/time_within_train_step": 2.665165424346924, "step": 2452} {"train_info/time_between_train_steps": 0.0029544830322265625, "step": 2452} {"info/global_step": 2453, "train_info/time_within_train_step": 2.657318115234375, "step": 2453} {"train_info/time_between_train_steps": 0.0030176639556884766, "step": 2453} {"info/global_step": 2454, "train_info/time_within_train_step": 2.6650946140289307, "step": 2454} {"train_info/time_between_train_steps": 0.0029299259185791016, "step": 2454} {"info/global_step": 2455, "train_info/time_within_train_step": 2.687223434448242, "step": 2455} {"train_info/time_between_train_steps": 0.0029625892639160156, "step": 2455} {"info/global_step": 2456, "train_info/time_within_train_step": 2.648550510406494, "step": 2456} {"train_info/time_between_train_steps": 0.002993345260620117, "step": 2456} {"info/global_step": 2457, "train_info/time_within_train_step": 2.6501903533935547, "step": 2457} {"train_info/time_between_train_steps": 0.0029511451721191406, "step": 2457} {"info/global_step": 2458, "train_info/time_within_train_step": 2.659799098968506, "step": 2458} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 2458} {"info/global_step": 2459, "train_info/time_within_train_step": 2.6433191299438477, "step": 2459} {"train_info/time_between_train_steps": 0.002971172332763672, "step": 2459} {"info/global_step": 2460, "train_info/time_within_train_step": 2.6490163803100586, "step": 2460} {"train_info/time_between_train_steps": 0.0029320716857910156, "step": 2460} {"info/global_step": 2461, "train_info/time_within_train_step": 2.660329580307007, "step": 2461} {"train_info/time_between_train_steps": 0.0029134750366210938, "step": 2461} {"info/global_step": 2462, "train_info/time_within_train_step": 2.6528913974761963, "step": 2462} {"train_info/time_between_train_steps": 0.002975940704345703, "step": 2462} {"info/global_step": 2463, "train_info/time_within_train_step": 2.660071611404419, "step": 2463} {"train_info/time_between_train_steps": 0.0030145645141601562, "step": 2463} {"info/global_step": 2464, "train_info/time_within_train_step": 2.6795244216918945, "step": 2464} {"train_info/time_between_train_steps": 0.002913951873779297, "step": 2464} {"info/global_step": 2465, "train_info/time_within_train_step": 2.8292884826660156, "step": 2465} {"train_info/time_between_train_steps": 0.003039836883544922, "step": 2465} {"info/global_step": 2466, "train_info/time_within_train_step": 2.677600622177124, "step": 2466} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 2466} {"info/global_step": 2467, "train_info/time_within_train_step": 2.728867292404175, "step": 2467} {"train_info/time_between_train_steps": 0.003012418746948242, "step": 2467} {"info/global_step": 2468, "train_info/time_within_train_step": 2.651562213897705, "step": 2468} {"train_info/time_between_train_steps": 0.0029871463775634766, "step": 2468} {"info/global_step": 2469, "train_info/time_within_train_step": 2.641148090362549, "step": 2469} {"train_info/time_between_train_steps": 0.002933025360107422, "step": 2469} {"info/global_step": 2470, "train_info/time_within_train_step": 2.6591856479644775, "step": 2470} {"train_info/time_between_train_steps": 0.002943754196166992, "step": 2470} {"info/global_step": 2471, "train_info/time_within_train_step": 2.6479806900024414, "step": 2471} {"train_info/time_between_train_steps": 0.0029451847076416016, "step": 2471} {"info/global_step": 2472, "train_info/time_within_train_step": 2.651061534881592, "step": 2472} {"train_info/time_between_train_steps": 0.0029175281524658203, "step": 2472} {"info/global_step": 2473, "train_info/time_within_train_step": 2.648376941680908, "step": 2473} {"train_info/time_between_train_steps": 0.0029535293579101562, "step": 2473} {"info/global_step": 2474, "train_info/time_within_train_step": 2.643079996109009, "step": 2474} {"train_info/time_between_train_steps": 0.003389120101928711, "step": 2474} {"info/global_step": 2475, "train_info/time_within_train_step": 2.6695806980133057, "step": 2475} {"train_info/time_between_train_steps": 0.0029642581939697266, "step": 2475} {"info/global_step": 2476, "train_info/time_within_train_step": 2.691315174102783, "step": 2476} {"train_info/time_between_train_steps": 0.0029442310333251953, "step": 2476} {"info/global_step": 2477, "train_info/time_within_train_step": 2.648791790008545, "step": 2477} {"train_info/time_between_train_steps": 0.002866506576538086, "step": 2477} {"info/global_step": 2478, "train_info/time_within_train_step": 2.6636953353881836, "step": 2478} {"train_info/time_between_train_steps": 0.0029501914978027344, "step": 2478} {"info/global_step": 2479, "train_info/time_within_train_step": 2.6478614807128906, "step": 2479} {"train_info/time_between_train_steps": 0.0029480457305908203, "step": 2479} {"info/global_step": 2480, "train_info/time_within_train_step": 2.6475493907928467, "step": 2480} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 2480} {"info/global_step": 2481, "train_info/time_within_train_step": 2.6614835262298584, "step": 2481} {"train_info/time_between_train_steps": 0.002923727035522461, "step": 2481} {"info/global_step": 2482, "train_info/time_within_train_step": 2.6453797817230225, "step": 2482} {"train_info/time_between_train_steps": 0.0029430389404296875, "step": 2482} {"info/global_step": 2483, "train_info/time_within_train_step": 2.645258903503418, "step": 2483} {"train_info/time_between_train_steps": 0.002940654754638672, "step": 2483} {"info/global_step": 2484, "train_info/time_within_train_step": 2.6691839694976807, "step": 2484} {"train_info/time_between_train_steps": 0.0030024051666259766, "step": 2484} {"info/global_step": 2485, "train_info/time_within_train_step": 2.654423236846924, "step": 2485} {"train_info/time_between_train_steps": 0.003026247024536133, "step": 2485} {"info/global_step": 2486, "train_info/time_within_train_step": 2.649214267730713, "step": 2486} {"train_info/time_between_train_steps": 0.002988576889038086, "step": 2486} {"info/global_step": 2487, "train_info/time_within_train_step": 2.6539347171783447, "step": 2487} {"train_info/time_between_train_steps": 0.0030374526977539062, "step": 2487} {"info/global_step": 2488, "train_info/time_within_train_step": 2.649609088897705, "step": 2488} {"train_info/time_between_train_steps": 0.002941608428955078, "step": 2488} {"info/global_step": 2489, "train_info/time_within_train_step": 2.6440556049346924, "step": 2489} {"train_info/time_between_train_steps": 0.003095865249633789, "step": 2489} {"info/global_step": 2490, "train_info/time_within_train_step": 2.6482818126678467, "step": 2490} {"train_info/time_between_train_steps": 0.0029380321502685547, "step": 2490} {"info/global_step": 2491, "train_info/time_within_train_step": 2.650770902633667, "step": 2491} {"train_info/time_between_train_steps": 0.0029478073120117188, "step": 2491} {"info/global_step": 2492, "train_info/time_within_train_step": 2.6633224487304688, "step": 2492} {"train_info/time_between_train_steps": 0.0029447078704833984, "step": 2492} {"info/global_step": 2493, "train_info/time_within_train_step": 2.6641757488250732, "step": 2493} {"train_info/time_between_train_steps": 0.0030133724212646484, "step": 2493} {"info/global_step": 2494, "train_info/time_within_train_step": 2.6575865745544434, "step": 2494} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 2494} {"info/global_step": 2495, "train_info/time_within_train_step": 2.7070963382720947, "step": 2495} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 2495} {"info/global_step": 2496, "train_info/time_within_train_step": 2.6569674015045166, "step": 2496} {"train_info/time_between_train_steps": 0.0029191970825195312, "step": 2496} {"info/global_step": 2497, "train_info/time_within_train_step": 2.6487722396850586, "step": 2497} {"train_info/time_between_train_steps": 0.0029311180114746094, "step": 2497} {"info/global_step": 2498, "train_info/time_within_train_step": 2.6658966541290283, "step": 2498} {"train_info/time_between_train_steps": 0.0029633045196533203, "step": 2498} {"info/global_step": 2499, "train_info/time_within_train_step": 2.648488759994507, "step": 2499} {"train_info/time_between_train_steps": 0.002966642379760742, "step": 2499} {"info/global_step": 2500, "train_info/time_within_train_step": 3.252974033355713, "step": 2500} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746904426, "_runtime": 7024}, "step": 2500} {"logs": {"train/loss": 4.1474, "train/learning_rate": 0.0005, "train/epoch": 2.08, "_timestamp": 1746904426, "_runtime": 7024}, "step": 2500} {"train_info/time_between_train_steps": 0.02979278564453125, "step": 2500} {"info/global_step": 2501, "train_info/time_within_train_step": 2.6653850078582764, "step": 2501} {"train_info/time_between_train_steps": 0.00292205810546875, "step": 2501} {"info/global_step": 2502, "train_info/time_within_train_step": 2.6604673862457275, "step": 2502} {"train_info/time_between_train_steps": 0.002988576889038086, "step": 2502} {"info/global_step": 2503, "train_info/time_within_train_step": 2.6646018028259277, "step": 2503} {"train_info/time_between_train_steps": 0.0029251575469970703, "step": 2503} {"info/global_step": 2504, "train_info/time_within_train_step": 2.684368371963501, "step": 2504} {"train_info/time_between_train_steps": 0.0029718875885009766, "step": 2504} {"info/global_step": 2505, "train_info/time_within_train_step": 2.6681838035583496, "step": 2505} {"train_info/time_between_train_steps": 0.0029354095458984375, "step": 2505} {"info/global_step": 2506, "train_info/time_within_train_step": 2.6463429927825928, "step": 2506} {"train_info/time_between_train_steps": 0.0029196739196777344, "step": 2506} {"info/global_step": 2507, "train_info/time_within_train_step": 2.6438443660736084, "step": 2507} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 2507} {"info/global_step": 2508, "train_info/time_within_train_step": 2.6513047218322754, "step": 2508} {"train_info/time_between_train_steps": 0.0029480457305908203, "step": 2508} {"info/global_step": 2509, "train_info/time_within_train_step": 2.653186082839966, "step": 2509} {"train_info/time_between_train_steps": 0.002903461456298828, "step": 2509} {"info/global_step": 2510, "train_info/time_within_train_step": 2.657618999481201, "step": 2510} {"train_info/time_between_train_steps": 0.0028994083404541016, "step": 2510} {"info/global_step": 2511, "train_info/time_within_train_step": 2.665219783782959, "step": 2511} {"train_info/time_between_train_steps": 0.0029516220092773438, "step": 2511} {"info/global_step": 2512, "train_info/time_within_train_step": 2.6521615982055664, "step": 2512} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 2512} {"info/global_step": 2513, "train_info/time_within_train_step": 2.6615278720855713, "step": 2513} {"train_info/time_between_train_steps": 0.0029785633087158203, "step": 2513} {"info/global_step": 2514, "train_info/time_within_train_step": 2.715245246887207, "step": 2514} {"train_info/time_between_train_steps": 0.0029375553131103516, "step": 2514} {"info/global_step": 2515, "train_info/time_within_train_step": 2.688906669616699, "step": 2515} {"train_info/time_between_train_steps": 0.0029311180114746094, "step": 2515} {"info/global_step": 2516, "train_info/time_within_train_step": 2.640925168991089, "step": 2516} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 2516} {"info/global_step": 2517, "train_info/time_within_train_step": 2.641526222229004, "step": 2517} {"train_info/time_between_train_steps": 0.0029594898223876953, "step": 2517} {"info/global_step": 2518, "train_info/time_within_train_step": 2.66054368019104, "step": 2518} {"train_info/time_between_train_steps": 0.002972841262817383, "step": 2518} {"info/global_step": 2519, "train_info/time_within_train_step": 2.6548688411712646, "step": 2519} {"train_info/time_between_train_steps": 0.002984285354614258, "step": 2519} {"info/global_step": 2520, "train_info/time_within_train_step": 2.644559144973755, "step": 2520} {"train_info/time_between_train_steps": 0.0028905868530273438, "step": 2520} {"info/global_step": 2521, "train_info/time_within_train_step": 2.654108762741089, "step": 2521} {"train_info/time_between_train_steps": 0.002953767776489258, "step": 2521} {"info/global_step": 2522, "train_info/time_within_train_step": 2.6476287841796875, "step": 2522} {"train_info/time_between_train_steps": 0.002940654754638672, "step": 2522} {"info/global_step": 2523, "train_info/time_within_train_step": 2.667069435119629, "step": 2523} {"train_info/time_between_train_steps": 0.0029501914978027344, "step": 2523} {"info/global_step": 2524, "train_info/time_within_train_step": 2.7655582427978516, "step": 2524} {"train_info/time_between_train_steps": 0.002965211868286133, "step": 2524} {"info/global_step": 2525, "train_info/time_within_train_step": 2.6965880393981934, "step": 2525} {"train_info/time_between_train_steps": 0.0029523372650146484, "step": 2525} {"info/global_step": 2526, "train_info/time_within_train_step": 2.6569602489471436, "step": 2526} {"train_info/time_between_train_steps": 0.002944469451904297, "step": 2526} {"info/global_step": 2527, "train_info/time_within_train_step": 2.6637203693389893, "step": 2527} {"train_info/time_between_train_steps": 0.0029556751251220703, "step": 2527} {"info/global_step": 2528, "train_info/time_within_train_step": 2.63983416557312, "step": 2528} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 2528} {"info/global_step": 2529, "train_info/time_within_train_step": 2.6544950008392334, "step": 2529} {"train_info/time_between_train_steps": 0.002913236618041992, "step": 2529} {"info/global_step": 2530, "train_info/time_within_train_step": 2.659339427947998, "step": 2530} {"train_info/time_between_train_steps": 0.003303050994873047, "step": 2530} {"info/global_step": 2531, "train_info/time_within_train_step": 2.644357442855835, "step": 2531} {"train_info/time_between_train_steps": 0.0029327869415283203, "step": 2531} {"info/global_step": 2532, "train_info/time_within_train_step": 2.64497447013855, "step": 2532} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 2532} {"info/global_step": 2533, "train_info/time_within_train_step": 2.6533868312835693, "step": 2533} {"train_info/time_between_train_steps": 0.0032682418823242188, "step": 2533} {"info/global_step": 2534, "train_info/time_within_train_step": 2.6715242862701416, "step": 2534} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 2534} {"info/global_step": 2535, "train_info/time_within_train_step": 2.6816155910491943, "step": 2535} {"train_info/time_between_train_steps": 0.0029659271240234375, "step": 2535} {"info/global_step": 2536, "train_info/time_within_train_step": 2.6528046131134033, "step": 2536} {"train_info/time_between_train_steps": 0.002943277359008789, "step": 2536} {"info/global_step": 2537, "train_info/time_within_train_step": 2.684816837310791, "step": 2537} {"train_info/time_between_train_steps": 0.002930879592895508, "step": 2537} {"info/global_step": 2538, "train_info/time_within_train_step": 2.641098737716675, "step": 2538} {"train_info/time_between_train_steps": 0.0030171871185302734, "step": 2538} {"info/global_step": 2539, "train_info/time_within_train_step": 2.6483640670776367, "step": 2539} {"train_info/time_between_train_steps": 0.002943277359008789, "step": 2539} {"info/global_step": 2540, "train_info/time_within_train_step": 2.6616129875183105, "step": 2540} {"train_info/time_between_train_steps": 0.0029506683349609375, "step": 2540} {"info/global_step": 2541, "train_info/time_within_train_step": 2.642261266708374, "step": 2541} {"train_info/time_between_train_steps": 0.0029671192169189453, "step": 2541} {"info/global_step": 2542, "train_info/time_within_train_step": 2.64446759223938, "step": 2542} {"train_info/time_between_train_steps": 0.0029456615447998047, "step": 2542} {"info/global_step": 2543, "train_info/time_within_train_step": 2.6569137573242188, "step": 2543} {"train_info/time_between_train_steps": 0.0030426979064941406, "step": 2543} {"info/global_step": 2544, "train_info/time_within_train_step": 2.6764538288116455, "step": 2544} {"train_info/time_between_train_steps": 0.0029337406158447266, "step": 2544} {"info/global_step": 2545, "train_info/time_within_train_step": 2.6668505668640137, "step": 2545} {"train_info/time_between_train_steps": 0.0030279159545898438, "step": 2545} {"info/global_step": 2546, "train_info/time_within_train_step": 2.7082905769348145, "step": 2546} {"train_info/time_between_train_steps": 0.0029239654541015625, "step": 2546} {"info/global_step": 2547, "train_info/time_within_train_step": 2.6529834270477295, "step": 2547} {"train_info/time_between_train_steps": 0.0029718875885009766, "step": 2547} {"info/global_step": 2548, "train_info/time_within_train_step": 2.643968343734741, "step": 2548} {"train_info/time_between_train_steps": 0.0030355453491210938, "step": 2548} {"info/global_step": 2549, "train_info/time_within_train_step": 2.643479585647583, "step": 2549} {"train_info/time_between_train_steps": 0.0031020641326904297, "step": 2549} {"info/global_step": 2550, "train_info/time_within_train_step": 2.6438560485839844, "step": 2550} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746904561, "_runtime": 7159}, "step": 2550} {"logs": {"train/loss": 4.1362, "train/learning_rate": 0.0004966666666666666, "train/epoch": 2.08, "_timestamp": 1746904561, "_runtime": 7159}, "step": 2550} {"train_info/time_between_train_steps": 0.41367483139038086, "step": 2550} {"info/global_step": 2551, "train_info/time_within_train_step": 2.6443960666656494, "step": 2551} {"train_info/time_between_train_steps": 0.003103971481323242, "step": 2551} {"info/global_step": 2552, "train_info/time_within_train_step": 2.646196126937866, "step": 2552} {"train_info/time_between_train_steps": 0.004267692565917969, "step": 2552} {"info/global_step": 2553, "train_info/time_within_train_step": 2.647918224334717, "step": 2553} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 2553} {"info/global_step": 2554, "train_info/time_within_train_step": 2.6437947750091553, "step": 2554} {"train_info/time_between_train_steps": 0.003072023391723633, "step": 2554} {"info/global_step": 2555, "train_info/time_within_train_step": 2.6428396701812744, "step": 2555} {"train_info/time_between_train_steps": 0.003069162368774414, "step": 2555} {"info/global_step": 2556, "train_info/time_within_train_step": 2.6411917209625244, "step": 2556} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 2556} {"info/global_step": 2557, "train_info/time_within_train_step": 2.6378917694091797, "step": 2557} {"train_info/time_between_train_steps": 0.0029773712158203125, "step": 2557} {"info/global_step": 2558, "train_info/time_within_train_step": 2.673516035079956, "step": 2558} {"train_info/time_between_train_steps": 0.0030090808868408203, "step": 2558} {"info/global_step": 2559, "train_info/time_within_train_step": 2.6413776874542236, "step": 2559} {"train_info/time_between_train_steps": 0.0029726028442382812, "step": 2559} {"info/global_step": 2560, "train_info/time_within_train_step": 2.6629838943481445, "step": 2560} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 2560} {"info/global_step": 2561, "train_info/time_within_train_step": 2.654538154602051, "step": 2561} {"train_info/time_between_train_steps": 0.0030477046966552734, "step": 2561} {"info/global_step": 2562, "train_info/time_within_train_step": 2.647756814956665, "step": 2562} {"train_info/time_between_train_steps": 0.003042459487915039, "step": 2562} {"info/global_step": 2563, "train_info/time_within_train_step": 2.648303508758545, "step": 2563} {"train_info/time_between_train_steps": 0.003061056137084961, "step": 2563} {"info/global_step": 2564, "train_info/time_within_train_step": 2.6483006477355957, "step": 2564} {"train_info/time_between_train_steps": 0.0030281543731689453, "step": 2564} {"info/global_step": 2565, "train_info/time_within_train_step": 2.703550338745117, "step": 2565} {"train_info/time_between_train_steps": 0.0030231475830078125, "step": 2565} {"info/global_step": 2566, "train_info/time_within_train_step": 2.6443543434143066, "step": 2566} {"train_info/time_between_train_steps": 0.0030107498168945312, "step": 2566} {"info/global_step": 2567, "train_info/time_within_train_step": 2.6667749881744385, "step": 2567} {"train_info/time_between_train_steps": 0.0030858516693115234, "step": 2567} {"info/global_step": 2568, "train_info/time_within_train_step": 2.7020299434661865, "step": 2568} {"train_info/time_between_train_steps": 0.003088712692260742, "step": 2568} {"info/global_step": 2569, "train_info/time_within_train_step": 2.6473615169525146, "step": 2569} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 2569} {"info/global_step": 2570, "train_info/time_within_train_step": 2.6582696437835693, "step": 2570} {"train_info/time_between_train_steps": 0.0031130313873291016, "step": 2570} {"info/global_step": 2571, "train_info/time_within_train_step": 2.649944305419922, "step": 2571} {"train_info/time_between_train_steps": 0.0031363964080810547, "step": 2571} {"info/global_step": 2572, "train_info/time_within_train_step": 2.6498429775238037, "step": 2572} {"train_info/time_between_train_steps": 0.0031261444091796875, "step": 2572} {"info/global_step": 2573, "train_info/time_within_train_step": 2.645465135574341, "step": 2573} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 2573} {"info/global_step": 2574, "train_info/time_within_train_step": 2.645488977432251, "step": 2574} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 2574} {"info/global_step": 2575, "train_info/time_within_train_step": 2.6503164768218994, "step": 2575} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 2575} {"info/global_step": 2576, "train_info/time_within_train_step": 2.6691203117370605, "step": 2576} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 2576} {"info/global_step": 2577, "train_info/time_within_train_step": 2.6771388053894043, "step": 2577} {"train_info/time_between_train_steps": 0.003359079360961914, "step": 2577} {"info/global_step": 2578, "train_info/time_within_train_step": 2.6526834964752197, "step": 2578} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 2578} {"info/global_step": 2579, "train_info/time_within_train_step": 2.6883199214935303, "step": 2579} {"train_info/time_between_train_steps": 0.0033638477325439453, "step": 2579} {"info/global_step": 2580, "train_info/time_within_train_step": 2.6431329250335693, "step": 2580} {"train_info/time_between_train_steps": 0.003297567367553711, "step": 2580} {"info/global_step": 2581, "train_info/time_within_train_step": 2.6485025882720947, "step": 2581} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 2581} {"info/global_step": 2582, "train_info/time_within_train_step": 2.662564754486084, "step": 2582} {"train_info/time_between_train_steps": 0.003539562225341797, "step": 2582} {"info/global_step": 2583, "train_info/time_within_train_step": 2.645815134048462, "step": 2583} {"train_info/time_between_train_steps": 0.003797769546508789, "step": 2583} {"info/global_step": 2584, "train_info/time_within_train_step": 2.646432399749756, "step": 2584} {"train_info/time_between_train_steps": 0.003830432891845703, "step": 2584} {"info/global_step": 2585, "train_info/time_within_train_step": 2.65399169921875, "step": 2585} {"train_info/time_between_train_steps": 0.003844022750854492, "step": 2585} {"info/global_step": 2586, "train_info/time_within_train_step": 2.664273500442505, "step": 2586} {"train_info/time_between_train_steps": 0.0038933753967285156, "step": 2586} {"info/global_step": 2587, "train_info/time_within_train_step": 2.6707606315612793, "step": 2587} {"train_info/time_between_train_steps": 0.0043087005615234375, "step": 2587} {"info/global_step": 2588, "train_info/time_within_train_step": 2.663648843765259, "step": 2588} {"train_info/time_between_train_steps": 0.004596710205078125, "step": 2588} {"info/global_step": 2589, "train_info/time_within_train_step": 2.712681293487549, "step": 2589} {"train_info/time_between_train_steps": 0.0038421154022216797, "step": 2589} {"train_info/time_between_train_steps": 2.350055694580078, "step": 2589} {"info/global_step": 2590, "train_info/time_within_train_step": 2.629443407058716, "step": 2590} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 2590} {"info/global_step": 2591, "train_info/time_within_train_step": 2.6605944633483887, "step": 2591} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 2591} {"info/global_step": 2592, "train_info/time_within_train_step": 2.6825733184814453, "step": 2592} {"train_info/time_between_train_steps": 0.00311279296875, "step": 2592} {"info/global_step": 2593, "train_info/time_within_train_step": 2.9274115562438965, "step": 2593} {"train_info/time_between_train_steps": 0.0032062530517578125, "step": 2593} {"info/global_step": 2594, "train_info/time_within_train_step": 2.6595187187194824, "step": 2594} {"train_info/time_between_train_steps": 0.003257274627685547, "step": 2594} {"info/global_step": 2595, "train_info/time_within_train_step": 2.66797137260437, "step": 2595} {"train_info/time_between_train_steps": 0.003133535385131836, "step": 2595} {"info/global_step": 2596, "train_info/time_within_train_step": 2.7141356468200684, "step": 2596} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 2596} {"info/global_step": 2597, "train_info/time_within_train_step": 2.6586086750030518, "step": 2597} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 2597} {"info/global_step": 2598, "train_info/time_within_train_step": 2.647630214691162, "step": 2598} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 2598} {"info/global_step": 2599, "train_info/time_within_train_step": 2.647892951965332, "step": 2599} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 2599} {"info/global_step": 2600, "train_info/time_within_train_step": 2.648143768310547, "step": 2600} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746904701, "_runtime": 7299}, "step": 2600} {"logs": {"train/loss": 4.1513, "train/learning_rate": 0.0004933333333333333, "train/epoch": 3.0, "_timestamp": 1746904701, "_runtime": 7299}, "step": 2600} {"train_info/time_between_train_steps": 28.358619451522827, "step": 2600} {"info/global_step": 2601, "train_info/time_within_train_step": 2.442563056945801, "step": 2601} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 2601} {"info/global_step": 2602, "train_info/time_within_train_step": 2.438835382461548, "step": 2602} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 2602} {"info/global_step": 2603, "train_info/time_within_train_step": 2.5571956634521484, "step": 2603} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 2603} {"info/global_step": 2604, "train_info/time_within_train_step": 2.633791446685791, "step": 2604} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 2604} {"info/global_step": 2605, "train_info/time_within_train_step": 2.6361353397369385, "step": 2605} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 2605} {"info/global_step": 2606, "train_info/time_within_train_step": 2.6585237979888916, "step": 2606} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 2606} {"info/global_step": 2607, "train_info/time_within_train_step": 2.6530227661132812, "step": 2607} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 2607} {"info/global_step": 2608, "train_info/time_within_train_step": 2.643357992172241, "step": 2608} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 2608} {"info/global_step": 2609, "train_info/time_within_train_step": 2.662120819091797, "step": 2609} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 2609} {"info/global_step": 2610, "train_info/time_within_train_step": 2.652688980102539, "step": 2610} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 2610} {"info/global_step": 2611, "train_info/time_within_train_step": 2.6625545024871826, "step": 2611} {"train_info/time_between_train_steps": 0.0032329559326171875, "step": 2611} {"info/global_step": 2612, "train_info/time_within_train_step": 2.71907114982605, "step": 2612} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 2612} {"info/global_step": 2613, "train_info/time_within_train_step": 2.6868269443511963, "step": 2613} {"train_info/time_between_train_steps": 0.003132343292236328, "step": 2613} {"info/global_step": 2614, "train_info/time_within_train_step": 2.6430811882019043, "step": 2614} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 2614} {"info/global_step": 2615, "train_info/time_within_train_step": 2.643030881881714, "step": 2615} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 2615} {"info/global_step": 2616, "train_info/time_within_train_step": 2.657832145690918, "step": 2616} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 2616} {"info/global_step": 2617, "train_info/time_within_train_step": 2.6574928760528564, "step": 2617} {"train_info/time_between_train_steps": 0.0031502246856689453, "step": 2617} {"info/global_step": 2618, "train_info/time_within_train_step": 2.6460392475128174, "step": 2618} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 2618} {"info/global_step": 2619, "train_info/time_within_train_step": 2.6525115966796875, "step": 2619} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 2619} {"info/global_step": 2620, "train_info/time_within_train_step": 2.6584300994873047, "step": 2620} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 2620} {"info/global_step": 2621, "train_info/time_within_train_step": 2.6690263748168945, "step": 2621} {"train_info/time_between_train_steps": 0.003097057342529297, "step": 2621} {"info/global_step": 2622, "train_info/time_within_train_step": 2.7112207412719727, "step": 2622} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 2622} {"info/global_step": 2623, "train_info/time_within_train_step": 2.6428160667419434, "step": 2623} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 2623} {"info/global_step": 2624, "train_info/time_within_train_step": 2.653184175491333, "step": 2624} {"train_info/time_between_train_steps": 0.003109455108642578, "step": 2624} {"info/global_step": 2625, "train_info/time_within_train_step": 2.6496617794036865, "step": 2625} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 2625} {"info/global_step": 2626, "train_info/time_within_train_step": 2.64856219291687, "step": 2626} {"train_info/time_between_train_steps": 0.0031499862670898438, "step": 2626} {"info/global_step": 2627, "train_info/time_within_train_step": 2.6596624851226807, "step": 2627} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 2627} {"info/global_step": 2628, "train_info/time_within_train_step": 2.6440811157226562, "step": 2628} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 2628} {"info/global_step": 2629, "train_info/time_within_train_step": 2.647007942199707, "step": 2629} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 2629} {"info/global_step": 2630, "train_info/time_within_train_step": 2.6738345623016357, "step": 2630} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 2630} {"info/global_step": 2631, "train_info/time_within_train_step": 2.6681947708129883, "step": 2631} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 2631} {"info/global_step": 2632, "train_info/time_within_train_step": 2.691663980484009, "step": 2632} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 2632} {"info/global_step": 2633, "train_info/time_within_train_step": 2.655684232711792, "step": 2633} {"train_info/time_between_train_steps": 0.0031270980834960938, "step": 2633} {"info/global_step": 2634, "train_info/time_within_train_step": 2.6826601028442383, "step": 2634} {"train_info/time_between_train_steps": 0.00311279296875, "step": 2634} {"info/global_step": 2635, "train_info/time_within_train_step": 2.646228313446045, "step": 2635} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 2635} {"info/global_step": 2636, "train_info/time_within_train_step": 2.645967721939087, "step": 2636} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 2636} {"info/global_step": 2637, "train_info/time_within_train_step": 2.66477108001709, "step": 2637} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 2637} {"info/global_step": 2638, "train_info/time_within_train_step": 2.662762403488159, "step": 2638} {"train_info/time_between_train_steps": 0.0032083988189697266, "step": 2638} {"info/global_step": 2639, "train_info/time_within_train_step": 2.674684524536133, "step": 2639} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 2639} {"info/global_step": 2640, "train_info/time_within_train_step": 2.674593210220337, "step": 2640} {"train_info/time_between_train_steps": 0.0032274723052978516, "step": 2640} {"info/global_step": 2641, "train_info/time_within_train_step": 2.695091962814331, "step": 2641} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 2641} {"info/global_step": 2642, "train_info/time_within_train_step": 2.6422595977783203, "step": 2642} {"train_info/time_between_train_steps": 0.003242969512939453, "step": 2642} {"info/global_step": 2643, "train_info/time_within_train_step": 2.642498016357422, "step": 2643} {"train_info/time_between_train_steps": 0.0033278465270996094, "step": 2643} {"info/global_step": 2644, "train_info/time_within_train_step": 2.668778896331787, "step": 2644} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 2644} {"info/global_step": 2645, "train_info/time_within_train_step": 2.6493351459503174, "step": 2645} {"train_info/time_between_train_steps": 0.003183126449584961, "step": 2645} {"info/global_step": 2646, "train_info/time_within_train_step": 2.646517753601074, "step": 2646} {"train_info/time_between_train_steps": 0.003125905990600586, "step": 2646} {"info/global_step": 2647, "train_info/time_within_train_step": 2.660417318344116, "step": 2647} {"train_info/time_between_train_steps": 0.0031249523162841797, "step": 2647} {"info/global_step": 2648, "train_info/time_within_train_step": 2.8611714839935303, "step": 2648} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 2648} {"info/global_step": 2649, "train_info/time_within_train_step": 2.6442556381225586, "step": 2649} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 2649} {"info/global_step": 2650, "train_info/time_within_train_step": 2.6508736610412598, "step": 2650} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746904863, "_runtime": 7461}, "step": 2650} {"logs": {"train/loss": 4.1101, "train/learning_rate": 0.00049, "train/epoch": 3.01, "_timestamp": 1746904863, "_runtime": 7461}, "step": 2650} {"train_info/time_between_train_steps": 0.024379491806030273, "step": 2650} {"info/global_step": 2651, "train_info/time_within_train_step": 2.6497857570648193, "step": 2651} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 2651} {"info/global_step": 2652, "train_info/time_within_train_step": 2.7741024494171143, "step": 2652} {"train_info/time_between_train_steps": 0.003340005874633789, "step": 2652} {"info/global_step": 2653, "train_info/time_within_train_step": 2.669116973876953, "step": 2653} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 2653} {"info/global_step": 2654, "train_info/time_within_train_step": 2.71109938621521, "step": 2654} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 2654} {"info/global_step": 2655, "train_info/time_within_train_step": 2.643528699874878, "step": 2655} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 2655} {"info/global_step": 2656, "train_info/time_within_train_step": 2.656015396118164, "step": 2656} {"train_info/time_between_train_steps": 0.0032427310943603516, "step": 2656} {"info/global_step": 2657, "train_info/time_within_train_step": 2.6468217372894287, "step": 2657} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 2657} {"info/global_step": 2658, "train_info/time_within_train_step": 2.648590564727783, "step": 2658} {"train_info/time_between_train_steps": 0.0032618045806884766, "step": 2658} {"info/global_step": 2659, "train_info/time_within_train_step": 2.661240339279175, "step": 2659} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 2659} {"info/global_step": 2660, "train_info/time_within_train_step": 2.6444435119628906, "step": 2660} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 2660} {"info/global_step": 2661, "train_info/time_within_train_step": 2.646367311477661, "step": 2661} {"train_info/time_between_train_steps": 0.00492095947265625, "step": 2661} {"info/global_step": 2662, "train_info/time_within_train_step": 2.6758487224578857, "step": 2662} {"train_info/time_between_train_steps": 0.003173828125, "step": 2662} {"info/global_step": 2663, "train_info/time_within_train_step": 2.6660592555999756, "step": 2663} {"train_info/time_between_train_steps": 0.003173828125, "step": 2663} {"info/global_step": 2664, "train_info/time_within_train_step": 2.6620595455169678, "step": 2664} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 2664} {"info/global_step": 2665, "train_info/time_within_train_step": 2.6811277866363525, "step": 2665} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 2665} {"info/global_step": 2666, "train_info/time_within_train_step": 2.6420555114746094, "step": 2666} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 2666} {"info/global_step": 2667, "train_info/time_within_train_step": 2.652482032775879, "step": 2667} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 2667} {"info/global_step": 2668, "train_info/time_within_train_step": 2.661179304122925, "step": 2668} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 2668} {"info/global_step": 2669, "train_info/time_within_train_step": 2.645362377166748, "step": 2669} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 2669} {"info/global_step": 2670, "train_info/time_within_train_step": 2.643751382827759, "step": 2670} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 2670} {"info/global_step": 2671, "train_info/time_within_train_step": 2.6749320030212402, "step": 2671} {"train_info/time_between_train_steps": 0.003221273422241211, "step": 2671} {"info/global_step": 2672, "train_info/time_within_train_step": 2.660235643386841, "step": 2672} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 2672} {"info/global_step": 2673, "train_info/time_within_train_step": 2.6782636642456055, "step": 2673} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 2673} {"info/global_step": 2674, "train_info/time_within_train_step": 2.672401189804077, "step": 2674} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 2674} {"info/global_step": 2675, "train_info/time_within_train_step": 2.67164945602417, "step": 2675} {"train_info/time_between_train_steps": 0.0032334327697753906, "step": 2675} {"info/global_step": 2676, "train_info/time_within_train_step": 2.6469473838806152, "step": 2676} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 2676} {"info/global_step": 2677, "train_info/time_within_train_step": 2.642688512802124, "step": 2677} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 2677} {"info/global_step": 2678, "train_info/time_within_train_step": 2.6576008796691895, "step": 2678} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 2678} {"info/global_step": 2679, "train_info/time_within_train_step": 2.66157603263855, "step": 2679} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 2679} {"info/global_step": 2680, "train_info/time_within_train_step": 2.654160976409912, "step": 2680} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 2680} {"info/global_step": 2681, "train_info/time_within_train_step": 2.660045862197876, "step": 2681} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 2681} {"info/global_step": 2682, "train_info/time_within_train_step": 2.6537821292877197, "step": 2682} {"train_info/time_between_train_steps": 0.003225564956665039, "step": 2682} {"info/global_step": 2683, "train_info/time_within_train_step": 2.6623761653900146, "step": 2683} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 2683} {"info/global_step": 2684, "train_info/time_within_train_step": 2.725510835647583, "step": 2684} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 2684} {"info/global_step": 2685, "train_info/time_within_train_step": 2.671644926071167, "step": 2685} {"train_info/time_between_train_steps": 0.003193378448486328, "step": 2685} {"info/global_step": 2686, "train_info/time_within_train_step": 2.6432342529296875, "step": 2686} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 2686} {"info/global_step": 2687, "train_info/time_within_train_step": 2.642427682876587, "step": 2687} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 2687} {"info/global_step": 2688, "train_info/time_within_train_step": 2.6571598052978516, "step": 2688} {"train_info/time_between_train_steps": 0.003249645233154297, "step": 2688} {"info/global_step": 2689, "train_info/time_within_train_step": 2.653670072555542, "step": 2689} {"train_info/time_between_train_steps": 0.0032579898834228516, "step": 2689} {"info/global_step": 2690, "train_info/time_within_train_step": 2.8718206882476807, "step": 2690} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 2690} {"info/global_step": 2691, "train_info/time_within_train_step": 2.658602237701416, "step": 2691} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 2691} {"info/global_step": 2692, "train_info/time_within_train_step": 2.654822587966919, "step": 2692} {"train_info/time_between_train_steps": 0.0032651424407958984, "step": 2692} {"info/global_step": 2693, "train_info/time_within_train_step": 2.644320487976074, "step": 2693} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 2693} {"info/global_step": 2694, "train_info/time_within_train_step": 2.6951370239257812, "step": 2694} {"train_info/time_between_train_steps": 0.003268003463745117, "step": 2694} {"info/global_step": 2695, "train_info/time_within_train_step": 2.6485321521759033, "step": 2695} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 2695} {"info/global_step": 2696, "train_info/time_within_train_step": 2.6417720317840576, "step": 2696} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 2696} {"info/global_step": 2697, "train_info/time_within_train_step": 2.656036138534546, "step": 2697} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 2697} {"info/global_step": 2698, "train_info/time_within_train_step": 2.654611110687256, "step": 2698} {"train_info/time_between_train_steps": 0.003193378448486328, "step": 2698} {"info/global_step": 2699, "train_info/time_within_train_step": 2.6446754932403564, "step": 2699} {"train_info/time_between_train_steps": 0.0031290054321289062, "step": 2699} {"info/global_step": 2700, "train_info/time_within_train_step": 2.6496593952178955, "step": 2700} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746904998, "_runtime": 7596}, "step": 2700} {"logs": {"train/loss": 4.095, "train/learning_rate": 0.0004866666666666666, "train/epoch": 3.01, "_timestamp": 1746904998, "_runtime": 7596}, "step": 2700} {"train_info/time_between_train_steps": 0.028499126434326172, "step": 2700} {"info/global_step": 2701, "train_info/time_within_train_step": 2.652045488357544, "step": 2701} {"train_info/time_between_train_steps": 0.003228425979614258, "step": 2701} {"info/global_step": 2702, "train_info/time_within_train_step": 2.6714725494384766, "step": 2702} {"train_info/time_between_train_steps": 0.0031468868255615234, "step": 2702} {"info/global_step": 2703, "train_info/time_within_train_step": 2.6723806858062744, "step": 2703} {"train_info/time_between_train_steps": 0.003269195556640625, "step": 2703} {"info/global_step": 2704, "train_info/time_within_train_step": 2.6547963619232178, "step": 2704} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 2704} {"info/global_step": 2705, "train_info/time_within_train_step": 2.691084384918213, "step": 2705} {"train_info/time_between_train_steps": 0.0031468868255615234, "step": 2705} {"info/global_step": 2706, "train_info/time_within_train_step": 2.6415958404541016, "step": 2706} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 2706} {"info/global_step": 2707, "train_info/time_within_train_step": 2.6548585891723633, "step": 2707} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 2707} {"info/global_step": 2708, "train_info/time_within_train_step": 2.6593217849731445, "step": 2708} {"train_info/time_between_train_steps": 0.0031604766845703125, "step": 2708} {"info/global_step": 2709, "train_info/time_within_train_step": 2.6436355113983154, "step": 2709} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 2709} {"info/global_step": 2710, "train_info/time_within_train_step": 2.6448493003845215, "step": 2710} {"train_info/time_between_train_steps": 0.003118276596069336, "step": 2710} {"info/global_step": 2711, "train_info/time_within_train_step": 2.6547226905822754, "step": 2711} {"train_info/time_between_train_steps": 0.003228425979614258, "step": 2711} {"info/global_step": 2712, "train_info/time_within_train_step": 2.6590938568115234, "step": 2712} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 2712} {"info/global_step": 2713, "train_info/time_within_train_step": 2.6757442951202393, "step": 2713} {"train_info/time_between_train_steps": 0.0036253929138183594, "step": 2713} {"info/global_step": 2714, "train_info/time_within_train_step": 2.6618893146514893, "step": 2714} {"train_info/time_between_train_steps": 0.12503266334533691, "step": 2714} {"info/global_step": 2715, "train_info/time_within_train_step": 2.6740944385528564, "step": 2715} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 2715} {"info/global_step": 2716, "train_info/time_within_train_step": 2.6763124465942383, "step": 2716} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 2716} {"info/global_step": 2717, "train_info/time_within_train_step": 2.644336223602295, "step": 2717} {"train_info/time_between_train_steps": 0.0033288002014160156, "step": 2717} {"info/global_step": 2718, "train_info/time_within_train_step": 2.6543967723846436, "step": 2718} {"train_info/time_between_train_steps": 0.003371715545654297, "step": 2718} {"info/global_step": 2719, "train_info/time_within_train_step": 2.659252405166626, "step": 2719} {"train_info/time_between_train_steps": 0.003311634063720703, "step": 2719} {"info/global_step": 2720, "train_info/time_within_train_step": 2.648850202560425, "step": 2720} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 2720} {"info/global_step": 2721, "train_info/time_within_train_step": 2.6606171131134033, "step": 2721} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 2721} {"info/global_step": 2722, "train_info/time_within_train_step": 2.6559300422668457, "step": 2722} {"train_info/time_between_train_steps": 0.003246307373046875, "step": 2722} {"info/global_step": 2723, "train_info/time_within_train_step": 2.66683292388916, "step": 2723} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 2723} {"info/global_step": 2724, "train_info/time_within_train_step": 2.724978446960449, "step": 2724} {"train_info/time_between_train_steps": 0.003262758255004883, "step": 2724} {"info/global_step": 2725, "train_info/time_within_train_step": 2.680187940597534, "step": 2725} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 2725} {"info/global_step": 2726, "train_info/time_within_train_step": 2.6422579288482666, "step": 2726} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 2726} {"info/global_step": 2727, "train_info/time_within_train_step": 2.6419408321380615, "step": 2727} {"train_info/time_between_train_steps": 0.0032587051391601562, "step": 2727} {"info/global_step": 2728, "train_info/time_within_train_step": 2.658243179321289, "step": 2728} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 2728} {"info/global_step": 2729, "train_info/time_within_train_step": 2.665376663208008, "step": 2729} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 2729} {"info/global_step": 2730, "train_info/time_within_train_step": 2.6453804969787598, "step": 2730} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 2730} {"info/global_step": 2731, "train_info/time_within_train_step": 2.655302047729492, "step": 2731} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 2731} {"info/global_step": 2732, "train_info/time_within_train_step": 2.647838592529297, "step": 2732} {"train_info/time_between_train_steps": 0.003423929214477539, "step": 2732} {"info/global_step": 2733, "train_info/time_within_train_step": 2.6695144176483154, "step": 2733} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 2733} {"info/global_step": 2734, "train_info/time_within_train_step": 2.6699678897857666, "step": 2734} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 2734} {"info/global_step": 2735, "train_info/time_within_train_step": 2.701794147491455, "step": 2735} {"train_info/time_between_train_steps": 0.0034096240997314453, "step": 2735} {"info/global_step": 2736, "train_info/time_within_train_step": 2.649325370788574, "step": 2736} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 2736} {"info/global_step": 2737, "train_info/time_within_train_step": 2.6645612716674805, "step": 2737} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 2737} {"info/global_step": 2738, "train_info/time_within_train_step": 2.642205238342285, "step": 2738} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 2738} {"info/global_step": 2739, "train_info/time_within_train_step": 2.651568651199341, "step": 2739} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 2739} {"info/global_step": 2740, "train_info/time_within_train_step": 2.6655070781707764, "step": 2740} {"train_info/time_between_train_steps": 0.003254413604736328, "step": 2740} {"info/global_step": 2741, "train_info/time_within_train_step": 2.6477952003479004, "step": 2741} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 2741} {"info/global_step": 2742, "train_info/time_within_train_step": 2.643986225128174, "step": 2742} {"train_info/time_between_train_steps": 0.0032684803009033203, "step": 2742} {"info/global_step": 2743, "train_info/time_within_train_step": 2.6717584133148193, "step": 2743} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 2743} {"info/global_step": 2744, "train_info/time_within_train_step": 2.665493965148926, "step": 2744} {"train_info/time_between_train_steps": 0.003278017044067383, "step": 2744} {"info/global_step": 2745, "train_info/time_within_train_step": 2.67991304397583, "step": 2745} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 2745} {"info/global_step": 2746, "train_info/time_within_train_step": 2.6672253608703613, "step": 2746} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 2746} {"info/global_step": 2747, "train_info/time_within_train_step": 2.6639344692230225, "step": 2747} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 2747} {"info/global_step": 2748, "train_info/time_within_train_step": 2.6482062339782715, "step": 2748} {"train_info/time_between_train_steps": 0.003170490264892578, "step": 2748} {"info/global_step": 2749, "train_info/time_within_train_step": 2.6473023891448975, "step": 2749} {"train_info/time_between_train_steps": 0.003253936767578125, "step": 2749} {"info/global_step": 2750, "train_info/time_within_train_step": 3.2507810592651367, "step": 2750} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746905133, "_runtime": 7731}, "step": 2750} {"logs": {"train/loss": 4.0845, "train/learning_rate": 0.0004833333333333333, "train/epoch": 3.02, "_timestamp": 1746905133, "_runtime": 7731}, "step": 2750} {"train_info/time_between_train_steps": 0.029404878616333008, "step": 2750} {"info/global_step": 2751, "train_info/time_within_train_step": 2.6457231044769287, "step": 2751} {"train_info/time_between_train_steps": 0.0032362937927246094, "step": 2751} {"info/global_step": 2752, "train_info/time_within_train_step": 2.6425981521606445, "step": 2752} {"train_info/time_between_train_steps": 0.0034880638122558594, "step": 2752} {"info/global_step": 2753, "train_info/time_within_train_step": 2.644059896469116, "step": 2753} {"train_info/time_between_train_steps": 0.003380298614501953, "step": 2753} {"info/global_step": 2754, "train_info/time_within_train_step": 2.643195867538452, "step": 2754} {"train_info/time_between_train_steps": 0.003361940383911133, "step": 2754} {"info/global_step": 2755, "train_info/time_within_train_step": 2.647214651107788, "step": 2755} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 2755} {"info/global_step": 2756, "train_info/time_within_train_step": 2.647860527038574, "step": 2756} {"train_info/time_between_train_steps": 0.003373861312866211, "step": 2756} {"info/global_step": 2757, "train_info/time_within_train_step": 2.6438140869140625, "step": 2757} {"train_info/time_between_train_steps": 0.0033457279205322266, "step": 2757} {"info/global_step": 2758, "train_info/time_within_train_step": 2.643549680709839, "step": 2758} {"train_info/time_between_train_steps": 0.0033359527587890625, "step": 2758} {"info/global_step": 2759, "train_info/time_within_train_step": 2.6423985958099365, "step": 2759} {"train_info/time_between_train_steps": 0.003468751907348633, "step": 2759} {"info/global_step": 2760, "train_info/time_within_train_step": 4.803624153137207, "step": 2760} {"train_info/time_between_train_steps": 0.003574848175048828, "step": 2760} {"info/global_step": 2761, "train_info/time_within_train_step": 2.561366319656372, "step": 2761} {"train_info/time_between_train_steps": 0.003370523452758789, "step": 2761} {"info/global_step": 2762, "train_info/time_within_train_step": 2.5028700828552246, "step": 2762} {"train_info/time_between_train_steps": 0.003376007080078125, "step": 2762} {"info/global_step": 2763, "train_info/time_within_train_step": 2.700540542602539, "step": 2763} {"train_info/time_between_train_steps": 0.0034372806549072266, "step": 2763} {"info/global_step": 2764, "train_info/time_within_train_step": 4.135347604751587, "step": 2764} {"train_info/time_between_train_steps": 0.003369569778442383, "step": 2764} {"info/global_step": 2765, "train_info/time_within_train_step": 2.4455718994140625, "step": 2765} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 2765} {"info/global_step": 2766, "train_info/time_within_train_step": 2.617903232574463, "step": 2766} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 2766} {"info/global_step": 2767, "train_info/time_within_train_step": 2.636014938354492, "step": 2767} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 2767} {"info/global_step": 2768, "train_info/time_within_train_step": 2.6852831840515137, "step": 2768} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 2768} {"info/global_step": 2769, "train_info/time_within_train_step": 2.6607587337493896, "step": 2769} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 2769} {"info/global_step": 2770, "train_info/time_within_train_step": 2.6511716842651367, "step": 2770} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 2770} {"info/global_step": 2771, "train_info/time_within_train_step": 2.645427703857422, "step": 2771} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 2771} {"info/global_step": 2772, "train_info/time_within_train_step": 2.6670570373535156, "step": 2772} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 2772} {"info/global_step": 2773, "train_info/time_within_train_step": 2.697354555130005, "step": 2773} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 2773} {"info/global_step": 2774, "train_info/time_within_train_step": 2.6580018997192383, "step": 2774} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 2774} {"info/global_step": 2775, "train_info/time_within_train_step": 2.6630361080169678, "step": 2775} {"train_info/time_between_train_steps": 0.0032329559326171875, "step": 2775} {"info/global_step": 2776, "train_info/time_within_train_step": 2.640813112258911, "step": 2776} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 2776} {"info/global_step": 2777, "train_info/time_within_train_step": 2.7670063972473145, "step": 2777} {"train_info/time_between_train_steps": 0.0032334327697753906, "step": 2777} {"info/global_step": 2778, "train_info/time_within_train_step": 2.648942232131958, "step": 2778} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 2778} {"info/global_step": 2779, "train_info/time_within_train_step": 2.6506600379943848, "step": 2779} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 2779} {"info/global_step": 2780, "train_info/time_within_train_step": 2.6443958282470703, "step": 2780} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 2780} {"info/global_step": 2781, "train_info/time_within_train_step": 2.646291494369507, "step": 2781} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 2781} {"info/global_step": 2782, "train_info/time_within_train_step": 2.6515002250671387, "step": 2782} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 2782} {"info/global_step": 2783, "train_info/time_within_train_step": 2.6691668033599854, "step": 2783} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 2783} {"info/global_step": 2784, "train_info/time_within_train_step": 2.67871356010437, "step": 2784} {"train_info/time_between_train_steps": 0.003261566162109375, "step": 2784} {"info/global_step": 2785, "train_info/time_within_train_step": 2.6501832008361816, "step": 2785} {"train_info/time_between_train_steps": 0.0032682418823242188, "step": 2785} {"info/global_step": 2786, "train_info/time_within_train_step": 2.9487974643707275, "step": 2786} {"train_info/time_between_train_steps": 0.0032618045806884766, "step": 2786} {"info/global_step": 2787, "train_info/time_within_train_step": 2.6690831184387207, "step": 2787} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 2787} {"info/global_step": 2788, "train_info/time_within_train_step": 2.677239418029785, "step": 2788} {"train_info/time_between_train_steps": 0.0032644271850585938, "step": 2788} {"info/global_step": 2789, "train_info/time_within_train_step": 2.653864860534668, "step": 2789} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 2789} {"info/global_step": 2790, "train_info/time_within_train_step": 2.6873199939727783, "step": 2790} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 2790} {"info/global_step": 2791, "train_info/time_within_train_step": 2.6411941051483154, "step": 2791} {"train_info/time_between_train_steps": 0.0031430721282958984, "step": 2791} {"info/global_step": 2792, "train_info/time_within_train_step": 2.6560046672821045, "step": 2792} {"train_info/time_between_train_steps": 0.0032579898834228516, "step": 2792} {"info/global_step": 2793, "train_info/time_within_train_step": 2.649029016494751, "step": 2793} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 2793} {"info/global_step": 2794, "train_info/time_within_train_step": 2.645547866821289, "step": 2794} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 2794} {"info/global_step": 2795, "train_info/time_within_train_step": 2.6667237281799316, "step": 2795} {"train_info/time_between_train_steps": 0.0032339096069335938, "step": 2795} {"info/global_step": 2796, "train_info/time_within_train_step": 2.6619176864624023, "step": 2796} {"train_info/time_between_train_steps": 0.003261566162109375, "step": 2796} {"info/global_step": 2797, "train_info/time_within_train_step": 2.67195725440979, "step": 2797} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 2797} {"info/global_step": 2798, "train_info/time_within_train_step": 2.6908702850341797, "step": 2798} {"train_info/time_between_train_steps": 0.0032625198364257812, "step": 2798} {"info/global_step": 2799, "train_info/time_within_train_step": 2.6639230251312256, "step": 2799} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 2799} {"info/global_step": 2800, "train_info/time_within_train_step": 2.645200252532959, "step": 2800} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746905282, "_runtime": 7880}, "step": 2800} {"logs": {"train/loss": 4.0696, "train/learning_rate": 0.00047999999999999996, "train/epoch": 3.02, "_timestamp": 1746905282, "_runtime": 7880}, "step": 2800} {"train_info/time_between_train_steps": 26.27517008781433, "step": 2800} {"info/global_step": 2801, "train_info/time_within_train_step": 2.454678773880005, "step": 2801} {"train_info/time_between_train_steps": 0.0031702518463134766, "step": 2801} {"info/global_step": 2802, "train_info/time_within_train_step": 2.4338440895080566, "step": 2802} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 2802} {"info/global_step": 2803, "train_info/time_within_train_step": 2.5696487426757812, "step": 2803} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 2803} {"info/global_step": 2804, "train_info/time_within_train_step": 2.6339776515960693, "step": 2804} {"train_info/time_between_train_steps": 0.0032300949096679688, "step": 2804} {"info/global_step": 2805, "train_info/time_within_train_step": 2.644591808319092, "step": 2805} {"train_info/time_between_train_steps": 0.0032646656036376953, "step": 2805} {"info/global_step": 2806, "train_info/time_within_train_step": 2.6637425422668457, "step": 2806} {"train_info/time_between_train_steps": 0.0031604766845703125, "step": 2806} {"info/global_step": 2807, "train_info/time_within_train_step": 2.6435816287994385, "step": 2807} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 2807} {"info/global_step": 2808, "train_info/time_within_train_step": 2.646399736404419, "step": 2808} {"train_info/time_between_train_steps": 0.003416776657104492, "step": 2808} {"info/global_step": 2809, "train_info/time_within_train_step": 2.6674790382385254, "step": 2809} {"train_info/time_between_train_steps": 0.003376007080078125, "step": 2809} {"info/global_step": 2810, "train_info/time_within_train_step": 2.661311149597168, "step": 2810} {"train_info/time_between_train_steps": 0.003473043441772461, "step": 2810} {"info/global_step": 2811, "train_info/time_within_train_step": 2.6611430644989014, "step": 2811} {"train_info/time_between_train_steps": 0.003619670867919922, "step": 2811} {"info/global_step": 2812, "train_info/time_within_train_step": 2.701138496398926, "step": 2812} {"train_info/time_between_train_steps": 0.0033669471740722656, "step": 2812} {"info/global_step": 2813, "train_info/time_within_train_step": 2.6698007583618164, "step": 2813} {"train_info/time_between_train_steps": 0.0039675235748291016, "step": 2813} {"info/global_step": 2814, "train_info/time_within_train_step": 2.6531858444213867, "step": 2814} {"train_info/time_between_train_steps": 0.0038268566131591797, "step": 2814} {"info/global_step": 2815, "train_info/time_within_train_step": 2.6489009857177734, "step": 2815} {"train_info/time_between_train_steps": 0.004196643829345703, "step": 2815} {"info/global_step": 2816, "train_info/time_within_train_step": 2.6631369590759277, "step": 2816} {"train_info/time_between_train_steps": 0.0038161277770996094, "step": 2816} {"info/global_step": 2817, "train_info/time_within_train_step": 2.655472755432129, "step": 2817} {"train_info/time_between_train_steps": 0.0042989253997802734, "step": 2817} {"info/global_step": 2818, "train_info/time_within_train_step": 2.663546323776245, "step": 2818} {"train_info/time_between_train_steps": 0.003684520721435547, "step": 2818} {"info/global_step": 2819, "train_info/time_within_train_step": 2.6891980171203613, "step": 2819} {"train_info/time_between_train_steps": 0.0038805007934570312, "step": 2819} {"info/global_step": 2820, "train_info/time_within_train_step": 2.7362751960754395, "step": 2820} {"train_info/time_between_train_steps": 0.003864288330078125, "step": 2820} {"info/global_step": 2821, "train_info/time_within_train_step": 2.6742043495178223, "step": 2821} {"train_info/time_between_train_steps": 0.0037746429443359375, "step": 2821} {"info/global_step": 2822, "train_info/time_within_train_step": 2.6444270610809326, "step": 2822} {"train_info/time_between_train_steps": 0.0038290023803710938, "step": 2822} {"info/global_step": 2823, "train_info/time_within_train_step": 2.6480045318603516, "step": 2823} {"train_info/time_between_train_steps": 0.0037767887115478516, "step": 2823} {"info/global_step": 2824, "train_info/time_within_train_step": 2.6654367446899414, "step": 2824} {"train_info/time_between_train_steps": 0.0037932395935058594, "step": 2824} {"info/global_step": 2825, "train_info/time_within_train_step": 2.6582374572753906, "step": 2825} {"train_info/time_between_train_steps": 0.004004001617431641, "step": 2825} {"info/global_step": 2826, "train_info/time_within_train_step": 2.6468799114227295, "step": 2826} {"train_info/time_between_train_steps": 0.003569364547729492, "step": 2826} {"info/global_step": 2827, "train_info/time_within_train_step": 2.6549086570739746, "step": 2827} {"train_info/time_between_train_steps": 0.0039010047912597656, "step": 2827} {"info/global_step": 2828, "train_info/time_within_train_step": 2.6490042209625244, "step": 2828} {"train_info/time_between_train_steps": 0.003691434860229492, "step": 2828} {"info/global_step": 2829, "train_info/time_within_train_step": 2.671969175338745, "step": 2829} {"train_info/time_between_train_steps": 0.0038194656372070312, "step": 2829} {"info/global_step": 2830, "train_info/time_within_train_step": 2.674856185913086, "step": 2830} {"train_info/time_between_train_steps": 0.0038442611694335938, "step": 2830} {"info/global_step": 2831, "train_info/time_within_train_step": 2.6982665061950684, "step": 2831} {"train_info/time_between_train_steps": 0.003601551055908203, "step": 2831} {"info/global_step": 2832, "train_info/time_within_train_step": 2.6501145362854004, "step": 2832} {"train_info/time_between_train_steps": 0.003781557083129883, "step": 2832} {"info/global_step": 2833, "train_info/time_within_train_step": 2.6543021202087402, "step": 2833} {"train_info/time_between_train_steps": 0.0038750171661376953, "step": 2833} {"info/global_step": 2834, "train_info/time_within_train_step": 2.6530773639678955, "step": 2834} {"train_info/time_between_train_steps": 0.003608226776123047, "step": 2834} {"info/global_step": 2835, "train_info/time_within_train_step": 2.6530721187591553, "step": 2835} {"train_info/time_between_train_steps": 0.003860950469970703, "step": 2835} {"info/global_step": 2836, "train_info/time_within_train_step": 2.6651978492736816, "step": 2836} {"train_info/time_between_train_steps": 0.003931760787963867, "step": 2836} {"info/global_step": 2837, "train_info/time_within_train_step": 2.648747444152832, "step": 2837} {"train_info/time_between_train_steps": 0.0037550926208496094, "step": 2837} {"info/global_step": 2838, "train_info/time_within_train_step": 2.646451473236084, "step": 2838} {"train_info/time_between_train_steps": 0.003778696060180664, "step": 2838} {"info/global_step": 2839, "train_info/time_within_train_step": 2.6652493476867676, "step": 2839} {"train_info/time_between_train_steps": 0.2092268466949463, "step": 2839} {"info/global_step": 2840, "train_info/time_within_train_step": 2.646585702896118, "step": 2840} {"train_info/time_between_train_steps": 0.0034449100494384766, "step": 2840} {"info/global_step": 2841, "train_info/time_within_train_step": 2.660369634628296, "step": 2841} {"train_info/time_between_train_steps": 0.003599882125854492, "step": 2841} {"info/global_step": 2842, "train_info/time_within_train_step": 2.649606943130493, "step": 2842} {"train_info/time_between_train_steps": 0.003584623336791992, "step": 2842} {"info/global_step": 2843, "train_info/time_within_train_step": 2.673696517944336, "step": 2843} {"train_info/time_between_train_steps": 0.0035791397094726562, "step": 2843} {"info/global_step": 2844, "train_info/time_within_train_step": 2.6674177646636963, "step": 2844} {"train_info/time_between_train_steps": 0.0037012100219726562, "step": 2844} {"info/global_step": 2845, "train_info/time_within_train_step": 2.675931930541992, "step": 2845} {"train_info/time_between_train_steps": 0.0035247802734375, "step": 2845} {"info/global_step": 2846, "train_info/time_within_train_step": 2.6733169555664062, "step": 2846} {"train_info/time_between_train_steps": 0.003419160842895508, "step": 2846} {"info/global_step": 2847, "train_info/time_within_train_step": 2.6617813110351562, "step": 2847} {"train_info/time_between_train_steps": 0.0035750865936279297, "step": 2847} {"info/global_step": 2848, "train_info/time_within_train_step": 2.6470108032226562, "step": 2848} {"train_info/time_between_train_steps": 0.0035588741302490234, "step": 2848} {"info/global_step": 2849, "train_info/time_within_train_step": 2.650725841522217, "step": 2849} {"train_info/time_between_train_steps": 0.0037102699279785156, "step": 2849} {"info/global_step": 2850, "train_info/time_within_train_step": 2.6469786167144775, "step": 2850} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746905443, "_runtime": 8041}, "step": 2850} {"logs": {"train/loss": 4.0541, "train/learning_rate": 0.0004766666666666666, "train/epoch": 3.03, "_timestamp": 1746905443, "_runtime": 8041}, "step": 2850} {"train_info/time_between_train_steps": 0.025493621826171875, "step": 2850} {"info/global_step": 2851, "train_info/time_within_train_step": 2.658820152282715, "step": 2851} {"train_info/time_between_train_steps": 0.0036020278930664062, "step": 2851} {"info/global_step": 2852, "train_info/time_within_train_step": 2.6639657020568848, "step": 2852} {"train_info/time_between_train_steps": 0.0036666393280029297, "step": 2852} {"info/global_step": 2853, "train_info/time_within_train_step": 2.672124147415161, "step": 2853} {"train_info/time_between_train_steps": 0.0037000179290771484, "step": 2853} {"info/global_step": 2854, "train_info/time_within_train_step": 2.6630187034606934, "step": 2854} {"train_info/time_between_train_steps": 0.0035364627838134766, "step": 2854} {"info/global_step": 2855, "train_info/time_within_train_step": 2.7118079662323, "step": 2855} {"train_info/time_between_train_steps": 0.0035941600799560547, "step": 2855} {"info/global_step": 2856, "train_info/time_within_train_step": 2.646169900894165, "step": 2856} {"train_info/time_between_train_steps": 0.003634929656982422, "step": 2856} {"info/global_step": 2857, "train_info/time_within_train_step": 2.663104295730591, "step": 2857} {"train_info/time_between_train_steps": 0.0036280155181884766, "step": 2857} {"info/global_step": 2858, "train_info/time_within_train_step": 2.647150993347168, "step": 2858} {"train_info/time_between_train_steps": 0.003671884536743164, "step": 2858} {"info/global_step": 2859, "train_info/time_within_train_step": 2.6796340942382812, "step": 2859} {"train_info/time_between_train_steps": 0.0036554336547851562, "step": 2859} {"info/global_step": 2860, "train_info/time_within_train_step": 2.732468366622925, "step": 2860} {"train_info/time_between_train_steps": 0.0035042762756347656, "step": 2860} {"info/global_step": 2861, "train_info/time_within_train_step": 2.6610891819000244, "step": 2861} {"train_info/time_between_train_steps": 0.003540515899658203, "step": 2861} {"info/global_step": 2862, "train_info/time_within_train_step": 2.643819808959961, "step": 2862} {"train_info/time_between_train_steps": 0.0035789012908935547, "step": 2862} {"info/global_step": 2863, "train_info/time_within_train_step": 2.647364377975464, "step": 2863} {"train_info/time_between_train_steps": 0.0035681724548339844, "step": 2863} {"info/global_step": 2864, "train_info/time_within_train_step": 2.6585116386413574, "step": 2864} {"train_info/time_between_train_steps": 0.0034656524658203125, "step": 2864} {"info/global_step": 2865, "train_info/time_within_train_step": 2.6572349071502686, "step": 2865} {"train_info/time_between_train_steps": 0.003609895706176758, "step": 2865} {"info/global_step": 2866, "train_info/time_within_train_step": 2.6465325355529785, "step": 2866} {"train_info/time_between_train_steps": 0.0035729408264160156, "step": 2866} {"info/global_step": 2867, "train_info/time_within_train_step": 2.6532866954803467, "step": 2867} {"train_info/time_between_train_steps": 0.0036475658416748047, "step": 2867} {"info/global_step": 2868, "train_info/time_within_train_step": 2.6571624279022217, "step": 2868} {"train_info/time_between_train_steps": 0.003473520278930664, "step": 2868} {"info/global_step": 2869, "train_info/time_within_train_step": 2.6723761558532715, "step": 2869} {"train_info/time_between_train_steps": 0.0038971900939941406, "step": 2869} {"info/global_step": 2870, "train_info/time_within_train_step": 2.71329927444458, "step": 2870} {"train_info/time_between_train_steps": 0.003571033477783203, "step": 2870} {"info/global_step": 2871, "train_info/time_within_train_step": 2.651862382888794, "step": 2871} {"train_info/time_between_train_steps": 0.0035219192504882812, "step": 2871} {"info/global_step": 2872, "train_info/time_within_train_step": 3.035794496536255, "step": 2872} {"train_info/time_between_train_steps": 0.0033254623413085938, "step": 2872} {"info/global_step": 2873, "train_info/time_within_train_step": 2.650517463684082, "step": 2873} {"train_info/time_between_train_steps": 0.0032722949981689453, "step": 2873} {"info/global_step": 2874, "train_info/time_within_train_step": 2.6570608615875244, "step": 2874} {"train_info/time_between_train_steps": 0.0034322738647460938, "step": 2874} {"info/global_step": 2875, "train_info/time_within_train_step": 2.669590711593628, "step": 2875} {"train_info/time_between_train_steps": 0.003311634063720703, "step": 2875} {"info/global_step": 2876, "train_info/time_within_train_step": 2.6982223987579346, "step": 2876} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 2876} {"info/global_step": 2877, "train_info/time_within_train_step": 2.6613500118255615, "step": 2877} {"train_info/time_between_train_steps": 0.003248453140258789, "step": 2877} {"info/global_step": 2878, "train_info/time_within_train_step": 2.665817975997925, "step": 2878} {"train_info/time_between_train_steps": 0.003287792205810547, "step": 2878} {"info/global_step": 2879, "train_info/time_within_train_step": 2.643000841140747, "step": 2879} {"train_info/time_between_train_steps": 0.0032439231872558594, "step": 2879} {"info/global_step": 2880, "train_info/time_within_train_step": 2.6548593044281006, "step": 2880} {"train_info/time_between_train_steps": 0.0032486915588378906, "step": 2880} {"info/global_step": 2881, "train_info/time_within_train_step": 2.6690244674682617, "step": 2881} {"train_info/time_between_train_steps": 0.003281116485595703, "step": 2881} {"info/global_step": 2882, "train_info/time_within_train_step": 2.6450672149658203, "step": 2882} {"train_info/time_between_train_steps": 0.0032444000244140625, "step": 2882} {"info/global_step": 2883, "train_info/time_within_train_step": 2.645202159881592, "step": 2883} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 2883} {"info/global_step": 2884, "train_info/time_within_train_step": 2.657418727874756, "step": 2884} {"train_info/time_between_train_steps": 0.0032739639282226562, "step": 2884} {"info/global_step": 2885, "train_info/time_within_train_step": 2.6713359355926514, "step": 2885} {"train_info/time_between_train_steps": 0.0032782554626464844, "step": 2885} {"info/global_step": 2886, "train_info/time_within_train_step": 2.67927622795105, "step": 2886} {"train_info/time_between_train_steps": 0.0032858848571777344, "step": 2886} {"info/global_step": 2887, "train_info/time_within_train_step": 2.651249885559082, "step": 2887} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 2887} {"info/global_step": 2888, "train_info/time_within_train_step": 2.6853275299072266, "step": 2888} {"train_info/time_between_train_steps": 0.003338336944580078, "step": 2888} {"info/global_step": 2889, "train_info/time_within_train_step": 2.6413307189941406, "step": 2889} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 2889} {"info/global_step": 2890, "train_info/time_within_train_step": 2.649407386779785, "step": 2890} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 2890} {"info/global_step": 2891, "train_info/time_within_train_step": 2.66422438621521, "step": 2891} {"train_info/time_between_train_steps": 0.0032711029052734375, "step": 2891} {"info/global_step": 2892, "train_info/time_within_train_step": 2.643721103668213, "step": 2892} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 2892} {"info/global_step": 2893, "train_info/time_within_train_step": 2.644639253616333, "step": 2893} {"train_info/time_between_train_steps": 0.003237009048461914, "step": 2893} {"info/global_step": 2894, "train_info/time_within_train_step": 2.65881085395813, "step": 2894} {"train_info/time_between_train_steps": 0.003237009048461914, "step": 2894} {"info/global_step": 2895, "train_info/time_within_train_step": 2.6605520248413086, "step": 2895} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 2895} {"info/global_step": 2896, "train_info/time_within_train_step": 2.675075054168701, "step": 2896} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 2896} {"info/global_step": 2897, "train_info/time_within_train_step": 2.6673314571380615, "step": 2897} {"train_info/time_between_train_steps": 0.0035796165466308594, "step": 2897} {"info/global_step": 2898, "train_info/time_within_train_step": 2.6978466510772705, "step": 2898} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 2898} {"info/global_step": 2899, "train_info/time_within_train_step": 2.6415185928344727, "step": 2899} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 2899} {"info/global_step": 2900, "train_info/time_within_train_step": 2.646069049835205, "step": 2900} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746905577, "_runtime": 8175}, "step": 2900} {"logs": {"train/loss": 4.0465, "train/learning_rate": 0.00047333333333333326, "train/epoch": 3.03, "_timestamp": 1746905577, "_runtime": 8175}, "step": 2900} {"train_info/time_between_train_steps": 0.02444934844970703, "step": 2900} {"info/global_step": 2901, "train_info/time_within_train_step": 2.6481852531433105, "step": 2901} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 2901} {"info/global_step": 2902, "train_info/time_within_train_step": 2.778846502304077, "step": 2902} {"train_info/time_between_train_steps": 0.0032358169555664062, "step": 2902} {"info/global_step": 2903, "train_info/time_within_train_step": 2.6611998081207275, "step": 2903} {"train_info/time_between_train_steps": 0.003300189971923828, "step": 2903} {"info/global_step": 2904, "train_info/time_within_train_step": 2.6442534923553467, "step": 2904} {"train_info/time_between_train_steps": 0.0032570362091064453, "step": 2904} {"info/global_step": 2905, "train_info/time_within_train_step": 2.647273302078247, "step": 2905} {"train_info/time_between_train_steps": 0.003248929977416992, "step": 2905} {"info/global_step": 2906, "train_info/time_within_train_step": 2.6518306732177734, "step": 2906} {"train_info/time_between_train_steps": 0.003400564193725586, "step": 2906} {"info/global_step": 2907, "train_info/time_within_train_step": 2.6540918350219727, "step": 2907} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 2907} {"info/global_step": 2908, "train_info/time_within_train_step": 2.6735987663269043, "step": 2908} {"train_info/time_between_train_steps": 0.0033180713653564453, "step": 2908} {"info/global_step": 2909, "train_info/time_within_train_step": 2.6746931076049805, "step": 2909} {"train_info/time_between_train_steps": 0.003296375274658203, "step": 2909} {"info/global_step": 2910, "train_info/time_within_train_step": 2.7222442626953125, "step": 2910} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 2910} {"info/global_step": 2911, "train_info/time_within_train_step": 2.6605310440063477, "step": 2911} {"train_info/time_between_train_steps": 0.0033464431762695312, "step": 2911} {"info/global_step": 2912, "train_info/time_within_train_step": 2.6653635501861572, "step": 2912} {"train_info/time_between_train_steps": 0.003281831741333008, "step": 2912} {"info/global_step": 2913, "train_info/time_within_train_step": 2.6675829887390137, "step": 2913} {"train_info/time_between_train_steps": 0.003265380859375, "step": 2913} {"info/global_step": 2914, "train_info/time_within_train_step": 2.6556549072265625, "step": 2914} {"train_info/time_between_train_steps": 0.003237009048461914, "step": 2914} {"info/global_step": 2915, "train_info/time_within_train_step": 2.664715528488159, "step": 2915} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 2915} {"info/global_step": 2916, "train_info/time_within_train_step": 2.6475157737731934, "step": 2916} {"train_info/time_between_train_steps": 0.0032761096954345703, "step": 2916} {"info/global_step": 2917, "train_info/time_within_train_step": 2.6430563926696777, "step": 2917} {"train_info/time_between_train_steps": 0.003251791000366211, "step": 2917} {"info/global_step": 2918, "train_info/time_within_train_step": 2.6665945053100586, "step": 2918} {"train_info/time_between_train_steps": 0.003354310989379883, "step": 2918} {"info/global_step": 2919, "train_info/time_within_train_step": 2.650374412536621, "step": 2919} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 2919} {"info/global_step": 2920, "train_info/time_within_train_step": 2.6446776390075684, "step": 2920} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 2920} {"info/global_step": 2921, "train_info/time_within_train_step": 2.6694328784942627, "step": 2921} {"train_info/time_between_train_steps": 0.0032470226287841797, "step": 2921} {"info/global_step": 2922, "train_info/time_within_train_step": 2.660729169845581, "step": 2922} {"train_info/time_between_train_steps": 0.0033652782440185547, "step": 2922} {"info/global_step": 2923, "train_info/time_within_train_step": 2.6672732830047607, "step": 2923} {"train_info/time_between_train_steps": 0.003338336944580078, "step": 2923} {"info/global_step": 2924, "train_info/time_within_train_step": 2.6831068992614746, "step": 2924} {"train_info/time_between_train_steps": 0.003304004669189453, "step": 2924} {"info/global_step": 2925, "train_info/time_within_train_step": 2.6710586547851562, "step": 2925} {"train_info/time_between_train_steps": 0.003262758255004883, "step": 2925} {"info/global_step": 2926, "train_info/time_within_train_step": 2.6423888206481934, "step": 2926} {"train_info/time_between_train_steps": 0.0032579898834228516, "step": 2926} {"info/global_step": 2927, "train_info/time_within_train_step": 2.6411705017089844, "step": 2927} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 2927} {"info/global_step": 2928, "train_info/time_within_train_step": 2.658179998397827, "step": 2928} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 2928} {"info/global_step": 2929, "train_info/time_within_train_step": 2.6552984714508057, "step": 2929} {"train_info/time_between_train_steps": 0.0032634735107421875, "step": 2929} {"info/global_step": 2930, "train_info/time_within_train_step": 2.9109694957733154, "step": 2930} {"train_info/time_between_train_steps": 0.003251314163208008, "step": 2930} {"info/global_step": 2931, "train_info/time_within_train_step": 2.653069257736206, "step": 2931} {"train_info/time_between_train_steps": 0.003273487091064453, "step": 2931} {"info/global_step": 2932, "train_info/time_within_train_step": 2.6554324626922607, "step": 2932} {"train_info/time_between_train_steps": 0.003240823745727539, "step": 2932} {"info/global_step": 2933, "train_info/time_within_train_step": 2.660036563873291, "step": 2933} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 2933} {"info/global_step": 2934, "train_info/time_within_train_step": 2.6460447311401367, "step": 2934} {"train_info/time_between_train_steps": 0.0032482147216796875, "step": 2934} {"info/global_step": 2935, "train_info/time_within_train_step": 2.6556153297424316, "step": 2935} {"train_info/time_between_train_steps": 0.003355264663696289, "step": 2935} {"info/global_step": 2936, "train_info/time_within_train_step": 2.659144878387451, "step": 2936} {"train_info/time_between_train_steps": 0.0032739639282226562, "step": 2936} {"info/global_step": 2937, "train_info/time_within_train_step": 2.668809175491333, "step": 2937} {"train_info/time_between_train_steps": 0.00327301025390625, "step": 2937} {"info/global_step": 2938, "train_info/time_within_train_step": 2.7278645038604736, "step": 2938} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 2938} {"info/global_step": 2939, "train_info/time_within_train_step": 2.6628949642181396, "step": 2939} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 2939} {"info/global_step": 2940, "train_info/time_within_train_step": 2.6412572860717773, "step": 2940} {"train_info/time_between_train_steps": 0.0032699108123779297, "step": 2940} {"info/global_step": 2941, "train_info/time_within_train_step": 2.646901845932007, "step": 2941} {"train_info/time_between_train_steps": 0.00325775146484375, "step": 2941} {"info/global_step": 2942, "train_info/time_within_train_step": 2.6554527282714844, "step": 2942} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 2942} {"info/global_step": 2943, "train_info/time_within_train_step": 2.6540186405181885, "step": 2943} {"train_info/time_between_train_steps": 0.003294229507446289, "step": 2943} {"info/global_step": 2944, "train_info/time_within_train_step": 2.645536184310913, "step": 2944} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 2944} {"info/global_step": 2945, "train_info/time_within_train_step": 2.6460278034210205, "step": 2945} {"train_info/time_between_train_steps": 0.0032291412353515625, "step": 2945} {"info/global_step": 2946, "train_info/time_within_train_step": 2.667032241821289, "step": 2946} {"train_info/time_between_train_steps": 0.003439664840698242, "step": 2946} {"info/global_step": 2947, "train_info/time_within_train_step": 2.6704869270324707, "step": 2947} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 2947} {"info/global_step": 2948, "train_info/time_within_train_step": 2.7170557975769043, "step": 2948} {"train_info/time_between_train_steps": 0.003284931182861328, "step": 2948} {"info/global_step": 2949, "train_info/time_within_train_step": 2.652850866317749, "step": 2949} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 2949} {"info/global_step": 2950, "train_info/time_within_train_step": 2.6641392707824707, "step": 2950} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746905712, "_runtime": 8310}, "step": 2950} {"logs": {"train/loss": 4.0267, "train/learning_rate": 0.00046999999999999993, "train/epoch": 3.04, "_timestamp": 1746905712, "_runtime": 8310}, "step": 2950} {"train_info/time_between_train_steps": 0.02469468116760254, "step": 2950} {"info/global_step": 2951, "train_info/time_within_train_step": 2.6419034004211426, "step": 2951} {"train_info/time_between_train_steps": 0.003236055374145508, "step": 2951} {"info/global_step": 2952, "train_info/time_within_train_step": 2.657522201538086, "step": 2952} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 2952} {"info/global_step": 2953, "train_info/time_within_train_step": 2.6523542404174805, "step": 2953} {"train_info/time_between_train_steps": 0.0032892227172851562, "step": 2953} {"info/global_step": 2954, "train_info/time_within_train_step": 2.6458160877227783, "step": 2954} {"train_info/time_between_train_steps": 0.0032770633697509766, "step": 2954} {"info/global_step": 2955, "train_info/time_within_train_step": 2.6489360332489014, "step": 2955} {"train_info/time_between_train_steps": 0.003248453140258789, "step": 2955} {"info/global_step": 2956, "train_info/time_within_train_step": 2.6476287841796875, "step": 2956} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 2956} {"info/global_step": 2957, "train_info/time_within_train_step": 2.6419308185577393, "step": 2957} {"train_info/time_between_train_steps": 0.003229379653930664, "step": 2957} {"info/global_step": 2958, "train_info/time_within_train_step": 2.661691188812256, "step": 2958} {"train_info/time_between_train_steps": 0.0032427310943603516, "step": 2958} {"info/global_step": 2959, "train_info/time_within_train_step": 2.64951229095459, "step": 2959} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 2959} {"info/global_step": 2960, "train_info/time_within_train_step": 2.650148630142212, "step": 2960} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 2960} {"info/global_step": 2961, "train_info/time_within_train_step": 2.6434783935546875, "step": 2961} {"train_info/time_between_train_steps": 0.003450155258178711, "step": 2961} {"info/global_step": 2962, "train_info/time_within_train_step": 2.644486427307129, "step": 2962} {"train_info/time_between_train_steps": 0.003488779067993164, "step": 2962} {"info/global_step": 2963, "train_info/time_within_train_step": 2.6426055431365967, "step": 2963} {"train_info/time_between_train_steps": 0.0033397674560546875, "step": 2963} {"info/global_step": 2964, "train_info/time_within_train_step": 2.645488739013672, "step": 2964} {"train_info/time_between_train_steps": 0.12461471557617188, "step": 2964} {"info/global_step": 2965, "train_info/time_within_train_step": 2.643155097961426, "step": 2965} {"train_info/time_between_train_steps": 0.0033512115478515625, "step": 2965} {"info/global_step": 2966, "train_info/time_within_train_step": 2.6447205543518066, "step": 2966} {"train_info/time_between_train_steps": 0.003574848175048828, "step": 2966} {"info/global_step": 2967, "train_info/time_within_train_step": 2.643213987350464, "step": 2967} {"train_info/time_between_train_steps": 0.0032961368560791016, "step": 2967} {"info/global_step": 2968, "train_info/time_within_train_step": 2.6437339782714844, "step": 2968} {"train_info/time_between_train_steps": 0.0034172534942626953, "step": 2968} {"info/global_step": 2969, "train_info/time_within_train_step": 2.6243057250976562, "step": 2969} {"train_info/time_between_train_steps": 0.0033669471740722656, "step": 2969} {"info/global_step": 2970, "train_info/time_within_train_step": 2.6402840614318848, "step": 2970} {"train_info/time_between_train_steps": 0.003342866897583008, "step": 2970} {"info/global_step": 2971, "train_info/time_within_train_step": 2.6809329986572266, "step": 2971} {"train_info/time_between_train_steps": 0.003306865692138672, "step": 2971} {"info/global_step": 2972, "train_info/time_within_train_step": 2.8954362869262695, "step": 2972} {"train_info/time_between_train_steps": 0.0032684803009033203, "step": 2972} {"info/global_step": 2973, "train_info/time_within_train_step": 2.6675784587860107, "step": 2973} {"train_info/time_between_train_steps": 0.003514528274536133, "step": 2973} {"info/global_step": 2974, "train_info/time_within_train_step": 2.675755023956299, "step": 2974} {"train_info/time_between_train_steps": 0.003286600112915039, "step": 2974} {"info/global_step": 2975, "train_info/time_within_train_step": 2.6481730937957764, "step": 2975} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 2975} {"info/global_step": 2976, "train_info/time_within_train_step": 2.6510143280029297, "step": 2976} {"train_info/time_between_train_steps": 0.003261089324951172, "step": 2976} {"info/global_step": 2977, "train_info/time_within_train_step": 2.6593880653381348, "step": 2977} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 2977} {"info/global_step": 2978, "train_info/time_within_train_step": 2.6955337524414062, "step": 2978} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 2978} {"info/global_step": 2979, "train_info/time_within_train_step": 2.692152738571167, "step": 2979} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 2979} {"info/global_step": 2980, "train_info/time_within_train_step": 2.643970489501953, "step": 2980} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 2980} {"info/global_step": 2981, "train_info/time_within_train_step": 2.6401777267456055, "step": 2981} {"train_info/time_between_train_steps": 0.003242969512939453, "step": 2981} {"info/global_step": 2982, "train_info/time_within_train_step": 2.658661365509033, "step": 2982} {"train_info/time_between_train_steps": 0.0032320022583007812, "step": 2982} {"info/global_step": 2983, "train_info/time_within_train_step": 2.6556026935577393, "step": 2983} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 2983} {"info/global_step": 2984, "train_info/time_within_train_step": 2.643892526626587, "step": 2984} {"train_info/time_between_train_steps": 0.0033597946166992188, "step": 2984} {"info/global_step": 2985, "train_info/time_within_train_step": 2.642425775527954, "step": 2985} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 2985} {"info/global_step": 2986, "train_info/time_within_train_step": 2.7067558765411377, "step": 2986} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 2986} {"info/global_step": 2987, "train_info/time_within_train_step": 2.6465725898742676, "step": 2987} {"train_info/time_between_train_steps": 0.0032532215118408203, "step": 2987} {"info/global_step": 2988, "train_info/time_within_train_step": 2.6620020866394043, "step": 2988} {"train_info/time_between_train_steps": 0.003237485885620117, "step": 2988} {"info/global_step": 2989, "train_info/time_within_train_step": 2.6436374187469482, "step": 2989} {"train_info/time_between_train_steps": 0.0032885074615478516, "step": 2989} {"info/global_step": 2990, "train_info/time_within_train_step": 2.6472251415252686, "step": 2990} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 2990} {"info/global_step": 2991, "train_info/time_within_train_step": 2.6704704761505127, "step": 2991} {"train_info/time_between_train_steps": 0.003287792205810547, "step": 2991} {"info/global_step": 2992, "train_info/time_within_train_step": 2.6442086696624756, "step": 2992} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 2992} {"info/global_step": 2993, "train_info/time_within_train_step": 2.649522304534912, "step": 2993} {"train_info/time_between_train_steps": 0.0032281875610351562, "step": 2993} {"info/global_step": 2994, "train_info/time_within_train_step": 2.6685080528259277, "step": 2994} {"train_info/time_between_train_steps": 0.003224611282348633, "step": 2994} {"info/global_step": 2995, "train_info/time_within_train_step": 2.6671302318573, "step": 2995} {"train_info/time_between_train_steps": 0.0032815933227539062, "step": 2995} {"info/global_step": 2996, "train_info/time_within_train_step": 2.7008323669433594, "step": 2996} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 2996} {"info/global_step": 2997, "train_info/time_within_train_step": 2.65310001373291, "step": 2997} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 2997} {"info/global_step": 2998, "train_info/time_within_train_step": 2.6675591468811035, "step": 2998} {"train_info/time_between_train_steps": 0.0032052993774414062, "step": 2998} {"info/global_step": 2999, "train_info/time_within_train_step": 2.6490206718444824, "step": 2999} {"train_info/time_between_train_steps": 0.003233194351196289, "step": 2999} {"info/global_step": 3000, "train_info/time_within_train_step": 3.2640974521636963, "step": 3000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746905851, "_runtime": 8449}, "step": 3000} {"logs": {"train/loss": 4.0153, "train/learning_rate": 0.0004666666666666666, "train/epoch": 3.04, "_timestamp": 1746905851, "_runtime": 8449}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746905856, "_runtime": 8454}, "step": 3000} {"logs": {"eval/loss": 4.633265972137451, "eval/runtime": 5.1782, "eval/samples_per_second": 37.079, "eval/steps_per_second": 1.159, "train/epoch": 3.04, "_timestamp": 1746905856, "_runtime": 8454}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746905856, "_runtime": 8454}, "step": 3000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.633265972137451, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 102.84941952019629, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1782, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 37.079, "train/epoch": 3.04, "_timestamp": 1746905856, "_runtime": 8454}, "step": 3000} {"train_info/time_between_train_steps": 32.03795051574707, "step": 3000} {"info/global_step": 3001, "train_info/time_within_train_step": 2.432659387588501, "step": 3001} {"train_info/time_between_train_steps": 0.003352642059326172, "step": 3001} {"info/global_step": 3002, "train_info/time_within_train_step": 2.4321305751800537, "step": 3002} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 3002} {"info/global_step": 3003, "train_info/time_within_train_step": 2.5476198196411133, "step": 3003} {"train_info/time_between_train_steps": 0.003271818161010742, "step": 3003} {"info/global_step": 3004, "train_info/time_within_train_step": 2.6486237049102783, "step": 3004} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 3004} {"info/global_step": 3005, "train_info/time_within_train_step": 2.649033308029175, "step": 3005} {"train_info/time_between_train_steps": 0.0042629241943359375, "step": 3005} {"info/global_step": 3006, "train_info/time_within_train_step": 2.6435182094573975, "step": 3006} {"train_info/time_between_train_steps": 0.003292560577392578, "step": 3006} {"info/global_step": 3007, "train_info/time_within_train_step": 2.642896890640259, "step": 3007} {"train_info/time_between_train_steps": 0.0032792091369628906, "step": 3007} {"info/global_step": 3008, "train_info/time_within_train_step": 2.6514182090759277, "step": 3008} {"train_info/time_between_train_steps": 0.003283262252807617, "step": 3008} {"info/global_step": 3009, "train_info/time_within_train_step": 2.6730709075927734, "step": 3009} {"train_info/time_between_train_steps": 0.003303050994873047, "step": 3009} {"info/global_step": 3010, "train_info/time_within_train_step": 2.674191474914551, "step": 3010} {"train_info/time_between_train_steps": 0.0032596588134765625, "step": 3010} {"info/global_step": 3011, "train_info/time_within_train_step": 2.649446725845337, "step": 3011} {"train_info/time_between_train_steps": 0.003236532211303711, "step": 3011} {"info/global_step": 3012, "train_info/time_within_train_step": 2.6595265865325928, "step": 3012} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 3012} {"info/global_step": 3013, "train_info/time_within_train_step": 2.650357723236084, "step": 3013} {"train_info/time_between_train_steps": 0.0032510757446289062, "step": 3013} {"info/global_step": 3014, "train_info/time_within_train_step": 2.649738073348999, "step": 3014} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 3014} {"info/global_step": 3015, "train_info/time_within_train_step": 2.655115842819214, "step": 3015} {"train_info/time_between_train_steps": 0.0034363269805908203, "step": 3015} {"info/global_step": 3016, "train_info/time_within_train_step": 2.6514320373535156, "step": 3016} {"train_info/time_between_train_steps": 0.0032722949981689453, "step": 3016} {"info/global_step": 3017, "train_info/time_within_train_step": 2.6484429836273193, "step": 3017} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 3017} {"info/global_step": 3018, "train_info/time_within_train_step": 2.6694211959838867, "step": 3018} {"train_info/time_between_train_steps": 0.003284931182861328, "step": 3018} {"info/global_step": 3019, "train_info/time_within_train_step": 2.6596572399139404, "step": 3019} {"train_info/time_between_train_steps": 0.003263711929321289, "step": 3019} {"info/global_step": 3020, "train_info/time_within_train_step": 2.6577579975128174, "step": 3020} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 3020} {"info/global_step": 3021, "train_info/time_within_train_step": 2.70855712890625, "step": 3021} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 3021} {"info/global_step": 3022, "train_info/time_within_train_step": 2.6492843627929688, "step": 3022} {"train_info/time_between_train_steps": 0.0033681392669677734, "step": 3022} {"info/global_step": 3023, "train_info/time_within_train_step": 2.6488232612609863, "step": 3023} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 3023} {"info/global_step": 3024, "train_info/time_within_train_step": 2.6585047245025635, "step": 3024} {"train_info/time_between_train_steps": 0.003424406051635742, "step": 3024} {"info/global_step": 3025, "train_info/time_within_train_step": 2.6493098735809326, "step": 3025} {"train_info/time_between_train_steps": 0.0033638477325439453, "step": 3025} {"info/global_step": 3026, "train_info/time_within_train_step": 2.652147054672241, "step": 3026} {"train_info/time_between_train_steps": 0.003421306610107422, "step": 3026} {"info/global_step": 3027, "train_info/time_within_train_step": 2.8011536598205566, "step": 3027} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 3027} {"info/global_step": 3028, "train_info/time_within_train_step": 2.656641721725464, "step": 3028} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 3028} {"info/global_step": 3029, "train_info/time_within_train_step": 2.661966323852539, "step": 3029} {"train_info/time_between_train_steps": 0.0032911300659179688, "step": 3029} {"info/global_step": 3030, "train_info/time_within_train_step": 2.6620280742645264, "step": 3030} {"train_info/time_between_train_steps": 0.0032966136932373047, "step": 3030} {"info/global_step": 3031, "train_info/time_within_train_step": 2.664093017578125, "step": 3031} {"train_info/time_between_train_steps": 0.0033032894134521484, "step": 3031} {"info/global_step": 3032, "train_info/time_within_train_step": 2.6611649990081787, "step": 3032} {"train_info/time_between_train_steps": 0.003301858901977539, "step": 3032} {"info/global_step": 3033, "train_info/time_within_train_step": 2.7004833221435547, "step": 3033} {"train_info/time_between_train_steps": 0.0033140182495117188, "step": 3033} {"info/global_step": 3034, "train_info/time_within_train_step": 2.707598924636841, "step": 3034} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 3034} {"info/global_step": 3035, "train_info/time_within_train_step": 2.6447653770446777, "step": 3035} {"train_info/time_between_train_steps": 0.003260374069213867, "step": 3035} {"info/global_step": 3036, "train_info/time_within_train_step": 2.643611192703247, "step": 3036} {"train_info/time_between_train_steps": 0.0032372474670410156, "step": 3036} {"info/global_step": 3037, "train_info/time_within_train_step": 2.6632156372070312, "step": 3037} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 3037} {"info/global_step": 3038, "train_info/time_within_train_step": 2.6555252075195312, "step": 3038} {"train_info/time_between_train_steps": 0.0034384727478027344, "step": 3038} {"info/global_step": 3039, "train_info/time_within_train_step": 2.652235507965088, "step": 3039} {"train_info/time_between_train_steps": 0.003259420394897461, "step": 3039} {"info/global_step": 3040, "train_info/time_within_train_step": 2.9262611865997314, "step": 3040} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 3040} {"info/global_step": 3041, "train_info/time_within_train_step": 2.643922805786133, "step": 3041} {"train_info/time_between_train_steps": 0.0032439231872558594, "step": 3041} {"info/global_step": 3042, "train_info/time_within_train_step": 2.656508684158325, "step": 3042} {"train_info/time_between_train_steps": 0.003289937973022461, "step": 3042} {"info/global_step": 3043, "train_info/time_within_train_step": 2.6514971256256104, "step": 3043} {"train_info/time_between_train_steps": 0.003306865692138672, "step": 3043} {"info/global_step": 3044, "train_info/time_within_train_step": 2.6483943462371826, "step": 3044} {"train_info/time_between_train_steps": 0.0032575130462646484, "step": 3044} {"info/global_step": 3045, "train_info/time_within_train_step": 2.6583971977233887, "step": 3045} {"train_info/time_between_train_steps": 0.0033419132232666016, "step": 3045} {"info/global_step": 3046, "train_info/time_within_train_step": 2.646615743637085, "step": 3046} {"train_info/time_between_train_steps": 0.0032494068145751953, "step": 3046} {"info/global_step": 3047, "train_info/time_within_train_step": 2.6492083072662354, "step": 3047} {"train_info/time_between_train_steps": 0.0032494068145751953, "step": 3047} {"info/global_step": 3048, "train_info/time_within_train_step": 2.6732070446014404, "step": 3048} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 3048} {"info/global_step": 3049, "train_info/time_within_train_step": 2.6682963371276855, "step": 3049} {"train_info/time_between_train_steps": 0.0035676956176757812, "step": 3049} {"info/global_step": 3050, "train_info/time_within_train_step": 2.669949531555176, "step": 3050} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746906017, "_runtime": 8615}, "step": 3050} {"logs": {"train/loss": 4.0167, "train/learning_rate": 0.00046333333333333334, "train/epoch": 3.05, "_timestamp": 1746906017, "_runtime": 8615}, "step": 3050} {"train_info/time_between_train_steps": 0.02456974983215332, "step": 3050} {"info/global_step": 3051, "train_info/time_within_train_step": 2.6596899032592773, "step": 3051} {"train_info/time_between_train_steps": 0.0035364627838134766, "step": 3051} {"info/global_step": 3052, "train_info/time_within_train_step": 2.6883835792541504, "step": 3052} {"train_info/time_between_train_steps": 0.003709554672241211, "step": 3052} {"info/global_step": 3053, "train_info/time_within_train_step": 2.644432306289673, "step": 3053} {"train_info/time_between_train_steps": 0.0035636425018310547, "step": 3053} {"info/global_step": 3054, "train_info/time_within_train_step": 2.64778995513916, "step": 3054} {"train_info/time_between_train_steps": 0.0035676956176757812, "step": 3054} {"info/global_step": 3055, "train_info/time_within_train_step": 2.6596286296844482, "step": 3055} {"train_info/time_between_train_steps": 0.0038025379180908203, "step": 3055} {"info/global_step": 3056, "train_info/time_within_train_step": 2.6513471603393555, "step": 3056} {"train_info/time_between_train_steps": 0.0038518905639648438, "step": 3056} {"info/global_step": 3057, "train_info/time_within_train_step": 2.6534016132354736, "step": 3057} {"train_info/time_between_train_steps": 0.0036406517028808594, "step": 3057} {"info/global_step": 3058, "train_info/time_within_train_step": 2.6685731410980225, "step": 3058} {"train_info/time_between_train_steps": 0.00370025634765625, "step": 3058} {"info/global_step": 3059, "train_info/time_within_train_step": 2.660324811935425, "step": 3059} {"train_info/time_between_train_steps": 0.0036492347717285156, "step": 3059} {"info/global_step": 3060, "train_info/time_within_train_step": 2.666959047317505, "step": 3060} {"train_info/time_between_train_steps": 0.003693819046020508, "step": 3060} {"info/global_step": 3061, "train_info/time_within_train_step": 2.6885035037994385, "step": 3061} {"train_info/time_between_train_steps": 0.003574848175048828, "step": 3061} {"info/global_step": 3062, "train_info/time_within_train_step": 2.661762237548828, "step": 3062} {"train_info/time_between_train_steps": 0.003718852996826172, "step": 3062} {"info/global_step": 3063, "train_info/time_within_train_step": 2.651052713394165, "step": 3063} {"train_info/time_between_train_steps": 0.0037126541137695312, "step": 3063} {"info/global_step": 3064, "train_info/time_within_train_step": 2.662985324859619, "step": 3064} {"train_info/time_between_train_steps": 0.0036890506744384766, "step": 3064} {"info/global_step": 3065, "train_info/time_within_train_step": 2.6606175899505615, "step": 3065} {"train_info/time_between_train_steps": 0.0036454200744628906, "step": 3065} {"info/global_step": 3066, "train_info/time_within_train_step": 2.6529831886291504, "step": 3066} {"train_info/time_between_train_steps": 0.0036356449127197266, "step": 3066} {"info/global_step": 3067, "train_info/time_within_train_step": 2.6478567123413086, "step": 3067} {"train_info/time_between_train_steps": 0.0035784244537353516, "step": 3067} {"info/global_step": 3068, "train_info/time_within_train_step": 2.656338930130005, "step": 3068} {"train_info/time_between_train_steps": 0.0035889148712158203, "step": 3068} {"info/global_step": 3069, "train_info/time_within_train_step": 2.6586577892303467, "step": 3069} {"train_info/time_between_train_steps": 0.0037283897399902344, "step": 3069} {"info/global_step": 3070, "train_info/time_within_train_step": 2.673891544342041, "step": 3070} {"train_info/time_between_train_steps": 0.0036466121673583984, "step": 3070} {"info/global_step": 3071, "train_info/time_within_train_step": 2.7295730113983154, "step": 3071} {"train_info/time_between_train_steps": 0.003504514694213867, "step": 3071} {"info/global_step": 3072, "train_info/time_within_train_step": 2.6751720905303955, "step": 3072} {"train_info/time_between_train_steps": 0.0035877227783203125, "step": 3072} {"info/global_step": 3073, "train_info/time_within_train_step": 2.643296241760254, "step": 3073} {"train_info/time_between_train_steps": 0.003560304641723633, "step": 3073} {"info/global_step": 3074, "train_info/time_within_train_step": 2.6451361179351807, "step": 3074} {"train_info/time_between_train_steps": 0.003624439239501953, "step": 3074} {"info/global_step": 3075, "train_info/time_within_train_step": 2.6569812297821045, "step": 3075} {"train_info/time_between_train_steps": 0.003571033477783203, "step": 3075} {"info/global_step": 3076, "train_info/time_within_train_step": 2.6612420082092285, "step": 3076} {"train_info/time_between_train_steps": 0.003668546676635742, "step": 3076} {"info/global_step": 3077, "train_info/time_within_train_step": 2.6461923122406006, "step": 3077} {"train_info/time_between_train_steps": 0.003612995147705078, "step": 3077} {"info/global_step": 3078, "train_info/time_within_train_step": 2.652385711669922, "step": 3078} {"train_info/time_between_train_steps": 0.0034873485565185547, "step": 3078} {"info/global_step": 3079, "train_info/time_within_train_step": 2.6592438220977783, "step": 3079} {"train_info/time_between_train_steps": 0.0037157535552978516, "step": 3079} {"info/global_step": 3080, "train_info/time_within_train_step": 2.6672377586364746, "step": 3080} {"train_info/time_between_train_steps": 0.003537416458129883, "step": 3080} {"info/global_step": 3081, "train_info/time_within_train_step": 2.7058260440826416, "step": 3081} {"train_info/time_between_train_steps": 0.003690481185913086, "step": 3081} {"info/global_step": 3082, "train_info/time_within_train_step": 3.0215022563934326, "step": 3082} {"train_info/time_between_train_steps": 0.0033273696899414062, "step": 3082} {"info/global_step": 3083, "train_info/time_within_train_step": 2.64986252784729, "step": 3083} {"train_info/time_between_train_steps": 0.0032439231872558594, "step": 3083} {"info/global_step": 3084, "train_info/time_within_train_step": 2.646632194519043, "step": 3084} {"train_info/time_between_train_steps": 0.0037384033203125, "step": 3084} {"info/global_step": 3085, "train_info/time_within_train_step": 2.6702702045440674, "step": 3085} {"train_info/time_between_train_steps": 0.003331899642944336, "step": 3085} {"info/global_step": 3086, "train_info/time_within_train_step": 2.690737247467041, "step": 3086} {"train_info/time_between_train_steps": 0.0032813549041748047, "step": 3086} {"info/global_step": 3087, "train_info/time_within_train_step": 2.660876989364624, "step": 3087} {"train_info/time_between_train_steps": 0.003306150436401367, "step": 3087} {"info/global_step": 3088, "train_info/time_within_train_step": 2.6641757488250732, "step": 3088} {"train_info/time_between_train_steps": 0.0033838748931884766, "step": 3088} {"info/global_step": 3089, "train_info/time_within_train_step": 2.6417794227600098, "step": 3089} {"train_info/time_between_train_steps": 0.12229180335998535, "step": 3089} {"info/global_step": 3090, "train_info/time_within_train_step": 2.6547813415527344, "step": 3090} {"train_info/time_between_train_steps": 0.003320932388305664, "step": 3090} {"info/global_step": 3091, "train_info/time_within_train_step": 2.6573445796966553, "step": 3091} {"train_info/time_between_train_steps": 0.003264188766479492, "step": 3091} {"info/global_step": 3092, "train_info/time_within_train_step": 2.6545615196228027, "step": 3092} {"train_info/time_between_train_steps": 0.0033333301544189453, "step": 3092} {"info/global_step": 3093, "train_info/time_within_train_step": 2.649806261062622, "step": 3093} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 3093} {"info/global_step": 3094, "train_info/time_within_train_step": 2.6463348865509033, "step": 3094} {"train_info/time_between_train_steps": 0.003333568572998047, "step": 3094} {"info/global_step": 3095, "train_info/time_within_train_step": 2.6520729064941406, "step": 3095} {"train_info/time_between_train_steps": 0.003257274627685547, "step": 3095} {"info/global_step": 3096, "train_info/time_within_train_step": 2.6853907108306885, "step": 3096} {"train_info/time_between_train_steps": 0.003315448760986328, "step": 3096} {"info/global_step": 3097, "train_info/time_within_train_step": 2.6736392974853516, "step": 3097} {"train_info/time_between_train_steps": 0.003268718719482422, "step": 3097} {"info/global_step": 3098, "train_info/time_within_train_step": 2.667130470275879, "step": 3098} {"train_info/time_between_train_steps": 0.0033025741577148438, "step": 3098} {"info/global_step": 3099, "train_info/time_within_train_step": 2.6781160831451416, "step": 3099} {"train_info/time_between_train_steps": 0.0032966136932373047, "step": 3099} {"info/global_step": 3100, "train_info/time_within_train_step": 2.6554179191589355, "step": 3100} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746906152, "_runtime": 8750}, "step": 3100} {"logs": {"train/loss": 3.9947, "train/learning_rate": 0.00046, "train/epoch": 3.05, "_timestamp": 1746906152, "_runtime": 8750}, "step": 3100} {"train_info/time_between_train_steps": 0.031101703643798828, "step": 3100} {"info/global_step": 3101, "train_info/time_within_train_step": 2.6656112670898438, "step": 3101} {"train_info/time_between_train_steps": 0.003273487091064453, "step": 3101} {"info/global_step": 3102, "train_info/time_within_train_step": 2.661844491958618, "step": 3102} {"train_info/time_between_train_steps": 0.0032739639282226562, "step": 3102} {"info/global_step": 3103, "train_info/time_within_train_step": 2.6511950492858887, "step": 3103} {"train_info/time_between_train_steps": 0.003325939178466797, "step": 3103} {"info/global_step": 3104, "train_info/time_within_train_step": 2.6433918476104736, "step": 3104} {"train_info/time_between_train_steps": 0.003229379653930664, "step": 3104} {"info/global_step": 3105, "train_info/time_within_train_step": 2.6424882411956787, "step": 3105} {"train_info/time_between_train_steps": 0.0033020973205566406, "step": 3105} {"info/global_step": 3106, "train_info/time_within_train_step": 2.659297466278076, "step": 3106} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 3106} {"info/global_step": 3107, "train_info/time_within_train_step": 2.654754400253296, "step": 3107} {"train_info/time_between_train_steps": 0.0032753944396972656, "step": 3107} {"info/global_step": 3108, "train_info/time_within_train_step": 2.647615671157837, "step": 3108} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 3108} {"info/global_step": 3109, "train_info/time_within_train_step": 2.6558878421783447, "step": 3109} {"train_info/time_between_train_steps": 0.0032765865325927734, "step": 3109} {"info/global_step": 3110, "train_info/time_within_train_step": 2.6568808555603027, "step": 3110} {"train_info/time_between_train_steps": 0.003226757049560547, "step": 3110} {"info/global_step": 3111, "train_info/time_within_train_step": 2.6713860034942627, "step": 3111} {"train_info/time_between_train_steps": 0.0032885074615478516, "step": 3111} {"info/global_step": 3112, "train_info/time_within_train_step": 2.727632999420166, "step": 3112} {"train_info/time_between_train_steps": 0.0032465457916259766, "step": 3112} {"info/global_step": 3113, "train_info/time_within_train_step": 2.661721706390381, "step": 3113} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 3113} {"info/global_step": 3114, "train_info/time_within_train_step": 2.6412904262542725, "step": 3114} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 3114} {"info/global_step": 3115, "train_info/time_within_train_step": 2.6580638885498047, "step": 3115} {"train_info/time_between_train_steps": 0.003275632858276367, "step": 3115} {"info/global_step": 3116, "train_info/time_within_train_step": 2.6531200408935547, "step": 3116} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 3116} {"info/global_step": 3117, "train_info/time_within_train_step": 2.645167112350464, "step": 3117} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 3117} {"info/global_step": 3118, "train_info/time_within_train_step": 2.6538703441619873, "step": 3118} {"train_info/time_between_train_steps": 0.0032176971435546875, "step": 3118} {"info/global_step": 3119, "train_info/time_within_train_step": 2.652364492416382, "step": 3119} {"train_info/time_between_train_steps": 0.003305673599243164, "step": 3119} {"info/global_step": 3120, "train_info/time_within_train_step": 2.672987937927246, "step": 3120} {"train_info/time_between_train_steps": 0.0032677650451660156, "step": 3120} {"info/global_step": 3121, "train_info/time_within_train_step": 2.709238052368164, "step": 3121} {"train_info/time_between_train_steps": 0.0033788681030273438, "step": 3121} {"info/global_step": 3122, "train_info/time_within_train_step": 2.643500804901123, "step": 3122} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 3122} {"info/global_step": 3123, "train_info/time_within_train_step": 2.6518783569335938, "step": 3123} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 3123} {"info/global_step": 3124, "train_info/time_within_train_step": 2.655442714691162, "step": 3124} {"train_info/time_between_train_steps": 0.003258228302001953, "step": 3124} {"info/global_step": 3125, "train_info/time_within_train_step": 2.652261972427368, "step": 3125} {"train_info/time_between_train_steps": 0.0032167434692382812, "step": 3125} {"info/global_step": 3126, "train_info/time_within_train_step": 2.6517393589019775, "step": 3126} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 3126} {"info/global_step": 3127, "train_info/time_within_train_step": 2.6462855339050293, "step": 3127} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 3127} {"info/global_step": 3128, "train_info/time_within_train_step": 2.650264263153076, "step": 3128} {"train_info/time_between_train_steps": 0.0032911300659179688, "step": 3128} {"info/global_step": 3129, "train_info/time_within_train_step": 2.6725587844848633, "step": 3129} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 3129} {"info/global_step": 3130, "train_info/time_within_train_step": 2.6692774295806885, "step": 3130} {"train_info/time_between_train_steps": 0.0033740997314453125, "step": 3130} {"info/global_step": 3131, "train_info/time_within_train_step": 2.6574766635894775, "step": 3131} {"train_info/time_between_train_steps": 0.003261089324951172, "step": 3131} {"info/global_step": 3132, "train_info/time_within_train_step": 2.6995813846588135, "step": 3132} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 3132} {"info/global_step": 3133, "train_info/time_within_train_step": 2.6478559970855713, "step": 3133} {"train_info/time_between_train_steps": 0.003289937973022461, "step": 3133} {"info/global_step": 3134, "train_info/time_within_train_step": 2.654742479324341, "step": 3134} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 3134} {"info/global_step": 3135, "train_info/time_within_train_step": 2.6577107906341553, "step": 3135} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 3135} {"info/global_step": 3136, "train_info/time_within_train_step": 2.644031524658203, "step": 3136} {"train_info/time_between_train_steps": 0.003427743911743164, "step": 3136} {"info/global_step": 3137, "train_info/time_within_train_step": 2.645425319671631, "step": 3137} {"train_info/time_between_train_steps": 0.003193378448486328, "step": 3137} {"info/global_step": 3138, "train_info/time_within_train_step": 2.6601154804229736, "step": 3138} {"train_info/time_between_train_steps": 0.0032758712768554688, "step": 3138} {"info/global_step": 3139, "train_info/time_within_train_step": 2.6616952419281006, "step": 3139} {"train_info/time_between_train_steps": 0.003255605697631836, "step": 3139} {"info/global_step": 3140, "train_info/time_within_train_step": 2.694272041320801, "step": 3140} {"train_info/time_between_train_steps": 0.002964496612548828, "step": 3140} {"info/global_step": 3141, "train_info/time_within_train_step": 2.670736074447632, "step": 3141} {"train_info/time_between_train_steps": 0.0029230117797851562, "step": 3141} {"info/global_step": 3142, "train_info/time_within_train_step": 2.6895413398742676, "step": 3142} {"train_info/time_between_train_steps": 0.0029664039611816406, "step": 3142} {"info/global_step": 3143, "train_info/time_within_train_step": 2.652958393096924, "step": 3143} {"train_info/time_between_train_steps": 0.002924680709838867, "step": 3143} {"info/global_step": 3144, "train_info/time_within_train_step": 2.653123140335083, "step": 3144} {"train_info/time_between_train_steps": 0.002946615219116211, "step": 3144} {"info/global_step": 3145, "train_info/time_within_train_step": 2.6578781604766846, "step": 3145} {"train_info/time_between_train_steps": 0.0030083656311035156, "step": 3145} {"info/global_step": 3146, "train_info/time_within_train_step": 2.678424835205078, "step": 3146} {"train_info/time_between_train_steps": 0.0029573440551757812, "step": 3146} {"info/global_step": 3147, "train_info/time_within_train_step": 2.7256968021392822, "step": 3147} {"train_info/time_between_train_steps": 0.002989530563354492, "step": 3147} {"info/global_step": 3148, "train_info/time_within_train_step": 2.645935535430908, "step": 3148} {"train_info/time_between_train_steps": 0.002969026565551758, "step": 3148} {"info/global_step": 3149, "train_info/time_within_train_step": 2.6414570808410645, "step": 3149} {"train_info/time_between_train_steps": 0.0029833316802978516, "step": 3149} {"info/global_step": 3150, "train_info/time_within_train_step": 2.6644375324249268, "step": 3150} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746906286, "_runtime": 8884}, "step": 3150} {"logs": {"train/loss": 3.9842, "train/learning_rate": 0.0004566666666666666, "train/epoch": 3.06, "_timestamp": 1746906286, "_runtime": 8884}, "step": 3150} {"train_info/time_between_train_steps": 0.024410724639892578, "step": 3150} {"info/global_step": 3151, "train_info/time_within_train_step": 2.6491384506225586, "step": 3151} {"train_info/time_between_train_steps": 0.0029451847076416016, "step": 3151} {"info/global_step": 3152, "train_info/time_within_train_step": 2.6434173583984375, "step": 3152} {"train_info/time_between_train_steps": 0.0029158592224121094, "step": 3152} {"info/global_step": 3153, "train_info/time_within_train_step": 2.650920867919922, "step": 3153} {"train_info/time_between_train_steps": 0.0030364990234375, "step": 3153} {"info/global_step": 3154, "train_info/time_within_train_step": 2.645869016647339, "step": 3154} {"train_info/time_between_train_steps": 0.003072977066040039, "step": 3154} {"info/global_step": 3155, "train_info/time_within_train_step": 2.6700327396392822, "step": 3155} {"train_info/time_between_train_steps": 0.00292205810546875, "step": 3155} {"info/global_step": 3156, "train_info/time_within_train_step": 2.6839661598205566, "step": 3156} {"train_info/time_between_train_steps": 0.0029878616333007812, "step": 3156} {"info/global_step": 3157, "train_info/time_within_train_step": 2.6627256870269775, "step": 3157} {"train_info/time_between_train_steps": 0.0029540061950683594, "step": 3157} {"info/global_step": 3158, "train_info/time_within_train_step": 2.6721386909484863, "step": 3158} {"train_info/time_between_train_steps": 0.0029532909393310547, "step": 3158} {"info/global_step": 3159, "train_info/time_within_train_step": 2.642828941345215, "step": 3159} {"train_info/time_between_train_steps": 0.002950429916381836, "step": 3159} {"info/global_step": 3160, "train_info/time_within_train_step": 2.6546905040740967, "step": 3160} {"train_info/time_between_train_steps": 0.002948284149169922, "step": 3160} {"info/global_step": 3161, "train_info/time_within_train_step": 2.6596789360046387, "step": 3161} {"train_info/time_between_train_steps": 0.0029866695404052734, "step": 3161} {"info/global_step": 3162, "train_info/time_within_train_step": 2.6445369720458984, "step": 3162} {"train_info/time_between_train_steps": 0.002947568893432617, "step": 3162} {"info/global_step": 3163, "train_info/time_within_train_step": 2.645151138305664, "step": 3163} {"train_info/time_between_train_steps": 0.0029289722442626953, "step": 3163} {"info/global_step": 3164, "train_info/time_within_train_step": 2.6690354347229004, "step": 3164} {"train_info/time_between_train_steps": 0.002983570098876953, "step": 3164} {"info/global_step": 3165, "train_info/time_within_train_step": 2.6448395252227783, "step": 3165} {"train_info/time_between_train_steps": 0.002937793731689453, "step": 3165} {"info/global_step": 3166, "train_info/time_within_train_step": 2.6583993434906006, "step": 3166} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 3166} {"info/global_step": 3167, "train_info/time_within_train_step": 2.6508731842041016, "step": 3167} {"train_info/time_between_train_steps": 0.0035161972045898438, "step": 3167} {"info/global_step": 3168, "train_info/time_within_train_step": 2.6437649726867676, "step": 3168} {"train_info/time_between_train_steps": 0.003061056137084961, "step": 3168} {"info/global_step": 3169, "train_info/time_within_train_step": 2.6435866355895996, "step": 3169} {"train_info/time_between_train_steps": 0.003016233444213867, "step": 3169} {"info/global_step": 3170, "train_info/time_within_train_step": 2.638478994369507, "step": 3170} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 3170} {"info/global_step": 3171, "train_info/time_within_train_step": 2.641160249710083, "step": 3171} {"train_info/time_between_train_steps": 0.003104686737060547, "step": 3171} {"info/global_step": 3172, "train_info/time_within_train_step": 2.642392635345459, "step": 3172} {"train_info/time_between_train_steps": 0.0033795833587646484, "step": 3172} {"info/global_step": 3173, "train_info/time_within_train_step": 2.641822099685669, "step": 3173} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 3173} {"info/global_step": 3174, "train_info/time_within_train_step": 2.628915548324585, "step": 3174} {"train_info/time_between_train_steps": 0.003095388412475586, "step": 3174} {"info/global_step": 3175, "train_info/time_within_train_step": 2.6257236003875732, "step": 3175} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 3175} {"info/global_step": 3176, "train_info/time_within_train_step": 2.6075024604797363, "step": 3176} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 3176} {"info/global_step": 3177, "train_info/time_within_train_step": 2.7546160221099854, "step": 3177} {"train_info/time_between_train_steps": 0.0034208297729492188, "step": 3177} {"info/global_step": 3178, "train_info/time_within_train_step": 2.680114984512329, "step": 3178} {"train_info/time_between_train_steps": 0.003008127212524414, "step": 3178} {"info/global_step": 3179, "train_info/time_within_train_step": 2.6429684162139893, "step": 3179} {"train_info/time_between_train_steps": 0.002957582473754883, "step": 3179} {"info/global_step": 3180, "train_info/time_within_train_step": 2.6570069789886475, "step": 3180} {"train_info/time_between_train_steps": 0.0029485225677490234, "step": 3180} {"info/global_step": 3181, "train_info/time_within_train_step": 2.645684242248535, "step": 3181} {"train_info/time_between_train_steps": 0.0030035972595214844, "step": 3181} {"info/global_step": 3182, "train_info/time_within_train_step": 2.6734578609466553, "step": 3182} {"train_info/time_between_train_steps": 0.002986431121826172, "step": 3182} {"info/global_step": 3183, "train_info/time_within_train_step": 2.6557037830352783, "step": 3183} {"train_info/time_between_train_steps": 0.002925395965576172, "step": 3183} {"info/global_step": 3184, "train_info/time_within_train_step": 2.638918876647949, "step": 3184} {"train_info/time_between_train_steps": 0.0029790401458740234, "step": 3184} {"info/global_step": 3185, "train_info/time_within_train_step": 2.6529295444488525, "step": 3185} {"train_info/time_between_train_steps": 0.0029609203338623047, "step": 3185} {"info/global_step": 3186, "train_info/time_within_train_step": 2.6471548080444336, "step": 3186} {"train_info/time_between_train_steps": 0.003022909164428711, "step": 3186} {"info/global_step": 3187, "train_info/time_within_train_step": 2.8528664112091064, "step": 3187} {"train_info/time_between_train_steps": 0.002981424331665039, "step": 3187} {"info/global_step": 3188, "train_info/time_within_train_step": 2.662322521209717, "step": 3188} {"train_info/time_between_train_steps": 0.0029256343841552734, "step": 3188} {"info/global_step": 3189, "train_info/time_within_train_step": 2.650343656539917, "step": 3189} {"train_info/time_between_train_steps": 0.002945423126220703, "step": 3189} {"info/global_step": 3190, "train_info/time_within_train_step": 2.6428661346435547, "step": 3190} {"train_info/time_between_train_steps": 0.0029430389404296875, "step": 3190} {"info/global_step": 3191, "train_info/time_within_train_step": 2.650608777999878, "step": 3191} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 3191} {"info/global_step": 3192, "train_info/time_within_train_step": 2.6456384658813477, "step": 3192} {"train_info/time_between_train_steps": 0.002980470657348633, "step": 3192} {"info/global_step": 3193, "train_info/time_within_train_step": 2.6685616970062256, "step": 3193} {"train_info/time_between_train_steps": 0.0028908252716064453, "step": 3193} {"info/global_step": 3194, "train_info/time_within_train_step": 2.7009029388427734, "step": 3194} {"train_info/time_between_train_steps": 0.0029497146606445312, "step": 3194} {"info/global_step": 3195, "train_info/time_within_train_step": 2.654219627380371, "step": 3195} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 3195} {"info/global_step": 3196, "train_info/time_within_train_step": 2.664165496826172, "step": 3196} {"train_info/time_between_train_steps": 0.0029320716857910156, "step": 3196} {"info/global_step": 3197, "train_info/time_within_train_step": 2.641012191772461, "step": 3197} {"train_info/time_between_train_steps": 0.003080129623413086, "step": 3197} {"info/global_step": 3198, "train_info/time_within_train_step": 2.649847984313965, "step": 3198} {"train_info/time_between_train_steps": 0.0030126571655273438, "step": 3198} {"info/global_step": 3199, "train_info/time_within_train_step": 2.6622188091278076, "step": 3199} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 3199} {"info/global_step": 3200, "train_info/time_within_train_step": 2.646035671234131, "step": 3200} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746906427, "_runtime": 9025}, "step": 3200} {"logs": {"train/loss": 3.9689, "train/learning_rate": 0.00045333333333333326, "train/epoch": 3.06, "_timestamp": 1746906427, "_runtime": 9025}, "step": 3200} {"train_info/time_between_train_steps": 28.933313846588135, "step": 3200} {"info/global_step": 3201, "train_info/time_within_train_step": 2.4554717540740967, "step": 3201} {"train_info/time_between_train_steps": 0.003029346466064453, "step": 3201} {"info/global_step": 3202, "train_info/time_within_train_step": 2.4294369220733643, "step": 3202} {"train_info/time_between_train_steps": 0.0030062198638916016, "step": 3202} {"info/global_step": 3203, "train_info/time_within_train_step": 2.556472063064575, "step": 3203} {"train_info/time_between_train_steps": 0.0029449462890625, "step": 3203} {"info/global_step": 3204, "train_info/time_within_train_step": 2.642498254776001, "step": 3204} {"train_info/time_between_train_steps": 0.002947092056274414, "step": 3204} {"info/global_step": 3205, "train_info/time_within_train_step": 2.641711473464966, "step": 3205} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 3205} {"info/global_step": 3206, "train_info/time_within_train_step": 2.662837266921997, "step": 3206} {"train_info/time_between_train_steps": 0.0030167102813720703, "step": 3206} {"info/global_step": 3207, "train_info/time_within_train_step": 2.661280393600464, "step": 3207} {"train_info/time_between_train_steps": 0.002952098846435547, "step": 3207} {"info/global_step": 3208, "train_info/time_within_train_step": 2.656818151473999, "step": 3208} {"train_info/time_between_train_steps": 0.003322601318359375, "step": 3208} {"info/global_step": 3209, "train_info/time_within_train_step": 2.7064292430877686, "step": 3209} {"train_info/time_between_train_steps": 0.002942800521850586, "step": 3209} {"info/global_step": 3210, "train_info/time_within_train_step": 2.6417903900146484, "step": 3210} {"train_info/time_between_train_steps": 0.0029289722442626953, "step": 3210} {"info/global_step": 3211, "train_info/time_within_train_step": 2.643024444580078, "step": 3211} {"train_info/time_between_train_steps": 0.002955198287963867, "step": 3211} {"info/global_step": 3212, "train_info/time_within_train_step": 2.664071798324585, "step": 3212} {"train_info/time_between_train_steps": 0.002925872802734375, "step": 3212} {"info/global_step": 3213, "train_info/time_within_train_step": 2.6480321884155273, "step": 3213} {"train_info/time_between_train_steps": 0.002930879592895508, "step": 3213} {"info/global_step": 3214, "train_info/time_within_train_step": 2.6462819576263428, "step": 3214} {"train_info/time_between_train_steps": 0.0029342174530029297, "step": 3214} {"info/global_step": 3215, "train_info/time_within_train_step": 2.654843330383301, "step": 3215} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 3215} {"info/global_step": 3216, "train_info/time_within_train_step": 2.6535229682922363, "step": 3216} {"train_info/time_between_train_steps": 0.002910614013671875, "step": 3216} {"info/global_step": 3217, "train_info/time_within_train_step": 2.6657278537750244, "step": 3217} {"train_info/time_between_train_steps": 0.0029647350311279297, "step": 3217} {"info/global_step": 3218, "train_info/time_within_train_step": 2.681814432144165, "step": 3218} {"train_info/time_between_train_steps": 0.0030121803283691406, "step": 3218} {"info/global_step": 3219, "train_info/time_within_train_step": 2.682208299636841, "step": 3219} {"train_info/time_between_train_steps": 0.0029897689819335938, "step": 3219} {"info/global_step": 3220, "train_info/time_within_train_step": 2.6430885791778564, "step": 3220} {"train_info/time_between_train_steps": 0.002910614013671875, "step": 3220} {"info/global_step": 3221, "train_info/time_within_train_step": 2.6609222888946533, "step": 3221} {"train_info/time_between_train_steps": 0.0029320716857910156, "step": 3221} {"info/global_step": 3222, "train_info/time_within_train_step": 2.649474620819092, "step": 3222} {"train_info/time_between_train_steps": 0.002980947494506836, "step": 3222} {"info/global_step": 3223, "train_info/time_within_train_step": 2.6483588218688965, "step": 3223} {"train_info/time_between_train_steps": 0.002995729446411133, "step": 3223} {"info/global_step": 3224, "train_info/time_within_train_step": 2.6485066413879395, "step": 3224} {"train_info/time_between_train_steps": 0.002917766571044922, "step": 3224} {"info/global_step": 3225, "train_info/time_within_train_step": 2.645125389099121, "step": 3225} {"train_info/time_between_train_steps": 0.0029745101928710938, "step": 3225} {"info/global_step": 3226, "train_info/time_within_train_step": 2.6689369678497314, "step": 3226} {"train_info/time_between_train_steps": 0.002972841262817383, "step": 3226} {"info/global_step": 3227, "train_info/time_within_train_step": 2.6707522869110107, "step": 3227} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 3227} {"info/global_step": 3228, "train_info/time_within_train_step": 2.6859445571899414, "step": 3228} {"train_info/time_between_train_steps": 0.002970457077026367, "step": 3228} {"info/global_step": 3229, "train_info/time_within_train_step": 2.6526713371276855, "step": 3229} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 3229} {"info/global_step": 3230, "train_info/time_within_train_step": 2.641446828842163, "step": 3230} {"train_info/time_between_train_steps": 0.0029768943786621094, "step": 3230} {"info/global_step": 3231, "train_info/time_within_train_step": 2.659432888031006, "step": 3231} {"train_info/time_between_train_steps": 0.0029327869415283203, "step": 3231} {"info/global_step": 3232, "train_info/time_within_train_step": 2.656726360321045, "step": 3232} {"train_info/time_between_train_steps": 0.0029811859130859375, "step": 3232} {"info/global_step": 3233, "train_info/time_within_train_step": 2.6459619998931885, "step": 3233} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 3233} {"info/global_step": 3234, "train_info/time_within_train_step": 2.6444039344787598, "step": 3234} {"train_info/time_between_train_steps": 0.0029973983764648438, "step": 3234} {"info/global_step": 3235, "train_info/time_within_train_step": 2.657500743865967, "step": 3235} {"train_info/time_between_train_steps": 0.002943277359008789, "step": 3235} {"info/global_step": 3236, "train_info/time_within_train_step": 2.670799732208252, "step": 3236} {"train_info/time_between_train_steps": 0.002936124801635742, "step": 3236} {"info/global_step": 3237, "train_info/time_within_train_step": 2.6856181621551514, "step": 3237} {"train_info/time_between_train_steps": 0.002959012985229492, "step": 3237} {"info/global_step": 3238, "train_info/time_within_train_step": 2.6530380249023438, "step": 3238} {"train_info/time_between_train_steps": 0.002953767776489258, "step": 3238} {"info/global_step": 3239, "train_info/time_within_train_step": 2.6907553672790527, "step": 3239} {"train_info/time_between_train_steps": 0.002972126007080078, "step": 3239} {"info/global_step": 3240, "train_info/time_within_train_step": 2.6420822143554688, "step": 3240} {"train_info/time_between_train_steps": 0.0029714107513427734, "step": 3240} {"info/global_step": 3241, "train_info/time_within_train_step": 2.6478967666625977, "step": 3241} {"train_info/time_between_train_steps": 0.002895832061767578, "step": 3241} {"info/global_step": 3242, "train_info/time_within_train_step": 2.6734094619750977, "step": 3242} {"train_info/time_between_train_steps": 0.0029582977294921875, "step": 3242} {"info/global_step": 3243, "train_info/time_within_train_step": 2.6439857482910156, "step": 3243} {"train_info/time_between_train_steps": 0.0029754638671875, "step": 3243} {"info/global_step": 3244, "train_info/time_within_train_step": 2.64451265335083, "step": 3244} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 3244} {"info/global_step": 3245, "train_info/time_within_train_step": 2.6646080017089844, "step": 3245} {"train_info/time_between_train_steps": 0.0029342174530029297, "step": 3245} {"info/global_step": 3246, "train_info/time_within_train_step": 2.6601402759552, "step": 3246} {"train_info/time_between_train_steps": 0.0029363632202148438, "step": 3246} {"info/global_step": 3247, "train_info/time_within_train_step": 2.6763622760772705, "step": 3247} {"train_info/time_between_train_steps": 0.002943277359008789, "step": 3247} {"info/global_step": 3248, "train_info/time_within_train_step": 2.6677074432373047, "step": 3248} {"train_info/time_between_train_steps": 0.003143310546875, "step": 3248} {"info/global_step": 3249, "train_info/time_within_train_step": 2.6958167552948, "step": 3249} {"train_info/time_between_train_steps": 0.003107786178588867, "step": 3249} {"info/global_step": 3250, "train_info/time_within_train_step": 3.2446186542510986, "step": 3250} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746906590, "_runtime": 9188}, "step": 3250} {"logs": {"train/loss": 3.9672, "train/learning_rate": 0.00045, "train/epoch": 3.07, "_timestamp": 1746906590, "_runtime": 9188}, "step": 3250} {"train_info/time_between_train_steps": 0.024231672286987305, "step": 3250} {"info/global_step": 3251, "train_info/time_within_train_step": 2.651028633117676, "step": 3251} {"train_info/time_between_train_steps": 0.0031096935272216797, "step": 3251} {"info/global_step": 3252, "train_info/time_within_train_step": 2.6470043659210205, "step": 3252} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 3252} {"info/global_step": 3253, "train_info/time_within_train_step": 2.650158405303955, "step": 3253} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 3253} {"info/global_step": 3254, "train_info/time_within_train_step": 2.648336172103882, "step": 3254} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 3254} {"info/global_step": 3255, "train_info/time_within_train_step": 2.665940046310425, "step": 3255} {"train_info/time_between_train_steps": 0.003248453140258789, "step": 3255} {"info/global_step": 3256, "train_info/time_within_train_step": 2.662642478942871, "step": 3256} {"train_info/time_between_train_steps": 0.003284931182861328, "step": 3256} {"info/global_step": 3257, "train_info/time_within_train_step": 2.675117254257202, "step": 3257} {"train_info/time_between_train_steps": 0.003385782241821289, "step": 3257} {"info/global_step": 3258, "train_info/time_within_train_step": 2.702054262161255, "step": 3258} {"train_info/time_between_train_steps": 0.003353118896484375, "step": 3258} {"info/global_step": 3259, "train_info/time_within_train_step": 2.6518537998199463, "step": 3259} {"train_info/time_between_train_steps": 0.0032334327697753906, "step": 3259} {"info/global_step": 3260, "train_info/time_within_train_step": 2.6481735706329346, "step": 3260} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 3260} {"info/global_step": 3261, "train_info/time_within_train_step": 2.6524574756622314, "step": 3261} {"train_info/time_between_train_steps": 0.0032982826232910156, "step": 3261} {"info/global_step": 3262, "train_info/time_within_train_step": 2.6481220722198486, "step": 3262} {"train_info/time_between_train_steps": 0.0032782554626464844, "step": 3262} {"info/global_step": 3263, "train_info/time_within_train_step": 2.6503043174743652, "step": 3263} {"train_info/time_between_train_steps": 0.0032694339752197266, "step": 3263} {"info/global_step": 3264, "train_info/time_within_train_step": 2.651003837585449, "step": 3264} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 3264} {"info/global_step": 3265, "train_info/time_within_train_step": 2.652458429336548, "step": 3265} {"train_info/time_between_train_steps": 0.003290414810180664, "step": 3265} {"info/global_step": 3266, "train_info/time_within_train_step": 2.6595823764801025, "step": 3266} {"train_info/time_between_train_steps": 0.003298044204711914, "step": 3266} {"info/global_step": 3267, "train_info/time_within_train_step": 2.676452398300171, "step": 3267} {"train_info/time_between_train_steps": 0.003337383270263672, "step": 3267} {"info/global_step": 3268, "train_info/time_within_train_step": 2.7313640117645264, "step": 3268} {"train_info/time_between_train_steps": 0.0033714771270751953, "step": 3268} {"info/global_step": 3269, "train_info/time_within_train_step": 2.6628434658050537, "step": 3269} {"train_info/time_between_train_steps": 0.0033288002014160156, "step": 3269} {"info/global_step": 3270, "train_info/time_within_train_step": 2.6412534713745117, "step": 3270} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 3270} {"info/global_step": 3271, "train_info/time_within_train_step": 2.6615848541259766, "step": 3271} {"train_info/time_between_train_steps": 0.0033102035522460938, "step": 3271} {"info/global_step": 3272, "train_info/time_within_train_step": 2.6523261070251465, "step": 3272} {"train_info/time_between_train_steps": 0.0033752918243408203, "step": 3272} {"info/global_step": 3273, "train_info/time_within_train_step": 2.644942283630371, "step": 3273} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 3273} {"info/global_step": 3274, "train_info/time_within_train_step": 2.653066873550415, "step": 3274} {"train_info/time_between_train_steps": 0.003221273422241211, "step": 3274} {"info/global_step": 3275, "train_info/time_within_train_step": 2.6480793952941895, "step": 3275} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 3275} {"info/global_step": 3276, "train_info/time_within_train_step": 2.668787717819214, "step": 3276} {"train_info/time_between_train_steps": 0.003224611282348633, "step": 3276} {"info/global_step": 3277, "train_info/time_within_train_step": 2.6939656734466553, "step": 3277} {"train_info/time_between_train_steps": 0.0032329559326171875, "step": 3277} {"info/global_step": 3278, "train_info/time_within_train_step": 2.664583921432495, "step": 3278} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 3278} {"info/global_step": 3279, "train_info/time_within_train_step": 2.664478302001953, "step": 3279} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 3279} {"info/global_step": 3280, "train_info/time_within_train_step": 2.643064498901367, "step": 3280} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 3280} {"info/global_step": 3281, "train_info/time_within_train_step": 2.655139207839966, "step": 3281} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 3281} {"info/global_step": 3282, "train_info/time_within_train_step": 2.6562750339508057, "step": 3282} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 3282} {"info/global_step": 3283, "train_info/time_within_train_step": 2.6440582275390625, "step": 3283} {"train_info/time_between_train_steps": 0.003309488296508789, "step": 3283} {"info/global_step": 3284, "train_info/time_within_train_step": 2.6499743461608887, "step": 3284} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 3284} {"info/global_step": 3285, "train_info/time_within_train_step": 2.6540122032165527, "step": 3285} {"train_info/time_between_train_steps": 0.003268718719482422, "step": 3285} {"info/global_step": 3286, "train_info/time_within_train_step": 2.668569326400757, "step": 3286} {"train_info/time_between_train_steps": 0.0034046173095703125, "step": 3286} {"info/global_step": 3287, "train_info/time_within_train_step": 2.682673454284668, "step": 3287} {"train_info/time_between_train_steps": 0.0032727718353271484, "step": 3287} {"info/global_step": 3288, "train_info/time_within_train_step": 2.6512632369995117, "step": 3288} {"train_info/time_between_train_steps": 0.0033652782440185547, "step": 3288} {"info/global_step": 3289, "train_info/time_within_train_step": 2.685293674468994, "step": 3289} {"train_info/time_between_train_steps": 0.0033426284790039062, "step": 3289} {"info/global_step": 3290, "train_info/time_within_train_step": 2.641913652420044, "step": 3290} {"train_info/time_between_train_steps": 0.0032563209533691406, "step": 3290} {"info/global_step": 3291, "train_info/time_within_train_step": 2.899329900741577, "step": 3291} {"train_info/time_between_train_steps": 0.003027200698852539, "step": 3291} {"info/global_step": 3292, "train_info/time_within_train_step": 2.6603970527648926, "step": 3292} {"train_info/time_between_train_steps": 0.0029506683349609375, "step": 3292} {"info/global_step": 3293, "train_info/time_within_train_step": 2.6493263244628906, "step": 3293} {"train_info/time_between_train_steps": 0.0030150413513183594, "step": 3293} {"info/global_step": 3294, "train_info/time_within_train_step": 2.6504452228546143, "step": 3294} {"train_info/time_between_train_steps": 0.0029921531677246094, "step": 3294} {"info/global_step": 3295, "train_info/time_within_train_step": 2.64878249168396, "step": 3295} {"train_info/time_between_train_steps": 0.0030312538146972656, "step": 3295} {"info/global_step": 3296, "train_info/time_within_train_step": 2.6435606479644775, "step": 3296} {"train_info/time_between_train_steps": 0.002969026565551758, "step": 3296} {"info/global_step": 3297, "train_info/time_within_train_step": 2.6462466716766357, "step": 3297} {"train_info/time_between_train_steps": 0.0030279159545898438, "step": 3297} {"info/global_step": 3298, "train_info/time_within_train_step": 2.663235902786255, "step": 3298} {"train_info/time_between_train_steps": 0.0030431747436523438, "step": 3298} {"info/global_step": 3299, "train_info/time_within_train_step": 2.6668918132781982, "step": 3299} {"train_info/time_between_train_steps": 0.002943277359008789, "step": 3299} {"info/global_step": 3300, "train_info/time_within_train_step": 2.658562660217285, "step": 3300} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746906724, "_runtime": 9322}, "step": 3300} {"logs": {"train/loss": 3.9562, "train/learning_rate": 0.00044666666666666666, "train/epoch": 3.07, "_timestamp": 1746906724, "_runtime": 9322}, "step": 3300} {"train_info/time_between_train_steps": 0.02424001693725586, "step": 3300} {"info/global_step": 3301, "train_info/time_within_train_step": 2.6757431030273438, "step": 3301} {"train_info/time_between_train_steps": 0.0029413700103759766, "step": 3301} {"info/global_step": 3302, "train_info/time_within_train_step": 2.6668789386749268, "step": 3302} {"train_info/time_between_train_steps": 0.0030820369720458984, "step": 3302} {"info/global_step": 3303, "train_info/time_within_train_step": 2.7023470401763916, "step": 3303} {"train_info/time_between_train_steps": 0.003062009811401367, "step": 3303} {"info/global_step": 3304, "train_info/time_within_train_step": 2.6446306705474854, "step": 3304} {"train_info/time_between_train_steps": 0.003082752227783203, "step": 3304} {"info/global_step": 3305, "train_info/time_within_train_step": 2.649473190307617, "step": 3305} {"train_info/time_between_train_steps": 0.003090381622314453, "step": 3305} {"info/global_step": 3306, "train_info/time_within_train_step": 2.6756680011749268, "step": 3306} {"train_info/time_between_train_steps": 0.0032165050506591797, "step": 3306} {"info/global_step": 3307, "train_info/time_within_train_step": 2.6576993465423584, "step": 3307} {"train_info/time_between_train_steps": 0.003042936325073242, "step": 3307} {"info/global_step": 3308, "train_info/time_within_train_step": 2.6496806144714355, "step": 3308} {"train_info/time_between_train_steps": 0.0030930042266845703, "step": 3308} {"info/global_step": 3309, "train_info/time_within_train_step": 2.6620383262634277, "step": 3309} {"train_info/time_between_train_steps": 0.0030078887939453125, "step": 3309} {"info/global_step": 3310, "train_info/time_within_train_step": 2.6581997871398926, "step": 3310} {"train_info/time_between_train_steps": 0.0030853748321533203, "step": 3310} {"info/global_step": 3311, "train_info/time_within_train_step": 2.661799430847168, "step": 3311} {"train_info/time_between_train_steps": 0.0030634403228759766, "step": 3311} {"info/global_step": 3312, "train_info/time_within_train_step": 2.7165327072143555, "step": 3312} {"train_info/time_between_train_steps": 0.003050565719604492, "step": 3312} {"info/global_step": 3313, "train_info/time_within_train_step": 2.7068376541137695, "step": 3313} {"train_info/time_between_train_steps": 0.0030460357666015625, "step": 3313} {"info/global_step": 3314, "train_info/time_within_train_step": 2.6518914699554443, "step": 3314} {"train_info/time_between_train_steps": 0.0030562877655029297, "step": 3314} {"info/global_step": 3315, "train_info/time_within_train_step": 2.6617307662963867, "step": 3315} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 3315} {"info/global_step": 3316, "train_info/time_within_train_step": 2.6515274047851562, "step": 3316} {"train_info/time_between_train_steps": 0.0030448436737060547, "step": 3316} {"info/global_step": 3317, "train_info/time_within_train_step": 2.6462130546569824, "step": 3317} {"train_info/time_between_train_steps": 0.003037691116333008, "step": 3317} {"info/global_step": 3318, "train_info/time_within_train_step": 2.671159505844116, "step": 3318} {"train_info/time_between_train_steps": 0.003030538558959961, "step": 3318} {"info/global_step": 3319, "train_info/time_within_train_step": 2.690545082092285, "step": 3319} {"train_info/time_between_train_steps": 0.0030341148376464844, "step": 3319} {"info/global_step": 3320, "train_info/time_within_train_step": 2.664595127105713, "step": 3320} {"train_info/time_between_train_steps": 0.0030379295349121094, "step": 3320} {"info/global_step": 3321, "train_info/time_within_train_step": 2.666219711303711, "step": 3321} {"train_info/time_between_train_steps": 0.003082275390625, "step": 3321} {"info/global_step": 3322, "train_info/time_within_train_step": 2.649350881576538, "step": 3322} {"train_info/time_between_train_steps": 0.0030257701873779297, "step": 3322} {"info/global_step": 3323, "train_info/time_within_train_step": 2.6506690979003906, "step": 3323} {"train_info/time_between_train_steps": 0.0030891895294189453, "step": 3323} {"info/global_step": 3324, "train_info/time_within_train_step": 2.6785569190979004, "step": 3324} {"train_info/time_between_train_steps": 0.003038167953491211, "step": 3324} {"info/global_step": 3325, "train_info/time_within_train_step": 2.649038553237915, "step": 3325} {"train_info/time_between_train_steps": 0.003038644790649414, "step": 3325} {"info/global_step": 3326, "train_info/time_within_train_step": 2.6488780975341797, "step": 3326} {"train_info/time_between_train_steps": 0.003046274185180664, "step": 3326} {"info/global_step": 3327, "train_info/time_within_train_step": 2.6704976558685303, "step": 3327} {"train_info/time_between_train_steps": 0.0030570030212402344, "step": 3327} {"info/global_step": 3328, "train_info/time_within_train_step": 2.6739256381988525, "step": 3328} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 3328} {"info/global_step": 3329, "train_info/time_within_train_step": 2.6906824111938477, "step": 3329} {"train_info/time_between_train_steps": 0.003085613250732422, "step": 3329} {"info/global_step": 3330, "train_info/time_within_train_step": 2.653886556625366, "step": 3330} {"train_info/time_between_train_steps": 0.002996206283569336, "step": 3330} {"info/global_step": 3331, "train_info/time_within_train_step": 2.6854774951934814, "step": 3331} {"train_info/time_between_train_steps": 0.0030744075775146484, "step": 3331} {"info/global_step": 3332, "train_info/time_within_train_step": 2.6424548625946045, "step": 3332} {"train_info/time_between_train_steps": 0.003073453903198242, "step": 3332} {"info/global_step": 3333, "train_info/time_within_train_step": 2.6462600231170654, "step": 3333} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 3333} {"info/global_step": 3334, "train_info/time_within_train_step": 2.6636886596679688, "step": 3334} {"train_info/time_between_train_steps": 0.0032761096954345703, "step": 3334} {"info/global_step": 3335, "train_info/time_within_train_step": 2.6465818881988525, "step": 3335} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 3335} {"info/global_step": 3336, "train_info/time_within_train_step": 2.644296646118164, "step": 3336} {"train_info/time_between_train_steps": 0.006551504135131836, "step": 3336} {"info/global_step": 3337, "train_info/time_within_train_step": 2.6745753288269043, "step": 3337} {"train_info/time_between_train_steps": 0.00529026985168457, "step": 3337} {"info/global_step": 3338, "train_info/time_within_train_step": 2.6627657413482666, "step": 3338} {"train_info/time_between_train_steps": 0.006552219390869141, "step": 3338} {"info/global_step": 3339, "train_info/time_within_train_step": 2.6760010719299316, "step": 3339} {"train_info/time_between_train_steps": 0.006676435470581055, "step": 3339} {"info/global_step": 3340, "train_info/time_within_train_step": 2.6643359661102295, "step": 3340} {"train_info/time_between_train_steps": 0.0064504146575927734, "step": 3340} {"info/global_step": 3341, "train_info/time_within_train_step": 2.7111289501190186, "step": 3341} {"train_info/time_between_train_steps": 0.006462812423706055, "step": 3341} {"info/global_step": 3342, "train_info/time_within_train_step": 2.649355173110962, "step": 3342} {"train_info/time_between_train_steps": 0.0064563751220703125, "step": 3342} {"info/global_step": 3343, "train_info/time_within_train_step": 2.6481878757476807, "step": 3343} {"train_info/time_between_train_steps": 0.0065460205078125, "step": 3343} {"info/global_step": 3344, "train_info/time_within_train_step": 2.6504809856414795, "step": 3344} {"train_info/time_between_train_steps": 0.0065004825592041016, "step": 3344} {"info/global_step": 3345, "train_info/time_within_train_step": 2.6511964797973633, "step": 3345} {"train_info/time_between_train_steps": 0.0064394474029541016, "step": 3345} {"info/global_step": 3346, "train_info/time_within_train_step": 2.6552231311798096, "step": 3346} {"train_info/time_between_train_steps": 0.0031158924102783203, "step": 3346} {"info/global_step": 3347, "train_info/time_within_train_step": 2.6443393230438232, "step": 3347} {"train_info/time_between_train_steps": 0.0032367706298828125, "step": 3347} {"info/global_step": 3348, "train_info/time_within_train_step": 2.661201000213623, "step": 3348} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 3348} {"info/global_step": 3349, "train_info/time_within_train_step": 2.6550655364990234, "step": 3349} {"train_info/time_between_train_steps": 0.003264188766479492, "step": 3349} {"info/global_step": 3350, "train_info/time_within_train_step": 2.661680221557617, "step": 3350} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746906859, "_runtime": 9457}, "step": 3350} {"logs": {"train/loss": 3.9346, "train/learning_rate": 0.00044333333333333334, "train/epoch": 3.08, "_timestamp": 1746906859, "_runtime": 9457}, "step": 3350} {"train_info/time_between_train_steps": 0.024647235870361328, "step": 3350} {"info/global_step": 3351, "train_info/time_within_train_step": 2.703275442123413, "step": 3351} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 3351} {"info/global_step": 3352, "train_info/time_within_train_step": 2.8649845123291016, "step": 3352} {"train_info/time_between_train_steps": 0.0030341148376464844, "step": 3352} {"info/global_step": 3353, "train_info/time_within_train_step": 2.660425901412964, "step": 3353} {"train_info/time_between_train_steps": 0.003122568130493164, "step": 3353} {"info/global_step": 3354, "train_info/time_within_train_step": 2.706303358078003, "step": 3354} {"train_info/time_between_train_steps": 0.003013134002685547, "step": 3354} {"info/global_step": 3355, "train_info/time_within_train_step": 2.660867929458618, "step": 3355} {"train_info/time_between_train_steps": 0.003048419952392578, "step": 3355} {"info/global_step": 3356, "train_info/time_within_train_step": 2.6407666206359863, "step": 3356} {"train_info/time_between_train_steps": 0.002947092056274414, "step": 3356} {"info/global_step": 3357, "train_info/time_within_train_step": 2.6511728763580322, "step": 3357} {"train_info/time_between_train_steps": 0.003012418746948242, "step": 3357} {"info/global_step": 3358, "train_info/time_within_train_step": 2.65000319480896, "step": 3358} {"train_info/time_between_train_steps": 0.003079652786254883, "step": 3358} {"info/global_step": 3359, "train_info/time_within_train_step": 2.655317544937134, "step": 3359} {"train_info/time_between_train_steps": 0.003000497817993164, "step": 3359} {"info/global_step": 3360, "train_info/time_within_train_step": 2.645289421081543, "step": 3360} {"train_info/time_between_train_steps": 0.0029752254486083984, "step": 3360} {"info/global_step": 3361, "train_info/time_within_train_step": 2.6440975666046143, "step": 3361} {"train_info/time_between_train_steps": 0.0029528141021728516, "step": 3361} {"info/global_step": 3362, "train_info/time_within_train_step": 2.6657896041870117, "step": 3362} {"train_info/time_between_train_steps": 0.003026723861694336, "step": 3362} {"info/global_step": 3363, "train_info/time_within_train_step": 2.6659255027770996, "step": 3363} {"train_info/time_between_train_steps": 0.002981901168823242, "step": 3363} {"info/global_step": 3364, "train_info/time_within_train_step": 2.709195852279663, "step": 3364} {"train_info/time_between_train_steps": 0.0029888153076171875, "step": 3364} {"info/global_step": 3365, "train_info/time_within_train_step": 2.655621290206909, "step": 3365} {"train_info/time_between_train_steps": 0.0029993057250976562, "step": 3365} {"info/global_step": 3366, "train_info/time_within_train_step": 2.665274143218994, "step": 3366} {"train_info/time_between_train_steps": 0.003083467483520508, "step": 3366} {"info/global_step": 3367, "train_info/time_within_train_step": 2.641376256942749, "step": 3367} {"train_info/time_between_train_steps": 0.0030794143676757812, "step": 3367} {"info/global_step": 3368, "train_info/time_within_train_step": 2.6545825004577637, "step": 3368} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 3368} {"info/global_step": 3369, "train_info/time_within_train_step": 2.6627676486968994, "step": 3369} {"train_info/time_between_train_steps": 0.003215789794921875, "step": 3369} {"info/global_step": 3370, "train_info/time_within_train_step": 2.6443846225738525, "step": 3370} {"train_info/time_between_train_steps": 0.0032618045806884766, "step": 3370} {"info/global_step": 3371, "train_info/time_within_train_step": 2.646271228790283, "step": 3371} {"train_info/time_between_train_steps": 0.0033490657806396484, "step": 3371} {"info/global_step": 3372, "train_info/time_within_train_step": 2.660348892211914, "step": 3372} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 3372} {"info/global_step": 3373, "train_info/time_within_train_step": 2.644968271255493, "step": 3373} {"train_info/time_between_train_steps": 0.003671407699584961, "step": 3373} {"info/global_step": 3374, "train_info/time_within_train_step": 2.6440634727478027, "step": 3374} {"train_info/time_between_train_steps": 0.003557443618774414, "step": 3374} {"info/global_step": 3375, "train_info/time_within_train_step": 2.644286632537842, "step": 3375} {"train_info/time_between_train_steps": 0.003306865692138672, "step": 3375} {"info/global_step": 3376, "train_info/time_within_train_step": 2.643156051635742, "step": 3376} {"train_info/time_between_train_steps": 0.0033142566680908203, "step": 3376} {"info/global_step": 3377, "train_info/time_within_train_step": 2.644073963165283, "step": 3377} {"train_info/time_between_train_steps": 0.0036559104919433594, "step": 3377} {"info/global_step": 3378, "train_info/time_within_train_step": 2.6465952396392822, "step": 3378} {"train_info/time_between_train_steps": 0.0035600662231445312, "step": 3378} {"info/global_step": 3379, "train_info/time_within_train_step": 2.64302134513855, "step": 3379} {"train_info/time_between_train_steps": 0.0033800601959228516, "step": 3379} {"info/global_step": 3380, "train_info/time_within_train_step": 2.642570734024048, "step": 3380} {"train_info/time_between_train_steps": 0.0033140182495117188, "step": 3380} {"info/global_step": 3381, "train_info/time_within_train_step": 2.63957142829895, "step": 3381} {"train_info/time_between_train_steps": 0.0033278465270996094, "step": 3381} {"info/global_step": 3382, "train_info/time_within_train_step": 2.6384165287017822, "step": 3382} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 3382} {"info/global_step": 3383, "train_info/time_within_train_step": 2.6698057651519775, "step": 3383} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 3383} {"info/global_step": 3384, "train_info/time_within_train_step": 2.67864990234375, "step": 3384} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 3384} {"info/global_step": 3385, "train_info/time_within_train_step": 2.6460647583007812, "step": 3385} {"train_info/time_between_train_steps": 0.003258228302001953, "step": 3385} {"info/global_step": 3386, "train_info/time_within_train_step": 2.651445150375366, "step": 3386} {"train_info/time_between_train_steps": 0.003241300582885742, "step": 3386} {"info/global_step": 3387, "train_info/time_within_train_step": 2.641401767730713, "step": 3387} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 3387} {"info/global_step": 3388, "train_info/time_within_train_step": 2.6392948627471924, "step": 3388} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 3388} {"info/global_step": 3389, "train_info/time_within_train_step": 2.6459951400756836, "step": 3389} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 3389} {"info/global_step": 3390, "train_info/time_within_train_step": 2.661968231201172, "step": 3390} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 3390} {"info/global_step": 3391, "train_info/time_within_train_step": 2.6433732509613037, "step": 3391} {"train_info/time_between_train_steps": 0.003122091293334961, "step": 3391} {"info/global_step": 3392, "train_info/time_within_train_step": 2.6425390243530273, "step": 3392} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 3392} {"info/global_step": 3393, "train_info/time_within_train_step": 2.759176015853882, "step": 3393} {"train_info/time_between_train_steps": 0.0030455589294433594, "step": 3393} {"info/global_step": 3394, "train_info/time_within_train_step": 2.6436517238616943, "step": 3394} {"train_info/time_between_train_steps": 0.0030393600463867188, "step": 3394} {"info/global_step": 3395, "train_info/time_within_train_step": 2.662518262863159, "step": 3395} {"train_info/time_between_train_steps": 0.003016948699951172, "step": 3395} {"info/global_step": 3396, "train_info/time_within_train_step": 2.6560277938842773, "step": 3396} {"train_info/time_between_train_steps": 0.003297567367553711, "step": 3396} {"info/global_step": 3397, "train_info/time_within_train_step": 2.6583259105682373, "step": 3397} {"train_info/time_between_train_steps": 0.0031135082244873047, "step": 3397} {"info/global_step": 3398, "train_info/time_within_train_step": 2.6949474811553955, "step": 3398} {"train_info/time_between_train_steps": 0.0030388832092285156, "step": 3398} {"info/global_step": 3399, "train_info/time_within_train_step": 2.652616024017334, "step": 3399} {"train_info/time_between_train_steps": 0.003084897994995117, "step": 3399} {"info/global_step": 3400, "train_info/time_within_train_step": 2.6523211002349854, "step": 3400} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746906997, "_runtime": 9595}, "step": 3400} {"logs": {"train/loss": 3.9281, "train/learning_rate": 0.0004399999999999999, "train/epoch": 3.08, "_timestamp": 1746906997, "_runtime": 9595}, "step": 3400} {"train_info/time_between_train_steps": 30.722991228103638, "step": 3400} {"info/global_step": 3401, "train_info/time_within_train_step": 2.45524525642395, "step": 3401} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 3401} {"info/global_step": 3402, "train_info/time_within_train_step": 2.4229307174682617, "step": 3402} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 3402} {"info/global_step": 3403, "train_info/time_within_train_step": 2.518270969390869, "step": 3403} {"train_info/time_between_train_steps": 0.003305196762084961, "step": 3403} {"info/global_step": 3404, "train_info/time_within_train_step": 2.6367063522338867, "step": 3404} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 3404} {"info/global_step": 3405, "train_info/time_within_train_step": 2.659799814224243, "step": 3405} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 3405} {"info/global_step": 3406, "train_info/time_within_train_step": 2.6475377082824707, "step": 3406} {"train_info/time_between_train_steps": 0.003117799758911133, "step": 3406} {"info/global_step": 3407, "train_info/time_within_train_step": 2.644005298614502, "step": 3407} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 3407} {"info/global_step": 3408, "train_info/time_within_train_step": 2.663858413696289, "step": 3408} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 3408} {"info/global_step": 3409, "train_info/time_within_train_step": 2.660991668701172, "step": 3409} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 3409} {"info/global_step": 3410, "train_info/time_within_train_step": 2.671618700027466, "step": 3410} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 3410} {"info/global_step": 3411, "train_info/time_within_train_step": 2.6734869480133057, "step": 3411} {"train_info/time_between_train_steps": 0.0031137466430664062, "step": 3411} {"info/global_step": 3412, "train_info/time_within_train_step": 2.6856849193573, "step": 3412} {"train_info/time_between_train_steps": 0.003040313720703125, "step": 3412} {"info/global_step": 3413, "train_info/time_within_train_step": 2.6416573524475098, "step": 3413} {"train_info/time_between_train_steps": 0.0030677318572998047, "step": 3413} {"info/global_step": 3414, "train_info/time_within_train_step": 2.6430768966674805, "step": 3414} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 3414} {"info/global_step": 3415, "train_info/time_within_train_step": 2.654378890991211, "step": 3415} {"train_info/time_between_train_steps": 0.0030765533447265625, "step": 3415} {"info/global_step": 3416, "train_info/time_within_train_step": 2.6463735103607178, "step": 3416} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 3416} {"info/global_step": 3417, "train_info/time_within_train_step": 2.6591763496398926, "step": 3417} {"train_info/time_between_train_steps": 0.0030667781829833984, "step": 3417} {"info/global_step": 3418, "train_info/time_within_train_step": 2.6525864601135254, "step": 3418} {"train_info/time_between_train_steps": 0.00310516357421875, "step": 3418} {"info/global_step": 3419, "train_info/time_within_train_step": 2.6608145236968994, "step": 3419} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 3419} {"info/global_step": 3420, "train_info/time_within_train_step": 2.6955065727233887, "step": 3420} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 3420} {"info/global_step": 3421, "train_info/time_within_train_step": 2.7247493267059326, "step": 3421} {"train_info/time_between_train_steps": 0.0033142566680908203, "step": 3421} {"info/global_step": 3422, "train_info/time_within_train_step": 2.655665159225464, "step": 3422} {"train_info/time_between_train_steps": 0.003231525421142578, "step": 3422} {"info/global_step": 3423, "train_info/time_within_train_step": 2.6472842693328857, "step": 3423} {"train_info/time_between_train_steps": 0.006549835205078125, "step": 3423} {"info/global_step": 3424, "train_info/time_within_train_step": 2.6562392711639404, "step": 3424} {"train_info/time_between_train_steps": 0.006293773651123047, "step": 3424} {"info/global_step": 3425, "train_info/time_within_train_step": 2.664102554321289, "step": 3425} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 3425} {"info/global_step": 3426, "train_info/time_within_train_step": 2.6563687324523926, "step": 3426} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 3426} {"info/global_step": 3427, "train_info/time_within_train_step": 2.6464951038360596, "step": 3427} {"train_info/time_between_train_steps": 0.003080129623413086, "step": 3427} {"info/global_step": 3428, "train_info/time_within_train_step": 2.6504926681518555, "step": 3428} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 3428} {"info/global_step": 3429, "train_info/time_within_train_step": 2.670426607131958, "step": 3429} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 3429} {"info/global_step": 3430, "train_info/time_within_train_step": 2.6708717346191406, "step": 3430} {"train_info/time_between_train_steps": 0.0032434463500976562, "step": 3430} {"info/global_step": 3431, "train_info/time_within_train_step": 2.6754491329193115, "step": 3431} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 3431} {"info/global_step": 3432, "train_info/time_within_train_step": 2.6893715858459473, "step": 3432} {"train_info/time_between_train_steps": 0.003551483154296875, "step": 3432} {"info/global_step": 3433, "train_info/time_within_train_step": 2.6577975749969482, "step": 3433} {"train_info/time_between_train_steps": 0.0031156539916992188, "step": 3433} {"info/global_step": 3434, "train_info/time_within_train_step": 2.666612148284912, "step": 3434} {"train_info/time_between_train_steps": 0.0030775070190429688, "step": 3434} {"info/global_step": 3435, "train_info/time_within_train_step": 2.643890619277954, "step": 3435} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 3435} {"info/global_step": 3436, "train_info/time_within_train_step": 2.6426305770874023, "step": 3436} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 3436} {"info/global_step": 3437, "train_info/time_within_train_step": 2.665386915206909, "step": 3437} {"train_info/time_between_train_steps": 0.003286600112915039, "step": 3437} {"info/global_step": 3438, "train_info/time_within_train_step": 2.650751829147339, "step": 3438} {"train_info/time_between_train_steps": 0.003389120101928711, "step": 3438} {"info/global_step": 3439, "train_info/time_within_train_step": 2.6471290588378906, "step": 3439} {"train_info/time_between_train_steps": 0.0032393932342529297, "step": 3439} {"info/global_step": 3440, "train_info/time_within_train_step": 2.662928342819214, "step": 3440} {"train_info/time_between_train_steps": 0.0034465789794921875, "step": 3440} {"info/global_step": 3441, "train_info/time_within_train_step": 2.6623268127441406, "step": 3441} {"train_info/time_between_train_steps": 0.0033347606658935547, "step": 3441} {"info/global_step": 3442, "train_info/time_within_train_step": 2.690513849258423, "step": 3442} {"train_info/time_between_train_steps": 0.003391265869140625, "step": 3442} {"info/global_step": 3443, "train_info/time_within_train_step": 2.6616270542144775, "step": 3443} {"train_info/time_between_train_steps": 0.0034105777740478516, "step": 3443} {"info/global_step": 3444, "train_info/time_within_train_step": 2.7125611305236816, "step": 3444} {"train_info/time_between_train_steps": 0.0034651756286621094, "step": 3444} {"info/global_step": 3445, "train_info/time_within_train_step": 2.6521975994110107, "step": 3445} {"train_info/time_between_train_steps": 0.003401517868041992, "step": 3445} {"info/global_step": 3446, "train_info/time_within_train_step": 2.6516709327697754, "step": 3446} {"train_info/time_between_train_steps": 0.0037746429443359375, "step": 3446} {"info/global_step": 3447, "train_info/time_within_train_step": 2.6589341163635254, "step": 3447} {"train_info/time_between_train_steps": 0.003579854965209961, "step": 3447} {"info/global_step": 3448, "train_info/time_within_train_step": 2.649193286895752, "step": 3448} {"train_info/time_between_train_steps": 0.003917694091796875, "step": 3448} {"info/global_step": 3449, "train_info/time_within_train_step": 2.6525332927703857, "step": 3449} {"train_info/time_between_train_steps": 0.003838062286376953, "step": 3449} {"info/global_step": 3450, "train_info/time_within_train_step": 2.650858163833618, "step": 3450} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746907162, "_runtime": 9760}, "step": 3450} {"logs": {"train/loss": 3.925, "train/learning_rate": 0.0004366666666666666, "train/epoch": 3.09, "_timestamp": 1746907162, "_runtime": 9760}, "step": 3450} {"train_info/time_between_train_steps": 0.02583622932434082, "step": 3450} {"info/global_step": 3451, "train_info/time_within_train_step": 2.6621992588043213, "step": 3451} {"train_info/time_between_train_steps": 0.004591703414916992, "step": 3451} {"info/global_step": 3452, "train_info/time_within_train_step": 2.65635347366333, "step": 3452} {"train_info/time_between_train_steps": 0.004286289215087891, "step": 3452} {"train_info/time_between_train_steps": 2.4364473819732666, "step": 3452} {"info/global_step": 3453, "train_info/time_within_train_step": 2.668356418609619, "step": 3453} {"train_info/time_between_train_steps": 0.003141641616821289, "step": 3453} {"info/global_step": 3454, "train_info/time_within_train_step": 2.646932601928711, "step": 3454} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 3454} {"info/global_step": 3455, "train_info/time_within_train_step": 2.6476285457611084, "step": 3455} {"train_info/time_between_train_steps": 0.0032660961151123047, "step": 3455} {"info/global_step": 3456, "train_info/time_within_train_step": 2.6475441455841064, "step": 3456} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 3456} {"info/global_step": 3457, "train_info/time_within_train_step": 2.647183418273926, "step": 3457} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 3457} {"info/global_step": 3458, "train_info/time_within_train_step": 2.664174795150757, "step": 3458} {"train_info/time_between_train_steps": 0.0033614635467529297, "step": 3458} {"info/global_step": 3459, "train_info/time_within_train_step": 2.6693484783172607, "step": 3459} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 3459} {"info/global_step": 3460, "train_info/time_within_train_step": 2.711956739425659, "step": 3460} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 3460} {"info/global_step": 3461, "train_info/time_within_train_step": 2.6482205390930176, "step": 3461} {"train_info/time_between_train_steps": 0.005887269973754883, "step": 3461} {"info/global_step": 3462, "train_info/time_within_train_step": 2.6685869693756104, "step": 3462} {"train_info/time_between_train_steps": 0.003183126449584961, "step": 3462} {"info/global_step": 3463, "train_info/time_within_train_step": 2.644313097000122, "step": 3463} {"train_info/time_between_train_steps": 0.003317117691040039, "step": 3463} {"info/global_step": 3464, "train_info/time_within_train_step": 2.666189670562744, "step": 3464} {"train_info/time_between_train_steps": 0.006615638732910156, "step": 3464} {"info/global_step": 3465, "train_info/time_within_train_step": 2.6596784591674805, "step": 3465} {"train_info/time_between_train_steps": 0.0033028125762939453, "step": 3465} {"info/global_step": 3466, "train_info/time_within_train_step": 2.6468324661254883, "step": 3466} {"train_info/time_between_train_steps": 0.003237485885620117, "step": 3466} {"info/global_step": 3467, "train_info/time_within_train_step": 2.643296718597412, "step": 3467} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 3467} {"info/global_step": 3468, "train_info/time_within_train_step": 2.6579787731170654, "step": 3468} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 3468} {"info/global_step": 3469, "train_info/time_within_train_step": 2.6681079864501953, "step": 3469} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 3469} {"info/global_step": 3470, "train_info/time_within_train_step": 2.686647415161133, "step": 3470} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 3470} {"info/global_step": 3471, "train_info/time_within_train_step": 2.6526103019714355, "step": 3471} {"train_info/time_between_train_steps": 0.0032668113708496094, "step": 3471} {"info/global_step": 3472, "train_info/time_within_train_step": 2.6796176433563232, "step": 3472} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 3472} {"info/global_step": 3473, "train_info/time_within_train_step": 2.643232822418213, "step": 3473} {"train_info/time_between_train_steps": 0.0031206607818603516, "step": 3473} {"info/global_step": 3474, "train_info/time_within_train_step": 2.6422951221466064, "step": 3474} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 3474} {"info/global_step": 3475, "train_info/time_within_train_step": 2.6621384620666504, "step": 3475} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 3475} {"info/global_step": 3476, "train_info/time_within_train_step": 2.6438634395599365, "step": 3476} {"train_info/time_between_train_steps": 0.003298044204711914, "step": 3476} {"info/global_step": 3477, "train_info/time_within_train_step": 2.6677112579345703, "step": 3477} {"train_info/time_between_train_steps": 0.0032737255096435547, "step": 3477} {"info/global_step": 3478, "train_info/time_within_train_step": 2.6433188915252686, "step": 3478} {"train_info/time_between_train_steps": 0.003204345703125, "step": 3478} {"info/global_step": 3479, "train_info/time_within_train_step": 2.6490049362182617, "step": 3479} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 3479} {"info/global_step": 3480, "train_info/time_within_train_step": 2.665060520172119, "step": 3480} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 3480} {"info/global_step": 3481, "train_info/time_within_train_step": 2.861717939376831, "step": 3481} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 3481} {"info/global_step": 3482, "train_info/time_within_train_step": 2.6567647457122803, "step": 3482} {"train_info/time_between_train_steps": 0.0032358169555664062, "step": 3482} {"info/global_step": 3483, "train_info/time_within_train_step": 2.6582202911376953, "step": 3483} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 3483} {"info/global_step": 3484, "train_info/time_within_train_step": 2.6455061435699463, "step": 3484} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 3484} {"info/global_step": 3485, "train_info/time_within_train_step": 2.644728899002075, "step": 3485} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 3485} {"info/global_step": 3486, "train_info/time_within_train_step": 2.66001558303833, "step": 3486} {"train_info/time_between_train_steps": 0.006536960601806641, "step": 3486} {"info/global_step": 3487, "train_info/time_within_train_step": 2.6776793003082275, "step": 3487} {"train_info/time_between_train_steps": 0.006432533264160156, "step": 3487} {"info/global_step": 3488, "train_info/time_within_train_step": 2.6658310890197754, "step": 3488} {"train_info/time_between_train_steps": 0.006493091583251953, "step": 3488} {"info/global_step": 3489, "train_info/time_within_train_step": 2.663961410522461, "step": 3489} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 3489} {"info/global_step": 3490, "train_info/time_within_train_step": 2.6725077629089355, "step": 3490} {"train_info/time_between_train_steps": 0.0031206607818603516, "step": 3490} {"info/global_step": 3491, "train_info/time_within_train_step": 2.649474859237671, "step": 3491} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 3491} {"info/global_step": 3492, "train_info/time_within_train_step": 2.648393154144287, "step": 3492} {"train_info/time_between_train_steps": 0.006455659866333008, "step": 3492} {"info/global_step": 3493, "train_info/time_within_train_step": 2.6479179859161377, "step": 3493} {"train_info/time_between_train_steps": 0.006407022476196289, "step": 3493} {"info/global_step": 3494, "train_info/time_within_train_step": 2.654121160507202, "step": 3494} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 3494} {"info/global_step": 3495, "train_info/time_within_train_step": 2.649465322494507, "step": 3495} {"train_info/time_between_train_steps": 0.0064852237701416016, "step": 3495} {"info/global_step": 3496, "train_info/time_within_train_step": 2.646202564239502, "step": 3496} {"train_info/time_between_train_steps": 0.006417989730834961, "step": 3496} {"info/global_step": 3497, "train_info/time_within_train_step": 2.6667838096618652, "step": 3497} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 3497} {"info/global_step": 3498, "train_info/time_within_train_step": 2.6573195457458496, "step": 3498} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 3498} {"info/global_step": 3499, "train_info/time_within_train_step": 3.300307035446167, "step": 3499} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 3499} {"info/global_step": 3500, "train_info/time_within_train_step": 2.6866116523742676, "step": 3500} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746907299, "_runtime": 9897}, "step": 3500} {"logs": {"train/loss": 3.9359, "train/learning_rate": 0.0004333333333333333, "train/epoch": 4.0, "_timestamp": 1746907299, "_runtime": 9897}, "step": 3500} {"train_info/time_between_train_steps": 0.024810314178466797, "step": 3500} {"info/global_step": 3501, "train_info/time_within_train_step": 2.6674349308013916, "step": 3501} {"train_info/time_between_train_steps": 0.0032317638397216797, "step": 3501} {"info/global_step": 3502, "train_info/time_within_train_step": 2.650407075881958, "step": 3502} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 3502} {"info/global_step": 3503, "train_info/time_within_train_step": 2.6415560245513916, "step": 3503} {"train_info/time_between_train_steps": 0.0031328201293945312, "step": 3503} {"info/global_step": 3504, "train_info/time_within_train_step": 2.6630663871765137, "step": 3504} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 3504} {"info/global_step": 3505, "train_info/time_within_train_step": 2.6484720706939697, "step": 3505} {"train_info/time_between_train_steps": 0.003126382827758789, "step": 3505} {"info/global_step": 3506, "train_info/time_within_train_step": 2.644334316253662, "step": 3506} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 3506} {"info/global_step": 3507, "train_info/time_within_train_step": 2.6869661808013916, "step": 3507} {"train_info/time_between_train_steps": 0.003139019012451172, "step": 3507} {"info/global_step": 3508, "train_info/time_within_train_step": 2.6496243476867676, "step": 3508} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 3508} {"info/global_step": 3509, "train_info/time_within_train_step": 2.6468706130981445, "step": 3509} {"train_info/time_between_train_steps": 0.0031316280364990234, "step": 3509} {"info/global_step": 3510, "train_info/time_within_train_step": 2.653491973876953, "step": 3510} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 3510} {"info/global_step": 3511, "train_info/time_within_train_step": 2.6486477851867676, "step": 3511} {"train_info/time_between_train_steps": 0.00311279296875, "step": 3511} {"info/global_step": 3512, "train_info/time_within_train_step": 2.6493265628814697, "step": 3512} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 3512} {"info/global_step": 3513, "train_info/time_within_train_step": 2.647150754928589, "step": 3513} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 3513} {"info/global_step": 3514, "train_info/time_within_train_step": 2.654421806335449, "step": 3514} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 3514} {"info/global_step": 3515, "train_info/time_within_train_step": 2.7793936729431152, "step": 3515} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 3515} {"info/global_step": 3516, "train_info/time_within_train_step": 2.6548047065734863, "step": 3516} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 3516} {"info/global_step": 3517, "train_info/time_within_train_step": 2.657933473587036, "step": 3517} {"train_info/time_between_train_steps": 0.003256559371948242, "step": 3517} {"info/global_step": 3518, "train_info/time_within_train_step": 2.674515724182129, "step": 3518} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 3518} {"info/global_step": 3519, "train_info/time_within_train_step": 2.728466749191284, "step": 3519} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 3519} {"info/global_step": 3520, "train_info/time_within_train_step": 2.6686973571777344, "step": 3520} {"train_info/time_between_train_steps": 0.003315448760986328, "step": 3520} {"info/global_step": 3521, "train_info/time_within_train_step": 2.6430962085723877, "step": 3521} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 3521} {"info/global_step": 3522, "train_info/time_within_train_step": 2.6546504497528076, "step": 3522} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 3522} {"info/global_step": 3523, "train_info/time_within_train_step": 2.655789375305176, "step": 3523} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 3523} {"info/global_step": 3524, "train_info/time_within_train_step": 2.6623053550720215, "step": 3524} {"train_info/time_between_train_steps": 0.0032591819763183594, "step": 3524} {"info/global_step": 3525, "train_info/time_within_train_step": 2.6494336128234863, "step": 3525} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 3525} {"info/global_step": 3526, "train_info/time_within_train_step": 2.6437225341796875, "step": 3526} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 3526} {"info/global_step": 3527, "train_info/time_within_train_step": 2.6678543090820312, "step": 3527} {"train_info/time_between_train_steps": 0.0032825469970703125, "step": 3527} {"info/global_step": 3528, "train_info/time_within_train_step": 2.6676411628723145, "step": 3528} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 3528} {"info/global_step": 3529, "train_info/time_within_train_step": 2.6815497875213623, "step": 3529} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 3529} {"info/global_step": 3530, "train_info/time_within_train_step": 2.6536948680877686, "step": 3530} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 3530} {"info/global_step": 3531, "train_info/time_within_train_step": 2.642564296722412, "step": 3531} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 3531} {"info/global_step": 3532, "train_info/time_within_train_step": 2.655949592590332, "step": 3532} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 3532} {"info/global_step": 3533, "train_info/time_within_train_step": 2.655039072036743, "step": 3533} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 3533} {"info/global_step": 3534, "train_info/time_within_train_step": 2.6448652744293213, "step": 3534} {"train_info/time_between_train_steps": 0.006590127944946289, "step": 3534} {"info/global_step": 3535, "train_info/time_within_train_step": 2.6438214778900146, "step": 3535} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 3535} {"info/global_step": 3536, "train_info/time_within_train_step": 2.6489930152893066, "step": 3536} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 3536} {"info/global_step": 3537, "train_info/time_within_train_step": 2.6694209575653076, "step": 3537} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 3537} {"info/global_step": 3538, "train_info/time_within_train_step": 2.671542167663574, "step": 3538} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 3538} {"info/global_step": 3539, "train_info/time_within_train_step": 2.654170274734497, "step": 3539} {"train_info/time_between_train_steps": 0.0031218528747558594, "step": 3539} {"info/global_step": 3540, "train_info/time_within_train_step": 2.9154980182647705, "step": 3540} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 3540} {"info/global_step": 3541, "train_info/time_within_train_step": 2.6501035690307617, "step": 3541} {"train_info/time_between_train_steps": 0.0031309127807617188, "step": 3541} {"info/global_step": 3542, "train_info/time_within_train_step": 2.681368112564087, "step": 3542} {"train_info/time_between_train_steps": 0.003115415573120117, "step": 3542} {"info/global_step": 3543, "train_info/time_within_train_step": 2.6412415504455566, "step": 3543} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 3543} {"info/global_step": 3544, "train_info/time_within_train_step": 2.648620843887329, "step": 3544} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 3544} {"info/global_step": 3545, "train_info/time_within_train_step": 2.6646571159362793, "step": 3545} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 3545} {"info/global_step": 3546, "train_info/time_within_train_step": 2.6443307399749756, "step": 3546} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 3546} {"info/global_step": 3547, "train_info/time_within_train_step": 2.645219326019287, "step": 3547} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 3547} {"info/global_step": 3548, "train_info/time_within_train_step": 2.653860569000244, "step": 3548} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 3548} {"info/global_step": 3549, "train_info/time_within_train_step": 2.6632144451141357, "step": 3549} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 3549} {"info/global_step": 3550, "train_info/time_within_train_step": 2.6643483638763428, "step": 3550} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746907434, "_runtime": 10032}, "step": 3550} {"logs": {"train/loss": 3.8935, "train/learning_rate": 0.00043, "train/epoch": 4.01, "_timestamp": 1746907434, "_runtime": 10032}, "step": 3550} {"train_info/time_between_train_steps": 0.023595571517944336, "step": 3550} {"info/global_step": 3551, "train_info/time_within_train_step": 2.6743881702423096, "step": 3551} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 3551} {"info/global_step": 3552, "train_info/time_within_train_step": 2.6670656204223633, "step": 3552} {"train_info/time_between_train_steps": 0.00324249267578125, "step": 3552} {"info/global_step": 3553, "train_info/time_within_train_step": 2.7018790245056152, "step": 3553} {"train_info/time_between_train_steps": 0.0035986900329589844, "step": 3553} {"info/global_step": 3554, "train_info/time_within_train_step": 2.6402947902679443, "step": 3554} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 3554} {"info/global_step": 3555, "train_info/time_within_train_step": 2.6463048458099365, "step": 3555} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 3555} {"info/global_step": 3556, "train_info/time_within_train_step": 2.6661617755889893, "step": 3556} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 3556} {"info/global_step": 3557, "train_info/time_within_train_step": 2.6475892066955566, "step": 3557} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 3557} {"info/global_step": 3558, "train_info/time_within_train_step": 2.645890712738037, "step": 3558} {"train_info/time_between_train_steps": 0.003231048583984375, "step": 3558} {"info/global_step": 3559, "train_info/time_within_train_step": 2.6525847911834717, "step": 3559} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 3559} {"info/global_step": 3560, "train_info/time_within_train_step": 2.6518971920013428, "step": 3560} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 3560} {"info/global_step": 3561, "train_info/time_within_train_step": 2.6595218181610107, "step": 3561} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 3561} {"info/global_step": 3562, "train_info/time_within_train_step": 2.6875076293945312, "step": 3562} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 3562} {"info/global_step": 3563, "train_info/time_within_train_step": 2.728545904159546, "step": 3563} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 3563} {"info/global_step": 3564, "train_info/time_within_train_step": 2.6501545906066895, "step": 3564} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 3564} {"info/global_step": 3565, "train_info/time_within_train_step": 2.6401286125183105, "step": 3565} {"train_info/time_between_train_steps": 0.003139019012451172, "step": 3565} {"info/global_step": 3566, "train_info/time_within_train_step": 2.658998489379883, "step": 3566} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 3566} {"info/global_step": 3567, "train_info/time_within_train_step": 2.648669719696045, "step": 3567} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 3567} {"info/global_step": 3568, "train_info/time_within_train_step": 2.6517720222473145, "step": 3568} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 3568} {"info/global_step": 3569, "train_info/time_within_train_step": 2.6455154418945312, "step": 3569} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 3569} {"info/global_step": 3570, "train_info/time_within_train_step": 2.6474859714508057, "step": 3570} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 3570} {"info/global_step": 3571, "train_info/time_within_train_step": 2.661494016647339, "step": 3571} {"train_info/time_between_train_steps": 0.0032715797424316406, "step": 3571} {"info/global_step": 3572, "train_info/time_within_train_step": 2.6656653881073, "step": 3572} {"train_info/time_between_train_steps": 0.0032618045806884766, "step": 3572} {"info/global_step": 3573, "train_info/time_within_train_step": 2.7111246585845947, "step": 3573} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 3573} {"info/global_step": 3574, "train_info/time_within_train_step": 2.643496513366699, "step": 3574} {"train_info/time_between_train_steps": 0.003119230270385742, "step": 3574} {"info/global_step": 3575, "train_info/time_within_train_step": 2.6584482192993164, "step": 3575} {"train_info/time_between_train_steps": 0.003149747848510742, "step": 3575} {"info/global_step": 3576, "train_info/time_within_train_step": 2.6516048908233643, "step": 3576} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 3576} {"info/global_step": 3577, "train_info/time_within_train_step": 2.646609306335449, "step": 3577} {"train_info/time_between_train_steps": 0.12300395965576172, "step": 3577} {"info/global_step": 3578, "train_info/time_within_train_step": 2.671172618865967, "step": 3578} {"train_info/time_between_train_steps": 0.0035314559936523438, "step": 3578} {"info/global_step": 3579, "train_info/time_within_train_step": 2.6450605392456055, "step": 3579} {"train_info/time_between_train_steps": 0.0033011436462402344, "step": 3579} {"info/global_step": 3580, "train_info/time_within_train_step": 2.64388108253479, "step": 3580} {"train_info/time_between_train_steps": 0.0034148693084716797, "step": 3580} {"info/global_step": 3581, "train_info/time_within_train_step": 2.646925687789917, "step": 3581} {"train_info/time_between_train_steps": 0.0033752918243408203, "step": 3581} {"info/global_step": 3582, "train_info/time_within_train_step": 2.643465757369995, "step": 3582} {"train_info/time_between_train_steps": 0.003309011459350586, "step": 3582} {"info/global_step": 3583, "train_info/time_within_train_step": 2.8676226139068604, "step": 3583} {"train_info/time_between_train_steps": 0.0064697265625, "step": 3583} {"info/global_step": 3584, "train_info/time_within_train_step": 2.7044899463653564, "step": 3584} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 3584} {"info/global_step": 3585, "train_info/time_within_train_step": 2.658064365386963, "step": 3585} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 3585} {"info/global_step": 3586, "train_info/time_within_train_step": 2.646618604660034, "step": 3586} {"train_info/time_between_train_steps": 0.003159761428833008, "step": 3586} {"info/global_step": 3587, "train_info/time_within_train_step": 2.669166326522827, "step": 3587} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 3587} {"info/global_step": 3588, "train_info/time_within_train_step": 2.6446423530578613, "step": 3588} {"train_info/time_between_train_steps": 0.0031468868255615234, "step": 3588} {"info/global_step": 3589, "train_info/time_within_train_step": 2.64390230178833, "step": 3589} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 3589} {"info/global_step": 3590, "train_info/time_within_train_step": 2.6510303020477295, "step": 3590} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 3590} {"info/global_step": 3591, "train_info/time_within_train_step": 2.6691842079162598, "step": 3591} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 3591} {"info/global_step": 3592, "train_info/time_within_train_step": 2.6746432781219482, "step": 3592} {"train_info/time_between_train_steps": 0.003251314163208008, "step": 3592} {"info/global_step": 3593, "train_info/time_within_train_step": 2.650714635848999, "step": 3593} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 3593} {"info/global_step": 3594, "train_info/time_within_train_step": 2.6837263107299805, "step": 3594} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 3594} {"info/global_step": 3595, "train_info/time_within_train_step": 2.6413910388946533, "step": 3595} {"train_info/time_between_train_steps": 0.0031676292419433594, "step": 3595} {"info/global_step": 3596, "train_info/time_within_train_step": 2.642463445663452, "step": 3596} {"train_info/time_between_train_steps": 0.0064809322357177734, "step": 3596} {"info/global_step": 3597, "train_info/time_within_train_step": 2.6650240421295166, "step": 3597} {"train_info/time_between_train_steps": 0.00653839111328125, "step": 3597} {"info/global_step": 3598, "train_info/time_within_train_step": 2.6573736667633057, "step": 3598} {"train_info/time_between_train_steps": 0.006566286087036133, "step": 3598} {"info/global_step": 3599, "train_info/time_within_train_step": 2.6652138233184814, "step": 3599} {"train_info/time_between_train_steps": 0.0065767765045166016, "step": 3599} {"info/global_step": 3600, "train_info/time_within_train_step": 2.6869633197784424, "step": 3600} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746907570, "_runtime": 10168}, "step": 3600} {"logs": {"train/loss": 3.8942, "train/learning_rate": 0.00042666666666666667, "train/epoch": 4.01, "_timestamp": 1746907570, "_runtime": 10168}, "step": 3600} {"train_info/time_between_train_steps": 13.755591869354248, "step": 3600} {"info/global_step": 3601, "train_info/time_within_train_step": 2.4435923099517822, "step": 3601} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 3601} {"info/global_step": 3602, "train_info/time_within_train_step": 2.4306554794311523, "step": 3602} {"train_info/time_between_train_steps": 0.0032324790954589844, "step": 3602} {"info/global_step": 3603, "train_info/time_within_train_step": 2.5804853439331055, "step": 3603} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 3603} {"info/global_step": 3604, "train_info/time_within_train_step": 2.6652112007141113, "step": 3604} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 3604} {"info/global_step": 3605, "train_info/time_within_train_step": 2.6791341304779053, "step": 3605} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 3605} {"info/global_step": 3606, "train_info/time_within_train_step": 2.6648638248443604, "step": 3606} {"train_info/time_between_train_steps": 0.003248453140258789, "step": 3606} {"info/global_step": 3607, "train_info/time_within_train_step": 2.6500258445739746, "step": 3607} {"train_info/time_between_train_steps": 0.003156423568725586, "step": 3607} {"info/global_step": 3608, "train_info/time_within_train_step": 2.65204119682312, "step": 3608} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 3608} {"info/global_step": 3609, "train_info/time_within_train_step": 2.650099277496338, "step": 3609} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 3609} {"info/global_step": 3610, "train_info/time_within_train_step": 2.6453797817230225, "step": 3610} {"train_info/time_between_train_steps": 0.003214597702026367, "step": 3610} {"info/global_step": 3611, "train_info/time_within_train_step": 2.650506019592285, "step": 3611} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 3611} {"info/global_step": 3612, "train_info/time_within_train_step": 2.6500751972198486, "step": 3612} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 3612} {"info/global_step": 3613, "train_info/time_within_train_step": 2.6615374088287354, "step": 3613} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 3613} {"info/global_step": 3614, "train_info/time_within_train_step": 2.6704905033111572, "step": 3614} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 3614} {"info/global_step": 3615, "train_info/time_within_train_step": 2.663019895553589, "step": 3615} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 3615} {"info/global_step": 3616, "train_info/time_within_train_step": 2.701766014099121, "step": 3616} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 3616} {"info/global_step": 3617, "train_info/time_within_train_step": 2.64802885055542, "step": 3617} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 3617} {"info/global_step": 3618, "train_info/time_within_train_step": 2.650171995162964, "step": 3618} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 3618} {"info/global_step": 3619, "train_info/time_within_train_step": 2.6658859252929688, "step": 3619} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 3619} {"info/global_step": 3620, "train_info/time_within_train_step": 2.6483688354492188, "step": 3620} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 3620} {"info/global_step": 3621, "train_info/time_within_train_step": 2.645986557006836, "step": 3621} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 3621} {"info/global_step": 3622, "train_info/time_within_train_step": 2.657872438430786, "step": 3622} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 3622} {"info/global_step": 3623, "train_info/time_within_train_step": 2.652635097503662, "step": 3623} {"train_info/time_between_train_steps": 0.0032439231872558594, "step": 3623} {"info/global_step": 3624, "train_info/time_within_train_step": 2.6613731384277344, "step": 3624} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 3624} {"info/global_step": 3625, "train_info/time_within_train_step": 2.6982953548431396, "step": 3625} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 3625} {"info/global_step": 3626, "train_info/time_within_train_step": 2.724433660507202, "step": 3626} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 3626} {"info/global_step": 3627, "train_info/time_within_train_step": 2.6494412422180176, "step": 3627} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 3627} {"info/global_step": 3628, "train_info/time_within_train_step": 2.6408636569976807, "step": 3628} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 3628} {"info/global_step": 3629, "train_info/time_within_train_step": 2.6558315753936768, "step": 3629} {"train_info/time_between_train_steps": 0.0032482147216796875, "step": 3629} {"info/global_step": 3630, "train_info/time_within_train_step": 2.655620813369751, "step": 3630} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 3630} {"info/global_step": 3631, "train_info/time_within_train_step": 2.6450724601745605, "step": 3631} {"train_info/time_between_train_steps": 0.0031499862670898438, "step": 3631} {"info/global_step": 3632, "train_info/time_within_train_step": 2.6522727012634277, "step": 3632} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 3632} {"info/global_step": 3633, "train_info/time_within_train_step": 2.649648666381836, "step": 3633} {"train_info/time_between_train_steps": 0.0032083988189697266, "step": 3633} {"info/global_step": 3634, "train_info/time_within_train_step": 2.668663740158081, "step": 3634} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 3634} {"info/global_step": 3635, "train_info/time_within_train_step": 2.882972240447998, "step": 3635} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 3635} {"info/global_step": 3636, "train_info/time_within_train_step": 2.644766092300415, "step": 3636} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 3636} {"info/global_step": 3637, "train_info/time_within_train_step": 2.6656148433685303, "step": 3637} {"train_info/time_between_train_steps": 0.0032300949096679688, "step": 3637} {"info/global_step": 3638, "train_info/time_within_train_step": 2.6698248386383057, "step": 3638} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 3638} {"info/global_step": 3639, "train_info/time_within_train_step": 2.6724162101745605, "step": 3639} {"train_info/time_between_train_steps": 0.003156423568725586, "step": 3639} {"info/global_step": 3640, "train_info/time_within_train_step": 2.8052282333374023, "step": 3640} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 3640} {"info/global_step": 3641, "train_info/time_within_train_step": 2.6720046997070312, "step": 3641} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 3641} {"info/global_step": 3642, "train_info/time_within_train_step": 2.658804416656494, "step": 3642} {"train_info/time_between_train_steps": 0.0032241344451904297, "step": 3642} {"info/global_step": 3643, "train_info/time_within_train_step": 2.6405246257781982, "step": 3643} {"train_info/time_between_train_steps": 0.003137350082397461, "step": 3643} {"info/global_step": 3644, "train_info/time_within_train_step": 2.655182123184204, "step": 3644} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 3644} {"info/global_step": 3645, "train_info/time_within_train_step": 2.662283182144165, "step": 3645} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 3645} {"info/global_step": 3646, "train_info/time_within_train_step": 2.6444203853607178, "step": 3646} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 3646} {"info/global_step": 3647, "train_info/time_within_train_step": 2.644649028778076, "step": 3647} {"train_info/time_between_train_steps": 0.003133535385131836, "step": 3647} {"info/global_step": 3648, "train_info/time_within_train_step": 2.6653807163238525, "step": 3648} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 3648} {"info/global_step": 3649, "train_info/time_within_train_step": 2.6665079593658447, "step": 3649} {"train_info/time_between_train_steps": 0.0033407211303710938, "step": 3649} {"info/global_step": 3650, "train_info/time_within_train_step": 2.688934564590454, "step": 3650} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746907717, "_runtime": 10315}, "step": 3650} {"logs": {"train/loss": 3.8737, "train/learning_rate": 0.00042333333333333334, "train/epoch": 4.02, "_timestamp": 1746907717, "_runtime": 10315}, "step": 3650} {"train_info/time_between_train_steps": 0.02509760856628418, "step": 3650} {"info/global_step": 3651, "train_info/time_within_train_step": 2.644254446029663, "step": 3651} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 3651} {"info/global_step": 3652, "train_info/time_within_train_step": 2.663252115249634, "step": 3652} {"train_info/time_between_train_steps": 0.0032601356506347656, "step": 3652} {"info/global_step": 3653, "train_info/time_within_train_step": 2.6484854221343994, "step": 3653} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 3653} {"info/global_step": 3654, "train_info/time_within_train_step": 2.6442158222198486, "step": 3654} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 3654} {"info/global_step": 3655, "train_info/time_within_train_step": 2.6650712490081787, "step": 3655} {"train_info/time_between_train_steps": 0.003326416015625, "step": 3655} {"info/global_step": 3656, "train_info/time_within_train_step": 2.658231735229492, "step": 3656} {"train_info/time_between_train_steps": 0.0032546520233154297, "step": 3656} {"info/global_step": 3657, "train_info/time_within_train_step": 2.654874086380005, "step": 3657} {"train_info/time_between_train_steps": 0.0032389163970947266, "step": 3657} {"info/global_step": 3658, "train_info/time_within_train_step": 2.706033945083618, "step": 3658} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 3658} {"info/global_step": 3659, "train_info/time_within_train_step": 2.648977518081665, "step": 3659} {"train_info/time_between_train_steps": 0.003291606903076172, "step": 3659} {"info/global_step": 3660, "train_info/time_within_train_step": 2.6480352878570557, "step": 3660} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 3660} {"info/global_step": 3661, "train_info/time_within_train_step": 2.6549527645111084, "step": 3661} {"train_info/time_between_train_steps": 0.003276348114013672, "step": 3661} {"info/global_step": 3662, "train_info/time_within_train_step": 2.645444631576538, "step": 3662} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 3662} {"info/global_step": 3663, "train_info/time_within_train_step": 2.6497714519500732, "step": 3663} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 3663} {"info/global_step": 3664, "train_info/time_within_train_step": 2.646528720855713, "step": 3664} {"train_info/time_between_train_steps": 0.003285646438598633, "step": 3664} {"info/global_step": 3665, "train_info/time_within_train_step": 2.6583731174468994, "step": 3665} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 3665} {"info/global_step": 3666, "train_info/time_within_train_step": 2.655576705932617, "step": 3666} {"train_info/time_between_train_steps": 0.0033609867095947266, "step": 3666} {"info/global_step": 3667, "train_info/time_within_train_step": 2.6727259159088135, "step": 3667} {"train_info/time_between_train_steps": 0.003238677978515625, "step": 3667} {"info/global_step": 3668, "train_info/time_within_train_step": 2.6825878620147705, "step": 3668} {"train_info/time_between_train_steps": 0.0032377243041992188, "step": 3668} {"info/global_step": 3669, "train_info/time_within_train_step": 2.6530799865722656, "step": 3669} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 3669} {"info/global_step": 3670, "train_info/time_within_train_step": 2.6483421325683594, "step": 3670} {"train_info/time_between_train_steps": 0.003252744674682617, "step": 3670} {"info/global_step": 3671, "train_info/time_within_train_step": 2.6493122577667236, "step": 3671} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 3671} {"info/global_step": 3672, "train_info/time_within_train_step": 2.6477324962615967, "step": 3672} {"train_info/time_between_train_steps": 0.0033583641052246094, "step": 3672} {"info/global_step": 3673, "train_info/time_within_train_step": 2.6441116333007812, "step": 3673} {"train_info/time_between_train_steps": 0.0033118724822998047, "step": 3673} {"info/global_step": 3674, "train_info/time_within_train_step": 2.6658778190612793, "step": 3674} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 3674} {"info/global_step": 3675, "train_info/time_within_train_step": 2.6648709774017334, "step": 3675} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 3675} {"info/global_step": 3676, "train_info/time_within_train_step": 2.698101282119751, "step": 3676} {"train_info/time_between_train_steps": 0.0033576488494873047, "step": 3676} {"info/global_step": 3677, "train_info/time_within_train_step": 2.645679235458374, "step": 3677} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 3677} {"info/global_step": 3678, "train_info/time_within_train_step": 2.6470937728881836, "step": 3678} {"train_info/time_between_train_steps": 0.003243684768676758, "step": 3678} {"info/global_step": 3679, "train_info/time_within_train_step": 2.6534008979797363, "step": 3679} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 3679} {"info/global_step": 3680, "train_info/time_within_train_step": 2.6489992141723633, "step": 3680} {"train_info/time_between_train_steps": 0.003265380859375, "step": 3680} {"info/global_step": 3681, "train_info/time_within_train_step": 2.656947612762451, "step": 3681} {"train_info/time_between_train_steps": 0.0033674240112304688, "step": 3681} {"info/global_step": 3682, "train_info/time_within_train_step": 2.6502256393432617, "step": 3682} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 3682} {"info/global_step": 3683, "train_info/time_within_train_step": 2.6437478065490723, "step": 3683} {"train_info/time_between_train_steps": 0.003264904022216797, "step": 3683} {"info/global_step": 3684, "train_info/time_within_train_step": 2.66996431350708, "step": 3684} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 3684} {"info/global_step": 3685, "train_info/time_within_train_step": 2.6702587604522705, "step": 3685} {"train_info/time_between_train_steps": 0.003263235092163086, "step": 3685} {"info/global_step": 3686, "train_info/time_within_train_step": 2.672356128692627, "step": 3686} {"train_info/time_between_train_steps": 0.0032732486724853516, "step": 3686} {"info/global_step": 3687, "train_info/time_within_train_step": 2.6635422706604004, "step": 3687} {"train_info/time_between_train_steps": 0.0032699108123779297, "step": 3687} {"info/global_step": 3688, "train_info/time_within_train_step": 2.7029147148132324, "step": 3688} {"train_info/time_between_train_steps": 0.00325775146484375, "step": 3688} {"info/global_step": 3689, "train_info/time_within_train_step": 2.639270305633545, "step": 3689} {"train_info/time_between_train_steps": 0.0032494068145751953, "step": 3689} {"info/global_step": 3690, "train_info/time_within_train_step": 2.6525375843048096, "step": 3690} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 3690} {"info/global_step": 3691, "train_info/time_within_train_step": 2.6633148193359375, "step": 3691} {"train_info/time_between_train_steps": 0.003269195556640625, "step": 3691} {"info/global_step": 3692, "train_info/time_within_train_step": 2.645893096923828, "step": 3692} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 3692} {"info/global_step": 3693, "train_info/time_within_train_step": 2.6439006328582764, "step": 3693} {"train_info/time_between_train_steps": 0.0033075809478759766, "step": 3693} {"info/global_step": 3694, "train_info/time_within_train_step": 2.659836530685425, "step": 3694} {"train_info/time_between_train_steps": 0.0032994747161865234, "step": 3694} {"info/global_step": 3695, "train_info/time_within_train_step": 2.640197277069092, "step": 3695} {"train_info/time_between_train_steps": 0.0033369064331054688, "step": 3695} {"info/global_step": 3696, "train_info/time_within_train_step": 2.639699935913086, "step": 3696} {"train_info/time_between_train_steps": 0.0032806396484375, "step": 3696} {"info/global_step": 3697, "train_info/time_within_train_step": 2.6641507148742676, "step": 3697} {"train_info/time_between_train_steps": 0.003265380859375, "step": 3697} {"info/global_step": 3698, "train_info/time_within_train_step": 2.65043044090271, "step": 3698} {"train_info/time_between_train_steps": 0.003293752670288086, "step": 3698} {"info/global_step": 3699, "train_info/time_within_train_step": 2.645087242126465, "step": 3699} {"train_info/time_between_train_steps": 0.0032498836517333984, "step": 3699} {"info/global_step": 3700, "train_info/time_within_train_step": 2.6497817039489746, "step": 3700} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746907851, "_runtime": 10449}, "step": 3700} {"logs": {"train/loss": 3.8648, "train/learning_rate": 0.00041999999999999996, "train/epoch": 4.02, "_timestamp": 1746907851, "_runtime": 10449}, "step": 3700} {"train_info/time_between_train_steps": 0.025333881378173828, "step": 3700} {"info/global_step": 3701, "train_info/time_within_train_step": 2.6478168964385986, "step": 3701} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 3701} {"info/global_step": 3702, "train_info/time_within_train_step": 2.659453868865967, "step": 3702} {"train_info/time_between_train_steps": 0.13925576210021973, "step": 3702} {"info/global_step": 3703, "train_info/time_within_train_step": 2.6520209312438965, "step": 3703} {"train_info/time_between_train_steps": 0.003238677978515625, "step": 3703} {"info/global_step": 3704, "train_info/time_within_train_step": 2.6514675617218018, "step": 3704} {"train_info/time_between_train_steps": 0.003320455551147461, "step": 3704} {"info/global_step": 3705, "train_info/time_within_train_step": 2.66707444190979, "step": 3705} {"train_info/time_between_train_steps": 0.003137350082397461, "step": 3705} {"info/global_step": 3706, "train_info/time_within_train_step": 2.7077505588531494, "step": 3706} {"train_info/time_between_train_steps": 0.0033643245697021484, "step": 3706} {"info/global_step": 3707, "train_info/time_within_train_step": 2.6415047645568848, "step": 3707} {"train_info/time_between_train_steps": 0.0032341480255126953, "step": 3707} {"info/global_step": 3708, "train_info/time_within_train_step": 2.654228687286377, "step": 3708} {"train_info/time_between_train_steps": 0.003256559371948242, "step": 3708} {"info/global_step": 3709, "train_info/time_within_train_step": 2.6463184356689453, "step": 3709} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 3709} {"info/global_step": 3710, "train_info/time_within_train_step": 2.6468827724456787, "step": 3710} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 3710} {"info/global_step": 3711, "train_info/time_within_train_step": 2.65718936920166, "step": 3711} {"train_info/time_between_train_steps": 0.0032777786254882812, "step": 3711} {"info/global_step": 3712, "train_info/time_within_train_step": 2.6439709663391113, "step": 3712} {"train_info/time_between_train_steps": 0.0032765865325927734, "step": 3712} {"info/global_step": 3713, "train_info/time_within_train_step": 2.643754005432129, "step": 3713} {"train_info/time_between_train_steps": 0.006545305252075195, "step": 3713} {"info/global_step": 3714, "train_info/time_within_train_step": 2.6679606437683105, "step": 3714} {"train_info/time_between_train_steps": 0.006573677062988281, "step": 3714} {"info/global_step": 3715, "train_info/time_within_train_step": 2.6632485389709473, "step": 3715} {"train_info/time_between_train_steps": 0.00652766227722168, "step": 3715} {"info/global_step": 3716, "train_info/time_within_train_step": 2.6873667240142822, "step": 3716} {"train_info/time_between_train_steps": 0.006571292877197266, "step": 3716} {"info/global_step": 3717, "train_info/time_within_train_step": 2.6541202068328857, "step": 3717} {"train_info/time_between_train_steps": 0.006494283676147461, "step": 3717} {"info/global_step": 3718, "train_info/time_within_train_step": 2.6715469360351562, "step": 3718} {"train_info/time_between_train_steps": 0.006542682647705078, "step": 3718} {"info/global_step": 3719, "train_info/time_within_train_step": 2.6415274143218994, "step": 3719} {"train_info/time_between_train_steps": 0.006935596466064453, "step": 3719} {"info/global_step": 3720, "train_info/time_within_train_step": 2.6448230743408203, "step": 3720} {"train_info/time_between_train_steps": 0.004799604415893555, "step": 3720} {"info/global_step": 3721, "train_info/time_within_train_step": 2.666611909866333, "step": 3721} {"train_info/time_between_train_steps": 0.006448507308959961, "step": 3721} {"info/global_step": 3722, "train_info/time_within_train_step": 2.6427764892578125, "step": 3722} {"train_info/time_between_train_steps": 0.0065784454345703125, "step": 3722} {"info/global_step": 3723, "train_info/time_within_train_step": 2.6430211067199707, "step": 3723} {"train_info/time_between_train_steps": 0.003472566604614258, "step": 3723} {"info/global_step": 3724, "train_info/time_within_train_step": 2.654595375061035, "step": 3724} {"train_info/time_between_train_steps": 0.0065155029296875, "step": 3724} {"info/global_step": 3725, "train_info/time_within_train_step": 2.659208297729492, "step": 3725} {"train_info/time_between_train_steps": 0.006544351577758789, "step": 3725} {"info/global_step": 3726, "train_info/time_within_train_step": 2.6708149909973145, "step": 3726} {"train_info/time_between_train_steps": 0.003237485885620117, "step": 3726} {"info/global_step": 3727, "train_info/time_within_train_step": 2.662679672241211, "step": 3727} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 3727} {"info/global_step": 3728, "train_info/time_within_train_step": 2.7068159580230713, "step": 3728} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 3728} {"info/global_step": 3729, "train_info/time_within_train_step": 2.64021897315979, "step": 3729} {"train_info/time_between_train_steps": 0.003252744674682617, "step": 3729} {"info/global_step": 3730, "train_info/time_within_train_step": 2.6489596366882324, "step": 3730} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 3730} {"info/global_step": 3731, "train_info/time_within_train_step": 2.660177230834961, "step": 3731} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 3731} {"info/global_step": 3732, "train_info/time_within_train_step": 2.648130178451538, "step": 3732} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 3732} {"info/global_step": 3733, "train_info/time_within_train_step": 2.9170117378234863, "step": 3733} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 3733} {"info/global_step": 3734, "train_info/time_within_train_step": 2.6517183780670166, "step": 3734} {"train_info/time_between_train_steps": 0.003139972686767578, "step": 3734} {"info/global_step": 3735, "train_info/time_within_train_step": 2.6450181007385254, "step": 3735} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 3735} {"info/global_step": 3736, "train_info/time_within_train_step": 2.6771445274353027, "step": 3736} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 3736} {"info/global_step": 3737, "train_info/time_within_train_step": 2.6546759605407715, "step": 3737} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 3737} {"info/global_step": 3738, "train_info/time_within_train_step": 2.658392906188965, "step": 3738} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 3738} {"info/global_step": 3739, "train_info/time_within_train_step": 2.692946195602417, "step": 3739} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 3739} {"info/global_step": 3740, "train_info/time_within_train_step": 2.7235374450683594, "step": 3740} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 3740} {"info/global_step": 3741, "train_info/time_within_train_step": 2.6478447914123535, "step": 3741} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 3741} {"info/global_step": 3742, "train_info/time_within_train_step": 2.6406311988830566, "step": 3742} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 3742} {"info/global_step": 3743, "train_info/time_within_train_step": 2.6601932048797607, "step": 3743} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 3743} {"info/global_step": 3744, "train_info/time_within_train_step": 2.647712230682373, "step": 3744} {"train_info/time_between_train_steps": 0.003136157989501953, "step": 3744} {"info/global_step": 3745, "train_info/time_within_train_step": 2.6469688415527344, "step": 3745} {"train_info/time_between_train_steps": 0.0031604766845703125, "step": 3745} {"info/global_step": 3746, "train_info/time_within_train_step": 2.648200035095215, "step": 3746} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 3746} {"info/global_step": 3747, "train_info/time_within_train_step": 2.6441164016723633, "step": 3747} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 3747} {"info/global_step": 3748, "train_info/time_within_train_step": 2.6659178733825684, "step": 3748} {"train_info/time_between_train_steps": 0.0033292770385742188, "step": 3748} {"info/global_step": 3749, "train_info/time_within_train_step": 3.3117334842681885, "step": 3749} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 3749} {"info/global_step": 3750, "train_info/time_within_train_step": 2.6866965293884277, "step": 3750} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746907987, "_runtime": 10585}, "step": 3750} {"logs": {"train/loss": 3.8523, "train/learning_rate": 0.00041666666666666664, "train/epoch": 4.03, "_timestamp": 1746907987, "_runtime": 10585}, "step": 3750} {"train_info/time_between_train_steps": 0.02456212043762207, "step": 3750} {"info/global_step": 3751, "train_info/time_within_train_step": 2.6452784538269043, "step": 3751} {"train_info/time_between_train_steps": 0.0034160614013671875, "step": 3751} {"info/global_step": 3752, "train_info/time_within_train_step": 2.6404733657836914, "step": 3752} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 3752} {"info/global_step": 3753, "train_info/time_within_train_step": 2.6593985557556152, "step": 3753} {"train_info/time_between_train_steps": 0.003248929977416992, "step": 3753} {"info/global_step": 3754, "train_info/time_within_train_step": 2.649202585220337, "step": 3754} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 3754} {"info/global_step": 3755, "train_info/time_within_train_step": 2.6464498043060303, "step": 3755} {"train_info/time_between_train_steps": 0.003284931182861328, "step": 3755} {"info/global_step": 3756, "train_info/time_within_train_step": 2.6499862670898438, "step": 3756} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 3756} {"info/global_step": 3757, "train_info/time_within_train_step": 2.6446025371551514, "step": 3757} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 3757} {"info/global_step": 3758, "train_info/time_within_train_step": 2.6686818599700928, "step": 3758} {"train_info/time_between_train_steps": 0.003319978713989258, "step": 3758} {"info/global_step": 3759, "train_info/time_within_train_step": 2.6723644733428955, "step": 3759} {"train_info/time_between_train_steps": 0.0032579898834228516, "step": 3759} {"info/global_step": 3760, "train_info/time_within_train_step": 2.685946226119995, "step": 3760} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 3760} {"info/global_step": 3761, "train_info/time_within_train_step": 2.6513402462005615, "step": 3761} {"train_info/time_between_train_steps": 0.003221273422241211, "step": 3761} {"info/global_step": 3762, "train_info/time_within_train_step": 2.6404292583465576, "step": 3762} {"train_info/time_between_train_steps": 0.003226041793823242, "step": 3762} {"info/global_step": 3763, "train_info/time_within_train_step": 2.6607041358947754, "step": 3763} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 3763} {"info/global_step": 3764, "train_info/time_within_train_step": 2.6533725261688232, "step": 3764} {"train_info/time_between_train_steps": 0.0031425952911376953, "step": 3764} {"info/global_step": 3765, "train_info/time_within_train_step": 2.7930681705474854, "step": 3765} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 3765} {"info/global_step": 3766, "train_info/time_within_train_step": 2.6545963287353516, "step": 3766} {"train_info/time_between_train_steps": 0.0031681060791015625, "step": 3766} {"info/global_step": 3767, "train_info/time_within_train_step": 2.646692991256714, "step": 3767} {"train_info/time_between_train_steps": 0.0031676292419433594, "step": 3767} {"info/global_step": 3768, "train_info/time_within_train_step": 2.6449334621429443, "step": 3768} {"train_info/time_between_train_steps": 0.0033545494079589844, "step": 3768} {"info/global_step": 3769, "train_info/time_within_train_step": 2.649973154067993, "step": 3769} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 3769} {"info/global_step": 3770, "train_info/time_within_train_step": 2.669822931289673, "step": 3770} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 3770} {"info/global_step": 3771, "train_info/time_within_train_step": 2.6862733364105225, "step": 3771} {"train_info/time_between_train_steps": 0.0032167434692382812, "step": 3771} {"info/global_step": 3772, "train_info/time_within_train_step": 2.671830177307129, "step": 3772} {"train_info/time_between_train_steps": 0.003229379653930664, "step": 3772} {"info/global_step": 3773, "train_info/time_within_train_step": 2.6699023246765137, "step": 3773} {"train_info/time_between_train_steps": 0.0033843517303466797, "step": 3773} {"info/global_step": 3774, "train_info/time_within_train_step": 2.6485071182250977, "step": 3774} {"train_info/time_between_train_steps": 0.003285646438598633, "step": 3774} {"info/global_step": 3775, "train_info/time_within_train_step": 2.65377140045166, "step": 3775} {"train_info/time_between_train_steps": 0.0032339096069335938, "step": 3775} {"info/global_step": 3776, "train_info/time_within_train_step": 2.6559479236602783, "step": 3776} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 3776} {"info/global_step": 3777, "train_info/time_within_train_step": 2.64327073097229, "step": 3777} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 3777} {"info/global_step": 3778, "train_info/time_within_train_step": 2.645113945007324, "step": 3778} {"train_info/time_between_train_steps": 0.003657102584838867, "step": 3778} {"info/global_step": 3779, "train_info/time_within_train_step": 2.6532998085021973, "step": 3779} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 3779} {"info/global_step": 3780, "train_info/time_within_train_step": 2.6616291999816895, "step": 3780} {"train_info/time_between_train_steps": 0.003224611282348633, "step": 3780} {"info/global_step": 3781, "train_info/time_within_train_step": 2.6740427017211914, "step": 3781} {"train_info/time_between_train_steps": 0.003293275833129883, "step": 3781} {"info/global_step": 3782, "train_info/time_within_train_step": 2.6723594665527344, "step": 3782} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 3782} {"info/global_step": 3783, "train_info/time_within_train_step": 2.6674399375915527, "step": 3783} {"train_info/time_between_train_steps": 0.0034017562866210938, "step": 3783} {"info/global_step": 3784, "train_info/time_within_train_step": 2.644174814224243, "step": 3784} {"train_info/time_between_train_steps": 0.0033304691314697266, "step": 3784} {"info/global_step": 3785, "train_info/time_within_train_step": 2.644399881362915, "step": 3785} {"train_info/time_between_train_steps": 0.0033631324768066406, "step": 3785} {"info/global_step": 3786, "train_info/time_within_train_step": 2.6456477642059326, "step": 3786} {"train_info/time_between_train_steps": 0.003436565399169922, "step": 3786} {"info/global_step": 3787, "train_info/time_within_train_step": 2.6458239555358887, "step": 3787} {"train_info/time_between_train_steps": 0.0033588409423828125, "step": 3787} {"info/global_step": 3788, "train_info/time_within_train_step": 2.6494967937469482, "step": 3788} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 3788} {"info/global_step": 3789, "train_info/time_within_train_step": 2.6531190872192383, "step": 3789} {"train_info/time_between_train_steps": 0.003253936767578125, "step": 3789} {"info/global_step": 3790, "train_info/time_within_train_step": 2.6410202980041504, "step": 3790} {"train_info/time_between_train_steps": 0.0033118724822998047, "step": 3790} {"info/global_step": 3791, "train_info/time_within_train_step": 2.6466457843780518, "step": 3791} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 3791} {"info/global_step": 3792, "train_info/time_within_train_step": 2.918588161468506, "step": 3792} {"train_info/time_between_train_steps": 0.003239154815673828, "step": 3792} {"info/global_step": 3793, "train_info/time_within_train_step": 2.679762840270996, "step": 3793} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 3793} {"info/global_step": 3794, "train_info/time_within_train_step": 2.667449712753296, "step": 3794} {"train_info/time_between_train_steps": 0.003335714340209961, "step": 3794} {"info/global_step": 3795, "train_info/time_within_train_step": 2.6840274333953857, "step": 3795} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 3795} {"info/global_step": 3796, "train_info/time_within_train_step": 2.6491401195526123, "step": 3796} {"train_info/time_between_train_steps": 0.003334522247314453, "step": 3796} {"info/global_step": 3797, "train_info/time_within_train_step": 2.669138193130493, "step": 3797} {"train_info/time_between_train_steps": 0.0031363964080810547, "step": 3797} {"info/global_step": 3798, "train_info/time_within_train_step": 2.647195339202881, "step": 3798} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 3798} {"info/global_step": 3799, "train_info/time_within_train_step": 2.6447136402130127, "step": 3799} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 3799} {"info/global_step": 3800, "train_info/time_within_train_step": 2.6511783599853516, "step": 3800} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746908122, "_runtime": 10720}, "step": 3800} {"logs": {"train/loss": 3.8479, "train/learning_rate": 0.0004133333333333333, "train/epoch": 4.03, "_timestamp": 1746908122, "_runtime": 10720}, "step": 3800} {"train_info/time_between_train_steps": 15.948989868164062, "step": 3800} {"info/global_step": 3801, "train_info/time_within_train_step": 2.425504446029663, "step": 3801} {"train_info/time_between_train_steps": 0.003232717514038086, "step": 3801} {"info/global_step": 3802, "train_info/time_within_train_step": 2.4399819374084473, "step": 3802} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 3802} {"info/global_step": 3803, "train_info/time_within_train_step": 2.6053645610809326, "step": 3803} {"train_info/time_between_train_steps": 0.0032165050506591797, "step": 3803} {"info/global_step": 3804, "train_info/time_within_train_step": 2.651339054107666, "step": 3804} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 3804} {"info/global_step": 3805, "train_info/time_within_train_step": 2.6445722579956055, "step": 3805} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 3805} {"info/global_step": 3806, "train_info/time_within_train_step": 2.652704954147339, "step": 3806} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 3806} {"info/global_step": 3807, "train_info/time_within_train_step": 2.652022361755371, "step": 3807} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 3807} {"info/global_step": 3808, "train_info/time_within_train_step": 2.6421234607696533, "step": 3808} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 3808} {"info/global_step": 3809, "train_info/time_within_train_step": 2.643707036972046, "step": 3809} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 3809} {"info/global_step": 3810, "train_info/time_within_train_step": 2.6515955924987793, "step": 3810} {"train_info/time_between_train_steps": 0.003170490264892578, "step": 3810} {"info/global_step": 3811, "train_info/time_within_train_step": 2.6602251529693604, "step": 3811} {"train_info/time_between_train_steps": 0.0031676292419433594, "step": 3811} {"info/global_step": 3812, "train_info/time_within_train_step": 2.673827886581421, "step": 3812} {"train_info/time_between_train_steps": 0.0032477378845214844, "step": 3812} {"info/global_step": 3813, "train_info/time_within_train_step": 2.6719303131103516, "step": 3813} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 3813} {"info/global_step": 3814, "train_info/time_within_train_step": 2.7100841999053955, "step": 3814} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 3814} {"info/global_step": 3815, "train_info/time_within_train_step": 2.650966167449951, "step": 3815} {"train_info/time_between_train_steps": 0.0032165050506591797, "step": 3815} {"info/global_step": 3816, "train_info/time_within_train_step": 2.649658441543579, "step": 3816} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 3816} {"info/global_step": 3817, "train_info/time_within_train_step": 2.652348279953003, "step": 3817} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 3817} {"info/global_step": 3818, "train_info/time_within_train_step": 2.6518781185150146, "step": 3818} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 3818} {"info/global_step": 3819, "train_info/time_within_train_step": 2.6512107849121094, "step": 3819} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 3819} {"info/global_step": 3820, "train_info/time_within_train_step": 2.649675130844116, "step": 3820} {"train_info/time_between_train_steps": 0.0032188892364501953, "step": 3820} {"info/global_step": 3821, "train_info/time_within_train_step": 2.6571359634399414, "step": 3821} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 3821} {"info/global_step": 3822, "train_info/time_within_train_step": 2.6830031871795654, "step": 3822} {"train_info/time_between_train_steps": 0.0032486915588378906, "step": 3822} {"info/global_step": 3823, "train_info/time_within_train_step": 2.6617374420166016, "step": 3823} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 3823} {"info/global_step": 3824, "train_info/time_within_train_step": 2.704406261444092, "step": 3824} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 3824} {"info/global_step": 3825, "train_info/time_within_train_step": 2.707224130630493, "step": 3825} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 3825} {"info/global_step": 3826, "train_info/time_within_train_step": 2.643077850341797, "step": 3826} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 3826} {"info/global_step": 3827, "train_info/time_within_train_step": 2.6428029537200928, "step": 3827} {"train_info/time_between_train_steps": 0.12656784057617188, "step": 3827} {"info/global_step": 3828, "train_info/time_within_train_step": 2.6433231830596924, "step": 3828} {"train_info/time_between_train_steps": 0.0032510757446289062, "step": 3828} {"info/global_step": 3829, "train_info/time_within_train_step": 2.6451539993286133, "step": 3829} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 3829} {"info/global_step": 3830, "train_info/time_within_train_step": 2.6505510807037354, "step": 3830} {"train_info/time_between_train_steps": 0.003361225128173828, "step": 3830} {"info/global_step": 3831, "train_info/time_within_train_step": 2.658273696899414, "step": 3831} {"train_info/time_between_train_steps": 0.0032873153686523438, "step": 3831} {"info/global_step": 3832, "train_info/time_within_train_step": 2.6665563583374023, "step": 3832} {"train_info/time_between_train_steps": 0.0032281875610351562, "step": 3832} {"info/global_step": 3833, "train_info/time_within_train_step": 2.710594654083252, "step": 3833} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 3833} {"info/global_step": 3834, "train_info/time_within_train_step": 2.641683340072632, "step": 3834} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 3834} {"info/global_step": 3835, "train_info/time_within_train_step": 2.641613483428955, "step": 3835} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 3835} {"info/global_step": 3836, "train_info/time_within_train_step": 2.658222198486328, "step": 3836} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 3836} {"info/global_step": 3837, "train_info/time_within_train_step": 2.6535987854003906, "step": 3837} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 3837} {"info/global_step": 3838, "train_info/time_within_train_step": 2.6452012062072754, "step": 3838} {"train_info/time_between_train_steps": 0.0032167434692382812, "step": 3838} {"info/global_step": 3839, "train_info/time_within_train_step": 2.6451609134674072, "step": 3839} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 3839} {"info/global_step": 3840, "train_info/time_within_train_step": 2.648987054824829, "step": 3840} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 3840} {"info/global_step": 3841, "train_info/time_within_train_step": 2.6712846755981445, "step": 3841} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 3841} {"info/global_step": 3842, "train_info/time_within_train_step": 2.6732311248779297, "step": 3842} {"train_info/time_between_train_steps": 0.003292560577392578, "step": 3842} {"info/global_step": 3843, "train_info/time_within_train_step": 2.6619720458984375, "step": 3843} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 3843} {"info/global_step": 3844, "train_info/time_within_train_step": 2.6821303367614746, "step": 3844} {"train_info/time_between_train_steps": 0.003179788589477539, "step": 3844} {"info/global_step": 3845, "train_info/time_within_train_step": 2.643552303314209, "step": 3845} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 3845} {"info/global_step": 3846, "train_info/time_within_train_step": 2.6483795642852783, "step": 3846} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 3846} {"info/global_step": 3847, "train_info/time_within_train_step": 2.665872097015381, "step": 3847} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 3847} {"info/global_step": 3848, "train_info/time_within_train_step": 2.646212100982666, "step": 3848} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 3848} {"info/global_step": 3849, "train_info/time_within_train_step": 2.644681692123413, "step": 3849} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 3849} {"info/global_step": 3850, "train_info/time_within_train_step": 2.6598806381225586, "step": 3850} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746908272, "_runtime": 10870}, "step": 3850} {"logs": {"train/loss": 3.8301, "train/learning_rate": 0.00041, "train/epoch": 4.04, "_timestamp": 1746908272, "_runtime": 10870}, "step": 3850} {"train_info/time_between_train_steps": 0.024731874465942383, "step": 3850} {"info/global_step": 3851, "train_info/time_within_train_step": 2.6655893325805664, "step": 3851} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 3851} {"info/global_step": 3852, "train_info/time_within_train_step": 2.6563446521759033, "step": 3852} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 3852} {"info/global_step": 3853, "train_info/time_within_train_step": 2.664217233657837, "step": 3853} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 3853} {"info/global_step": 3854, "train_info/time_within_train_step": 2.6901540756225586, "step": 3854} {"train_info/time_between_train_steps": 0.0032243728637695312, "step": 3854} {"info/global_step": 3855, "train_info/time_within_train_step": 2.662753105163574, "step": 3855} {"train_info/time_between_train_steps": 0.003265380859375, "step": 3855} {"info/global_step": 3856, "train_info/time_within_train_step": 2.648777961730957, "step": 3856} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 3856} {"info/global_step": 3857, "train_info/time_within_train_step": 2.6526710987091064, "step": 3857} {"train_info/time_between_train_steps": 0.003279447555541992, "step": 3857} {"info/global_step": 3858, "train_info/time_within_train_step": 2.6472535133361816, "step": 3858} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 3858} {"info/global_step": 3859, "train_info/time_within_train_step": 2.6670851707458496, "step": 3859} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 3859} {"info/global_step": 3860, "train_info/time_within_train_step": 2.6520333290100098, "step": 3860} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 3860} {"info/global_step": 3861, "train_info/time_within_train_step": 2.660438060760498, "step": 3861} {"train_info/time_between_train_steps": 0.003249645233154297, "step": 3861} {"info/global_step": 3862, "train_info/time_within_train_step": 2.7133595943450928, "step": 3862} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 3862} {"info/global_step": 3863, "train_info/time_within_train_step": 2.6950337886810303, "step": 3863} {"train_info/time_between_train_steps": 0.003235340118408203, "step": 3863} {"info/global_step": 3864, "train_info/time_within_train_step": 2.6417670249938965, "step": 3864} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 3864} {"info/global_step": 3865, "train_info/time_within_train_step": 2.6464412212371826, "step": 3865} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 3865} {"info/global_step": 3866, "train_info/time_within_train_step": 2.6583704948425293, "step": 3866} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 3866} {"info/global_step": 3867, "train_info/time_within_train_step": 2.6556029319763184, "step": 3867} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 3867} {"info/global_step": 3868, "train_info/time_within_train_step": 2.64581561088562, "step": 3868} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 3868} {"info/global_step": 3869, "train_info/time_within_train_step": 2.650920867919922, "step": 3869} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 3869} {"info/global_step": 3870, "train_info/time_within_train_step": 2.645711898803711, "step": 3870} {"train_info/time_between_train_steps": 0.003297567367553711, "step": 3870} {"info/global_step": 3871, "train_info/time_within_train_step": 2.669356107711792, "step": 3871} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 3871} {"info/global_step": 3872, "train_info/time_within_train_step": 2.6532907485961914, "step": 3872} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 3872} {"info/global_step": 3873, "train_info/time_within_train_step": 2.6467478275299072, "step": 3873} {"train_info/time_between_train_steps": 0.0031387805938720703, "step": 3873} {"info/global_step": 3874, "train_info/time_within_train_step": 2.6554203033447266, "step": 3874} {"train_info/time_between_train_steps": 0.003275632858276367, "step": 3874} {"info/global_step": 3875, "train_info/time_within_train_step": 2.6436009407043457, "step": 3875} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 3875} {"info/global_step": 3876, "train_info/time_within_train_step": 2.6465113162994385, "step": 3876} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 3876} {"info/global_step": 3877, "train_info/time_within_train_step": 2.9261789321899414, "step": 3877} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 3877} {"info/global_step": 3878, "train_info/time_within_train_step": 2.6556174755096436, "step": 3878} {"train_info/time_between_train_steps": 0.0032329559326171875, "step": 3878} {"info/global_step": 3879, "train_info/time_within_train_step": 2.6456167697906494, "step": 3879} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 3879} {"info/global_step": 3880, "train_info/time_within_train_step": 2.6470541954040527, "step": 3880} {"train_info/time_between_train_steps": 0.0032422542572021484, "step": 3880} {"info/global_step": 3881, "train_info/time_within_train_step": 2.6710102558135986, "step": 3881} {"train_info/time_between_train_steps": 0.003242969512939453, "step": 3881} {"info/global_step": 3882, "train_info/time_within_train_step": 2.664012908935547, "step": 3882} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 3882} {"info/global_step": 3883, "train_info/time_within_train_step": 2.6806108951568604, "step": 3883} {"train_info/time_between_train_steps": 0.0032567977905273438, "step": 3883} {"info/global_step": 3884, "train_info/time_within_train_step": 2.660736083984375, "step": 3884} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 3884} {"info/global_step": 3885, "train_info/time_within_train_step": 2.661562204360962, "step": 3885} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 3885} {"info/global_step": 3886, "train_info/time_within_train_step": 2.6501824855804443, "step": 3886} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 3886} {"info/global_step": 3887, "train_info/time_within_train_step": 2.6584339141845703, "step": 3887} {"train_info/time_between_train_steps": 0.0032477378845214844, "step": 3887} {"info/global_step": 3888, "train_info/time_within_train_step": 2.6473348140716553, "step": 3888} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 3888} {"info/global_step": 3889, "train_info/time_within_train_step": 2.6452062129974365, "step": 3889} {"train_info/time_between_train_steps": 0.003204345703125, "step": 3889} {"info/global_step": 3890, "train_info/time_within_train_step": 2.7757580280303955, "step": 3890} {"train_info/time_between_train_steps": 0.003244161605834961, "step": 3890} {"info/global_step": 3891, "train_info/time_within_train_step": 2.6459298133850098, "step": 3891} {"train_info/time_between_train_steps": 0.003216266632080078, "step": 3891} {"info/global_step": 3892, "train_info/time_within_train_step": 2.6627395153045654, "step": 3892} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 3892} {"info/global_step": 3893, "train_info/time_within_train_step": 2.660837411880493, "step": 3893} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 3893} {"info/global_step": 3894, "train_info/time_within_train_step": 2.673445224761963, "step": 3894} {"train_info/time_between_train_steps": 0.003248929977416992, "step": 3894} {"info/global_step": 3895, "train_info/time_within_train_step": 2.6724536418914795, "step": 3895} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 3895} {"info/global_step": 3896, "train_info/time_within_train_step": 2.6911990642547607, "step": 3896} {"train_info/time_between_train_steps": 0.0032074451446533203, "step": 3896} {"info/global_step": 3897, "train_info/time_within_train_step": 2.6411094665527344, "step": 3897} {"train_info/time_between_train_steps": 0.003222942352294922, "step": 3897} {"info/global_step": 3898, "train_info/time_within_train_step": 2.6413657665252686, "step": 3898} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 3898} {"info/global_step": 3899, "train_info/time_within_train_step": 2.664717435836792, "step": 3899} {"train_info/time_between_train_steps": 0.003236532211303711, "step": 3899} {"info/global_step": 3900, "train_info/time_within_train_step": 2.6505990028381348, "step": 3900} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746908406, "_runtime": 11004}, "step": 3900} {"logs": {"train/loss": 3.832, "train/learning_rate": 0.00040666666666666667, "train/epoch": 4.04, "_timestamp": 1746908406, "_runtime": 11004}, "step": 3900} {"train_info/time_between_train_steps": 0.024753093719482422, "step": 3900} {"info/global_step": 3901, "train_info/time_within_train_step": 2.64957332611084, "step": 3901} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 3901} {"info/global_step": 3902, "train_info/time_within_train_step": 2.647361993789673, "step": 3902} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 3902} {"info/global_step": 3903, "train_info/time_within_train_step": 2.662369966506958, "step": 3903} {"train_info/time_between_train_steps": 0.003236532211303711, "step": 3903} {"info/global_step": 3904, "train_info/time_within_train_step": 2.655083179473877, "step": 3904} {"train_info/time_between_train_steps": 0.003258228302001953, "step": 3904} {"info/global_step": 3905, "train_info/time_within_train_step": 2.6687326431274414, "step": 3905} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 3905} {"info/global_step": 3906, "train_info/time_within_train_step": 2.717193365097046, "step": 3906} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 3906} {"info/global_step": 3907, "train_info/time_within_train_step": 2.6996846199035645, "step": 3907} {"train_info/time_between_train_steps": 0.003281116485595703, "step": 3907} {"info/global_step": 3908, "train_info/time_within_train_step": 2.640469551086426, "step": 3908} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 3908} {"info/global_step": 3909, "train_info/time_within_train_step": 2.64111328125, "step": 3909} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 3909} {"info/global_step": 3910, "train_info/time_within_train_step": 2.6585209369659424, "step": 3910} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 3910} {"info/global_step": 3911, "train_info/time_within_train_step": 2.6551220417022705, "step": 3911} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 3911} {"info/global_step": 3912, "train_info/time_within_train_step": 2.6467673778533936, "step": 3912} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 3912} {"info/global_step": 3913, "train_info/time_within_train_step": 2.6527538299560547, "step": 3913} {"train_info/time_between_train_steps": 0.003237009048461914, "step": 3913} {"info/global_step": 3914, "train_info/time_within_train_step": 2.647742748260498, "step": 3914} {"train_info/time_between_train_steps": 0.0032377243041992188, "step": 3914} {"info/global_step": 3915, "train_info/time_within_train_step": 2.6400809288024902, "step": 3915} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 3915} {"info/global_step": 3916, "train_info/time_within_train_step": 2.6562414169311523, "step": 3916} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 3916} {"info/global_step": 3917, "train_info/time_within_train_step": 2.6534290313720703, "step": 3917} {"train_info/time_between_train_steps": 0.0032806396484375, "step": 3917} {"info/global_step": 3918, "train_info/time_within_train_step": 2.6446831226348877, "step": 3918} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 3918} {"info/global_step": 3919, "train_info/time_within_train_step": 2.64369535446167, "step": 3919} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 3919} {"info/global_step": 3920, "train_info/time_within_train_step": 2.6500630378723145, "step": 3920} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 3920} {"info/global_step": 3921, "train_info/time_within_train_step": 2.670802593231201, "step": 3921} {"train_info/time_between_train_steps": 0.0032355785369873047, "step": 3921} {"info/global_step": 3922, "train_info/time_within_train_step": 2.671083450317383, "step": 3922} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 3922} {"info/global_step": 3923, "train_info/time_within_train_step": 2.6557798385620117, "step": 3923} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 3923} {"info/global_step": 3924, "train_info/time_within_train_step": 2.6539666652679443, "step": 3924} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 3924} {"info/global_step": 3925, "train_info/time_within_train_step": 2.6663897037506104, "step": 3925} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 3925} {"info/global_step": 3926, "train_info/time_within_train_step": 2.6432907581329346, "step": 3926} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 3926} {"info/global_step": 3927, "train_info/time_within_train_step": 2.6476807594299316, "step": 3927} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 3927} {"info/global_step": 3928, "train_info/time_within_train_step": 2.650907516479492, "step": 3928} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 3928} {"info/global_step": 3929, "train_info/time_within_train_step": 2.662170886993408, "step": 3929} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 3929} {"info/global_step": 3930, "train_info/time_within_train_step": 2.665799856185913, "step": 3930} {"train_info/time_between_train_steps": 0.003226757049560547, "step": 3930} {"info/global_step": 3931, "train_info/time_within_train_step": 2.660891056060791, "step": 3931} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 3931} {"info/global_step": 3932, "train_info/time_within_train_step": 2.7017457485198975, "step": 3932} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 3932} {"info/global_step": 3933, "train_info/time_within_train_step": 2.640909194946289, "step": 3933} {"train_info/time_between_train_steps": 0.003238677978515625, "step": 3933} {"info/global_step": 3934, "train_info/time_within_train_step": 2.64216685295105, "step": 3934} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 3934} {"info/global_step": 3935, "train_info/time_within_train_step": 2.6697375774383545, "step": 3935} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 3935} {"info/global_step": 3936, "train_info/time_within_train_step": 2.9044055938720703, "step": 3936} {"train_info/time_between_train_steps": 0.003229856491088867, "step": 3936} {"info/global_step": 3937, "train_info/time_within_train_step": 2.6407222747802734, "step": 3937} {"train_info/time_between_train_steps": 0.003326416015625, "step": 3937} {"info/global_step": 3938, "train_info/time_within_train_step": 2.6403133869171143, "step": 3938} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 3938} {"info/global_step": 3939, "train_info/time_within_train_step": 2.660182237625122, "step": 3939} {"train_info/time_between_train_steps": 0.00334930419921875, "step": 3939} {"info/global_step": 3940, "train_info/time_within_train_step": 2.6536006927490234, "step": 3940} {"train_info/time_between_train_steps": 0.0033309459686279297, "step": 3940} {"info/global_step": 3941, "train_info/time_within_train_step": 2.645543098449707, "step": 3941} {"train_info/time_between_train_steps": 0.0032744407653808594, "step": 3941} {"info/global_step": 3942, "train_info/time_within_train_step": 2.6507115364074707, "step": 3942} {"train_info/time_between_train_steps": 0.0032427310943603516, "step": 3942} {"info/global_step": 3943, "train_info/time_within_train_step": 2.646981954574585, "step": 3943} {"train_info/time_between_train_steps": 0.003226757049560547, "step": 3943} {"info/global_step": 3944, "train_info/time_within_train_step": 2.667811393737793, "step": 3944} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 3944} {"info/global_step": 3945, "train_info/time_within_train_step": 2.6868398189544678, "step": 3945} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 3945} {"info/global_step": 3946, "train_info/time_within_train_step": 2.6771302223205566, "step": 3946} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 3946} {"info/global_step": 3947, "train_info/time_within_train_step": 2.6556789875030518, "step": 3947} {"train_info/time_between_train_steps": 0.003224611282348633, "step": 3947} {"info/global_step": 3948, "train_info/time_within_train_step": 2.640519142150879, "step": 3948} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 3948} {"info/global_step": 3949, "train_info/time_within_train_step": 2.658336639404297, "step": 3949} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 3949} {"info/global_step": 3950, "train_info/time_within_train_step": 2.656008005142212, "step": 3950} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746908541, "_runtime": 11139}, "step": 3950} {"logs": {"train/loss": 3.8167, "train/learning_rate": 0.00040333333333333334, "train/epoch": 4.05, "_timestamp": 1746908541, "_runtime": 11139}, "step": 3950} {"train_info/time_between_train_steps": 0.024903297424316406, "step": 3950} {"info/global_step": 3951, "train_info/time_within_train_step": 2.659050941467285, "step": 3951} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 3951} {"info/global_step": 3952, "train_info/time_within_train_step": 2.6451237201690674, "step": 3952} {"train_info/time_between_train_steps": 0.10882139205932617, "step": 3952} {"info/global_step": 3953, "train_info/time_within_train_step": 2.644097089767456, "step": 3953} {"train_info/time_between_train_steps": 0.003256082534790039, "step": 3953} {"info/global_step": 3954, "train_info/time_within_train_step": 2.6445107460021973, "step": 3954} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 3954} {"info/global_step": 3955, "train_info/time_within_train_step": 2.6512391567230225, "step": 3955} {"train_info/time_between_train_steps": 0.003443479537963867, "step": 3955} {"info/global_step": 3956, "train_info/time_within_train_step": 2.670833110809326, "step": 3956} {"train_info/time_between_train_steps": 0.0032782554626464844, "step": 3956} {"info/global_step": 3957, "train_info/time_within_train_step": 2.6730332374572754, "step": 3957} {"train_info/time_between_train_steps": 0.0033791065216064453, "step": 3957} {"info/global_step": 3958, "train_info/time_within_train_step": 2.6550753116607666, "step": 3958} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 3958} {"info/global_step": 3959, "train_info/time_within_train_step": 2.648620843887329, "step": 3959} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 3959} {"info/global_step": 3960, "train_info/time_within_train_step": 2.649481773376465, "step": 3960} {"train_info/time_between_train_steps": 0.0032243728637695312, "step": 3960} {"info/global_step": 3961, "train_info/time_within_train_step": 2.645794630050659, "step": 3961} {"train_info/time_between_train_steps": 0.0032677650451660156, "step": 3961} {"info/global_step": 3962, "train_info/time_within_train_step": 2.6665549278259277, "step": 3962} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 3962} {"info/global_step": 3963, "train_info/time_within_train_step": 2.6566152572631836, "step": 3963} {"train_info/time_between_train_steps": 0.0032906532287597656, "step": 3963} {"info/global_step": 3964, "train_info/time_within_train_step": 2.6627719402313232, "step": 3964} {"train_info/time_between_train_steps": 0.0032796859741210938, "step": 3964} {"info/global_step": 3965, "train_info/time_within_train_step": 2.6958141326904297, "step": 3965} {"train_info/time_between_train_steps": 0.0032339096069335938, "step": 3965} {"info/global_step": 3966, "train_info/time_within_train_step": 2.659508466720581, "step": 3966} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 3966} {"info/global_step": 3967, "train_info/time_within_train_step": 2.646942138671875, "step": 3967} {"train_info/time_between_train_steps": 0.003224611282348633, "step": 3967} {"info/global_step": 3968, "train_info/time_within_train_step": 2.646042823791504, "step": 3968} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 3968} {"info/global_step": 3969, "train_info/time_within_train_step": 2.649078607559204, "step": 3969} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 3969} {"info/global_step": 3970, "train_info/time_within_train_step": 2.650258779525757, "step": 3970} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 3970} {"info/global_step": 3971, "train_info/time_within_train_step": 2.6457200050354004, "step": 3971} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 3971} {"info/global_step": 3972, "train_info/time_within_train_step": 2.6557462215423584, "step": 3972} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 3972} {"info/global_step": 3973, "train_info/time_within_train_step": 2.6562812328338623, "step": 3973} {"train_info/time_between_train_steps": 0.0032439231872558594, "step": 3973} {"info/global_step": 3974, "train_info/time_within_train_step": 2.666189432144165, "step": 3974} {"train_info/time_between_train_steps": 0.0032575130462646484, "step": 3974} {"info/global_step": 3975, "train_info/time_within_train_step": 2.7237353324890137, "step": 3975} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 3975} {"info/global_step": 3976, "train_info/time_within_train_step": 2.6852641105651855, "step": 3976} {"train_info/time_between_train_steps": 0.0032744407653808594, "step": 3976} {"info/global_step": 3977, "train_info/time_within_train_step": 2.641132354736328, "step": 3977} {"train_info/time_between_train_steps": 0.00323486328125, "step": 3977} {"info/global_step": 3978, "train_info/time_within_train_step": 2.6410279273986816, "step": 3978} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 3978} {"info/global_step": 3979, "train_info/time_within_train_step": 2.954251289367676, "step": 3979} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 3979} {"info/global_step": 3980, "train_info/time_within_train_step": 2.720094680786133, "step": 3980} {"train_info/time_between_train_steps": 0.0032958984375, "step": 3980} {"info/global_step": 3981, "train_info/time_within_train_step": 2.6434993743896484, "step": 3981} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 3981} {"info/global_step": 3982, "train_info/time_within_train_step": 2.6399338245391846, "step": 3982} {"train_info/time_between_train_steps": 0.0032296180725097656, "step": 3982} {"info/global_step": 3983, "train_info/time_within_train_step": 2.661708354949951, "step": 3983} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 3983} {"info/global_step": 3984, "train_info/time_within_train_step": 2.6474015712738037, "step": 3984} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 3984} {"info/global_step": 3985, "train_info/time_within_train_step": 2.6491005420684814, "step": 3985} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 3985} {"info/global_step": 3986, "train_info/time_within_train_step": 2.6481518745422363, "step": 3986} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 3986} {"info/global_step": 3987, "train_info/time_within_train_step": 2.6441924571990967, "step": 3987} {"train_info/time_between_train_steps": 0.0032291412353515625, "step": 3987} {"info/global_step": 3988, "train_info/time_within_train_step": 2.6474411487579346, "step": 3988} {"train_info/time_between_train_steps": 0.003575563430786133, "step": 3988} {"info/global_step": 3989, "train_info/time_within_train_step": 2.6592490673065186, "step": 3989} {"train_info/time_between_train_steps": 0.0034646987915039062, "step": 3989} {"info/global_step": 3990, "train_info/time_within_train_step": 2.6460392475128174, "step": 3990} {"train_info/time_between_train_steps": 0.0033392906188964844, "step": 3990} {"info/global_step": 3991, "train_info/time_within_train_step": 2.6448709964752197, "step": 3991} {"train_info/time_between_train_steps": 0.0035631656646728516, "step": 3991} {"info/global_step": 3992, "train_info/time_within_train_step": 2.6553547382354736, "step": 3992} {"train_info/time_between_train_steps": 0.006554365158081055, "step": 3992} {"info/global_step": 3993, "train_info/time_within_train_step": 2.644606828689575, "step": 3993} {"train_info/time_between_train_steps": 0.006487846374511719, "step": 3993} {"info/global_step": 3994, "train_info/time_within_train_step": 2.651215076446533, "step": 3994} {"train_info/time_between_train_steps": 0.006488323211669922, "step": 3994} {"info/global_step": 3995, "train_info/time_within_train_step": 2.6412453651428223, "step": 3995} {"train_info/time_between_train_steps": 0.00651860237121582, "step": 3995} {"info/global_step": 3996, "train_info/time_within_train_step": 2.6881394386291504, "step": 3996} {"train_info/time_between_train_steps": 0.006483554840087891, "step": 3996} {"info/global_step": 3997, "train_info/time_within_train_step": 2.7056052684783936, "step": 3997} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 3997} {"info/global_step": 3998, "train_info/time_within_train_step": 2.649914264678955, "step": 3998} {"train_info/time_between_train_steps": 0.0032486915588378906, "step": 3998} {"info/global_step": 3999, "train_info/time_within_train_step": 3.255633592605591, "step": 3999} {"train_info/time_between_train_steps": 0.0032701492309570312, "step": 3999} {"info/global_step": 4000, "train_info/time_within_train_step": 2.654021739959717, "step": 4000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746908677, "_runtime": 11275}, "step": 4000} {"logs": {"train/loss": 3.8037, "train/learning_rate": 0.00039999999999999996, "train/epoch": 4.05, "_timestamp": 1746908677, "_runtime": 11275}, "step": 4000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746908682, "_runtime": 11280}, "step": 4000} {"logs": {"eval/loss": 4.595146656036377, "eval/runtime": 5.1938, "eval/samples_per_second": 36.967, "eval/steps_per_second": 1.155, "train/epoch": 4.05, "_timestamp": 1746908682, "_runtime": 11280}, "step": 4000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746908682, "_runtime": 11280}, "step": 4000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.595146656036377, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 99.00265381984578, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1938, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.967, "train/epoch": 4.05, "_timestamp": 1746908682, "_runtime": 11280}, "step": 4000} {"train_info/time_between_train_steps": 18.415024995803833, "step": 4000} {"info/global_step": 4001, "train_info/time_within_train_step": 2.4519684314727783, "step": 4001} {"train_info/time_between_train_steps": 0.0032510757446289062, "step": 4001} {"info/global_step": 4002, "train_info/time_within_train_step": 2.4560458660125732, "step": 4002} {"train_info/time_between_train_steps": 0.003290891647338867, "step": 4002} {"info/global_step": 4003, "train_info/time_within_train_step": 2.6429250240325928, "step": 4003} {"train_info/time_between_train_steps": 0.004256486892700195, "step": 4003} {"info/global_step": 4004, "train_info/time_within_train_step": 2.651235818862915, "step": 4004} {"train_info/time_between_train_steps": 0.0029048919677734375, "step": 4004} {"info/global_step": 4005, "train_info/time_within_train_step": 2.661423444747925, "step": 4005} {"train_info/time_between_train_steps": 0.002907276153564453, "step": 4005} {"info/global_step": 4006, "train_info/time_within_train_step": 2.6822566986083984, "step": 4006} {"train_info/time_between_train_steps": 0.0029778480529785156, "step": 4006} {"info/global_step": 4007, "train_info/time_within_train_step": 2.6551003456115723, "step": 4007} {"train_info/time_between_train_steps": 0.0028717517852783203, "step": 4007} {"info/global_step": 4008, "train_info/time_within_train_step": 2.655050039291382, "step": 4008} {"train_info/time_between_train_steps": 0.0029158592224121094, "step": 4008} {"info/global_step": 4009, "train_info/time_within_train_step": 2.6528868675231934, "step": 4009} {"train_info/time_between_train_steps": 0.0029096603393554688, "step": 4009} {"info/global_step": 4010, "train_info/time_within_train_step": 2.649585485458374, "step": 4010} {"train_info/time_between_train_steps": 0.0028808116912841797, "step": 4010} {"info/global_step": 4011, "train_info/time_within_train_step": 2.644956111907959, "step": 4011} {"train_info/time_between_train_steps": 0.0029366016387939453, "step": 4011} {"info/global_step": 4012, "train_info/time_within_train_step": 2.6502022743225098, "step": 4012} {"train_info/time_between_train_steps": 0.0029380321502685547, "step": 4012} {"info/global_step": 4013, "train_info/time_within_train_step": 2.6466386318206787, "step": 4013} {"train_info/time_between_train_steps": 0.0028879642486572266, "step": 4013} {"info/global_step": 4014, "train_info/time_within_train_step": 2.661078453063965, "step": 4014} {"train_info/time_between_train_steps": 0.0028808116912841797, "step": 4014} {"info/global_step": 4015, "train_info/time_within_train_step": 2.6745827198028564, "step": 4015} {"train_info/time_between_train_steps": 0.0029268264770507812, "step": 4015} {"info/global_step": 4016, "train_info/time_within_train_step": 2.6931610107421875, "step": 4016} {"train_info/time_between_train_steps": 0.002920866012573242, "step": 4016} {"info/global_step": 4017, "train_info/time_within_train_step": 2.705976724624634, "step": 4017} {"train_info/time_between_train_steps": 0.0028839111328125, "step": 4017} {"info/global_step": 4018, "train_info/time_within_train_step": 2.649885654449463, "step": 4018} {"train_info/time_between_train_steps": 0.002924203872680664, "step": 4018} {"info/global_step": 4019, "train_info/time_within_train_step": 2.648599624633789, "step": 4019} {"train_info/time_between_train_steps": 0.002959728240966797, "step": 4019} {"info/global_step": 4020, "train_info/time_within_train_step": 2.650068759918213, "step": 4020} {"train_info/time_between_train_steps": 0.0029053688049316406, "step": 4020} {"info/global_step": 4021, "train_info/time_within_train_step": 2.649996280670166, "step": 4021} {"train_info/time_between_train_steps": 0.002864360809326172, "step": 4021} {"info/global_step": 4022, "train_info/time_within_train_step": 2.6514952182769775, "step": 4022} {"train_info/time_between_train_steps": 0.00286865234375, "step": 4022} {"info/global_step": 4023, "train_info/time_within_train_step": 2.64680814743042, "step": 4023} {"train_info/time_between_train_steps": 0.0028951168060302734, "step": 4023} {"info/global_step": 4024, "train_info/time_within_train_step": 2.6562533378601074, "step": 4024} {"train_info/time_between_train_steps": 0.002873659133911133, "step": 4024} {"info/global_step": 4025, "train_info/time_within_train_step": 2.6548266410827637, "step": 4025} {"train_info/time_between_train_steps": 0.0029747486114501953, "step": 4025} {"info/global_step": 4026, "train_info/time_within_train_step": 2.6513009071350098, "step": 4026} {"train_info/time_between_train_steps": 0.002901792526245117, "step": 4026} {"info/global_step": 4027, "train_info/time_within_train_step": 2.6559393405914307, "step": 4027} {"train_info/time_between_train_steps": 0.002886056900024414, "step": 4027} {"info/global_step": 4028, "train_info/time_within_train_step": 2.6570160388946533, "step": 4028} {"train_info/time_between_train_steps": 0.0028824806213378906, "step": 4028} {"info/global_step": 4029, "train_info/time_within_train_step": 2.646061897277832, "step": 4029} {"train_info/time_between_train_steps": 0.0028944015502929688, "step": 4029} {"info/global_step": 4030, "train_info/time_within_train_step": 2.6507790088653564, "step": 4030} {"train_info/time_between_train_steps": 0.002900838851928711, "step": 4030} {"info/global_step": 4031, "train_info/time_within_train_step": 2.65450382232666, "step": 4031} {"train_info/time_between_train_steps": 0.002918243408203125, "step": 4031} {"info/global_step": 4032, "train_info/time_within_train_step": 2.6732091903686523, "step": 4032} {"train_info/time_between_train_steps": 0.0029075145721435547, "step": 4032} {"info/global_step": 4033, "train_info/time_within_train_step": 2.709733247756958, "step": 4033} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 4033} {"info/global_step": 4034, "train_info/time_within_train_step": 2.6484694480895996, "step": 4034} {"train_info/time_between_train_steps": 0.002892732620239258, "step": 4034} {"info/global_step": 4035, "train_info/time_within_train_step": 2.6511335372924805, "step": 4035} {"train_info/time_between_train_steps": 0.002924680709838867, "step": 4035} {"info/global_step": 4036, "train_info/time_within_train_step": 2.6479170322418213, "step": 4036} {"train_info/time_between_train_steps": 0.002892732620239258, "step": 4036} {"info/global_step": 4037, "train_info/time_within_train_step": 2.657010555267334, "step": 4037} {"train_info/time_between_train_steps": 0.002907276153564453, "step": 4037} {"info/global_step": 4038, "train_info/time_within_train_step": 2.647341012954712, "step": 4038} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 4038} {"info/global_step": 4039, "train_info/time_within_train_step": 2.6460721492767334, "step": 4039} {"train_info/time_between_train_steps": 0.003093719482421875, "step": 4039} {"info/global_step": 4040, "train_info/time_within_train_step": 2.649721384048462, "step": 4040} {"train_info/time_between_train_steps": 0.0030798912048339844, "step": 4040} {"info/global_step": 4041, "train_info/time_within_train_step": 2.672093629837036, "step": 4041} {"train_info/time_between_train_steps": 0.0031287670135498047, "step": 4041} {"info/global_step": 4042, "train_info/time_within_train_step": 2.667128801345825, "step": 4042} {"train_info/time_between_train_steps": 0.0032300949096679688, "step": 4042} {"info/global_step": 4043, "train_info/time_within_train_step": 2.6740875244140625, "step": 4043} {"train_info/time_between_train_steps": 0.003281116485595703, "step": 4043} {"info/global_step": 4044, "train_info/time_within_train_step": 2.6686458587646484, "step": 4044} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 4044} {"info/global_step": 4045, "train_info/time_within_train_step": 2.6508989334106445, "step": 4045} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 4045} {"info/global_step": 4046, "train_info/time_within_train_step": 2.6496877670288086, "step": 4046} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 4046} {"info/global_step": 4047, "train_info/time_within_train_step": 2.646481513977051, "step": 4047} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 4047} {"info/global_step": 4048, "train_info/time_within_train_step": 2.6555263996124268, "step": 4048} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 4048} {"info/global_step": 4049, "train_info/time_within_train_step": 2.66554856300354, "step": 4049} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 4049} {"info/global_step": 4050, "train_info/time_within_train_step": 2.9769463539123535, "step": 4050} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746908829, "_runtime": 11427}, "step": 4050} {"logs": {"train/loss": 3.7946, "train/learning_rate": 0.00039666666666666664, "train/epoch": 4.06, "_timestamp": 1746908829, "_runtime": 11427}, "step": 4050} {"train_info/time_between_train_steps": 0.024523496627807617, "step": 4050} {"info/global_step": 4051, "train_info/time_within_train_step": 2.641085386276245, "step": 4051} {"train_info/time_between_train_steps": 0.0029380321502685547, "step": 4051} {"info/global_step": 4052, "train_info/time_within_train_step": 2.654632806777954, "step": 4052} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 4052} {"info/global_step": 4053, "train_info/time_within_train_step": 2.661161184310913, "step": 4053} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 4053} {"info/global_step": 4054, "train_info/time_within_train_step": 2.643279552459717, "step": 4054} {"train_info/time_between_train_steps": 0.002988576889038086, "step": 4054} {"info/global_step": 4055, "train_info/time_within_train_step": 2.644049882888794, "step": 4055} {"train_info/time_between_train_steps": 0.002984762191772461, "step": 4055} {"info/global_step": 4056, "train_info/time_within_train_step": 2.6552796363830566, "step": 4056} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 4056} {"info/global_step": 4057, "train_info/time_within_train_step": 2.665797233581543, "step": 4057} {"train_info/time_between_train_steps": 0.0028922557830810547, "step": 4057} {"info/global_step": 4058, "train_info/time_within_train_step": 2.668717384338379, "step": 4058} {"train_info/time_between_train_steps": 0.003003358840942383, "step": 4058} {"info/global_step": 4059, "train_info/time_within_train_step": 2.6604790687561035, "step": 4059} {"train_info/time_between_train_steps": 0.002979755401611328, "step": 4059} {"info/global_step": 4060, "train_info/time_within_train_step": 2.7102081775665283, "step": 4060} {"train_info/time_between_train_steps": 0.0029447078704833984, "step": 4060} {"info/global_step": 4061, "train_info/time_within_train_step": 2.6443803310394287, "step": 4061} {"train_info/time_between_train_steps": 0.002955913543701172, "step": 4061} {"info/global_step": 4062, "train_info/time_within_train_step": 2.6479287147521973, "step": 4062} {"train_info/time_between_train_steps": 0.002981901168823242, "step": 4062} {"info/global_step": 4063, "train_info/time_within_train_step": 2.6581673622131348, "step": 4063} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 4063} {"info/global_step": 4064, "train_info/time_within_train_step": 2.6440768241882324, "step": 4064} {"train_info/time_between_train_steps": 0.002937793731689453, "step": 4064} {"info/global_step": 4065, "train_info/time_within_train_step": 2.6486527919769287, "step": 4065} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 4065} {"info/global_step": 4066, "train_info/time_within_train_step": 2.6480839252471924, "step": 4066} {"train_info/time_between_train_steps": 0.0029418468475341797, "step": 4066} {"info/global_step": 4067, "train_info/time_within_train_step": 2.654740571975708, "step": 4067} {"train_info/time_between_train_steps": 0.0029861927032470703, "step": 4067} {"info/global_step": 4068, "train_info/time_within_train_step": 2.658538341522217, "step": 4068} {"train_info/time_between_train_steps": 0.0030426979064941406, "step": 4068} {"info/global_step": 4069, "train_info/time_within_train_step": 2.672771453857422, "step": 4069} {"train_info/time_between_train_steps": 0.0029876232147216797, "step": 4069} {"info/global_step": 4070, "train_info/time_within_train_step": 2.730462074279785, "step": 4070} {"train_info/time_between_train_steps": 0.0029420852661132812, "step": 4070} {"info/global_step": 4071, "train_info/time_within_train_step": 2.6720211505889893, "step": 4071} {"train_info/time_between_train_steps": 0.0030024051666259766, "step": 4071} {"info/global_step": 4072, "train_info/time_within_train_step": 2.6540956497192383, "step": 4072} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 4072} {"info/global_step": 4073, "train_info/time_within_train_step": 2.644761562347412, "step": 4073} {"train_info/time_between_train_steps": 0.0029845237731933594, "step": 4073} {"info/global_step": 4074, "train_info/time_within_train_step": 2.6505239009857178, "step": 4074} {"train_info/time_between_train_steps": 0.002943277359008789, "step": 4074} {"info/global_step": 4075, "train_info/time_within_train_step": 2.647404432296753, "step": 4075} {"train_info/time_between_train_steps": 0.002900362014770508, "step": 4075} {"info/global_step": 4076, "train_info/time_within_train_step": 2.6687681674957275, "step": 4076} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 4076} {"info/global_step": 4077, "train_info/time_within_train_step": 2.688936948776245, "step": 4077} {"train_info/time_between_train_steps": 0.0029032230377197266, "step": 4077} {"info/global_step": 4078, "train_info/time_within_train_step": 2.682523250579834, "step": 4078} {"train_info/time_between_train_steps": 0.002962827682495117, "step": 4078} {"info/global_step": 4079, "train_info/time_within_train_step": 2.652376651763916, "step": 4079} {"train_info/time_between_train_steps": 0.0029625892639160156, "step": 4079} {"info/global_step": 4080, "train_info/time_within_train_step": 2.6412763595581055, "step": 4080} {"train_info/time_between_train_steps": 0.002927541732788086, "step": 4080} {"info/global_step": 4081, "train_info/time_within_train_step": 2.6549205780029297, "step": 4081} {"train_info/time_between_train_steps": 0.0029790401458740234, "step": 4081} {"info/global_step": 4082, "train_info/time_within_train_step": 2.651596784591675, "step": 4082} {"train_info/time_between_train_steps": 0.002943754196166992, "step": 4082} {"info/global_step": 4083, "train_info/time_within_train_step": 2.646746873855591, "step": 4083} {"train_info/time_between_train_steps": 0.0029053688049316406, "step": 4083} {"info/global_step": 4084, "train_info/time_within_train_step": 2.6439049243927, "step": 4084} {"train_info/time_between_train_steps": 0.003022432327270508, "step": 4084} {"info/global_step": 4085, "train_info/time_within_train_step": 2.6478641033172607, "step": 4085} {"train_info/time_between_train_steps": 0.0029621124267578125, "step": 4085} {"info/global_step": 4086, "train_info/time_within_train_step": 2.671154737472534, "step": 4086} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 4086} {"info/global_step": 4087, "train_info/time_within_train_step": 2.666754961013794, "step": 4087} {"train_info/time_between_train_steps": 0.0031194686889648438, "step": 4087} {"info/global_step": 4088, "train_info/time_within_train_step": 2.6450510025024414, "step": 4088} {"train_info/time_between_train_steps": 0.0030145645141601562, "step": 4088} {"info/global_step": 4089, "train_info/time_within_train_step": 2.6820480823516846, "step": 4089} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 4089} {"info/global_step": 4090, "train_info/time_within_train_step": 2.640521764755249, "step": 4090} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 4090} {"info/global_step": 4091, "train_info/time_within_train_step": 2.647766590118408, "step": 4091} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 4091} {"info/global_step": 4092, "train_info/time_within_train_step": 2.6636672019958496, "step": 4092} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 4092} {"info/global_step": 4093, "train_info/time_within_train_step": 2.643888235092163, "step": 4093} {"train_info/time_between_train_steps": 0.003117084503173828, "step": 4093} {"info/global_step": 4094, "train_info/time_within_train_step": 2.6450986862182617, "step": 4094} {"train_info/time_between_train_steps": 0.0031044483184814453, "step": 4094} {"info/global_step": 4095, "train_info/time_within_train_step": 2.9048516750335693, "step": 4095} {"train_info/time_between_train_steps": 0.0029327869415283203, "step": 4095} {"info/global_step": 4096, "train_info/time_within_train_step": 2.6622653007507324, "step": 4096} {"train_info/time_between_train_steps": 0.002961874008178711, "step": 4096} {"info/global_step": 4097, "train_info/time_within_train_step": 2.6579134464263916, "step": 4097} {"train_info/time_between_train_steps": 0.0029501914978027344, "step": 4097} {"info/global_step": 4098, "train_info/time_within_train_step": 2.6432406902313232, "step": 4098} {"train_info/time_between_train_steps": 0.002958536148071289, "step": 4098} {"info/global_step": 4099, "train_info/time_within_train_step": 2.6647143363952637, "step": 4099} {"train_info/time_between_train_steps": 0.0029706954956054688, "step": 4099} {"info/global_step": 4100, "train_info/time_within_train_step": 2.659980297088623, "step": 4100} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746908963, "_runtime": 11561}, "step": 4100} {"logs": {"train/loss": 3.7826, "train/learning_rate": 0.0003933333333333333, "train/epoch": 4.06, "_timestamp": 1746908963, "_runtime": 11561}, "step": 4100} {"train_info/time_between_train_steps": 0.024374723434448242, "step": 4100} {"info/global_step": 4101, "train_info/time_within_train_step": 2.6611382961273193, "step": 4101} {"train_info/time_between_train_steps": 0.003011941909790039, "step": 4101} {"info/global_step": 4102, "train_info/time_within_train_step": 2.6552810668945312, "step": 4102} {"train_info/time_between_train_steps": 0.0029098987579345703, "step": 4102} {"info/global_step": 4103, "train_info/time_within_train_step": 2.705909252166748, "step": 4103} {"train_info/time_between_train_steps": 0.002967357635498047, "step": 4103} {"info/global_step": 4104, "train_info/time_within_train_step": 2.6503543853759766, "step": 4104} {"train_info/time_between_train_steps": 0.0029146671295166016, "step": 4104} {"info/global_step": 4105, "train_info/time_within_train_step": 2.6466286182403564, "step": 4105} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 4105} {"info/global_step": 4106, "train_info/time_within_train_step": 2.6531496047973633, "step": 4106} {"train_info/time_between_train_steps": 0.002900362014770508, "step": 4106} {"info/global_step": 4107, "train_info/time_within_train_step": 2.6453707218170166, "step": 4107} {"train_info/time_between_train_steps": 0.0061283111572265625, "step": 4107} {"info/global_step": 4108, "train_info/time_within_train_step": 2.6441650390625, "step": 4108} {"train_info/time_between_train_steps": 0.004918336868286133, "step": 4108} {"info/global_step": 4109, "train_info/time_within_train_step": 2.650662422180176, "step": 4109} {"train_info/time_between_train_steps": 0.006052494049072266, "step": 4109} {"info/global_step": 4110, "train_info/time_within_train_step": 2.652214527130127, "step": 4110} {"train_info/time_between_train_steps": 0.0062024593353271484, "step": 4110} {"info/global_step": 4111, "train_info/time_within_train_step": 2.658989667892456, "step": 4111} {"train_info/time_between_train_steps": 0.006072998046875, "step": 4111} {"info/global_step": 4112, "train_info/time_within_train_step": 2.6738839149475098, "step": 4112} {"train_info/time_between_train_steps": 0.006137847900390625, "step": 4112} {"info/global_step": 4113, "train_info/time_within_train_step": 2.7282073497772217, "step": 4113} {"train_info/time_between_train_steps": 0.006124973297119141, "step": 4113} {"info/global_step": 4114, "train_info/time_within_train_step": 2.669196128845215, "step": 4114} {"train_info/time_between_train_steps": 0.006101369857788086, "step": 4114} {"info/global_step": 4115, "train_info/time_within_train_step": 2.6404666900634766, "step": 4115} {"train_info/time_between_train_steps": 0.006089925765991211, "step": 4115} {"info/global_step": 4116, "train_info/time_within_train_step": 2.641221284866333, "step": 4116} {"train_info/time_between_train_steps": 0.00608062744140625, "step": 4116} {"info/global_step": 4117, "train_info/time_within_train_step": 2.656850814819336, "step": 4117} {"train_info/time_between_train_steps": 0.006075620651245117, "step": 4117} {"info/global_step": 4118, "train_info/time_within_train_step": 2.6622049808502197, "step": 4118} {"train_info/time_between_train_steps": 0.006290435791015625, "step": 4118} {"info/global_step": 4119, "train_info/time_within_train_step": 2.644003391265869, "step": 4119} {"train_info/time_between_train_steps": 0.006108760833740234, "step": 4119} {"info/global_step": 4120, "train_info/time_within_train_step": 2.651667356491089, "step": 4120} {"train_info/time_between_train_steps": 0.0065081119537353516, "step": 4120} {"info/global_step": 4121, "train_info/time_within_train_step": 2.646036148071289, "step": 4121} {"train_info/time_between_train_steps": 0.006192922592163086, "step": 4121} {"info/global_step": 4122, "train_info/time_within_train_step": 2.668593406677246, "step": 4122} {"train_info/time_between_train_steps": 0.006098270416259766, "step": 4122} {"info/global_step": 4123, "train_info/time_within_train_step": 2.6691689491271973, "step": 4123} {"train_info/time_between_train_steps": 0.006143093109130859, "step": 4123} {"info/global_step": 4124, "train_info/time_within_train_step": 2.6884427070617676, "step": 4124} {"train_info/time_between_train_steps": 0.006146430969238281, "step": 4124} {"info/global_step": 4125, "train_info/time_within_train_step": 2.64959454536438, "step": 4125} {"train_info/time_between_train_steps": 0.006194353103637695, "step": 4125} {"info/global_step": 4126, "train_info/time_within_train_step": 2.6490793228149414, "step": 4126} {"train_info/time_between_train_steps": 0.006116390228271484, "step": 4126} {"info/global_step": 4127, "train_info/time_within_train_step": 2.6505837440490723, "step": 4127} {"train_info/time_between_train_steps": 0.006089687347412109, "step": 4127} {"info/global_step": 4128, "train_info/time_within_train_step": 2.646698474884033, "step": 4128} {"train_info/time_between_train_steps": 0.0060977935791015625, "step": 4128} {"info/global_step": 4129, "train_info/time_within_train_step": 2.6580183506011963, "step": 4129} {"train_info/time_between_train_steps": 0.006138801574707031, "step": 4129} {"info/global_step": 4130, "train_info/time_within_train_step": 2.643444299697876, "step": 4130} {"train_info/time_between_train_steps": 0.006064891815185547, "step": 4130} {"info/global_step": 4131, "train_info/time_within_train_step": 2.6444711685180664, "step": 4131} {"train_info/time_between_train_steps": 0.0061190128326416016, "step": 4131} {"info/global_step": 4132, "train_info/time_within_train_step": 2.66610050201416, "step": 4132} {"train_info/time_between_train_steps": 0.006074666976928711, "step": 4132} {"info/global_step": 4133, "train_info/time_within_train_step": 2.6690852642059326, "step": 4133} {"train_info/time_between_train_steps": 0.00607609748840332, "step": 4133} {"info/global_step": 4134, "train_info/time_within_train_step": 2.680774450302124, "step": 4134} {"train_info/time_between_train_steps": 0.006103515625, "step": 4134} {"info/global_step": 4135, "train_info/time_within_train_step": 2.653088092803955, "step": 4135} {"train_info/time_between_train_steps": 0.00619053840637207, "step": 4135} {"info/global_step": 4136, "train_info/time_within_train_step": 2.6867988109588623, "step": 4136} {"train_info/time_between_train_steps": 0.00601649284362793, "step": 4136} {"info/global_step": 4137, "train_info/time_within_train_step": 2.641974449157715, "step": 4137} {"train_info/time_between_train_steps": 0.006190776824951172, "step": 4137} {"info/global_step": 4138, "train_info/time_within_train_step": 2.654109477996826, "step": 4138} {"train_info/time_between_train_steps": 0.006235599517822266, "step": 4138} {"info/global_step": 4139, "train_info/time_within_train_step": 2.6544909477233887, "step": 4139} {"train_info/time_between_train_steps": 0.006510019302368164, "step": 4139} {"info/global_step": 4140, "train_info/time_within_train_step": 2.644240617752075, "step": 4140} {"train_info/time_between_train_steps": 0.006459951400756836, "step": 4140} {"info/global_step": 4141, "train_info/time_within_train_step": 2.6442689895629883, "step": 4141} {"train_info/time_between_train_steps": 0.006398916244506836, "step": 4141} {"info/global_step": 4142, "train_info/time_within_train_step": 2.6562182903289795, "step": 4142} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 4142} {"info/global_step": 4143, "train_info/time_within_train_step": 2.6604647636413574, "step": 4143} {"train_info/time_between_train_steps": 0.0031585693359375, "step": 4143} {"info/global_step": 4144, "train_info/time_within_train_step": 2.6660830974578857, "step": 4144} {"train_info/time_between_train_steps": 0.003252744674682617, "step": 4144} {"info/global_step": 4145, "train_info/time_within_train_step": 2.657808780670166, "step": 4145} {"train_info/time_between_train_steps": 0.0031499862670898438, "step": 4145} {"info/global_step": 4146, "train_info/time_within_train_step": 2.7090229988098145, "step": 4146} {"train_info/time_between_train_steps": 0.0030977725982666016, "step": 4146} {"info/global_step": 4147, "train_info/time_within_train_step": 2.6480910778045654, "step": 4147} {"train_info/time_between_train_steps": 0.0030913352966308594, "step": 4147} {"info/global_step": 4148, "train_info/time_within_train_step": 2.6487646102905273, "step": 4148} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 4148} {"info/global_step": 4149, "train_info/time_within_train_step": 2.6544668674468994, "step": 4149} {"train_info/time_between_train_steps": 0.0031213760375976562, "step": 4149} {"info/global_step": 4150, "train_info/time_within_train_step": 2.6485860347747803, "step": 4150} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746909098, "_runtime": 11696}, "step": 4150} {"logs": {"train/loss": 3.7826, "train/learning_rate": 0.00039, "train/epoch": 4.07, "_timestamp": 1746909098, "_runtime": 11696}, "step": 4150} {"train_info/time_between_train_steps": 0.02386641502380371, "step": 4150} {"info/global_step": 4151, "train_info/time_within_train_step": 2.650858163833618, "step": 4151} {"train_info/time_between_train_steps": 0.003251314163208008, "step": 4151} {"info/global_step": 4152, "train_info/time_within_train_step": 2.6460494995117188, "step": 4152} {"train_info/time_between_train_steps": 0.0033462047576904297, "step": 4152} {"info/global_step": 4153, "train_info/time_within_train_step": 2.6590757369995117, "step": 4153} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 4153} {"info/global_step": 4154, "train_info/time_within_train_step": 2.652414321899414, "step": 4154} {"train_info/time_between_train_steps": 0.003076314926147461, "step": 4154} {"info/global_step": 4155, "train_info/time_within_train_step": 2.6597580909729004, "step": 4155} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 4155} {"info/global_step": 4156, "train_info/time_within_train_step": 2.696882486343384, "step": 4156} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 4156} {"info/global_step": 4157, "train_info/time_within_train_step": 2.718904733657837, "step": 4157} {"train_info/time_between_train_steps": 0.0031402111053466797, "step": 4157} {"info/global_step": 4158, "train_info/time_within_train_step": 2.6439778804779053, "step": 4158} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 4158} {"info/global_step": 4159, "train_info/time_within_train_step": 2.642040491104126, "step": 4159} {"train_info/time_between_train_steps": 0.003136157989501953, "step": 4159} {"info/global_step": 4160, "train_info/time_within_train_step": 2.660296678543091, "step": 4160} {"train_info/time_between_train_steps": 0.0031087398529052734, "step": 4160} {"info/global_step": 4161, "train_info/time_within_train_step": 2.647758722305298, "step": 4161} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 4161} {"info/global_step": 4162, "train_info/time_within_train_step": 2.647073268890381, "step": 4162} {"train_info/time_between_train_steps": 0.003134012222290039, "step": 4162} {"info/global_step": 4163, "train_info/time_within_train_step": 2.649423360824585, "step": 4163} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 4163} {"info/global_step": 4164, "train_info/time_within_train_step": 2.6434903144836426, "step": 4164} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 4164} {"info/global_step": 4165, "train_info/time_within_train_step": 2.6667468547821045, "step": 4165} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 4165} {"info/global_step": 4166, "train_info/time_within_train_step": 2.67059588432312, "step": 4166} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 4166} {"info/global_step": 4167, "train_info/time_within_train_step": 2.686411142349243, "step": 4167} {"train_info/time_between_train_steps": 0.003112316131591797, "step": 4167} {"info/global_step": 4168, "train_info/time_within_train_step": 2.6523020267486572, "step": 4168} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 4168} {"info/global_step": 4169, "train_info/time_within_train_step": 2.6430017948150635, "step": 4169} {"train_info/time_between_train_steps": 0.003309488296508789, "step": 4169} {"info/global_step": 4170, "train_info/time_within_train_step": 2.654878854751587, "step": 4170} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 4170} {"info/global_step": 4171, "train_info/time_within_train_step": 2.652543544769287, "step": 4171} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 4171} {"info/global_step": 4172, "train_info/time_within_train_step": 2.6493241786956787, "step": 4172} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 4172} {"info/global_step": 4173, "train_info/time_within_train_step": 2.644456148147583, "step": 4173} {"train_info/time_between_train_steps": 0.00646519660949707, "step": 4173} {"info/global_step": 4174, "train_info/time_within_train_step": 2.6472010612487793, "step": 4174} {"train_info/time_between_train_steps": 0.006370067596435547, "step": 4174} {"info/global_step": 4175, "train_info/time_within_train_step": 2.6706149578094482, "step": 4175} {"train_info/time_between_train_steps": 0.006346225738525391, "step": 4175} {"info/global_step": 4176, "train_info/time_within_train_step": 2.6655845642089844, "step": 4176} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 4176} {"info/global_step": 4177, "train_info/time_within_train_step": 2.687511920928955, "step": 4177} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 4177} {"info/global_step": 4178, "train_info/time_within_train_step": 2.6551218032836914, "step": 4178} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 4178} {"info/global_step": 4179, "train_info/time_within_train_step": 2.667088270187378, "step": 4179} {"train_info/time_between_train_steps": 0.003275156021118164, "step": 4179} {"info/global_step": 4180, "train_info/time_within_train_step": 2.6427173614501953, "step": 4180} {"train_info/time_between_train_steps": 0.0031316280364990234, "step": 4180} {"info/global_step": 4181, "train_info/time_within_train_step": 2.6422994136810303, "step": 4181} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 4181} {"info/global_step": 4182, "train_info/time_within_train_step": 2.665705919265747, "step": 4182} {"train_info/time_between_train_steps": 0.00312042236328125, "step": 4182} {"info/global_step": 4183, "train_info/time_within_train_step": 2.6680095195770264, "step": 4183} {"train_info/time_between_train_steps": 0.0031435489654541016, "step": 4183} {"info/global_step": 4184, "train_info/time_within_train_step": 2.656693935394287, "step": 4184} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 4184} {"info/global_step": 4185, "train_info/time_within_train_step": 2.6625711917877197, "step": 4185} {"train_info/time_between_train_steps": 0.0031239986419677734, "step": 4185} {"info/global_step": 4186, "train_info/time_within_train_step": 2.6957950592041016, "step": 4186} {"train_info/time_between_train_steps": 0.0033745765686035156, "step": 4186} {"info/global_step": 4187, "train_info/time_within_train_step": 2.6583023071289062, "step": 4187} {"train_info/time_between_train_steps": 0.003094196319580078, "step": 4187} {"info/global_step": 4188, "train_info/time_within_train_step": 2.6476945877075195, "step": 4188} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 4188} {"info/global_step": 4189, "train_info/time_within_train_step": 2.6447489261627197, "step": 4189} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 4189} {"info/global_step": 4190, "train_info/time_within_train_step": 2.653085708618164, "step": 4190} {"train_info/time_between_train_steps": 0.003113269805908203, "step": 4190} {"info/global_step": 4191, "train_info/time_within_train_step": 2.6597936153411865, "step": 4191} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 4191} {"info/global_step": 4192, "train_info/time_within_train_step": 2.645627498626709, "step": 4192} {"train_info/time_between_train_steps": 0.0030727386474609375, "step": 4192} {"info/global_step": 4193, "train_info/time_within_train_step": 2.6455624103546143, "step": 4193} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 4193} {"info/global_step": 4194, "train_info/time_within_train_step": 2.645969867706299, "step": 4194} {"train_info/time_between_train_steps": 0.0032966136932373047, "step": 4194} {"info/global_step": 4195, "train_info/time_within_train_step": 2.646951675415039, "step": 4195} {"train_info/time_between_train_steps": 0.003289937973022461, "step": 4195} {"info/global_step": 4196, "train_info/time_within_train_step": 2.645263195037842, "step": 4196} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 4196} {"info/global_step": 4197, "train_info/time_within_train_step": 2.6458985805511475, "step": 4197} {"train_info/time_between_train_steps": 0.0030906200408935547, "step": 4197} {"info/global_step": 4198, "train_info/time_within_train_step": 2.6845169067382812, "step": 4198} {"train_info/time_between_train_steps": 0.0031058788299560547, "step": 4198} {"info/global_step": 4199, "train_info/time_within_train_step": 2.6422481536865234, "step": 4199} {"train_info/time_between_train_steps": 0.00310516357421875, "step": 4199} {"info/global_step": 4200, "train_info/time_within_train_step": 2.6535403728485107, "step": 4200} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746909232, "_runtime": 11830}, "step": 4200} {"logs": {"train/loss": 3.7623, "train/learning_rate": 0.00038666666666666667, "train/epoch": 4.07, "_timestamp": 1746909232, "_runtime": 11830}, "step": 4200} {"train_info/time_between_train_steps": 12.879773378372192, "step": 4200} {"info/global_step": 4201, "train_info/time_within_train_step": 2.463157892227173, "step": 4201} {"train_info/time_between_train_steps": 0.003069639205932617, "step": 4201} {"info/global_step": 4202, "train_info/time_within_train_step": 2.423402786254883, "step": 4202} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 4202} {"info/global_step": 4203, "train_info/time_within_train_step": 2.6129908561706543, "step": 4203} {"train_info/time_between_train_steps": 0.003098011016845703, "step": 4203} {"info/global_step": 4204, "train_info/time_within_train_step": 2.6827690601348877, "step": 4204} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 4204} {"info/global_step": 4205, "train_info/time_within_train_step": 2.6525206565856934, "step": 4205} {"train_info/time_between_train_steps": 0.0030641555786132812, "step": 4205} {"info/global_step": 4206, "train_info/time_within_train_step": 2.657198667526245, "step": 4206} {"train_info/time_between_train_steps": 0.003093242645263672, "step": 4206} {"info/global_step": 4207, "train_info/time_within_train_step": 2.6473374366760254, "step": 4207} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 4207} {"info/global_step": 4208, "train_info/time_within_train_step": 2.806764841079712, "step": 4208} {"train_info/time_between_train_steps": 0.0032939910888671875, "step": 4208} {"info/global_step": 4209, "train_info/time_within_train_step": 2.6426024436950684, "step": 4209} {"train_info/time_between_train_steps": 0.00289154052734375, "step": 4209} {"info/global_step": 4210, "train_info/time_within_train_step": 2.6409144401550293, "step": 4210} {"train_info/time_between_train_steps": 0.0030057430267333984, "step": 4210} {"info/global_step": 4211, "train_info/time_within_train_step": 2.662766695022583, "step": 4211} {"train_info/time_between_train_steps": 0.003070354461669922, "step": 4211} {"info/global_step": 4212, "train_info/time_within_train_step": 2.6501502990722656, "step": 4212} {"train_info/time_between_train_steps": 0.0031223297119140625, "step": 4212} {"info/global_step": 4213, "train_info/time_within_train_step": 2.643826723098755, "step": 4213} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 4213} {"info/global_step": 4214, "train_info/time_within_train_step": 2.6671018600463867, "step": 4214} {"train_info/time_between_train_steps": 0.0030455589294433594, "step": 4214} {"info/global_step": 4215, "train_info/time_within_train_step": 2.6587910652160645, "step": 4215} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 4215} {"info/global_step": 4216, "train_info/time_within_train_step": 2.6704416275024414, "step": 4216} {"train_info/time_between_train_steps": 0.003115415573120117, "step": 4216} {"info/global_step": 4217, "train_info/time_within_train_step": 2.680044412612915, "step": 4217} {"train_info/time_between_train_steps": 0.003130197525024414, "step": 4217} {"info/global_step": 4218, "train_info/time_within_train_step": 2.674238443374634, "step": 4218} {"train_info/time_between_train_steps": 0.003027677536010742, "step": 4218} {"info/global_step": 4219, "train_info/time_within_train_step": 2.6424381732940674, "step": 4219} {"train_info/time_between_train_steps": 0.003076314926147461, "step": 4219} {"info/global_step": 4220, "train_info/time_within_train_step": 2.643517255783081, "step": 4220} {"train_info/time_between_train_steps": 0.0030775070190429688, "step": 4220} {"info/global_step": 4221, "train_info/time_within_train_step": 2.666402578353882, "step": 4221} {"train_info/time_between_train_steps": 0.003119230270385742, "step": 4221} {"info/global_step": 4222, "train_info/time_within_train_step": 2.652745008468628, "step": 4222} {"train_info/time_between_train_steps": 0.0030388832092285156, "step": 4222} {"info/global_step": 4223, "train_info/time_within_train_step": 2.644991874694824, "step": 4223} {"train_info/time_between_train_steps": 0.003130674362182617, "step": 4223} {"info/global_step": 4224, "train_info/time_within_train_step": 2.658268928527832, "step": 4224} {"train_info/time_between_train_steps": 0.003098726272583008, "step": 4224} {"info/global_step": 4225, "train_info/time_within_train_step": 2.654146432876587, "step": 4225} {"train_info/time_between_train_steps": 0.0030863285064697266, "step": 4225} {"info/global_step": 4226, "train_info/time_within_train_step": 2.663064479827881, "step": 4226} {"train_info/time_between_train_steps": 0.003055095672607422, "step": 4226} {"info/global_step": 4227, "train_info/time_within_train_step": 2.691903591156006, "step": 4227} {"train_info/time_between_train_steps": 0.003063678741455078, "step": 4227} {"info/global_step": 4228, "train_info/time_within_train_step": 2.6830334663391113, "step": 4228} {"train_info/time_between_train_steps": 0.003061056137084961, "step": 4228} {"info/global_step": 4229, "train_info/time_within_train_step": 2.6521761417388916, "step": 4229} {"train_info/time_between_train_steps": 0.003019094467163086, "step": 4229} {"info/global_step": 4230, "train_info/time_within_train_step": 2.6522927284240723, "step": 4230} {"train_info/time_between_train_steps": 0.0030426979064941406, "step": 4230} {"info/global_step": 4231, "train_info/time_within_train_step": 2.6452300548553467, "step": 4231} {"train_info/time_between_train_steps": 0.0030052661895751953, "step": 4231} {"info/global_step": 4232, "train_info/time_within_train_step": 2.6493589878082275, "step": 4232} {"train_info/time_between_train_steps": 0.003022909164428711, "step": 4232} {"info/global_step": 4233, "train_info/time_within_train_step": 2.6459715366363525, "step": 4233} {"train_info/time_between_train_steps": 0.0030891895294189453, "step": 4233} {"info/global_step": 4234, "train_info/time_within_train_step": 2.6703786849975586, "step": 4234} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 4234} {"info/global_step": 4235, "train_info/time_within_train_step": 2.6829755306243896, "step": 4235} {"train_info/time_between_train_steps": 0.0029954910278320312, "step": 4235} {"info/global_step": 4236, "train_info/time_within_train_step": 2.6952311992645264, "step": 4236} {"train_info/time_between_train_steps": 0.0030508041381835938, "step": 4236} {"info/global_step": 4237, "train_info/time_within_train_step": 2.647441864013672, "step": 4237} {"train_info/time_between_train_steps": 0.003056049346923828, "step": 4237} {"info/global_step": 4238, "train_info/time_within_train_step": 2.647064447402954, "step": 4238} {"train_info/time_between_train_steps": 0.0030601024627685547, "step": 4238} {"info/global_step": 4239, "train_info/time_within_train_step": 2.653508186340332, "step": 4239} {"train_info/time_between_train_steps": 0.003245115280151367, "step": 4239} {"info/global_step": 4240, "train_info/time_within_train_step": 2.6488711833953857, "step": 4240} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 4240} {"info/global_step": 4241, "train_info/time_within_train_step": 2.6567299365997314, "step": 4241} {"train_info/time_between_train_steps": 0.003016233444213867, "step": 4241} {"info/global_step": 4242, "train_info/time_within_train_step": 2.6448614597320557, "step": 4242} {"train_info/time_between_train_steps": 0.0030291080474853516, "step": 4242} {"info/global_step": 4243, "train_info/time_within_train_step": 2.6467061042785645, "step": 4243} {"train_info/time_between_train_steps": 0.0030367374420166016, "step": 4243} {"info/global_step": 4244, "train_info/time_within_train_step": 2.6712758541107178, "step": 4244} {"train_info/time_between_train_steps": 0.0030858516693115234, "step": 4244} {"info/global_step": 4245, "train_info/time_within_train_step": 2.6740992069244385, "step": 4245} {"train_info/time_between_train_steps": 0.003088712692260742, "step": 4245} {"info/global_step": 4246, "train_info/time_within_train_step": 2.656568765640259, "step": 4246} {"train_info/time_between_train_steps": 0.0030028820037841797, "step": 4246} {"info/global_step": 4247, "train_info/time_within_train_step": 2.686619520187378, "step": 4247} {"train_info/time_between_train_steps": 0.0030527114868164062, "step": 4247} {"info/global_step": 4248, "train_info/time_within_train_step": 2.6425321102142334, "step": 4248} {"train_info/time_between_train_steps": 0.003062009811401367, "step": 4248} {"info/global_step": 4249, "train_info/time_within_train_step": 3.282301187515259, "step": 4249} {"train_info/time_between_train_steps": 0.0030710697174072266, "step": 4249} {"info/global_step": 4250, "train_info/time_within_train_step": 2.661900520324707, "step": 4250} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746909380, "_runtime": 11978}, "step": 4250} {"logs": {"train/loss": 3.758, "train/learning_rate": 0.0003833333333333333, "train/epoch": 4.08, "_timestamp": 1746909380, "_runtime": 11978}, "step": 4250} {"train_info/time_between_train_steps": 0.02424001693725586, "step": 4250} {"info/global_step": 4251, "train_info/time_within_train_step": 2.649648427963257, "step": 4251} {"train_info/time_between_train_steps": 0.002989530563354492, "step": 4251} {"info/global_step": 4252, "train_info/time_within_train_step": 2.644310712814331, "step": 4252} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 4252} {"info/global_step": 4253, "train_info/time_within_train_step": 2.6465706825256348, "step": 4253} {"train_info/time_between_train_steps": 0.0031211376190185547, "step": 4253} {"info/global_step": 4254, "train_info/time_within_train_step": 2.671449661254883, "step": 4254} {"train_info/time_between_train_steps": 0.003058195114135742, "step": 4254} {"info/global_step": 4255, "train_info/time_within_train_step": 2.6851561069488525, "step": 4255} {"train_info/time_between_train_steps": 0.003267526626586914, "step": 4255} {"info/global_step": 4256, "train_info/time_within_train_step": 2.6947858333587646, "step": 4256} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 4256} {"info/global_step": 4257, "train_info/time_within_train_step": 2.652385950088501, "step": 4257} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 4257} {"info/global_step": 4258, "train_info/time_within_train_step": 2.672759532928467, "step": 4258} {"train_info/time_between_train_steps": 0.003173828125, "step": 4258} {"info/global_step": 4259, "train_info/time_within_train_step": 2.641787052154541, "step": 4259} {"train_info/time_between_train_steps": 0.003315448760986328, "step": 4259} {"info/global_step": 4260, "train_info/time_within_train_step": 2.647958517074585, "step": 4260} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 4260} {"info/global_step": 4261, "train_info/time_within_train_step": 2.669200897216797, "step": 4261} {"train_info/time_between_train_steps": 0.003086566925048828, "step": 4261} {"info/global_step": 4262, "train_info/time_within_train_step": 2.643413543701172, "step": 4262} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 4262} {"info/global_step": 4263, "train_info/time_within_train_step": 2.644792318344116, "step": 4263} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 4263} {"info/global_step": 4264, "train_info/time_within_train_step": 2.6547584533691406, "step": 4264} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 4264} {"info/global_step": 4265, "train_info/time_within_train_step": 2.6604318618774414, "step": 4265} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 4265} {"info/global_step": 4266, "train_info/time_within_train_step": 2.673063039779663, "step": 4266} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 4266} {"info/global_step": 4267, "train_info/time_within_train_step": 2.660719394683838, "step": 4267} {"train_info/time_between_train_steps": 0.003241300582885742, "step": 4267} {"info/global_step": 4268, "train_info/time_within_train_step": 2.7634735107421875, "step": 4268} {"train_info/time_between_train_steps": 0.002942323684692383, "step": 4268} {"info/global_step": 4269, "train_info/time_within_train_step": 2.6976523399353027, "step": 4269} {"train_info/time_between_train_steps": 0.0029926300048828125, "step": 4269} {"info/global_step": 4270, "train_info/time_within_train_step": 2.65738844871521, "step": 4270} {"train_info/time_between_train_steps": 0.002929210662841797, "step": 4270} {"info/global_step": 4271, "train_info/time_within_train_step": 2.655712127685547, "step": 4271} {"train_info/time_between_train_steps": 0.0029973983764648438, "step": 4271} {"info/global_step": 4272, "train_info/time_within_train_step": 2.6444194316864014, "step": 4272} {"train_info/time_between_train_steps": 0.0029897689819335938, "step": 4272} {"info/global_step": 4273, "train_info/time_within_train_step": 2.646846055984497, "step": 4273} {"train_info/time_between_train_steps": 0.002994060516357422, "step": 4273} {"info/global_step": 4274, "train_info/time_within_train_step": 2.646779775619507, "step": 4274} {"train_info/time_between_train_steps": 0.0029418468475341797, "step": 4274} {"info/global_step": 4275, "train_info/time_within_train_step": 2.6531713008880615, "step": 4275} {"train_info/time_between_train_steps": 0.0029478073120117188, "step": 4275} {"info/global_step": 4276, "train_info/time_within_train_step": 2.6579360961914062, "step": 4276} {"train_info/time_between_train_steps": 0.003010988235473633, "step": 4276} {"info/global_step": 4277, "train_info/time_within_train_step": 2.6766538619995117, "step": 4277} {"train_info/time_between_train_steps": 0.002923250198364258, "step": 4277} {"info/global_step": 4278, "train_info/time_within_train_step": 2.727914571762085, "step": 4278} {"train_info/time_between_train_steps": 0.0029082298278808594, "step": 4278} {"info/global_step": 4279, "train_info/time_within_train_step": 2.6554794311523438, "step": 4279} {"train_info/time_between_train_steps": 0.0029077529907226562, "step": 4279} {"info/global_step": 4280, "train_info/time_within_train_step": 2.6397759914398193, "step": 4280} {"train_info/time_between_train_steps": 0.002914905548095703, "step": 4280} {"info/global_step": 4281, "train_info/time_within_train_step": 2.6539900302886963, "step": 4281} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 4281} {"info/global_step": 4282, "train_info/time_within_train_step": 2.64913272857666, "step": 4282} {"train_info/time_between_train_steps": 0.003103017807006836, "step": 4282} {"info/global_step": 4283, "train_info/time_within_train_step": 2.648406505584717, "step": 4283} {"train_info/time_between_train_steps": 0.002973794937133789, "step": 4283} {"info/global_step": 4284, "train_info/time_within_train_step": 2.6438541412353516, "step": 4284} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 4284} {"info/global_step": 4285, "train_info/time_within_train_step": 2.6463816165924072, "step": 4285} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 4285} {"info/global_step": 4286, "train_info/time_within_train_step": 2.6613540649414062, "step": 4286} {"train_info/time_between_train_steps": 0.0033597946166992188, "step": 4286} {"info/global_step": 4287, "train_info/time_within_train_step": 2.6682469844818115, "step": 4287} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 4287} {"info/global_step": 4288, "train_info/time_within_train_step": 2.711881399154663, "step": 4288} {"train_info/time_between_train_steps": 0.0033006668090820312, "step": 4288} {"info/global_step": 4289, "train_info/time_within_train_step": 2.6446902751922607, "step": 4289} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 4289} {"info/global_step": 4290, "train_info/time_within_train_step": 2.6573379039764404, "step": 4290} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 4290} {"info/global_step": 4291, "train_info/time_within_train_step": 2.6471006870269775, "step": 4291} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 4291} {"info/global_step": 4292, "train_info/time_within_train_step": 2.646883726119995, "step": 4292} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 4292} {"info/global_step": 4293, "train_info/time_within_train_step": 2.661832809448242, "step": 4293} {"train_info/time_between_train_steps": 0.003327608108520508, "step": 4293} {"info/global_step": 4294, "train_info/time_within_train_step": 2.644214391708374, "step": 4294} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 4294} {"info/global_step": 4295, "train_info/time_within_train_step": 2.646364688873291, "step": 4295} {"train_info/time_between_train_steps": 0.003265380859375, "step": 4295} {"info/global_step": 4296, "train_info/time_within_train_step": 2.6728439331054688, "step": 4296} {"train_info/time_between_train_steps": 0.0032739639282226562, "step": 4296} {"info/global_step": 4297, "train_info/time_within_train_step": 2.6650915145874023, "step": 4297} {"train_info/time_between_train_steps": 0.0033195018768310547, "step": 4297} {"info/global_step": 4298, "train_info/time_within_train_step": 2.6642682552337646, "step": 4298} {"train_info/time_between_train_steps": 0.003324747085571289, "step": 4298} {"info/global_step": 4299, "train_info/time_within_train_step": 2.678640365600586, "step": 4299} {"train_info/time_between_train_steps": 0.0033516883850097656, "step": 4299} {"info/global_step": 4300, "train_info/time_within_train_step": 2.646198272705078, "step": 4300} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746909514, "_runtime": 12112}, "step": 4300} {"logs": {"train/loss": 3.7516, "train/learning_rate": 0.00037999999999999997, "train/epoch": 4.08, "_timestamp": 1746909514, "_runtime": 12112}, "step": 4300} {"train_info/time_between_train_steps": 0.02462625503540039, "step": 4300} {"info/global_step": 4301, "train_info/time_within_train_step": 2.6414928436279297, "step": 4301} {"train_info/time_between_train_steps": 0.003116130828857422, "step": 4301} {"info/global_step": 4302, "train_info/time_within_train_step": 2.6461095809936523, "step": 4302} {"train_info/time_between_train_steps": 0.0033845901489257812, "step": 4302} {"info/global_step": 4303, "train_info/time_within_train_step": 2.663116455078125, "step": 4303} {"train_info/time_between_train_steps": 0.0033838748931884766, "step": 4303} {"info/global_step": 4304, "train_info/time_within_train_step": 2.649881601333618, "step": 4304} {"train_info/time_between_train_steps": 0.003143787384033203, "step": 4304} {"info/global_step": 4305, "train_info/time_within_train_step": 2.6454954147338867, "step": 4305} {"train_info/time_between_train_steps": 0.0032706260681152344, "step": 4305} {"info/global_step": 4306, "train_info/time_within_train_step": 2.6645431518554688, "step": 4306} {"train_info/time_between_train_steps": 0.00342559814453125, "step": 4306} {"info/global_step": 4307, "train_info/time_within_train_step": 2.6621978282928467, "step": 4307} {"train_info/time_between_train_steps": 0.003419637680053711, "step": 4307} {"info/global_step": 4308, "train_info/time_within_train_step": 2.711061716079712, "step": 4308} {"train_info/time_between_train_steps": 0.00345611572265625, "step": 4308} {"info/global_step": 4309, "train_info/time_within_train_step": 2.6619205474853516, "step": 4309} {"train_info/time_between_train_steps": 0.003983020782470703, "step": 4309} {"info/global_step": 4310, "train_info/time_within_train_step": 2.6983306407928467, "step": 4310} {"train_info/time_between_train_steps": 0.0037832260131835938, "step": 4310} {"info/global_step": 4311, "train_info/time_within_train_step": 2.668379306793213, "step": 4311} {"train_info/time_between_train_steps": 0.00390934944152832, "step": 4311} {"info/global_step": 4312, "train_info/time_within_train_step": 2.6446585655212402, "step": 4312} {"train_info/time_between_train_steps": 0.003941059112548828, "step": 4312} {"info/global_step": 4313, "train_info/time_within_train_step": 2.644082546234131, "step": 4313} {"train_info/time_between_train_steps": 0.004062175750732422, "step": 4313} {"info/global_step": 4314, "train_info/time_within_train_step": 2.6660964488983154, "step": 4314} {"train_info/time_between_train_steps": 0.004262208938598633, "step": 4314} {"info/global_step": 4315, "train_info/time_within_train_step": 2.6531693935394287, "step": 4315} {"train_info/time_between_train_steps": 0.0033156871795654297, "step": 4315} {"train_info/time_between_train_steps": 2.3627474308013916, "step": 4315} {"info/global_step": 4316, "train_info/time_within_train_step": 2.5990231037139893, "step": 4316} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 4316} {"info/global_step": 4317, "train_info/time_within_train_step": 2.654576539993286, "step": 4317} {"train_info/time_between_train_steps": 0.003121614456176758, "step": 4317} {"info/global_step": 4318, "train_info/time_within_train_step": 2.6476824283599854, "step": 4318} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 4318} {"info/global_step": 4319, "train_info/time_within_train_step": 2.6489925384521484, "step": 4319} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 4319} {"info/global_step": 4320, "train_info/time_within_train_step": 2.6455092430114746, "step": 4320} {"train_info/time_between_train_steps": 0.0031309127807617188, "step": 4320} {"info/global_step": 4321, "train_info/time_within_train_step": 2.6450512409210205, "step": 4321} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 4321} {"info/global_step": 4322, "train_info/time_within_train_step": 2.664137125015259, "step": 4322} {"train_info/time_between_train_steps": 0.003395557403564453, "step": 4322} {"info/global_step": 4323, "train_info/time_within_train_step": 2.6671946048736572, "step": 4323} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 4323} {"info/global_step": 4324, "train_info/time_within_train_step": 2.697364091873169, "step": 4324} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 4324} {"info/global_step": 4325, "train_info/time_within_train_step": 2.645857334136963, "step": 4325} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 4325} {"info/global_step": 4326, "train_info/time_within_train_step": 2.650196075439453, "step": 4326} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 4326} {"info/global_step": 4327, "train_info/time_within_train_step": 2.6504712104797363, "step": 4327} {"train_info/time_between_train_steps": 0.0031228065490722656, "step": 4327} {"info/global_step": 4328, "train_info/time_within_train_step": 2.8635149002075195, "step": 4328} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 4328} {"info/global_step": 4329, "train_info/time_within_train_step": 2.6578118801116943, "step": 4329} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 4329} {"info/global_step": 4330, "train_info/time_within_train_step": 2.649557590484619, "step": 4330} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 4330} {"info/global_step": 4331, "train_info/time_within_train_step": 2.6470935344696045, "step": 4331} {"train_info/time_between_train_steps": 0.003239154815673828, "step": 4331} {"info/global_step": 4332, "train_info/time_within_train_step": 2.660893440246582, "step": 4332} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 4332} {"info/global_step": 4333, "train_info/time_within_train_step": 2.6438145637512207, "step": 4333} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 4333} {"info/global_step": 4334, "train_info/time_within_train_step": 2.643446207046509, "step": 4334} {"train_info/time_between_train_steps": 0.0032186508178710938, "step": 4334} {"info/global_step": 4335, "train_info/time_within_train_step": 2.6705851554870605, "step": 4335} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 4335} {"info/global_step": 4336, "train_info/time_within_train_step": 2.667983293533325, "step": 4336} {"train_info/time_between_train_steps": 0.0033140182495117188, "step": 4336} {"info/global_step": 4337, "train_info/time_within_train_step": 2.6722538471221924, "step": 4337} {"train_info/time_between_train_steps": 0.0032644271850585938, "step": 4337} {"info/global_step": 4338, "train_info/time_within_train_step": 2.671940803527832, "step": 4338} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 4338} {"info/global_step": 4339, "train_info/time_within_train_step": 2.652580976486206, "step": 4339} {"train_info/time_between_train_steps": 0.0032727718353271484, "step": 4339} {"info/global_step": 4340, "train_info/time_within_train_step": 2.6515491008758545, "step": 4340} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 4340} {"info/global_step": 4341, "train_info/time_within_train_step": 2.6506333351135254, "step": 4341} {"train_info/time_between_train_steps": 0.0032732486724853516, "step": 4341} {"info/global_step": 4342, "train_info/time_within_train_step": 2.6561601161956787, "step": 4342} {"train_info/time_between_train_steps": 0.003299236297607422, "step": 4342} {"info/global_step": 4343, "train_info/time_within_train_step": 2.652648687362671, "step": 4343} {"train_info/time_between_train_steps": 0.0032644271850585938, "step": 4343} {"info/global_step": 4344, "train_info/time_within_train_step": 2.6478159427642822, "step": 4344} {"train_info/time_between_train_steps": 0.0032329559326171875, "step": 4344} {"info/global_step": 4345, "train_info/time_within_train_step": 2.671708822250366, "step": 4345} {"train_info/time_between_train_steps": 0.0033195018768310547, "step": 4345} {"info/global_step": 4346, "train_info/time_within_train_step": 2.683659553527832, "step": 4346} {"train_info/time_between_train_steps": 0.0034270286560058594, "step": 4346} {"info/global_step": 4347, "train_info/time_within_train_step": 2.678619384765625, "step": 4347} {"train_info/time_between_train_steps": 0.003381967544555664, "step": 4347} {"info/global_step": 4348, "train_info/time_within_train_step": 2.695403814315796, "step": 4348} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 4348} {"info/global_step": 4349, "train_info/time_within_train_step": 2.644195318222046, "step": 4349} {"train_info/time_between_train_steps": 0.003350973129272461, "step": 4349} {"info/global_step": 4350, "train_info/time_within_train_step": 2.6457996368408203, "step": 4350} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746909651, "_runtime": 12249}, "step": 4350} {"logs": {"train/loss": 3.7609, "train/learning_rate": 0.00037666666666666664, "train/epoch": 5.0, "_timestamp": 1746909651, "_runtime": 12249}, "step": 4350} {"train_info/time_between_train_steps": 0.024459362030029297, "step": 4350} {"info/global_step": 4351, "train_info/time_within_train_step": 2.659775495529175, "step": 4351} {"train_info/time_between_train_steps": 0.0032553672790527344, "step": 4351} {"info/global_step": 4352, "train_info/time_within_train_step": 2.651384115219116, "step": 4352} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 4352} {"info/global_step": 4353, "train_info/time_within_train_step": 2.652498722076416, "step": 4353} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 4353} {"info/global_step": 4354, "train_info/time_within_train_step": 2.650164842605591, "step": 4354} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 4354} {"info/global_step": 4355, "train_info/time_within_train_step": 2.6538355350494385, "step": 4355} {"train_info/time_between_train_steps": 0.0032806396484375, "step": 4355} {"info/global_step": 4356, "train_info/time_within_train_step": 2.6501941680908203, "step": 4356} {"train_info/time_between_train_steps": 0.0032486915588378906, "step": 4356} {"info/global_step": 4357, "train_info/time_within_train_step": 2.668570041656494, "step": 4357} {"train_info/time_between_train_steps": 0.0034530162811279297, "step": 4357} {"info/global_step": 4358, "train_info/time_within_train_step": 2.647599697113037, "step": 4358} {"train_info/time_between_train_steps": 0.004007101058959961, "step": 4358} {"info/global_step": 4359, "train_info/time_within_train_step": 2.6522669792175293, "step": 4359} {"train_info/time_between_train_steps": 0.0037169456481933594, "step": 4359} {"info/global_step": 4360, "train_info/time_within_train_step": 2.652289628982544, "step": 4360} {"train_info/time_between_train_steps": 0.003806591033935547, "step": 4360} {"info/global_step": 4361, "train_info/time_within_train_step": 2.672201633453369, "step": 4361} {"train_info/time_between_train_steps": 0.004119157791137695, "step": 4361} {"info/global_step": 4362, "train_info/time_within_train_step": 2.662534236907959, "step": 4362} {"train_info/time_between_train_steps": 0.003943920135498047, "step": 4362} {"info/global_step": 4363, "train_info/time_within_train_step": 2.668529510498047, "step": 4363} {"train_info/time_between_train_steps": 0.0039288997650146484, "step": 4363} {"info/global_step": 4364, "train_info/time_within_train_step": 2.686028003692627, "step": 4364} {"train_info/time_between_train_steps": 0.0038480758666992188, "step": 4364} {"info/global_step": 4365, "train_info/time_within_train_step": 2.6815733909606934, "step": 4365} {"train_info/time_between_train_steps": 0.003873586654663086, "step": 4365} {"info/global_step": 4366, "train_info/time_within_train_step": 2.6470632553100586, "step": 4366} {"train_info/time_between_train_steps": 0.0040585994720458984, "step": 4366} {"info/global_step": 4367, "train_info/time_within_train_step": 2.6452062129974365, "step": 4367} {"train_info/time_between_train_steps": 0.003970146179199219, "step": 4367} {"info/global_step": 4368, "train_info/time_within_train_step": 2.6664328575134277, "step": 4368} {"train_info/time_between_train_steps": 0.003782987594604492, "step": 4368} {"info/global_step": 4369, "train_info/time_within_train_step": 2.6537559032440186, "step": 4369} {"train_info/time_between_train_steps": 0.004059314727783203, "step": 4369} {"info/global_step": 4370, "train_info/time_within_train_step": 2.6526286602020264, "step": 4370} {"train_info/time_between_train_steps": 0.003907918930053711, "step": 4370} {"info/global_step": 4371, "train_info/time_within_train_step": 2.6539502143859863, "step": 4371} {"train_info/time_between_train_steps": 0.0037322044372558594, "step": 4371} {"info/global_step": 4372, "train_info/time_within_train_step": 3.04426646232605, "step": 4372} {"train_info/time_between_train_steps": 0.003301858901977539, "step": 4372} {"info/global_step": 4373, "train_info/time_within_train_step": 2.6430752277374268, "step": 4373} {"train_info/time_between_train_steps": 0.003306865692138672, "step": 4373} {"info/global_step": 4374, "train_info/time_within_train_step": 2.6640748977661133, "step": 4374} {"train_info/time_between_train_steps": 0.003357410430908203, "step": 4374} {"info/global_step": 4375, "train_info/time_within_train_step": 2.6491522789001465, "step": 4375} {"train_info/time_between_train_steps": 0.003358125686645508, "step": 4375} {"info/global_step": 4376, "train_info/time_within_train_step": 2.6477625370025635, "step": 4376} {"train_info/time_between_train_steps": 0.0033597946166992188, "step": 4376} {"info/global_step": 4377, "train_info/time_within_train_step": 2.7091193199157715, "step": 4377} {"train_info/time_between_train_steps": 0.0033135414123535156, "step": 4377} {"info/global_step": 4378, "train_info/time_within_train_step": 2.8398547172546387, "step": 4378} {"train_info/time_between_train_steps": 0.0032470226287841797, "step": 4378} {"info/global_step": 4379, "train_info/time_within_train_step": 2.668029308319092, "step": 4379} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 4379} {"info/global_step": 4380, "train_info/time_within_train_step": 2.7271456718444824, "step": 4380} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 4380} {"info/global_step": 4381, "train_info/time_within_train_step": 2.6513102054595947, "step": 4381} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 4381} {"info/global_step": 4382, "train_info/time_within_train_step": 2.645272970199585, "step": 4382} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 4382} {"info/global_step": 4383, "train_info/time_within_train_step": 2.6579413414001465, "step": 4383} {"train_info/time_between_train_steps": 0.003244638442993164, "step": 4383} {"info/global_step": 4384, "train_info/time_within_train_step": 2.650423288345337, "step": 4384} {"train_info/time_between_train_steps": 0.003255128860473633, "step": 4384} {"info/global_step": 4385, "train_info/time_within_train_step": 2.6522254943847656, "step": 4385} {"train_info/time_between_train_steps": 0.003294706344604492, "step": 4385} {"info/global_step": 4386, "train_info/time_within_train_step": 2.646151065826416, "step": 4386} {"train_info/time_between_train_steps": 0.0032281875610351562, "step": 4386} {"info/global_step": 4387, "train_info/time_within_train_step": 2.649885892868042, "step": 4387} {"train_info/time_between_train_steps": 0.0032660961151123047, "step": 4387} {"info/global_step": 4388, "train_info/time_within_train_step": 2.6649138927459717, "step": 4388} {"train_info/time_between_train_steps": 0.0033800601959228516, "step": 4388} {"info/global_step": 4389, "train_info/time_within_train_step": 2.671238899230957, "step": 4389} {"train_info/time_between_train_steps": 0.0032777786254882812, "step": 4389} {"info/global_step": 4390, "train_info/time_within_train_step": 2.7110085487365723, "step": 4390} {"train_info/time_between_train_steps": 0.0033533573150634766, "step": 4390} {"info/global_step": 4391, "train_info/time_within_train_step": 2.64387845993042, "step": 4391} {"train_info/time_between_train_steps": 0.003290891647338867, "step": 4391} {"info/global_step": 4392, "train_info/time_within_train_step": 2.6504907608032227, "step": 4392} {"train_info/time_between_train_steps": 0.0033087730407714844, "step": 4392} {"info/global_step": 4393, "train_info/time_within_train_step": 2.655280113220215, "step": 4393} {"train_info/time_between_train_steps": 0.0032453536987304688, "step": 4393} {"info/global_step": 4394, "train_info/time_within_train_step": 2.6493852138519287, "step": 4394} {"train_info/time_between_train_steps": 0.003345489501953125, "step": 4394} {"info/global_step": 4395, "train_info/time_within_train_step": 2.655803680419922, "step": 4395} {"train_info/time_between_train_steps": 0.003258228302001953, "step": 4395} {"info/global_step": 4396, "train_info/time_within_train_step": 2.6450483798980713, "step": 4396} {"train_info/time_between_train_steps": 0.0032203197479248047, "step": 4396} {"info/global_step": 4397, "train_info/time_within_train_step": 2.6461734771728516, "step": 4397} {"train_info/time_between_train_steps": 0.0037610530853271484, "step": 4397} {"info/global_step": 4398, "train_info/time_within_train_step": 2.653489828109741, "step": 4398} {"train_info/time_between_train_steps": 0.0032672882080078125, "step": 4398} {"info/global_step": 4399, "train_info/time_within_train_step": 2.6556785106658936, "step": 4399} {"train_info/time_between_train_steps": 0.0038254261016845703, "step": 4399} {"info/global_step": 4400, "train_info/time_within_train_step": 2.649519681930542, "step": 4400} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746909786, "_runtime": 12384}, "step": 4400} {"logs": {"train/loss": 3.7292, "train/learning_rate": 0.0003733333333333333, "train/epoch": 5.01, "_timestamp": 1746909786, "_runtime": 12384}, "step": 4400} {"train_info/time_between_train_steps": 14.72954249382019, "step": 4400} {"info/global_step": 4401, "train_info/time_within_train_step": 2.4472546577453613, "step": 4401} {"train_info/time_between_train_steps": 0.0032939910888671875, "step": 4401} {"info/global_step": 4402, "train_info/time_within_train_step": 2.4294180870056152, "step": 4402} {"train_info/time_between_train_steps": 0.003273487091064453, "step": 4402} {"info/global_step": 4403, "train_info/time_within_train_step": 2.588562250137329, "step": 4403} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 4403} {"info/global_step": 4404, "train_info/time_within_train_step": 2.6402456760406494, "step": 4404} {"train_info/time_between_train_steps": 0.003300905227661133, "step": 4404} {"info/global_step": 4405, "train_info/time_within_train_step": 2.6679189205169678, "step": 4405} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 4405} {"info/global_step": 4406, "train_info/time_within_train_step": 2.66473126411438, "step": 4406} {"train_info/time_between_train_steps": 0.0032782554626464844, "step": 4406} {"info/global_step": 4407, "train_info/time_within_train_step": 2.683702230453491, "step": 4407} {"train_info/time_between_train_steps": 0.0032453536987304688, "step": 4407} {"info/global_step": 4408, "train_info/time_within_train_step": 2.6587445735931396, "step": 4408} {"train_info/time_between_train_steps": 0.003251791000366211, "step": 4408} {"info/global_step": 4409, "train_info/time_within_train_step": 2.6482815742492676, "step": 4409} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 4409} {"info/global_step": 4410, "train_info/time_within_train_step": 2.6546831130981445, "step": 4410} {"train_info/time_between_train_steps": 0.0032176971435546875, "step": 4410} {"info/global_step": 4411, "train_info/time_within_train_step": 2.651965379714966, "step": 4411} {"train_info/time_between_train_steps": 0.003278970718383789, "step": 4411} {"info/global_step": 4412, "train_info/time_within_train_step": 2.647716999053955, "step": 4412} {"train_info/time_between_train_steps": 0.0033180713653564453, "step": 4412} {"info/global_step": 4413, "train_info/time_within_train_step": 2.6506099700927734, "step": 4413} {"train_info/time_between_train_steps": 0.0032186508178710938, "step": 4413} {"info/global_step": 4414, "train_info/time_within_train_step": 2.648085832595825, "step": 4414} {"train_info/time_between_train_steps": 0.0032503604888916016, "step": 4414} {"info/global_step": 4415, "train_info/time_within_train_step": 2.670107126235962, "step": 4415} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 4415} {"info/global_step": 4416, "train_info/time_within_train_step": 2.6595044136047363, "step": 4416} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 4416} {"info/global_step": 4417, "train_info/time_within_train_step": 2.666790723800659, "step": 4417} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 4417} {"info/global_step": 4418, "train_info/time_within_train_step": 2.685920476913452, "step": 4418} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 4418} {"info/global_step": 4419, "train_info/time_within_train_step": 2.676866054534912, "step": 4419} {"train_info/time_between_train_steps": 0.003232240676879883, "step": 4419} {"info/global_step": 4420, "train_info/time_within_train_step": 2.666581869125366, "step": 4420} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 4420} {"info/global_step": 4421, "train_info/time_within_train_step": 2.645672082901001, "step": 4421} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 4421} {"info/global_step": 4422, "train_info/time_within_train_step": 2.6559243202209473, "step": 4422} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 4422} {"info/global_step": 4423, "train_info/time_within_train_step": 2.6477606296539307, "step": 4423} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 4423} {"info/global_step": 4424, "train_info/time_within_train_step": 2.654923439025879, "step": 4424} {"train_info/time_between_train_steps": 0.0034356117248535156, "step": 4424} {"info/global_step": 4425, "train_info/time_within_train_step": 2.6606719493865967, "step": 4425} {"train_info/time_between_train_steps": 0.0032558441162109375, "step": 4425} {"info/global_step": 4426, "train_info/time_within_train_step": 2.6710569858551025, "step": 4426} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 4426} {"info/global_step": 4427, "train_info/time_within_train_step": 2.7291128635406494, "step": 4427} {"train_info/time_between_train_steps": 0.0032422542572021484, "step": 4427} {"info/global_step": 4428, "train_info/time_within_train_step": 2.664538860321045, "step": 4428} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 4428} {"info/global_step": 4429, "train_info/time_within_train_step": 2.643106460571289, "step": 4429} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 4429} {"info/global_step": 4430, "train_info/time_within_train_step": 2.6511330604553223, "step": 4430} {"train_info/time_between_train_steps": 0.0032367706298828125, "step": 4430} {"info/global_step": 4431, "train_info/time_within_train_step": 2.6468448638916016, "step": 4431} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 4431} {"info/global_step": 4432, "train_info/time_within_train_step": 2.6701207160949707, "step": 4432} {"train_info/time_between_train_steps": 0.003258228302001953, "step": 4432} {"info/global_step": 4433, "train_info/time_within_train_step": 2.6728415489196777, "step": 4433} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 4433} {"info/global_step": 4434, "train_info/time_within_train_step": 2.6894943714141846, "step": 4434} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 4434} {"info/global_step": 4435, "train_info/time_within_train_step": 2.6544272899627686, "step": 4435} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 4435} {"info/global_step": 4436, "train_info/time_within_train_step": 2.6446070671081543, "step": 4436} {"train_info/time_between_train_steps": 0.003285646438598633, "step": 4436} {"info/global_step": 4437, "train_info/time_within_train_step": 2.656773090362549, "step": 4437} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 4437} {"info/global_step": 4438, "train_info/time_within_train_step": 2.6550185680389404, "step": 4438} {"train_info/time_between_train_steps": 0.0032739639282226562, "step": 4438} {"info/global_step": 4439, "train_info/time_within_train_step": 2.6477084159851074, "step": 4439} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 4439} {"info/global_step": 4440, "train_info/time_within_train_step": 2.6461403369903564, "step": 4440} {"train_info/time_between_train_steps": 0.12527799606323242, "step": 4440} {"info/global_step": 4441, "train_info/time_within_train_step": 2.6463465690612793, "step": 4441} {"train_info/time_between_train_steps": 0.0032951831817626953, "step": 4441} {"info/global_step": 4442, "train_info/time_within_train_step": 2.647383213043213, "step": 4442} {"train_info/time_between_train_steps": 0.003256559371948242, "step": 4442} {"info/global_step": 4443, "train_info/time_within_train_step": 2.6603751182556152, "step": 4443} {"train_info/time_between_train_steps": 0.003355741500854492, "step": 4443} {"info/global_step": 4444, "train_info/time_within_train_step": 2.671649932861328, "step": 4444} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 4444} {"info/global_step": 4445, "train_info/time_within_train_step": 2.685931444168091, "step": 4445} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 4445} {"info/global_step": 4446, "train_info/time_within_train_step": 2.6514976024627686, "step": 4446} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 4446} {"info/global_step": 4447, "train_info/time_within_train_step": 2.6866607666015625, "step": 4447} {"train_info/time_between_train_steps": 0.00328826904296875, "step": 4447} {"info/global_step": 4448, "train_info/time_within_train_step": 2.6437902450561523, "step": 4448} {"train_info/time_between_train_steps": 0.003361940383911133, "step": 4448} {"info/global_step": 4449, "train_info/time_within_train_step": 2.6495702266693115, "step": 4449} {"train_info/time_between_train_steps": 0.0032596588134765625, "step": 4449} {"info/global_step": 4450, "train_info/time_within_train_step": 2.6633925437927246, "step": 4450} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746909935, "_runtime": 12533}, "step": 4450} {"logs": {"train/loss": 3.7229, "train/learning_rate": 0.00037, "train/epoch": 5.01, "_timestamp": 1746909935, "_runtime": 12533}, "step": 4450} {"train_info/time_between_train_steps": 0.024931669235229492, "step": 4450} {"info/global_step": 4451, "train_info/time_within_train_step": 2.6628994941711426, "step": 4451} {"train_info/time_between_train_steps": 0.0033457279205322266, "step": 4451} {"info/global_step": 4452, "train_info/time_within_train_step": 2.657449960708618, "step": 4452} {"train_info/time_between_train_steps": 0.003305196762084961, "step": 4452} {"info/global_step": 4453, "train_info/time_within_train_step": 2.6519718170166016, "step": 4453} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 4453} {"info/global_step": 4454, "train_info/time_within_train_step": 2.6573097705841064, "step": 4454} {"train_info/time_between_train_steps": 0.003228425979614258, "step": 4454} {"info/global_step": 4455, "train_info/time_within_train_step": 2.661461591720581, "step": 4455} {"train_info/time_between_train_steps": 0.0032775402069091797, "step": 4455} {"info/global_step": 4456, "train_info/time_within_train_step": 2.6781423091888428, "step": 4456} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 4456} {"info/global_step": 4457, "train_info/time_within_train_step": 2.7299952507019043, "step": 4457} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 4457} {"info/global_step": 4458, "train_info/time_within_train_step": 2.666853904724121, "step": 4458} {"train_info/time_between_train_steps": 0.003368377685546875, "step": 4458} {"info/global_step": 4459, "train_info/time_within_train_step": 2.6459078788757324, "step": 4459} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 4459} {"info/global_step": 4460, "train_info/time_within_train_step": 2.644852638244629, "step": 4460} {"train_info/time_between_train_steps": 0.003472566604614258, "step": 4460} {"info/global_step": 4461, "train_info/time_within_train_step": 2.655576705932617, "step": 4461} {"train_info/time_between_train_steps": 0.0032341480255126953, "step": 4461} {"info/global_step": 4462, "train_info/time_within_train_step": 2.652984857559204, "step": 4462} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 4462} {"info/global_step": 4463, "train_info/time_within_train_step": 2.6447784900665283, "step": 4463} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 4463} {"info/global_step": 4464, "train_info/time_within_train_step": 2.650700569152832, "step": 4464} {"train_info/time_between_train_steps": 0.003265857696533203, "step": 4464} {"info/global_step": 4465, "train_info/time_within_train_step": 2.6592648029327393, "step": 4465} {"train_info/time_between_train_steps": 0.003306865692138672, "step": 4465} {"info/global_step": 4466, "train_info/time_within_train_step": 2.6672253608703613, "step": 4466} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 4466} {"info/global_step": 4467, "train_info/time_within_train_step": 2.693394899368286, "step": 4467} {"train_info/time_between_train_steps": 0.0032935142517089844, "step": 4467} {"info/global_step": 4468, "train_info/time_within_train_step": 2.6499059200286865, "step": 4468} {"train_info/time_between_train_steps": 0.003278017044067383, "step": 4468} {"info/global_step": 4469, "train_info/time_within_train_step": 2.891632318496704, "step": 4469} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 4469} {"info/global_step": 4470, "train_info/time_within_train_step": 2.69474720954895, "step": 4470} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 4470} {"info/global_step": 4471, "train_info/time_within_train_step": 2.6664347648620605, "step": 4471} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 4471} {"info/global_step": 4472, "train_info/time_within_train_step": 2.6617887020111084, "step": 4472} {"train_info/time_between_train_steps": 0.003249645233154297, "step": 4472} {"info/global_step": 4473, "train_info/time_within_train_step": 2.6415321826934814, "step": 4473} {"train_info/time_between_train_steps": 0.0034055709838867188, "step": 4473} {"info/global_step": 4474, "train_info/time_within_train_step": 2.6551835536956787, "step": 4474} {"train_info/time_between_train_steps": 0.003201007843017578, "step": 4474} {"info/global_step": 4475, "train_info/time_within_train_step": 2.6805665493011475, "step": 4475} {"train_info/time_between_train_steps": 0.003247976303100586, "step": 4475} {"info/global_step": 4476, "train_info/time_within_train_step": 2.646794319152832, "step": 4476} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 4476} {"info/global_step": 4477, "train_info/time_within_train_step": 2.6442105770111084, "step": 4477} {"train_info/time_between_train_steps": 0.0032694339752197266, "step": 4477} {"info/global_step": 4478, "train_info/time_within_train_step": 2.648939847946167, "step": 4478} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 4478} {"info/global_step": 4479, "train_info/time_within_train_step": 2.673835277557373, "step": 4479} {"train_info/time_between_train_steps": 0.0032770633697509766, "step": 4479} {"info/global_step": 4480, "train_info/time_within_train_step": 2.667881488800049, "step": 4480} {"train_info/time_between_train_steps": 0.0033788681030273438, "step": 4480} {"info/global_step": 4481, "train_info/time_within_train_step": 2.6630778312683105, "step": 4481} {"train_info/time_between_train_steps": 0.003321409225463867, "step": 4481} {"info/global_step": 4482, "train_info/time_within_train_step": 2.6814095973968506, "step": 4482} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 4482} {"info/global_step": 4483, "train_info/time_within_train_step": 2.6426384449005127, "step": 4483} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 4483} {"info/global_step": 4484, "train_info/time_within_train_step": 2.644012212753296, "step": 4484} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 4484} {"info/global_step": 4485, "train_info/time_within_train_step": 2.6447489261627197, "step": 4485} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 4485} {"info/global_step": 4486, "train_info/time_within_train_step": 2.658341407775879, "step": 4486} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 4486} {"info/global_step": 4487, "train_info/time_within_train_step": 2.6618127822875977, "step": 4487} {"train_info/time_between_train_steps": 0.0032563209533691406, "step": 4487} {"info/global_step": 4488, "train_info/time_within_train_step": 2.67667293548584, "step": 4488} {"train_info/time_between_train_steps": 0.0032644271850585938, "step": 4488} {"info/global_step": 4489, "train_info/time_within_train_step": 2.6675758361816406, "step": 4489} {"train_info/time_between_train_steps": 0.0032622814178466797, "step": 4489} {"info/global_step": 4490, "train_info/time_within_train_step": 2.6980388164520264, "step": 4490} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 4490} {"info/global_step": 4491, "train_info/time_within_train_step": 2.6422150135040283, "step": 4491} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 4491} {"info/global_step": 4492, "train_info/time_within_train_step": 2.6421401500701904, "step": 4492} {"train_info/time_between_train_steps": 0.0032701492309570312, "step": 4492} {"info/global_step": 4493, "train_info/time_within_train_step": 2.663468599319458, "step": 4493} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 4493} {"info/global_step": 4494, "train_info/time_within_train_step": 2.647578239440918, "step": 4494} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 4494} {"info/global_step": 4495, "train_info/time_within_train_step": 2.6448187828063965, "step": 4495} {"train_info/time_between_train_steps": 0.0032241344451904297, "step": 4495} {"info/global_step": 4496, "train_info/time_within_train_step": 2.6638498306274414, "step": 4496} {"train_info/time_between_train_steps": 0.003647327423095703, "step": 4496} {"info/global_step": 4497, "train_info/time_within_train_step": 2.652602195739746, "step": 4497} {"train_info/time_between_train_steps": 0.003256559371948242, "step": 4497} {"info/global_step": 4498, "train_info/time_within_train_step": 2.6602702140808105, "step": 4498} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 4498} {"info/global_step": 4499, "train_info/time_within_train_step": 3.276209831237793, "step": 4499} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 4499} {"info/global_step": 4500, "train_info/time_within_train_step": 2.646401882171631, "step": 4500} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746910070, "_runtime": 12668}, "step": 4500} {"logs": {"train/loss": 3.7126, "train/learning_rate": 0.00036666666666666667, "train/epoch": 5.02, "_timestamp": 1746910070, "_runtime": 12668}, "step": 4500} {"train_info/time_between_train_steps": 0.024684667587280273, "step": 4500} {"info/global_step": 4501, "train_info/time_within_train_step": 2.64734148979187, "step": 4501} {"train_info/time_between_train_steps": 0.0032317638397216797, "step": 4501} {"info/global_step": 4502, "train_info/time_within_train_step": 2.6497385501861572, "step": 4502} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 4502} {"info/global_step": 4503, "train_info/time_within_train_step": 2.790097951889038, "step": 4503} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 4503} {"info/global_step": 4504, "train_info/time_within_train_step": 2.6427161693573, "step": 4504} {"train_info/time_between_train_steps": 0.003237009048461914, "step": 4504} {"info/global_step": 4505, "train_info/time_within_train_step": 2.646301746368408, "step": 4505} {"train_info/time_between_train_steps": 0.003251791000366211, "step": 4505} {"info/global_step": 4506, "train_info/time_within_train_step": 2.650857448577881, "step": 4506} {"train_info/time_between_train_steps": 0.003277301788330078, "step": 4506} {"info/global_step": 4507, "train_info/time_within_train_step": 2.6521220207214355, "step": 4507} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 4507} {"info/global_step": 4508, "train_info/time_within_train_step": 2.661093235015869, "step": 4508} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 4508} {"info/global_step": 4509, "train_info/time_within_train_step": 2.681581974029541, "step": 4509} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 4509} {"info/global_step": 4510, "train_info/time_within_train_step": 2.7277302742004395, "step": 4510} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 4510} {"info/global_step": 4511, "train_info/time_within_train_step": 2.6480305194854736, "step": 4511} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 4511} {"info/global_step": 4512, "train_info/time_within_train_step": 2.6421451568603516, "step": 4512} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 4512} {"info/global_step": 4513, "train_info/time_within_train_step": 2.6606688499450684, "step": 4513} {"train_info/time_between_train_steps": 0.003274202346801758, "step": 4513} {"info/global_step": 4514, "train_info/time_within_train_step": 2.648197650909424, "step": 4514} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 4514} {"info/global_step": 4515, "train_info/time_within_train_step": 2.6441681385040283, "step": 4515} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 4515} {"info/global_step": 4516, "train_info/time_within_train_step": 2.6521499156951904, "step": 4516} {"train_info/time_between_train_steps": 0.003269195556640625, "step": 4516} {"info/global_step": 4517, "train_info/time_within_train_step": 2.644002676010132, "step": 4517} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 4517} {"info/global_step": 4518, "train_info/time_within_train_step": 2.6680426597595215, "step": 4518} {"train_info/time_between_train_steps": 0.003261089324951172, "step": 4518} {"info/global_step": 4519, "train_info/time_within_train_step": 2.7114295959472656, "step": 4519} {"train_info/time_between_train_steps": 0.003283262252807617, "step": 4519} {"info/global_step": 4520, "train_info/time_within_train_step": 2.6493492126464844, "step": 4520} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 4520} {"info/global_step": 4521, "train_info/time_within_train_step": 2.662712574005127, "step": 4521} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 4521} {"info/global_step": 4522, "train_info/time_within_train_step": 2.641801595687866, "step": 4522} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 4522} {"info/global_step": 4523, "train_info/time_within_train_step": 2.6488983631134033, "step": 4523} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 4523} {"info/global_step": 4524, "train_info/time_within_train_step": 2.6629436016082764, "step": 4524} {"train_info/time_between_train_steps": 0.003246307373046875, "step": 4524} {"info/global_step": 4525, "train_info/time_within_train_step": 2.6434473991394043, "step": 4525} {"train_info/time_between_train_steps": 0.0032629966735839844, "step": 4525} {"info/global_step": 4526, "train_info/time_within_train_step": 2.6883902549743652, "step": 4526} {"train_info/time_between_train_steps": 0.0032672882080078125, "step": 4526} {"info/global_step": 4527, "train_info/time_within_train_step": 2.642544984817505, "step": 4527} {"train_info/time_between_train_steps": 0.003286123275756836, "step": 4527} {"info/global_step": 4528, "train_info/time_within_train_step": 2.8975207805633545, "step": 4528} {"train_info/time_between_train_steps": 0.0033028125762939453, "step": 4528} {"info/global_step": 4529, "train_info/time_within_train_step": 2.6550848484039307, "step": 4529} {"train_info/time_between_train_steps": 0.0032389163970947266, "step": 4529} {"info/global_step": 4530, "train_info/time_within_train_step": 2.6736390590667725, "step": 4530} {"train_info/time_between_train_steps": 0.0032579898834228516, "step": 4530} {"info/global_step": 4531, "train_info/time_within_train_step": 2.6424336433410645, "step": 4531} {"train_info/time_between_train_steps": 0.003193378448486328, "step": 4531} {"info/global_step": 4532, "train_info/time_within_train_step": 2.6444294452667236, "step": 4532} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 4532} {"info/global_step": 4533, "train_info/time_within_train_step": 2.667052984237671, "step": 4533} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 4533} {"info/global_step": 4534, "train_info/time_within_train_step": 2.647555351257324, "step": 4534} {"train_info/time_between_train_steps": 0.0032699108123779297, "step": 4534} {"info/global_step": 4535, "train_info/time_within_train_step": 2.6438791751861572, "step": 4535} {"train_info/time_between_train_steps": 0.0031943321228027344, "step": 4535} {"info/global_step": 4536, "train_info/time_within_train_step": 2.663123607635498, "step": 4536} {"train_info/time_between_train_steps": 0.003249645233154297, "step": 4536} {"info/global_step": 4537, "train_info/time_within_train_step": 2.661860942840576, "step": 4537} {"train_info/time_between_train_steps": 0.0032510757446289062, "step": 4537} {"info/global_step": 4538, "train_info/time_within_train_step": 2.673363447189331, "step": 4538} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 4538} {"info/global_step": 4539, "train_info/time_within_train_step": 2.6722729206085205, "step": 4539} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 4539} {"info/global_step": 4540, "train_info/time_within_train_step": 2.690068483352661, "step": 4540} {"train_info/time_between_train_steps": 0.0034949779510498047, "step": 4540} {"info/global_step": 4541, "train_info/time_within_train_step": 2.640761375427246, "step": 4541} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 4541} {"info/global_step": 4542, "train_info/time_within_train_step": 2.642345666885376, "step": 4542} {"train_info/time_between_train_steps": 0.003246784210205078, "step": 4542} {"info/global_step": 4543, "train_info/time_within_train_step": 2.664340019226074, "step": 4543} {"train_info/time_between_train_steps": 0.003387451171875, "step": 4543} {"info/global_step": 4544, "train_info/time_within_train_step": 2.6496644020080566, "step": 4544} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 4544} {"info/global_step": 4545, "train_info/time_within_train_step": 2.643023729324341, "step": 4545} {"train_info/time_between_train_steps": 0.003252744674682617, "step": 4545} {"info/global_step": 4546, "train_info/time_within_train_step": 2.657611846923828, "step": 4546} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 4546} {"info/global_step": 4547, "train_info/time_within_train_step": 2.6510324478149414, "step": 4547} {"train_info/time_between_train_steps": 0.003270864486694336, "step": 4547} {"info/global_step": 4548, "train_info/time_within_train_step": 2.642333507537842, "step": 4548} {"train_info/time_between_train_steps": 0.0032944679260253906, "step": 4548} {"info/global_step": 4549, "train_info/time_within_train_step": 2.644766092300415, "step": 4549} {"train_info/time_between_train_steps": 0.003284931182861328, "step": 4549} {"info/global_step": 4550, "train_info/time_within_train_step": 2.6544694900512695, "step": 4550} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746910204, "_runtime": 12802}, "step": 4550} {"logs": {"train/loss": 3.6942, "train/learning_rate": 0.0003633333333333333, "train/epoch": 5.02, "_timestamp": 1746910204, "_runtime": 12802}, "step": 4550} {"train_info/time_between_train_steps": 0.024513721466064453, "step": 4550} {"info/global_step": 4551, "train_info/time_within_train_step": 2.6493773460388184, "step": 4551} {"train_info/time_between_train_steps": 0.003240823745727539, "step": 4551} {"info/global_step": 4552, "train_info/time_within_train_step": 2.647723913192749, "step": 4552} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 4552} {"info/global_step": 4553, "train_info/time_within_train_step": 2.6467063426971436, "step": 4553} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 4553} {"info/global_step": 4554, "train_info/time_within_train_step": 2.6633455753326416, "step": 4554} {"train_info/time_between_train_steps": 0.0032296180725097656, "step": 4554} {"info/global_step": 4555, "train_info/time_within_train_step": 2.6675968170166016, "step": 4555} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 4555} {"info/global_step": 4556, "train_info/time_within_train_step": 2.701218605041504, "step": 4556} {"train_info/time_between_train_steps": 0.0032939910888671875, "step": 4556} {"info/global_step": 4557, "train_info/time_within_train_step": 2.643306016921997, "step": 4557} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 4557} {"info/global_step": 4558, "train_info/time_within_train_step": 2.650418281555176, "step": 4558} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 4558} {"info/global_step": 4559, "train_info/time_within_train_step": 2.6512014865875244, "step": 4559} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 4559} {"info/global_step": 4560, "train_info/time_within_train_step": 2.6471495628356934, "step": 4560} {"train_info/time_between_train_steps": 0.0032808780670166016, "step": 4560} {"info/global_step": 4561, "train_info/time_within_train_step": 2.6578288078308105, "step": 4561} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 4561} {"info/global_step": 4562, "train_info/time_within_train_step": 2.6444523334503174, "step": 4562} {"train_info/time_between_train_steps": 0.0032634735107421875, "step": 4562} {"info/global_step": 4563, "train_info/time_within_train_step": 2.6449007987976074, "step": 4563} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 4563} {"info/global_step": 4564, "train_info/time_within_train_step": 2.673654317855835, "step": 4564} {"train_info/time_between_train_steps": 0.0032622814178466797, "step": 4564} {"info/global_step": 4565, "train_info/time_within_train_step": 2.667193651199341, "step": 4565} {"train_info/time_between_train_steps": 0.12725067138671875, "step": 4565} {"info/global_step": 4566, "train_info/time_within_train_step": 2.6728405952453613, "step": 4566} {"train_info/time_between_train_steps": 0.0032765865325927734, "step": 4566} {"info/global_step": 4567, "train_info/time_within_train_step": 2.666565179824829, "step": 4567} {"train_info/time_between_train_steps": 0.0032706260681152344, "step": 4567} {"info/global_step": 4568, "train_info/time_within_train_step": 2.6630795001983643, "step": 4568} {"train_info/time_between_train_steps": 0.0032553672790527344, "step": 4568} {"info/global_step": 4569, "train_info/time_within_train_step": 2.677633285522461, "step": 4569} {"train_info/time_between_train_steps": 0.003232240676879883, "step": 4569} {"info/global_step": 4570, "train_info/time_within_train_step": 2.6443405151367188, "step": 4570} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 4570} {"info/global_step": 4571, "train_info/time_within_train_step": 2.654496192932129, "step": 4571} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 4571} {"info/global_step": 4572, "train_info/time_within_train_step": 2.904885768890381, "step": 4572} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 4572} {"info/global_step": 4573, "train_info/time_within_train_step": 2.692578077316284, "step": 4573} {"train_info/time_between_train_steps": 0.0032243728637695312, "step": 4573} {"info/global_step": 4574, "train_info/time_within_train_step": 2.6427745819091797, "step": 4574} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 4574} {"info/global_step": 4575, "train_info/time_within_train_step": 2.6558284759521484, "step": 4575} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 4575} {"info/global_step": 4576, "train_info/time_within_train_step": 2.6593217849731445, "step": 4576} {"train_info/time_between_train_steps": 0.0032596588134765625, "step": 4576} {"info/global_step": 4577, "train_info/time_within_train_step": 2.645111560821533, "step": 4577} {"train_info/time_between_train_steps": 0.0032663345336914062, "step": 4577} {"info/global_step": 4578, "train_info/time_within_train_step": 2.64487624168396, "step": 4578} {"train_info/time_between_train_steps": 0.0032453536987304688, "step": 4578} {"info/global_step": 4579, "train_info/time_within_train_step": 2.660029411315918, "step": 4579} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 4579} {"info/global_step": 4580, "train_info/time_within_train_step": 2.6697559356689453, "step": 4580} {"train_info/time_between_train_steps": 0.0032835006713867188, "step": 4580} {"info/global_step": 4581, "train_info/time_within_train_step": 2.678506851196289, "step": 4581} {"train_info/time_between_train_steps": 0.0034210681915283203, "step": 4581} {"info/global_step": 4582, "train_info/time_within_train_step": 2.6700010299682617, "step": 4582} {"train_info/time_between_train_steps": 0.003360748291015625, "step": 4582} {"info/global_step": 4583, "train_info/time_within_train_step": 2.7179269790649414, "step": 4583} {"train_info/time_between_train_steps": 0.0033185482025146484, "step": 4583} {"info/global_step": 4584, "train_info/time_within_train_step": 2.6676342487335205, "step": 4584} {"train_info/time_between_train_steps": 0.003258943557739258, "step": 4584} {"info/global_step": 4585, "train_info/time_within_train_step": 2.6585984230041504, "step": 4585} {"train_info/time_between_train_steps": 0.003266572952270508, "step": 4585} {"info/global_step": 4586, "train_info/time_within_train_step": 2.6585946083068848, "step": 4586} {"train_info/time_between_train_steps": 0.0032682418823242188, "step": 4586} {"info/global_step": 4587, "train_info/time_within_train_step": 2.663921356201172, "step": 4587} {"train_info/time_between_train_steps": 0.0033681392669677734, "step": 4587} {"info/global_step": 4588, "train_info/time_within_train_step": 2.7003655433654785, "step": 4588} {"train_info/time_between_train_steps": 0.0032782554626464844, "step": 4588} {"info/global_step": 4589, "train_info/time_within_train_step": 2.722935914993286, "step": 4589} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 4589} {"info/global_step": 4590, "train_info/time_within_train_step": 2.646449565887451, "step": 4590} {"train_info/time_between_train_steps": 0.003277301788330078, "step": 4590} {"info/global_step": 4591, "train_info/time_within_train_step": 2.6468236446380615, "step": 4591} {"train_info/time_between_train_steps": 0.003270864486694336, "step": 4591} {"info/global_step": 4592, "train_info/time_within_train_step": 2.6637916564941406, "step": 4592} {"train_info/time_between_train_steps": 0.0033140182495117188, "step": 4592} {"info/global_step": 4593, "train_info/time_within_train_step": 2.6492068767547607, "step": 4593} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 4593} {"info/global_step": 4594, "train_info/time_within_train_step": 2.649217128753662, "step": 4594} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 4594} {"info/global_step": 4595, "train_info/time_within_train_step": 2.6485114097595215, "step": 4595} {"train_info/time_between_train_steps": 0.003226041793823242, "step": 4595} {"info/global_step": 4596, "train_info/time_within_train_step": 2.6445415019989014, "step": 4596} {"train_info/time_between_train_steps": 0.0033304691314697266, "step": 4596} {"info/global_step": 4597, "train_info/time_within_train_step": 2.669853925704956, "step": 4597} {"train_info/time_between_train_steps": 0.0032944679260253906, "step": 4597} {"info/global_step": 4598, "train_info/time_within_train_step": 2.684058666229248, "step": 4598} {"train_info/time_between_train_steps": 0.0032486915588378906, "step": 4598} {"info/global_step": 4599, "train_info/time_within_train_step": 2.687251329421997, "step": 4599} {"train_info/time_between_train_steps": 0.003299236297607422, "step": 4599} {"info/global_step": 4600, "train_info/time_within_train_step": 2.6532480716705322, "step": 4600} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746910339, "_runtime": 12937}, "step": 4600} {"logs": {"train/loss": 3.6889, "train/learning_rate": 0.00035999999999999997, "train/epoch": 5.03, "_timestamp": 1746910339, "_runtime": 12937}, "step": 4600} {"train_info/time_between_train_steps": 24.303050756454468, "step": 4600} {"info/global_step": 4601, "train_info/time_within_train_step": 2.4408085346221924, "step": 4601} {"train_info/time_between_train_steps": 0.003357410430908203, "step": 4601} {"info/global_step": 4602, "train_info/time_within_train_step": 2.420776128768921, "step": 4602} {"train_info/time_between_train_steps": 0.0032923221588134766, "step": 4602} {"info/global_step": 4603, "train_info/time_within_train_step": 2.5259809494018555, "step": 4603} {"train_info/time_between_train_steps": 0.003239154815673828, "step": 4603} {"info/global_step": 4604, "train_info/time_within_train_step": 2.6870102882385254, "step": 4604} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 4604} {"info/global_step": 4605, "train_info/time_within_train_step": 2.658992290496826, "step": 4605} {"train_info/time_between_train_steps": 0.0032074451446533203, "step": 4605} {"info/global_step": 4606, "train_info/time_within_train_step": 2.6466941833496094, "step": 4606} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 4606} {"info/global_step": 4607, "train_info/time_within_train_step": 2.6535964012145996, "step": 4607} {"train_info/time_between_train_steps": 0.0033032894134521484, "step": 4607} {"info/global_step": 4608, "train_info/time_within_train_step": 2.6495583057403564, "step": 4608} {"train_info/time_between_train_steps": 0.0033080577850341797, "step": 4608} {"info/global_step": 4609, "train_info/time_within_train_step": 2.668942928314209, "step": 4609} {"train_info/time_between_train_steps": 0.0033349990844726562, "step": 4609} {"info/global_step": 4610, "train_info/time_within_train_step": 2.7032899856567383, "step": 4610} {"train_info/time_between_train_steps": 0.003284931182861328, "step": 4610} {"info/global_step": 4611, "train_info/time_within_train_step": 2.6531641483306885, "step": 4611} {"train_info/time_between_train_steps": 0.0032770633697509766, "step": 4611} {"info/global_step": 4612, "train_info/time_within_train_step": 2.6781883239746094, "step": 4612} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 4612} {"info/global_step": 4613, "train_info/time_within_train_step": 2.6578240394592285, "step": 4613} {"train_info/time_between_train_steps": 0.003250598907470703, "step": 4613} {"info/global_step": 4614, "train_info/time_within_train_step": 2.649667263031006, "step": 4614} {"train_info/time_between_train_steps": 0.0033254623413085938, "step": 4614} {"info/global_step": 4615, "train_info/time_within_train_step": 2.6459250450134277, "step": 4615} {"train_info/time_between_train_steps": 0.0033006668090820312, "step": 4615} {"info/global_step": 4616, "train_info/time_within_train_step": 2.6576879024505615, "step": 4616} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 4616} {"info/global_step": 4617, "train_info/time_within_train_step": 2.6720550060272217, "step": 4617} {"train_info/time_between_train_steps": 0.0032944679260253906, "step": 4617} {"info/global_step": 4618, "train_info/time_within_train_step": 2.6848838329315186, "step": 4618} {"train_info/time_between_train_steps": 0.0033092498779296875, "step": 4618} {"info/global_step": 4619, "train_info/time_within_train_step": 2.6519148349761963, "step": 4619} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 4619} {"info/global_step": 4620, "train_info/time_within_train_step": 2.683544158935547, "step": 4620} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 4620} {"info/global_step": 4621, "train_info/time_within_train_step": 2.643533945083618, "step": 4621} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 4621} {"info/global_step": 4622, "train_info/time_within_train_step": 2.648897409439087, "step": 4622} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 4622} {"info/global_step": 4623, "train_info/time_within_train_step": 2.6627612113952637, "step": 4623} {"train_info/time_between_train_steps": 0.0032618045806884766, "step": 4623} {"info/global_step": 4624, "train_info/time_within_train_step": 2.6505565643310547, "step": 4624} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 4624} {"info/global_step": 4625, "train_info/time_within_train_step": 2.645948648452759, "step": 4625} {"train_info/time_between_train_steps": 0.0034749507904052734, "step": 4625} {"info/global_step": 4626, "train_info/time_within_train_step": 2.669724464416504, "step": 4626} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 4626} {"info/global_step": 4627, "train_info/time_within_train_step": 2.658686637878418, "step": 4627} {"train_info/time_between_train_steps": 0.003337383270263672, "step": 4627} {"info/global_step": 4628, "train_info/time_within_train_step": 2.798691749572754, "step": 4628} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 4628} {"info/global_step": 4629, "train_info/time_within_train_step": 2.6426498889923096, "step": 4629} {"train_info/time_between_train_steps": 0.0032486915588378906, "step": 4629} {"info/global_step": 4630, "train_info/time_within_train_step": 2.895155906677246, "step": 4630} {"train_info/time_between_train_steps": 0.0033926963806152344, "step": 4630} {"info/global_step": 4631, "train_info/time_within_train_step": 2.6807031631469727, "step": 4631} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 4631} {"info/global_step": 4632, "train_info/time_within_train_step": 2.6703312397003174, "step": 4632} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 4632} {"info/global_step": 4633, "train_info/time_within_train_step": 2.644989252090454, "step": 4633} {"train_info/time_between_train_steps": 0.003265857696533203, "step": 4633} {"info/global_step": 4634, "train_info/time_within_train_step": 2.644512891769409, "step": 4634} {"train_info/time_between_train_steps": 0.0032339096069335938, "step": 4634} {"info/global_step": 4635, "train_info/time_within_train_step": 2.657545328140259, "step": 4635} {"train_info/time_between_train_steps": 0.003615140914916992, "step": 4635} {"info/global_step": 4636, "train_info/time_within_train_step": 2.6553568840026855, "step": 4636} {"train_info/time_between_train_steps": 0.0032782554626464844, "step": 4636} {"info/global_step": 4637, "train_info/time_within_train_step": 2.646009922027588, "step": 4637} {"train_info/time_between_train_steps": 0.0032482147216796875, "step": 4637} {"info/global_step": 4638, "train_info/time_within_train_step": 2.6615891456604004, "step": 4638} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 4638} {"info/global_step": 4639, "train_info/time_within_train_step": 2.6547722816467285, "step": 4639} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 4639} {"info/global_step": 4640, "train_info/time_within_train_step": 2.6609647274017334, "step": 4640} {"train_info/time_between_train_steps": 0.003446817398071289, "step": 4640} {"info/global_step": 4641, "train_info/time_within_train_step": 2.718472957611084, "step": 4641} {"train_info/time_between_train_steps": 0.0035648345947265625, "step": 4641} {"info/global_step": 4642, "train_info/time_within_train_step": 2.6964242458343506, "step": 4642} {"train_info/time_between_train_steps": 0.003243684768676758, "step": 4642} {"info/global_step": 4643, "train_info/time_within_train_step": 2.643763542175293, "step": 4643} {"train_info/time_between_train_steps": 0.003236532211303711, "step": 4643} {"info/global_step": 4644, "train_info/time_within_train_step": 2.6435561180114746, "step": 4644} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 4644} {"info/global_step": 4645, "train_info/time_within_train_step": 2.6587986946105957, "step": 4645} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 4645} {"info/global_step": 4646, "train_info/time_within_train_step": 2.6544482707977295, "step": 4646} {"train_info/time_between_train_steps": 0.0032165050506591797, "step": 4646} {"info/global_step": 4647, "train_info/time_within_train_step": 2.6462795734405518, "step": 4647} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 4647} {"info/global_step": 4648, "train_info/time_within_train_step": 2.6547443866729736, "step": 4648} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 4648} {"info/global_step": 4649, "train_info/time_within_train_step": 2.650437831878662, "step": 4649} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 4649} {"info/global_step": 4650, "train_info/time_within_train_step": 2.6702072620391846, "step": 4650} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746910497, "_runtime": 13095}, "step": 4650} {"logs": {"train/loss": 3.6846, "train/learning_rate": 0.00035666666666666664, "train/epoch": 5.03, "_timestamp": 1746910497, "_runtime": 13095}, "step": 4650} {"train_info/time_between_train_steps": 0.024682044982910156, "step": 4650} {"info/global_step": 4651, "train_info/time_within_train_step": 2.674581527709961, "step": 4651} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 4651} {"info/global_step": 4652, "train_info/time_within_train_step": 2.689964532852173, "step": 4652} {"train_info/time_between_train_steps": 0.003232240676879883, "step": 4652} {"info/global_step": 4653, "train_info/time_within_train_step": 2.653050661087036, "step": 4653} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 4653} {"info/global_step": 4654, "train_info/time_within_train_step": 2.6420669555664062, "step": 4654} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 4654} {"info/global_step": 4655, "train_info/time_within_train_step": 2.6552066802978516, "step": 4655} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 4655} {"info/global_step": 4656, "train_info/time_within_train_step": 2.6609280109405518, "step": 4656} {"train_info/time_between_train_steps": 0.003188610076904297, "step": 4656} {"info/global_step": 4657, "train_info/time_within_train_step": 2.645176410675049, "step": 4657} {"train_info/time_between_train_steps": 0.0032694339752197266, "step": 4657} {"info/global_step": 4658, "train_info/time_within_train_step": 2.644625663757324, "step": 4658} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 4658} {"info/global_step": 4659, "train_info/time_within_train_step": 2.6673812866210938, "step": 4659} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 4659} {"info/global_step": 4660, "train_info/time_within_train_step": 2.663944721221924, "step": 4660} {"train_info/time_between_train_steps": 0.003262758255004883, "step": 4660} {"info/global_step": 4661, "train_info/time_within_train_step": 2.6811165809631348, "step": 4661} {"train_info/time_between_train_steps": 0.003269195556640625, "step": 4661} {"info/global_step": 4662, "train_info/time_within_train_step": 2.6658103466033936, "step": 4662} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 4662} {"info/global_step": 4663, "train_info/time_within_train_step": 2.6523802280426025, "step": 4663} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 4663} {"info/global_step": 4664, "train_info/time_within_train_step": 2.65455961227417, "step": 4664} {"train_info/time_between_train_steps": 0.0032570362091064453, "step": 4664} {"info/global_step": 4665, "train_info/time_within_train_step": 2.6521029472351074, "step": 4665} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 4665} {"info/global_step": 4666, "train_info/time_within_train_step": 2.646888494491577, "step": 4666} {"train_info/time_between_train_steps": 0.003284454345703125, "step": 4666} {"info/global_step": 4667, "train_info/time_within_train_step": 2.6821584701538086, "step": 4667} {"train_info/time_between_train_steps": 0.003222942352294922, "step": 4667} {"info/global_step": 4668, "train_info/time_within_train_step": 2.644118547439575, "step": 4668} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 4668} {"info/global_step": 4669, "train_info/time_within_train_step": 2.665372133255005, "step": 4669} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 4669} {"info/global_step": 4670, "train_info/time_within_train_step": 2.6576855182647705, "step": 4670} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 4670} {"info/global_step": 4671, "train_info/time_within_train_step": 2.6614091396331787, "step": 4671} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 4671} {"info/global_step": 4672, "train_info/time_within_train_step": 2.696765661239624, "step": 4672} {"train_info/time_between_train_steps": 0.003231048583984375, "step": 4672} {"info/global_step": 4673, "train_info/time_within_train_step": 2.6586594581604004, "step": 4673} {"train_info/time_between_train_steps": 0.0032646656036376953, "step": 4673} {"info/global_step": 4674, "train_info/time_within_train_step": 2.649325370788574, "step": 4674} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 4674} {"info/global_step": 4675, "train_info/time_within_train_step": 2.6468982696533203, "step": 4675} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 4675} {"info/global_step": 4676, "train_info/time_within_train_step": 2.6506991386413574, "step": 4676} {"train_info/time_between_train_steps": 0.003259420394897461, "step": 4676} {"info/global_step": 4677, "train_info/time_within_train_step": 2.661370038986206, "step": 4677} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 4677} {"info/global_step": 4678, "train_info/time_within_train_step": 2.6499056816101074, "step": 4678} {"train_info/time_between_train_steps": 0.0032558441162109375, "step": 4678} {"info/global_step": 4679, "train_info/time_within_train_step": 2.669002056121826, "step": 4679} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 4679} {"info/global_step": 4680, "train_info/time_within_train_step": 2.727748155593872, "step": 4680} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 4680} {"info/global_step": 4681, "train_info/time_within_train_step": 2.669004440307617, "step": 4681} {"train_info/time_between_train_steps": 0.003263235092163086, "step": 4681} {"info/global_step": 4682, "train_info/time_within_train_step": 2.642573356628418, "step": 4682} {"train_info/time_between_train_steps": 0.003253936767578125, "step": 4682} {"info/global_step": 4683, "train_info/time_within_train_step": 2.646176338195801, "step": 4683} {"train_info/time_between_train_steps": 0.0033071041107177734, "step": 4683} {"info/global_step": 4684, "train_info/time_within_train_step": 2.6577467918395996, "step": 4684} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 4684} {"info/global_step": 4685, "train_info/time_within_train_step": 2.654669761657715, "step": 4685} {"train_info/time_between_train_steps": 0.0032460689544677734, "step": 4685} {"info/global_step": 4686, "train_info/time_within_train_step": 2.6450722217559814, "step": 4686} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 4686} {"info/global_step": 4687, "train_info/time_within_train_step": 2.648346185684204, "step": 4687} {"train_info/time_between_train_steps": 0.0032758712768554688, "step": 4687} {"info/global_step": 4688, "train_info/time_within_train_step": 2.661565065383911, "step": 4688} {"train_info/time_between_train_steps": 0.0032880306243896484, "step": 4688} {"info/global_step": 4689, "train_info/time_within_train_step": 2.667471170425415, "step": 4689} {"train_info/time_between_train_steps": 0.003244638442993164, "step": 4689} {"info/global_step": 4690, "train_info/time_within_train_step": 2.7002031803131104, "step": 4690} {"train_info/time_between_train_steps": 0.1289067268371582, "step": 4690} {"info/global_step": 4691, "train_info/time_within_train_step": 2.67215633392334, "step": 4691} {"train_info/time_between_train_steps": 0.003297090530395508, "step": 4691} {"info/global_step": 4692, "train_info/time_within_train_step": 2.687762975692749, "step": 4692} {"train_info/time_between_train_steps": 0.003255605697631836, "step": 4692} {"info/global_step": 4693, "train_info/time_within_train_step": 2.6523549556732178, "step": 4693} {"train_info/time_between_train_steps": 0.003204345703125, "step": 4693} {"info/global_step": 4694, "train_info/time_within_train_step": 2.641308546066284, "step": 4694} {"train_info/time_between_train_steps": 0.0032248497009277344, "step": 4694} {"info/global_step": 4695, "train_info/time_within_train_step": 2.660071849822998, "step": 4695} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 4695} {"info/global_step": 4696, "train_info/time_within_train_step": 2.6541473865509033, "step": 4696} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 4696} {"info/global_step": 4697, "train_info/time_within_train_step": 2.64449405670166, "step": 4697} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 4697} {"info/global_step": 4698, "train_info/time_within_train_step": 2.645052194595337, "step": 4698} {"train_info/time_between_train_steps": 0.0032320022583007812, "step": 4698} {"info/global_step": 4699, "train_info/time_within_train_step": 2.6547393798828125, "step": 4699} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 4699} {"info/global_step": 4700, "train_info/time_within_train_step": 2.6717612743377686, "step": 4700} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746910632, "_runtime": 13230}, "step": 4700} {"logs": {"train/loss": 3.6631, "train/learning_rate": 0.0003533333333333333, "train/epoch": 5.04, "_timestamp": 1746910632, "_runtime": 13230}, "step": 4700} {"train_info/time_between_train_steps": 0.04967045783996582, "step": 4700} {"info/global_step": 4701, "train_info/time_within_train_step": 2.6684212684631348, "step": 4701} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 4701} {"info/global_step": 4702, "train_info/time_within_train_step": 2.694775342941284, "step": 4702} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 4702} {"info/global_step": 4703, "train_info/time_within_train_step": 2.65338397026062, "step": 4703} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 4703} {"info/global_step": 4704, "train_info/time_within_train_step": 2.674039125442505, "step": 4704} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 4704} {"info/global_step": 4705, "train_info/time_within_train_step": 2.661707639694214, "step": 4705} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 4705} {"info/global_step": 4706, "train_info/time_within_train_step": 2.650634288787842, "step": 4706} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 4706} {"info/global_step": 4707, "train_info/time_within_train_step": 2.647374153137207, "step": 4707} {"train_info/time_between_train_steps": 0.003275156021118164, "step": 4707} {"info/global_step": 4708, "train_info/time_within_train_step": 2.649942398071289, "step": 4708} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 4708} {"info/global_step": 4709, "train_info/time_within_train_step": 2.651179075241089, "step": 4709} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 4709} {"info/global_step": 4710, "train_info/time_within_train_step": 2.646547317504883, "step": 4710} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 4710} {"info/global_step": 4711, "train_info/time_within_train_step": 2.655804395675659, "step": 4711} {"train_info/time_between_train_steps": 0.0032439231872558594, "step": 4711} {"info/global_step": 4712, "train_info/time_within_train_step": 2.6728832721710205, "step": 4712} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 4712} {"info/global_step": 4713, "train_info/time_within_train_step": 2.67939829826355, "step": 4713} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 4713} {"info/global_step": 4714, "train_info/time_within_train_step": 2.7315895557403564, "step": 4714} {"train_info/time_between_train_steps": 0.003671884536743164, "step": 4714} {"info/global_step": 4715, "train_info/time_within_train_step": 2.660405397415161, "step": 4715} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 4715} {"info/global_step": 4716, "train_info/time_within_train_step": 2.642524003982544, "step": 4716} {"train_info/time_between_train_steps": 0.003156423568725586, "step": 4716} {"info/global_step": 4717, "train_info/time_within_train_step": 2.654561758041382, "step": 4717} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 4717} {"info/global_step": 4718, "train_info/time_within_train_step": 2.648139715194702, "step": 4718} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 4718} {"info/global_step": 4719, "train_info/time_within_train_step": 2.650576591491699, "step": 4719} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 4719} {"info/global_step": 4720, "train_info/time_within_train_step": 2.646742582321167, "step": 4720} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 4720} {"info/global_step": 4721, "train_info/time_within_train_step": 2.643378734588623, "step": 4721} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 4721} {"info/global_step": 4722, "train_info/time_within_train_step": 2.6684165000915527, "step": 4722} {"train_info/time_between_train_steps": 0.003382444381713867, "step": 4722} {"info/global_step": 4723, "train_info/time_within_train_step": 2.664095640182495, "step": 4723} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 4723} {"info/global_step": 4724, "train_info/time_within_train_step": 2.6489830017089844, "step": 4724} {"train_info/time_between_train_steps": 0.0032243728637695312, "step": 4724} {"info/global_step": 4725, "train_info/time_within_train_step": 2.6577203273773193, "step": 4725} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 4725} {"info/global_step": 4726, "train_info/time_within_train_step": 2.649420976638794, "step": 4726} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 4726} {"info/global_step": 4727, "train_info/time_within_train_step": 2.644489288330078, "step": 4727} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 4727} {"info/global_step": 4728, "train_info/time_within_train_step": 2.928555727005005, "step": 4728} {"train_info/time_between_train_steps": 0.0032384395599365234, "step": 4728} {"info/global_step": 4729, "train_info/time_within_train_step": 2.654938220977783, "step": 4729} {"train_info/time_between_train_steps": 0.0033435821533203125, "step": 4729} {"info/global_step": 4730, "train_info/time_within_train_step": 2.6443772315979004, "step": 4730} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 4730} {"info/global_step": 4731, "train_info/time_within_train_step": 2.6472864151000977, "step": 4731} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 4731} {"info/global_step": 4732, "train_info/time_within_train_step": 2.671816110610962, "step": 4732} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 4732} {"info/global_step": 4733, "train_info/time_within_train_step": 2.6661481857299805, "step": 4733} {"train_info/time_between_train_steps": 0.0032503604888916016, "step": 4733} {"info/global_step": 4734, "train_info/time_within_train_step": 2.695390224456787, "step": 4734} {"train_info/time_between_train_steps": 0.0033452510833740234, "step": 4734} {"info/global_step": 4735, "train_info/time_within_train_step": 2.6572515964508057, "step": 4735} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 4735} {"info/global_step": 4736, "train_info/time_within_train_step": 2.641881227493286, "step": 4736} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 4736} {"info/global_step": 4737, "train_info/time_within_train_step": 2.6557023525238037, "step": 4737} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 4737} {"info/global_step": 4738, "train_info/time_within_train_step": 2.657243013381958, "step": 4738} {"train_info/time_between_train_steps": 0.0032165050506591797, "step": 4738} {"info/global_step": 4739, "train_info/time_within_train_step": 2.6442031860351562, "step": 4739} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 4739} {"info/global_step": 4740, "train_info/time_within_train_step": 2.6623263359069824, "step": 4740} {"train_info/time_between_train_steps": 0.003255605697631836, "step": 4740} {"info/global_step": 4741, "train_info/time_within_train_step": 2.6668691635131836, "step": 4741} {"train_info/time_between_train_steps": 0.003208160400390625, "step": 4741} {"info/global_step": 4742, "train_info/time_within_train_step": 2.66170334815979, "step": 4742} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 4742} {"info/global_step": 4743, "train_info/time_within_train_step": 2.704383373260498, "step": 4743} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 4743} {"info/global_step": 4744, "train_info/time_within_train_step": 2.641505241394043, "step": 4744} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 4744} {"info/global_step": 4745, "train_info/time_within_train_step": 2.6470258235931396, "step": 4745} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 4745} {"info/global_step": 4746, "train_info/time_within_train_step": 2.666119337081909, "step": 4746} {"train_info/time_between_train_steps": 0.0032317638397216797, "step": 4746} {"info/global_step": 4747, "train_info/time_within_train_step": 2.6476378440856934, "step": 4747} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 4747} {"info/global_step": 4748, "train_info/time_within_train_step": 2.6431338787078857, "step": 4748} {"train_info/time_between_train_steps": 0.003253459930419922, "step": 4748} {"info/global_step": 4749, "train_info/time_within_train_step": 3.243964910507202, "step": 4749} {"train_info/time_between_train_steps": 0.006720304489135742, "step": 4749} {"info/global_step": 4750, "train_info/time_within_train_step": 2.663917303085327, "step": 4750} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746910767, "_runtime": 13365}, "step": 4750} {"logs": {"train/loss": 3.6689, "train/learning_rate": 0.00035, "train/epoch": 5.04, "_timestamp": 1746910767, "_runtime": 13365}, "step": 4750} {"train_info/time_between_train_steps": 0.029322385787963867, "step": 4750} {"info/global_step": 4751, "train_info/time_within_train_step": 2.6702940464019775, "step": 4751} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 4751} {"info/global_step": 4752, "train_info/time_within_train_step": 2.6708106994628906, "step": 4752} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 4752} {"info/global_step": 4753, "train_info/time_within_train_step": 2.786174774169922, "step": 4753} {"train_info/time_between_train_steps": 0.003244638442993164, "step": 4753} {"info/global_step": 4754, "train_info/time_within_train_step": 2.674143075942993, "step": 4754} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 4754} {"info/global_step": 4755, "train_info/time_within_train_step": 2.6473217010498047, "step": 4755} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 4755} {"info/global_step": 4756, "train_info/time_within_train_step": 2.6612532138824463, "step": 4756} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 4756} {"info/global_step": 4757, "train_info/time_within_train_step": 2.6440951824188232, "step": 4757} {"train_info/time_between_train_steps": 0.003315448760986328, "step": 4757} {"info/global_step": 4758, "train_info/time_within_train_step": 2.6445462703704834, "step": 4758} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 4758} {"info/global_step": 4759, "train_info/time_within_train_step": 2.659088611602783, "step": 4759} {"train_info/time_between_train_steps": 0.0032341480255126953, "step": 4759} {"info/global_step": 4760, "train_info/time_within_train_step": 2.6534435749053955, "step": 4760} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 4760} {"info/global_step": 4761, "train_info/time_within_train_step": 2.6599535942077637, "step": 4761} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 4761} {"info/global_step": 4762, "train_info/time_within_train_step": 2.703857421875, "step": 4762} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 4762} {"info/global_step": 4763, "train_info/time_within_train_step": 2.697862386703491, "step": 4763} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 4763} {"info/global_step": 4764, "train_info/time_within_train_step": 2.6409759521484375, "step": 4764} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 4764} {"info/global_step": 4765, "train_info/time_within_train_step": 2.6423373222351074, "step": 4765} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 4765} {"info/global_step": 4766, "train_info/time_within_train_step": 2.656526565551758, "step": 4766} {"train_info/time_between_train_steps": 0.0033905506134033203, "step": 4766} {"info/global_step": 4767, "train_info/time_within_train_step": 2.652569532394409, "step": 4767} {"train_info/time_between_train_steps": 0.0032792091369628906, "step": 4767} {"info/global_step": 4768, "train_info/time_within_train_step": 2.643465518951416, "step": 4768} {"train_info/time_between_train_steps": 0.0032575130462646484, "step": 4768} {"info/global_step": 4769, "train_info/time_within_train_step": 2.6533255577087402, "step": 4769} {"train_info/time_between_train_steps": 0.003227710723876953, "step": 4769} {"info/global_step": 4770, "train_info/time_within_train_step": 2.6479580402374268, "step": 4770} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 4770} {"info/global_step": 4771, "train_info/time_within_train_step": 2.6691009998321533, "step": 4771} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 4771} {"info/global_step": 4772, "train_info/time_within_train_step": 2.7088377475738525, "step": 4772} {"train_info/time_between_train_steps": 0.0032432079315185547, "step": 4772} {"info/global_step": 4773, "train_info/time_within_train_step": 2.641879081726074, "step": 4773} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 4773} {"info/global_step": 4774, "train_info/time_within_train_step": 2.6537084579467773, "step": 4774} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 4774} {"info/global_step": 4775, "train_info/time_within_train_step": 2.648483991622925, "step": 4775} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 4775} {"info/global_step": 4776, "train_info/time_within_train_step": 2.647237539291382, "step": 4776} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 4776} {"info/global_step": 4777, "train_info/time_within_train_step": 2.6543197631835938, "step": 4777} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 4777} {"info/global_step": 4778, "train_info/time_within_train_step": 2.643284797668457, "step": 4778} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 4778} {"info/global_step": 4779, "train_info/time_within_train_step": 2.6651265621185303, "step": 4779} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 4779} {"info/global_step": 4780, "train_info/time_within_train_step": 2.668855667114258, "step": 4780} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 4780} {"info/global_step": 4781, "train_info/time_within_train_step": 2.6672451496124268, "step": 4781} {"train_info/time_between_train_steps": 0.0032701492309570312, "step": 4781} {"info/global_step": 4782, "train_info/time_within_train_step": 2.666692018508911, "step": 4782} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 4782} {"info/global_step": 4783, "train_info/time_within_train_step": 2.6474874019622803, "step": 4783} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 4783} {"info/global_step": 4784, "train_info/time_within_train_step": 2.647723436355591, "step": 4784} {"train_info/time_between_train_steps": 0.0031588077545166016, "step": 4784} {"info/global_step": 4785, "train_info/time_within_train_step": 2.647350788116455, "step": 4785} {"train_info/time_between_train_steps": 0.003237485885620117, "step": 4785} {"info/global_step": 4786, "train_info/time_within_train_step": 2.663623094558716, "step": 4786} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 4786} {"info/global_step": 4787, "train_info/time_within_train_step": 2.9184746742248535, "step": 4787} {"train_info/time_between_train_steps": 0.0033829212188720703, "step": 4787} {"info/global_step": 4788, "train_info/time_within_train_step": 2.6445393562316895, "step": 4788} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 4788} {"info/global_step": 4789, "train_info/time_within_train_step": 2.654059410095215, "step": 4789} {"train_info/time_between_train_steps": 0.0035157203674316406, "step": 4789} {"info/global_step": 4790, "train_info/time_within_train_step": 2.6616315841674805, "step": 4790} {"train_info/time_between_train_steps": 0.0032186508178710938, "step": 4790} {"info/global_step": 4791, "train_info/time_within_train_step": 2.6728742122650146, "step": 4791} {"train_info/time_between_train_steps": 0.0032248497009277344, "step": 4791} {"info/global_step": 4792, "train_info/time_within_train_step": 2.6639351844787598, "step": 4792} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 4792} {"info/global_step": 4793, "train_info/time_within_train_step": 2.709390878677368, "step": 4793} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 4793} {"info/global_step": 4794, "train_info/time_within_train_step": 2.643301486968994, "step": 4794} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 4794} {"info/global_step": 4795, "train_info/time_within_train_step": 2.6487209796905518, "step": 4795} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 4795} {"info/global_step": 4796, "train_info/time_within_train_step": 2.659196138381958, "step": 4796} {"train_info/time_between_train_steps": 0.0032274723052978516, "step": 4796} {"info/global_step": 4797, "train_info/time_within_train_step": 2.642990827560425, "step": 4797} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 4797} {"info/global_step": 4798, "train_info/time_within_train_step": 2.646634817123413, "step": 4798} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 4798} {"info/global_step": 4799, "train_info/time_within_train_step": 2.649980306625366, "step": 4799} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 4799} {"info/global_step": 4800, "train_info/time_within_train_step": 2.651674270629883, "step": 4800} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746910901, "_runtime": 13499}, "step": 4800} {"logs": {"train/loss": 3.6553, "train/learning_rate": 0.0003466666666666666, "train/epoch": 5.05, "_timestamp": 1746910901, "_runtime": 13499}, "step": 4800} {"train_info/time_between_train_steps": 13.474765300750732, "step": 4800} {"info/global_step": 4801, "train_info/time_within_train_step": 2.4441890716552734, "step": 4801} {"train_info/time_between_train_steps": 0.003227710723876953, "step": 4801} {"info/global_step": 4802, "train_info/time_within_train_step": 2.4359731674194336, "step": 4802} {"train_info/time_between_train_steps": 0.0033173561096191406, "step": 4802} {"info/global_step": 4803, "train_info/time_within_train_step": 2.5940401554107666, "step": 4803} {"train_info/time_between_train_steps": 0.0034995079040527344, "step": 4803} {"info/global_step": 4804, "train_info/time_within_train_step": 2.640090227127075, "step": 4804} {"train_info/time_between_train_steps": 0.0034236907958984375, "step": 4804} {"info/global_step": 4805, "train_info/time_within_train_step": 2.6422207355499268, "step": 4805} {"train_info/time_between_train_steps": 0.003350496292114258, "step": 4805} {"info/global_step": 4806, "train_info/time_within_train_step": 2.6484639644622803, "step": 4806} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 4806} {"info/global_step": 4807, "train_info/time_within_train_step": 2.642718553543091, "step": 4807} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 4807} {"info/global_step": 4808, "train_info/time_within_train_step": 2.6518566608428955, "step": 4808} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 4808} {"info/global_step": 4809, "train_info/time_within_train_step": 2.64074444770813, "step": 4809} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 4809} {"info/global_step": 4810, "train_info/time_within_train_step": 2.6763033866882324, "step": 4810} {"train_info/time_between_train_steps": 0.0031943321228027344, "step": 4810} {"info/global_step": 4811, "train_info/time_within_train_step": 2.669208288192749, "step": 4811} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 4811} {"info/global_step": 4812, "train_info/time_within_train_step": 2.7287681102752686, "step": 4812} {"train_info/time_between_train_steps": 0.0031366348266601562, "step": 4812} {"info/global_step": 4813, "train_info/time_within_train_step": 2.698409080505371, "step": 4813} {"train_info/time_between_train_steps": 0.003227710723876953, "step": 4813} {"info/global_step": 4814, "train_info/time_within_train_step": 2.6431515216827393, "step": 4814} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 4814} {"info/global_step": 4815, "train_info/time_within_train_step": 2.6408307552337646, "step": 4815} {"train_info/time_between_train_steps": 0.10750079154968262, "step": 4815} {"info/global_step": 4816, "train_info/time_within_train_step": 2.6425247192382812, "step": 4816} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 4816} {"info/global_step": 4817, "train_info/time_within_train_step": 2.6581993103027344, "step": 4817} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 4817} {"info/global_step": 4818, "train_info/time_within_train_step": 2.6510183811187744, "step": 4818} {"train_info/time_between_train_steps": 0.003228425979614258, "step": 4818} {"info/global_step": 4819, "train_info/time_within_train_step": 2.6500749588012695, "step": 4819} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 4819} {"info/global_step": 4820, "train_info/time_within_train_step": 2.6538166999816895, "step": 4820} {"train_info/time_between_train_steps": 0.003263711929321289, "step": 4820} {"info/global_step": 4821, "train_info/time_within_train_step": 2.646019697189331, "step": 4821} {"train_info/time_between_train_steps": 0.0032396316528320312, "step": 4821} {"info/global_step": 4822, "train_info/time_within_train_step": 2.6689999103546143, "step": 4822} {"train_info/time_between_train_steps": 0.003275632858276367, "step": 4822} {"info/global_step": 4823, "train_info/time_within_train_step": 2.6728198528289795, "step": 4823} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 4823} {"info/global_step": 4824, "train_info/time_within_train_step": 2.688849449157715, "step": 4824} {"train_info/time_between_train_steps": 0.0032186508178710938, "step": 4824} {"info/global_step": 4825, "train_info/time_within_train_step": 2.6550066471099854, "step": 4825} {"train_info/time_between_train_steps": 0.003276824951171875, "step": 4825} {"info/global_step": 4826, "train_info/time_within_train_step": 2.64436674118042, "step": 4826} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 4826} {"info/global_step": 4827, "train_info/time_within_train_step": 2.6613454818725586, "step": 4827} {"train_info/time_between_train_steps": 0.0032324790954589844, "step": 4827} {"info/global_step": 4828, "train_info/time_within_train_step": 2.6564714908599854, "step": 4828} {"train_info/time_between_train_steps": 0.003255128860473633, "step": 4828} {"info/global_step": 4829, "train_info/time_within_train_step": 2.6613144874572754, "step": 4829} {"train_info/time_between_train_steps": 0.0038480758666992188, "step": 4829} {"info/global_step": 4830, "train_info/time_within_train_step": 2.646486759185791, "step": 4830} {"train_info/time_between_train_steps": 0.003243684768676758, "step": 4830} {"info/global_step": 4831, "train_info/time_within_train_step": 2.6533100605010986, "step": 4831} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 4831} {"info/global_step": 4832, "train_info/time_within_train_step": 2.6729114055633545, "step": 4832} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 4832} {"info/global_step": 4833, "train_info/time_within_train_step": 2.678900718688965, "step": 4833} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 4833} {"info/global_step": 4834, "train_info/time_within_train_step": 2.6871933937072754, "step": 4834} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 4834} {"info/global_step": 4835, "train_info/time_within_train_step": 2.6613595485687256, "step": 4835} {"train_info/time_between_train_steps": 0.003123760223388672, "step": 4835} {"info/global_step": 4836, "train_info/time_within_train_step": 2.6665427684783936, "step": 4836} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 4836} {"info/global_step": 4837, "train_info/time_within_train_step": 2.6465706825256348, "step": 4837} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 4837} {"info/global_step": 4838, "train_info/time_within_train_step": 2.6461164951324463, "step": 4838} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 4838} {"info/global_step": 4839, "train_info/time_within_train_step": 2.660233974456787, "step": 4839} {"train_info/time_between_train_steps": 0.0031359195709228516, "step": 4839} {"info/global_step": 4840, "train_info/time_within_train_step": 2.64979887008667, "step": 4840} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 4840} {"info/global_step": 4841, "train_info/time_within_train_step": 2.917888641357422, "step": 4841} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 4841} {"info/global_step": 4842, "train_info/time_within_train_step": 2.651000499725342, "step": 4842} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 4842} {"info/global_step": 4843, "train_info/time_within_train_step": 2.6456005573272705, "step": 4843} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 4843} {"info/global_step": 4844, "train_info/time_within_train_step": 2.6496055126190186, "step": 4844} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 4844} {"info/global_step": 4845, "train_info/time_within_train_step": 2.6493163108825684, "step": 4845} {"train_info/time_between_train_steps": 0.003257274627685547, "step": 4845} {"info/global_step": 4846, "train_info/time_within_train_step": 2.6645610332489014, "step": 4846} {"train_info/time_between_train_steps": 0.0032241344451904297, "step": 4846} {"info/global_step": 4847, "train_info/time_within_train_step": 2.662858009338379, "step": 4847} {"train_info/time_between_train_steps": 0.003243684768676758, "step": 4847} {"info/global_step": 4848, "train_info/time_within_train_step": 2.657956600189209, "step": 4848} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 4848} {"info/global_step": 4849, "train_info/time_within_train_step": 2.6433215141296387, "step": 4849} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 4849} {"info/global_step": 4850, "train_info/time_within_train_step": 2.6484663486480713, "step": 4850} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746911050, "_runtime": 13648}, "step": 4850} {"logs": {"train/loss": 3.6411, "train/learning_rate": 0.0003433333333333333, "train/epoch": 5.05, "_timestamp": 1746911050, "_runtime": 13648}, "step": 4850} {"train_info/time_between_train_steps": 0.024637699127197266, "step": 4850} {"info/global_step": 4851, "train_info/time_within_train_step": 2.646246910095215, "step": 4851} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 4851} {"info/global_step": 4852, "train_info/time_within_train_step": 2.6600615978240967, "step": 4852} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 4852} {"info/global_step": 4853, "train_info/time_within_train_step": 2.6591930389404297, "step": 4853} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 4853} {"info/global_step": 4854, "train_info/time_within_train_step": 2.662085771560669, "step": 4854} {"train_info/time_between_train_steps": 0.00325775146484375, "step": 4854} {"info/global_step": 4855, "train_info/time_within_train_step": 2.7158308029174805, "step": 4855} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 4855} {"info/global_step": 4856, "train_info/time_within_train_step": 2.681680202484131, "step": 4856} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 4856} {"info/global_step": 4857, "train_info/time_within_train_step": 2.6420936584472656, "step": 4857} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 4857} {"info/global_step": 4858, "train_info/time_within_train_step": 2.656500816345215, "step": 4858} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 4858} {"info/global_step": 4859, "train_info/time_within_train_step": 2.6508629322052, "step": 4859} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 4859} {"info/global_step": 4860, "train_info/time_within_train_step": 2.6498610973358154, "step": 4860} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 4860} {"info/global_step": 4861, "train_info/time_within_train_step": 2.6491687297821045, "step": 4861} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 4861} {"info/global_step": 4862, "train_info/time_within_train_step": 2.6457316875457764, "step": 4862} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 4862} {"info/global_step": 4863, "train_info/time_within_train_step": 2.6783342361450195, "step": 4863} {"train_info/time_between_train_steps": 0.0032892227172851562, "step": 4863} {"info/global_step": 4864, "train_info/time_within_train_step": 2.6940979957580566, "step": 4864} {"train_info/time_between_train_steps": 0.0032320022583007812, "step": 4864} {"info/global_step": 4865, "train_info/time_within_train_step": 2.6672892570495605, "step": 4865} {"train_info/time_between_train_steps": 0.003253936767578125, "step": 4865} {"info/global_step": 4866, "train_info/time_within_train_step": 2.6797568798065186, "step": 4866} {"train_info/time_between_train_steps": 0.0028839111328125, "step": 4866} {"info/global_step": 4867, "train_info/time_within_train_step": 2.641150951385498, "step": 4867} {"train_info/time_between_train_steps": 0.002928495407104492, "step": 4867} {"info/global_step": 4868, "train_info/time_within_train_step": 2.650542736053467, "step": 4868} {"train_info/time_between_train_steps": 0.002902507781982422, "step": 4868} {"info/global_step": 4869, "train_info/time_within_train_step": 2.642916202545166, "step": 4869} {"train_info/time_between_train_steps": 0.002941608428955078, "step": 4869} {"info/global_step": 4870, "train_info/time_within_train_step": 2.6454617977142334, "step": 4870} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 4870} {"info/global_step": 4871, "train_info/time_within_train_step": 2.6701176166534424, "step": 4871} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 4871} {"info/global_step": 4872, "train_info/time_within_train_step": 2.667978286743164, "step": 4872} {"train_info/time_between_train_steps": 0.002924680709838867, "step": 4872} {"info/global_step": 4873, "train_info/time_within_train_step": 2.6598622798919678, "step": 4873} {"train_info/time_between_train_steps": 0.002946615219116211, "step": 4873} {"info/global_step": 4874, "train_info/time_within_train_step": 2.6823601722717285, "step": 4874} {"train_info/time_between_train_steps": 0.0028848648071289062, "step": 4874} {"info/global_step": 4875, "train_info/time_within_train_step": 2.641240119934082, "step": 4875} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 4875} {"info/global_step": 4876, "train_info/time_within_train_step": 2.6505091190338135, "step": 4876} {"train_info/time_between_train_steps": 0.0028612613677978516, "step": 4876} {"info/global_step": 4877, "train_info/time_within_train_step": 2.6614577770233154, "step": 4877} {"train_info/time_between_train_steps": 0.0029020309448242188, "step": 4877} {"info/global_step": 4878, "train_info/time_within_train_step": 2.6423590183258057, "step": 4878} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 4878} {"info/global_step": 4879, "train_info/time_within_train_step": 2.6424808502197266, "step": 4879} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 4879} {"info/global_step": 4880, "train_info/time_within_train_step": 2.6602232456207275, "step": 4880} {"train_info/time_between_train_steps": 0.0030989646911621094, "step": 4880} {"info/global_step": 4881, "train_info/time_within_train_step": 2.660689353942871, "step": 4881} {"train_info/time_between_train_steps": 0.0029222965240478516, "step": 4881} {"info/global_step": 4882, "train_info/time_within_train_step": 2.671414375305176, "step": 4882} {"train_info/time_between_train_steps": 0.0029702186584472656, "step": 4882} {"info/global_step": 4883, "train_info/time_within_train_step": 2.6751198768615723, "step": 4883} {"train_info/time_between_train_steps": 0.002924203872680664, "step": 4883} {"info/global_step": 4884, "train_info/time_within_train_step": 2.6664834022521973, "step": 4884} {"train_info/time_between_train_steps": 0.0029158592224121094, "step": 4884} {"info/global_step": 4885, "train_info/time_within_train_step": 2.8675763607025146, "step": 4885} {"train_info/time_between_train_steps": 0.0029478073120117188, "step": 4885} {"info/global_step": 4886, "train_info/time_within_train_step": 2.6655287742614746, "step": 4886} {"train_info/time_between_train_steps": 0.0029747486114501953, "step": 4886} {"info/global_step": 4887, "train_info/time_within_train_step": 2.694075107574463, "step": 4887} {"train_info/time_between_train_steps": 0.0028989315032958984, "step": 4887} {"info/global_step": 4888, "train_info/time_within_train_step": 2.6406071186065674, "step": 4888} {"train_info/time_between_train_steps": 0.0029668807983398438, "step": 4888} {"info/global_step": 4889, "train_info/time_within_train_step": 2.6413230895996094, "step": 4889} {"train_info/time_between_train_steps": 0.002920866012573242, "step": 4889} {"info/global_step": 4890, "train_info/time_within_train_step": 2.656083583831787, "step": 4890} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 4890} {"info/global_step": 4891, "train_info/time_within_train_step": 2.6531386375427246, "step": 4891} {"train_info/time_between_train_steps": 0.0028717517852783203, "step": 4891} {"info/global_step": 4892, "train_info/time_within_train_step": 2.6432878971099854, "step": 4892} {"train_info/time_between_train_steps": 0.0029053688049316406, "step": 4892} {"info/global_step": 4893, "train_info/time_within_train_step": 2.654465913772583, "step": 4893} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 4893} {"info/global_step": 4894, "train_info/time_within_train_step": 2.65486741065979, "step": 4894} {"train_info/time_between_train_steps": 0.002923250198364258, "step": 4894} {"info/global_step": 4895, "train_info/time_within_train_step": 2.67299485206604, "step": 4895} {"train_info/time_between_train_steps": 0.002897500991821289, "step": 4895} {"info/global_step": 4896, "train_info/time_within_train_step": 2.739677906036377, "step": 4896} {"train_info/time_between_train_steps": 0.0029129981994628906, "step": 4896} {"info/global_step": 4897, "train_info/time_within_train_step": 2.674222469329834, "step": 4897} {"train_info/time_between_train_steps": 0.0029458999633789062, "step": 4897} {"info/global_step": 4898, "train_info/time_within_train_step": 2.6397039890289307, "step": 4898} {"train_info/time_between_train_steps": 0.0028734207153320312, "step": 4898} {"info/global_step": 4899, "train_info/time_within_train_step": 2.649258852005005, "step": 4899} {"train_info/time_between_train_steps": 0.002935171127319336, "step": 4899} {"info/global_step": 4900, "train_info/time_within_train_step": 2.651557207107544, "step": 4900} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746911184, "_runtime": 13782}, "step": 4900} {"logs": {"train/loss": 3.6362, "train/learning_rate": 0.00033999999999999997, "train/epoch": 5.06, "_timestamp": 1746911184, "_runtime": 13782}, "step": 4900} {"train_info/time_between_train_steps": 0.02432703971862793, "step": 4900} {"info/global_step": 4901, "train_info/time_within_train_step": 2.655393362045288, "step": 4901} {"train_info/time_between_train_steps": 0.002882719039916992, "step": 4901} {"info/global_step": 4902, "train_info/time_within_train_step": 2.6431281566619873, "step": 4902} {"train_info/time_between_train_steps": 0.002863645553588867, "step": 4902} {"info/global_step": 4903, "train_info/time_within_train_step": 2.649580717086792, "step": 4903} {"train_info/time_between_train_steps": 0.002936124801635742, "step": 4903} {"info/global_step": 4904, "train_info/time_within_train_step": 2.654735565185547, "step": 4904} {"train_info/time_between_train_steps": 0.002930879592895508, "step": 4904} {"info/global_step": 4905, "train_info/time_within_train_step": 2.6656334400177, "step": 4905} {"train_info/time_between_train_steps": 0.002925395965576172, "step": 4905} {"info/global_step": 4906, "train_info/time_within_train_step": 2.6939640045166016, "step": 4906} {"train_info/time_between_train_steps": 0.002893209457397461, "step": 4906} {"info/global_step": 4907, "train_info/time_within_train_step": 2.656738519668579, "step": 4907} {"train_info/time_between_train_steps": 0.002924203872680664, "step": 4907} {"info/global_step": 4908, "train_info/time_within_train_step": 2.6436312198638916, "step": 4908} {"train_info/time_between_train_steps": 0.0029485225677490234, "step": 4908} {"info/global_step": 4909, "train_info/time_within_train_step": 2.6480369567871094, "step": 4909} {"train_info/time_between_train_steps": 0.002889871597290039, "step": 4909} {"info/global_step": 4910, "train_info/time_within_train_step": 2.6710407733917236, "step": 4910} {"train_info/time_between_train_steps": 0.002956867218017578, "step": 4910} {"info/global_step": 4911, "train_info/time_within_train_step": 2.6725053787231445, "step": 4911} {"train_info/time_between_train_steps": 0.00296783447265625, "step": 4911} {"info/global_step": 4912, "train_info/time_within_train_step": 2.655177593231201, "step": 4912} {"train_info/time_between_train_steps": 0.0029458999633789062, "step": 4912} {"info/global_step": 4913, "train_info/time_within_train_step": 2.686293363571167, "step": 4913} {"train_info/time_between_train_steps": 0.002892732620239258, "step": 4913} {"info/global_step": 4914, "train_info/time_within_train_step": 2.6434834003448486, "step": 4914} {"train_info/time_between_train_steps": 0.0030536651611328125, "step": 4914} {"info/global_step": 4915, "train_info/time_within_train_step": 2.6517174243927, "step": 4915} {"train_info/time_between_train_steps": 0.002927064895629883, "step": 4915} {"info/global_step": 4916, "train_info/time_within_train_step": 2.658190965652466, "step": 4916} {"train_info/time_between_train_steps": 0.002897024154663086, "step": 4916} {"info/global_step": 4917, "train_info/time_within_train_step": 2.6482057571411133, "step": 4917} {"train_info/time_between_train_steps": 0.0029010772705078125, "step": 4917} {"info/global_step": 4918, "train_info/time_within_train_step": 2.6430141925811768, "step": 4918} {"train_info/time_between_train_steps": 0.0028960704803466797, "step": 4918} {"info/global_step": 4919, "train_info/time_within_train_step": 2.6649086475372314, "step": 4919} {"train_info/time_between_train_steps": 0.002883434295654297, "step": 4919} {"info/global_step": 4920, "train_info/time_within_train_step": 2.661087989807129, "step": 4920} {"train_info/time_between_train_steps": 0.002955913543701172, "step": 4920} {"info/global_step": 4921, "train_info/time_within_train_step": 2.6566994190216064, "step": 4921} {"train_info/time_between_train_steps": 0.0029714107513427734, "step": 4921} {"info/global_step": 4922, "train_info/time_within_train_step": 2.703416109085083, "step": 4922} {"train_info/time_between_train_steps": 0.002948284149169922, "step": 4922} {"info/global_step": 4923, "train_info/time_within_train_step": 2.652381658554077, "step": 4923} {"train_info/time_between_train_steps": 0.002946138381958008, "step": 4923} {"info/global_step": 4924, "train_info/time_within_train_step": 2.6474575996398926, "step": 4924} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 4924} {"info/global_step": 4925, "train_info/time_within_train_step": 2.6557281017303467, "step": 4925} {"train_info/time_between_train_steps": 0.0028810501098632812, "step": 4925} {"info/global_step": 4926, "train_info/time_within_train_step": 2.6422109603881836, "step": 4926} {"train_info/time_between_train_steps": 0.0028944015502929688, "step": 4926} {"info/global_step": 4927, "train_info/time_within_train_step": 2.645265817642212, "step": 4927} {"train_info/time_between_train_steps": 0.002904653549194336, "step": 4927} {"info/global_step": 4928, "train_info/time_within_train_step": 2.6488356590270996, "step": 4928} {"train_info/time_between_train_steps": 0.002889871597290039, "step": 4928} {"info/global_step": 4929, "train_info/time_within_train_step": 2.65206241607666, "step": 4929} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 4929} {"info/global_step": 4930, "train_info/time_within_train_step": 2.6603758335113525, "step": 4930} {"train_info/time_between_train_steps": 0.00296783447265625, "step": 4930} {"info/global_step": 4931, "train_info/time_within_train_step": 2.6785666942596436, "step": 4931} {"train_info/time_between_train_steps": 0.0029287338256835938, "step": 4931} {"info/global_step": 4932, "train_info/time_within_train_step": 2.697237253189087, "step": 4932} {"train_info/time_between_train_steps": 0.002939939498901367, "step": 4932} {"info/global_step": 4933, "train_info/time_within_train_step": 2.641982078552246, "step": 4933} {"train_info/time_between_train_steps": 0.002938985824584961, "step": 4933} {"info/global_step": 4934, "train_info/time_within_train_step": 2.640981912612915, "step": 4934} {"train_info/time_between_train_steps": 0.002953767776489258, "step": 4934} {"info/global_step": 4935, "train_info/time_within_train_step": 2.6570677757263184, "step": 4935} {"train_info/time_between_train_steps": 0.0029387474060058594, "step": 4935} {"info/global_step": 4936, "train_info/time_within_train_step": 2.6520299911499023, "step": 4936} {"train_info/time_between_train_steps": 0.0029230117797851562, "step": 4936} {"info/global_step": 4937, "train_info/time_within_train_step": 2.6438674926757812, "step": 4937} {"train_info/time_between_train_steps": 0.002935171127319336, "step": 4937} {"info/global_step": 4938, "train_info/time_within_train_step": 2.652970314025879, "step": 4938} {"train_info/time_between_train_steps": 0.0029592514038085938, "step": 4938} {"info/global_step": 4939, "train_info/time_within_train_step": 2.646641254425049, "step": 4939} {"train_info/time_between_train_steps": 0.0029358863830566406, "step": 4939} {"info/global_step": 4940, "train_info/time_within_train_step": 2.6692466735839844, "step": 4940} {"train_info/time_between_train_steps": 0.0029449462890625, "step": 4940} {"info/global_step": 4941, "train_info/time_within_train_step": 2.6880152225494385, "step": 4941} {"train_info/time_between_train_steps": 0.002874135971069336, "step": 4941} {"info/global_step": 4942, "train_info/time_within_train_step": 2.6677870750427246, "step": 4942} {"train_info/time_between_train_steps": 0.0028908252716064453, "step": 4942} {"info/global_step": 4943, "train_info/time_within_train_step": 2.656097888946533, "step": 4943} {"train_info/time_between_train_steps": 0.002948760986328125, "step": 4943} {"info/global_step": 4944, "train_info/time_within_train_step": 2.640542984008789, "step": 4944} {"train_info/time_between_train_steps": 0.0029129981994628906, "step": 4944} {"info/global_step": 4945, "train_info/time_within_train_step": 2.653688907623291, "step": 4945} {"train_info/time_between_train_steps": 0.0029261112213134766, "step": 4945} {"info/global_step": 4946, "train_info/time_within_train_step": 2.6550958156585693, "step": 4946} {"train_info/time_between_train_steps": 0.0029137134552001953, "step": 4946} {"info/global_step": 4947, "train_info/time_within_train_step": 2.643139123916626, "step": 4947} {"train_info/time_between_train_steps": 0.0029060840606689453, "step": 4947} {"info/global_step": 4948, "train_info/time_within_train_step": 2.643015146255493, "step": 4948} {"train_info/time_between_train_steps": 0.0029103755950927734, "step": 4948} {"info/global_step": 4949, "train_info/time_within_train_step": 2.6582818031311035, "step": 4949} {"train_info/time_between_train_steps": 0.002958536148071289, "step": 4949} {"info/global_step": 4950, "train_info/time_within_train_step": 2.6696300506591797, "step": 4950} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746911318, "_runtime": 13916}, "step": 4950} {"logs": {"train/loss": 3.6204, "train/learning_rate": 0.00033666666666666665, "train/epoch": 5.06, "_timestamp": 1746911318, "_runtime": 13916}, "step": 4950} {"train_info/time_between_train_steps": 0.02462601661682129, "step": 4950} {"info/global_step": 4951, "train_info/time_within_train_step": 2.666166067123413, "step": 4951} {"train_info/time_between_train_steps": 0.0029511451721191406, "step": 4951} {"info/global_step": 4952, "train_info/time_within_train_step": 2.6628832817077637, "step": 4952} {"train_info/time_between_train_steps": 0.0029146671295166016, "step": 4952} {"info/global_step": 4953, "train_info/time_within_train_step": 2.6833035945892334, "step": 4953} {"train_info/time_between_train_steps": 0.00292205810546875, "step": 4953} {"info/global_step": 4954, "train_info/time_within_train_step": 2.643037796020508, "step": 4954} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 4954} {"info/global_step": 4955, "train_info/time_within_train_step": 2.6451408863067627, "step": 4955} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 4955} {"info/global_step": 4956, "train_info/time_within_train_step": 2.6517624855041504, "step": 4956} {"train_info/time_between_train_steps": 0.0029387474060058594, "step": 4956} {"info/global_step": 4957, "train_info/time_within_train_step": 2.65946102142334, "step": 4957} {"train_info/time_between_train_steps": 0.0029184818267822266, "step": 4957} {"info/global_step": 4958, "train_info/time_within_train_step": 2.6691782474517822, "step": 4958} {"train_info/time_between_train_steps": 0.0029401779174804688, "step": 4958} {"info/global_step": 4959, "train_info/time_within_train_step": 2.662848949432373, "step": 4959} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 4959} {"info/global_step": 4960, "train_info/time_within_train_step": 2.701326370239258, "step": 4960} {"train_info/time_between_train_steps": 0.002916574478149414, "step": 4960} {"info/global_step": 4961, "train_info/time_within_train_step": 2.697038173675537, "step": 4961} {"train_info/time_between_train_steps": 0.002925872802734375, "step": 4961} {"info/global_step": 4962, "train_info/time_within_train_step": 2.639970541000366, "step": 4962} {"train_info/time_between_train_steps": 0.002942323684692383, "step": 4962} {"info/global_step": 4963, "train_info/time_within_train_step": 2.641080141067505, "step": 4963} {"train_info/time_between_train_steps": 0.0029518604278564453, "step": 4963} {"info/global_step": 4964, "train_info/time_within_train_step": 2.658505439758301, "step": 4964} {"train_info/time_between_train_steps": 0.0029554367065429688, "step": 4964} {"info/global_step": 4965, "train_info/time_within_train_step": 2.652775526046753, "step": 4965} {"train_info/time_between_train_steps": 0.0029022693634033203, "step": 4965} {"info/global_step": 4966, "train_info/time_within_train_step": 2.6438426971435547, "step": 4966} {"train_info/time_between_train_steps": 0.0029761791229248047, "step": 4966} {"info/global_step": 4967, "train_info/time_within_train_step": 2.6502418518066406, "step": 4967} {"train_info/time_between_train_steps": 0.0029141902923583984, "step": 4967} {"info/global_step": 4968, "train_info/time_within_train_step": 2.6531262397766113, "step": 4968} {"train_info/time_between_train_steps": 0.0030057430267333984, "step": 4968} {"info/global_step": 4969, "train_info/time_within_train_step": 2.668882369995117, "step": 4969} {"train_info/time_between_train_steps": 0.0028951168060302734, "step": 4969} {"info/global_step": 4970, "train_info/time_within_train_step": 2.7098138332366943, "step": 4970} {"train_info/time_between_train_steps": 0.0029349327087402344, "step": 4970} {"info/global_step": 4971, "train_info/time_within_train_step": 2.6431620121002197, "step": 4971} {"train_info/time_between_train_steps": 0.002911090850830078, "step": 4971} {"info/global_step": 4972, "train_info/time_within_train_step": 2.6559503078460693, "step": 4972} {"train_info/time_between_train_steps": 0.0029087066650390625, "step": 4972} {"info/global_step": 4973, "train_info/time_within_train_step": 2.6481287479400635, "step": 4973} {"train_info/time_between_train_steps": 0.002920866012573242, "step": 4973} {"info/global_step": 4974, "train_info/time_within_train_step": 2.6479504108428955, "step": 4974} {"train_info/time_between_train_steps": 0.0029268264770507812, "step": 4974} {"info/global_step": 4975, "train_info/time_within_train_step": 2.6567234992980957, "step": 4975} {"train_info/time_between_train_steps": 0.0029342174530029297, "step": 4975} {"info/global_step": 4976, "train_info/time_within_train_step": 2.643385648727417, "step": 4976} {"train_info/time_between_train_steps": 0.0028853416442871094, "step": 4976} {"info/global_step": 4977, "train_info/time_within_train_step": 2.644813060760498, "step": 4977} {"train_info/time_between_train_steps": 0.002990245819091797, "step": 4977} {"info/global_step": 4978, "train_info/time_within_train_step": 2.6722216606140137, "step": 4978} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 4978} {"info/global_step": 4979, "train_info/time_within_train_step": 2.667048454284668, "step": 4979} {"train_info/time_between_train_steps": 0.002914905548095703, "step": 4979} {"info/global_step": 4980, "train_info/time_within_train_step": 2.666393995285034, "step": 4980} {"train_info/time_between_train_steps": 0.0029745101928710938, "step": 4980} {"info/global_step": 4981, "train_info/time_within_train_step": 2.6754462718963623, "step": 4981} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 4981} {"info/global_step": 4982, "train_info/time_within_train_step": 2.6439948081970215, "step": 4982} {"train_info/time_between_train_steps": 0.0028629302978515625, "step": 4982} {"info/global_step": 4983, "train_info/time_within_train_step": 2.6550395488739014, "step": 4983} {"train_info/time_between_train_steps": 0.002889394760131836, "step": 4983} {"info/global_step": 4984, "train_info/time_within_train_step": 2.6508281230926514, "step": 4984} {"train_info/time_between_train_steps": 0.0029256343841552734, "step": 4984} {"info/global_step": 4985, "train_info/time_within_train_step": 2.6453518867492676, "step": 4985} {"train_info/time_between_train_steps": 0.0028841495513916016, "step": 4985} {"info/global_step": 4986, "train_info/time_within_train_step": 2.645707130432129, "step": 4986} {"train_info/time_between_train_steps": 0.0028727054595947266, "step": 4986} {"info/global_step": 4987, "train_info/time_within_train_step": 2.6513049602508545, "step": 4987} {"train_info/time_between_train_steps": 0.0029687881469726562, "step": 4987} {"info/global_step": 4988, "train_info/time_within_train_step": 2.660365104675293, "step": 4988} {"train_info/time_between_train_steps": 0.002962827682495117, "step": 4988} {"info/global_step": 4989, "train_info/time_within_train_step": 2.66874361038208, "step": 4989} {"train_info/time_between_train_steps": 0.0029027462005615234, "step": 4989} {"info/global_step": 4990, "train_info/time_within_train_step": 2.66178560256958, "step": 4990} {"train_info/time_between_train_steps": 0.002947092056274414, "step": 4990} {"info/global_step": 4991, "train_info/time_within_train_step": 2.703467607498169, "step": 4991} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 4991} {"info/global_step": 4992, "train_info/time_within_train_step": 2.6411328315734863, "step": 4992} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 4992} {"info/global_step": 4993, "train_info/time_within_train_step": 2.640399694442749, "step": 4993} {"train_info/time_between_train_steps": 0.002905130386352539, "step": 4993} {"info/global_step": 4994, "train_info/time_within_train_step": 2.6653521060943604, "step": 4994} {"train_info/time_between_train_steps": 0.002993345260620117, "step": 4994} {"info/global_step": 4995, "train_info/time_within_train_step": 2.6507863998413086, "step": 4995} {"train_info/time_between_train_steps": 0.002880573272705078, "step": 4995} {"info/global_step": 4996, "train_info/time_within_train_step": 2.6444144248962402, "step": 4996} {"train_info/time_between_train_steps": 0.0029108524322509766, "step": 4996} {"info/global_step": 4997, "train_info/time_within_train_step": 2.66162109375, "step": 4997} {"train_info/time_between_train_steps": 0.002902507781982422, "step": 4997} {"info/global_step": 4998, "train_info/time_within_train_step": 2.664423704147339, "step": 4998} {"train_info/time_between_train_steps": 0.0029816627502441406, "step": 4998} {"info/global_step": 4999, "train_info/time_within_train_step": 3.2722508907318115, "step": 4999} {"train_info/time_between_train_steps": 0.005226612091064453, "step": 4999} {"info/global_step": 5000, "train_info/time_within_train_step": 2.6403868198394775, "step": 5000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746911453, "_runtime": 14051}, "step": 5000} {"logs": {"train/loss": 3.6177, "train/learning_rate": 0.0003333333333333333, "train/epoch": 5.07, "_timestamp": 1746911453, "_runtime": 14051}, "step": 5000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746911458, "_runtime": 14056}, "step": 5000} {"logs": {"eval/loss": 4.606800079345703, "eval/runtime": 5.1765, "eval/samples_per_second": 37.091, "eval/steps_per_second": 1.159, "train/epoch": 5.07, "_timestamp": 1746911458, "_runtime": 14056}, "step": 5000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746911458, "_runtime": 14056}, "step": 5000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.606800079345703, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 100.1631222355734, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1765, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 37.091, "train/epoch": 5.07, "_timestamp": 1746911458, "_runtime": 14056}, "step": 5000} {"train_info/time_between_train_steps": 22.28702211380005, "step": 5000} {"info/global_step": 5001, "train_info/time_within_train_step": 2.6118640899658203, "step": 5001} {"train_info/time_between_train_steps": 0.002954244613647461, "step": 5001} {"info/global_step": 5002, "train_info/time_within_train_step": 2.429368495941162, "step": 5002} {"train_info/time_between_train_steps": 0.002906322479248047, "step": 5002} {"info/global_step": 5003, "train_info/time_within_train_step": 2.5480830669403076, "step": 5003} {"train_info/time_between_train_steps": 0.0028939247131347656, "step": 5003} {"info/global_step": 5004, "train_info/time_within_train_step": 2.640108108520508, "step": 5004} {"train_info/time_between_train_steps": 0.0030214786529541016, "step": 5004} {"info/global_step": 5005, "train_info/time_within_train_step": 2.643697500228882, "step": 5005} {"train_info/time_between_train_steps": 0.0030066967010498047, "step": 5005} {"info/global_step": 5006, "train_info/time_within_train_step": 2.644317150115967, "step": 5006} {"train_info/time_between_train_steps": 0.0029952526092529297, "step": 5006} {"info/global_step": 5007, "train_info/time_within_train_step": 2.6450865268707275, "step": 5007} {"train_info/time_between_train_steps": 0.0030813217163085938, "step": 5007} {"info/global_step": 5008, "train_info/time_within_train_step": 2.643515110015869, "step": 5008} {"train_info/time_between_train_steps": 0.002895832061767578, "step": 5008} {"info/global_step": 5009, "train_info/time_within_train_step": 2.6917192935943604, "step": 5009} {"train_info/time_between_train_steps": 0.002877950668334961, "step": 5009} {"info/global_step": 5010, "train_info/time_within_train_step": 2.64365291595459, "step": 5010} {"train_info/time_between_train_steps": 0.0029489994049072266, "step": 5010} {"info/global_step": 5011, "train_info/time_within_train_step": 2.657412528991699, "step": 5011} {"train_info/time_between_train_steps": 0.002918243408203125, "step": 5011} {"info/global_step": 5012, "train_info/time_within_train_step": 2.648674488067627, "step": 5012} {"train_info/time_between_train_steps": 0.0029752254486083984, "step": 5012} {"info/global_step": 5013, "train_info/time_within_train_step": 2.6456522941589355, "step": 5013} {"train_info/time_between_train_steps": 0.0029397010803222656, "step": 5013} {"info/global_step": 5014, "train_info/time_within_train_step": 2.662200689315796, "step": 5014} {"train_info/time_between_train_steps": 0.0029134750366210938, "step": 5014} {"info/global_step": 5015, "train_info/time_within_train_step": 2.654547929763794, "step": 5015} {"train_info/time_between_train_steps": 0.0029022693634033203, "step": 5015} {"info/global_step": 5016, "train_info/time_within_train_step": 2.643618106842041, "step": 5016} {"train_info/time_between_train_steps": 0.0030426979064941406, "step": 5016} {"info/global_step": 5017, "train_info/time_within_train_step": 2.6622729301452637, "step": 5017} {"train_info/time_between_train_steps": 0.0029976367950439453, "step": 5017} {"info/global_step": 5018, "train_info/time_within_train_step": 2.6524899005889893, "step": 5018} {"train_info/time_between_train_steps": 0.002961874008178711, "step": 5018} {"info/global_step": 5019, "train_info/time_within_train_step": 2.660601854324341, "step": 5019} {"train_info/time_between_train_steps": 0.002951383590698242, "step": 5019} {"info/global_step": 5020, "train_info/time_within_train_step": 2.7195849418640137, "step": 5020} {"train_info/time_between_train_steps": 0.0029304027557373047, "step": 5020} {"info/global_step": 5021, "train_info/time_within_train_step": 2.6825103759765625, "step": 5021} {"train_info/time_between_train_steps": 0.0029251575469970703, "step": 5021} {"info/global_step": 5022, "train_info/time_within_train_step": 2.6406829357147217, "step": 5022} {"train_info/time_between_train_steps": 0.002970457077026367, "step": 5022} {"info/global_step": 5023, "train_info/time_within_train_step": 2.6521167755126953, "step": 5023} {"train_info/time_between_train_steps": 0.0029075145721435547, "step": 5023} {"info/global_step": 5024, "train_info/time_within_train_step": 2.648495674133301, "step": 5024} {"train_info/time_between_train_steps": 0.0029754638671875, "step": 5024} {"info/global_step": 5025, "train_info/time_within_train_step": 2.6498825550079346, "step": 5025} {"train_info/time_between_train_steps": 0.0029137134552001953, "step": 5025} {"info/global_step": 5026, "train_info/time_within_train_step": 2.6473822593688965, "step": 5026} {"train_info/time_between_train_steps": 0.0029184818267822266, "step": 5026} {"info/global_step": 5027, "train_info/time_within_train_step": 2.645953893661499, "step": 5027} {"train_info/time_between_train_steps": 0.0029447078704833984, "step": 5027} {"info/global_step": 5028, "train_info/time_within_train_step": 2.6667120456695557, "step": 5028} {"train_info/time_between_train_steps": 0.0029718875885009766, "step": 5028} {"info/global_step": 5029, "train_info/time_within_train_step": 2.670196533203125, "step": 5029} {"train_info/time_between_train_steps": 0.0028734207153320312, "step": 5029} {"info/global_step": 5030, "train_info/time_within_train_step": 2.6747732162475586, "step": 5030} {"train_info/time_between_train_steps": 0.0029642581939697266, "step": 5030} {"info/global_step": 5031, "train_info/time_within_train_step": 2.6514811515808105, "step": 5031} {"train_info/time_between_train_steps": 0.002951383590698242, "step": 5031} {"info/global_step": 5032, "train_info/time_within_train_step": 2.648714303970337, "step": 5032} {"train_info/time_between_train_steps": 0.0029006004333496094, "step": 5032} {"info/global_step": 5033, "train_info/time_within_train_step": 2.643209457397461, "step": 5033} {"train_info/time_between_train_steps": 0.002902984619140625, "step": 5033} {"info/global_step": 5034, "train_info/time_within_train_step": 2.6829934120178223, "step": 5034} {"train_info/time_between_train_steps": 0.0029287338256835938, "step": 5034} {"info/global_step": 5035, "train_info/time_within_train_step": 2.6665048599243164, "step": 5035} {"train_info/time_between_train_steps": 0.002957582473754883, "step": 5035} {"info/global_step": 5036, "train_info/time_within_train_step": 2.6658620834350586, "step": 5036} {"train_info/time_between_train_steps": 0.002934694290161133, "step": 5036} {"info/global_step": 5037, "train_info/time_within_train_step": 2.6888082027435303, "step": 5037} {"train_info/time_between_train_steps": 0.0029807090759277344, "step": 5037} {"info/global_step": 5038, "train_info/time_within_train_step": 2.6568188667297363, "step": 5038} {"train_info/time_between_train_steps": 0.0028967857360839844, "step": 5038} {"info/global_step": 5039, "train_info/time_within_train_step": 2.6588451862335205, "step": 5039} {"train_info/time_between_train_steps": 0.0029273033142089844, "step": 5039} {"info/global_step": 5040, "train_info/time_within_train_step": 2.6480135917663574, "step": 5040} {"train_info/time_between_train_steps": 0.002907276153564453, "step": 5040} {"info/global_step": 5041, "train_info/time_within_train_step": 2.646556854248047, "step": 5041} {"train_info/time_between_train_steps": 0.0029616355895996094, "step": 5041} {"info/global_step": 5042, "train_info/time_within_train_step": 2.6534032821655273, "step": 5042} {"train_info/time_between_train_steps": 0.002923250198364258, "step": 5042} {"info/global_step": 5043, "train_info/time_within_train_step": 2.649799108505249, "step": 5043} {"train_info/time_between_train_steps": 0.0029244422912597656, "step": 5043} {"info/global_step": 5044, "train_info/time_within_train_step": 2.7765841484069824, "step": 5044} {"train_info/time_between_train_steps": 0.0029485225677490234, "step": 5044} {"info/global_step": 5045, "train_info/time_within_train_step": 2.6479387283325195, "step": 5045} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 5045} {"info/global_step": 5046, "train_info/time_within_train_step": 2.646775245666504, "step": 5046} {"train_info/time_between_train_steps": 0.0029077529907226562, "step": 5046} {"info/global_step": 5047, "train_info/time_within_train_step": 2.6666009426116943, "step": 5047} {"train_info/time_between_train_steps": 0.0029430389404296875, "step": 5047} {"info/global_step": 5048, "train_info/time_within_train_step": 2.6644248962402344, "step": 5048} {"train_info/time_between_train_steps": 0.0029706954956054688, "step": 5048} {"info/global_step": 5049, "train_info/time_within_train_step": 2.6544852256774902, "step": 5049} {"train_info/time_between_train_steps": 0.0029528141021728516, "step": 5049} {"info/global_step": 5050, "train_info/time_within_train_step": 2.7065320014953613, "step": 5050} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746911610, "_runtime": 14208}, "step": 5050} {"logs": {"train/loss": 3.6075, "train/learning_rate": 0.00033, "train/epoch": 5.07, "_timestamp": 1746911610, "_runtime": 14208}, "step": 5050} {"train_info/time_between_train_steps": 0.024430513381958008, "step": 5050} {"info/global_step": 5051, "train_info/time_within_train_step": 2.706742763519287, "step": 5051} {"train_info/time_between_train_steps": 0.0029344558715820312, "step": 5051} {"info/global_step": 5052, "train_info/time_within_train_step": 2.6416711807250977, "step": 5052} {"train_info/time_between_train_steps": 0.002980947494506836, "step": 5052} {"info/global_step": 5053, "train_info/time_within_train_step": 2.6498677730560303, "step": 5053} {"train_info/time_between_train_steps": 0.0029375553131103516, "step": 5053} {"info/global_step": 5054, "train_info/time_within_train_step": 2.6640846729278564, "step": 5054} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 5054} {"info/global_step": 5055, "train_info/time_within_train_step": 2.6436378955841064, "step": 5055} {"train_info/time_between_train_steps": 0.0032858848571777344, "step": 5055} {"info/global_step": 5056, "train_info/time_within_train_step": 2.6454076766967773, "step": 5056} {"train_info/time_between_train_steps": 0.0029888153076171875, "step": 5056} {"info/global_step": 5057, "train_info/time_within_train_step": 2.658277750015259, "step": 5057} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 5057} {"info/global_step": 5058, "train_info/time_within_train_step": 2.6605026721954346, "step": 5058} {"train_info/time_between_train_steps": 0.0029168128967285156, "step": 5058} {"info/global_step": 5059, "train_info/time_within_train_step": 2.659374952316284, "step": 5059} {"train_info/time_between_train_steps": 0.0029087066650390625, "step": 5059} {"info/global_step": 5060, "train_info/time_within_train_step": 2.7286055088043213, "step": 5060} {"train_info/time_between_train_steps": 0.0029685497283935547, "step": 5060} {"info/global_step": 5061, "train_info/time_within_train_step": 2.6690728664398193, "step": 5061} {"train_info/time_between_train_steps": 0.002895832061767578, "step": 5061} {"info/global_step": 5062, "train_info/time_within_train_step": 2.6402273178100586, "step": 5062} {"train_info/time_between_train_steps": 0.0029020309448242188, "step": 5062} {"info/global_step": 5063, "train_info/time_within_train_step": 2.641519784927368, "step": 5063} {"train_info/time_between_train_steps": 0.002917051315307617, "step": 5063} {"info/global_step": 5064, "train_info/time_within_train_step": 2.655035972595215, "step": 5064} {"train_info/time_between_train_steps": 0.002938985824584961, "step": 5064} {"info/global_step": 5065, "train_info/time_within_train_step": 2.6548073291778564, "step": 5065} {"train_info/time_between_train_steps": 0.002977132797241211, "step": 5065} {"info/global_step": 5066, "train_info/time_within_train_step": 2.6431992053985596, "step": 5066} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 5066} {"info/global_step": 5067, "train_info/time_within_train_step": 2.649566650390625, "step": 5067} {"train_info/time_between_train_steps": 0.002977132797241211, "step": 5067} {"info/global_step": 5068, "train_info/time_within_train_step": 2.6544501781463623, "step": 5068} {"train_info/time_between_train_steps": 0.0029599666595458984, "step": 5068} {"info/global_step": 5069, "train_info/time_within_train_step": 2.664201259613037, "step": 5069} {"train_info/time_between_train_steps": 0.0029685497283935547, "step": 5069} {"info/global_step": 5070, "train_info/time_within_train_step": 2.693826198577881, "step": 5070} {"train_info/time_between_train_steps": 0.0029594898223876953, "step": 5070} {"info/global_step": 5071, "train_info/time_within_train_step": 2.6493003368377686, "step": 5071} {"train_info/time_between_train_steps": 0.0029137134552001953, "step": 5071} {"info/global_step": 5072, "train_info/time_within_train_step": 2.640315055847168, "step": 5072} {"train_info/time_between_train_steps": 0.002904653549194336, "step": 5072} {"info/global_step": 5073, "train_info/time_within_train_step": 2.658862829208374, "step": 5073} {"train_info/time_between_train_steps": 0.0029439926147460938, "step": 5073} {"info/global_step": 5074, "train_info/time_within_train_step": 2.6538240909576416, "step": 5074} {"train_info/time_between_train_steps": 0.002902507781982422, "step": 5074} {"info/global_step": 5075, "train_info/time_within_train_step": 2.6430580615997314, "step": 5075} {"train_info/time_between_train_steps": 0.002945423126220703, "step": 5075} {"info/global_step": 5076, "train_info/time_within_train_step": 2.6422159671783447, "step": 5076} {"train_info/time_between_train_steps": 0.0029163360595703125, "step": 5076} {"info/global_step": 5077, "train_info/time_within_train_step": 2.6586265563964844, "step": 5077} {"train_info/time_between_train_steps": 0.0029554367065429688, "step": 5077} {"info/global_step": 5078, "train_info/time_within_train_step": 2.6666600704193115, "step": 5078} {"train_info/time_between_train_steps": 0.0029430389404296875, "step": 5078} {"info/global_step": 5079, "train_info/time_within_train_step": 2.686584949493408, "step": 5079} {"train_info/time_between_train_steps": 0.0028886795043945312, "step": 5079} {"info/global_step": 5080, "train_info/time_within_train_step": 2.6509222984313965, "step": 5080} {"train_info/time_between_train_steps": 0.0029087066650390625, "step": 5080} {"info/global_step": 5081, "train_info/time_within_train_step": 2.6704752445220947, "step": 5081} {"train_info/time_between_train_steps": 0.002891063690185547, "step": 5081} {"info/global_step": 5082, "train_info/time_within_train_step": 2.645188570022583, "step": 5082} {"train_info/time_between_train_steps": 0.0029675960540771484, "step": 5082} {"info/global_step": 5083, "train_info/time_within_train_step": 2.6443374156951904, "step": 5083} {"train_info/time_between_train_steps": 0.0028645992279052734, "step": 5083} {"info/global_step": 5084, "train_info/time_within_train_step": 2.6510984897613525, "step": 5084} {"train_info/time_between_train_steps": 0.002951383590698242, "step": 5084} {"info/global_step": 5085, "train_info/time_within_train_step": 2.6473894119262695, "step": 5085} {"train_info/time_between_train_steps": 0.0028755664825439453, "step": 5085} {"info/global_step": 5086, "train_info/time_within_train_step": 2.646369218826294, "step": 5086} {"train_info/time_between_train_steps": 0.003253936767578125, "step": 5086} {"info/global_step": 5087, "train_info/time_within_train_step": 2.6598644256591797, "step": 5087} {"train_info/time_between_train_steps": 0.0029480457305908203, "step": 5087} {"info/global_step": 5088, "train_info/time_within_train_step": 2.668160915374756, "step": 5088} {"train_info/time_between_train_steps": 0.003026723861694336, "step": 5088} {"info/global_step": 5089, "train_info/time_within_train_step": 2.6727473735809326, "step": 5089} {"train_info/time_between_train_steps": 0.002920389175415039, "step": 5089} {"info/global_step": 5090, "train_info/time_within_train_step": 2.7028260231018066, "step": 5090} {"train_info/time_between_train_steps": 0.0029706954956054688, "step": 5090} {"info/global_step": 5091, "train_info/time_within_train_step": 2.652477502822876, "step": 5091} {"train_info/time_between_train_steps": 0.002920389175415039, "step": 5091} {"info/global_step": 5092, "train_info/time_within_train_step": 2.6475186347961426, "step": 5092} {"train_info/time_between_train_steps": 0.002904653549194336, "step": 5092} {"info/global_step": 5093, "train_info/time_within_train_step": 2.6490705013275146, "step": 5093} {"train_info/time_between_train_steps": 0.003045797348022461, "step": 5093} {"info/global_step": 5094, "train_info/time_within_train_step": 2.6484644412994385, "step": 5094} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 5094} {"info/global_step": 5095, "train_info/time_within_train_step": 2.6527562141418457, "step": 5095} {"train_info/time_between_train_steps": 0.002957582473754883, "step": 5095} {"info/global_step": 5096, "train_info/time_within_train_step": 2.645336151123047, "step": 5096} {"train_info/time_between_train_steps": 0.002895355224609375, "step": 5096} {"info/global_step": 5097, "train_info/time_within_train_step": 2.652334451675415, "step": 5097} {"train_info/time_between_train_steps": 0.002908468246459961, "step": 5097} {"info/global_step": 5098, "train_info/time_within_train_step": 2.6591498851776123, "step": 5098} {"train_info/time_between_train_steps": 0.002911090850830078, "step": 5098} {"info/global_step": 5099, "train_info/time_within_train_step": 2.6774959564208984, "step": 5099} {"train_info/time_between_train_steps": 0.003322124481201172, "step": 5099} {"info/global_step": 5100, "train_info/time_within_train_step": 2.726870059967041, "step": 5100} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746911744, "_runtime": 14342}, "step": 5100} {"logs": {"train/loss": 3.5966, "train/learning_rate": 0.0003266666666666666, "train/epoch": 5.08, "_timestamp": 1746911744, "_runtime": 14342}, "step": 5100} {"train_info/time_between_train_steps": 0.024053096771240234, "step": 5100} {"info/global_step": 5101, "train_info/time_within_train_step": 2.7265493869781494, "step": 5101} {"train_info/time_between_train_steps": 0.002932310104370117, "step": 5101} {"info/global_step": 5102, "train_info/time_within_train_step": 2.6636831760406494, "step": 5102} {"train_info/time_between_train_steps": 0.0029268264770507812, "step": 5102} {"info/global_step": 5103, "train_info/time_within_train_step": 2.6400716304779053, "step": 5103} {"train_info/time_between_train_steps": 0.0029664039611816406, "step": 5103} {"info/global_step": 5104, "train_info/time_within_train_step": 2.6530964374542236, "step": 5104} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 5104} {"info/global_step": 5105, "train_info/time_within_train_step": 2.6475696563720703, "step": 5105} {"train_info/time_between_train_steps": 0.0029196739196777344, "step": 5105} {"info/global_step": 5106, "train_info/time_within_train_step": 2.648549795150757, "step": 5106} {"train_info/time_between_train_steps": 0.002896547317504883, "step": 5106} {"info/global_step": 5107, "train_info/time_within_train_step": 2.645721912384033, "step": 5107} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 5107} {"info/global_step": 5108, "train_info/time_within_train_step": 2.6445600986480713, "step": 5108} {"train_info/time_between_train_steps": 0.0029871463775634766, "step": 5108} {"info/global_step": 5109, "train_info/time_within_train_step": 2.6662838459014893, "step": 5109} {"train_info/time_between_train_steps": 0.0029497146606445312, "step": 5109} {"info/global_step": 5110, "train_info/time_within_train_step": 2.668649911880493, "step": 5110} {"train_info/time_between_train_steps": 0.0032167434692382812, "step": 5110} {"info/global_step": 5111, "train_info/time_within_train_step": 2.646494150161743, "step": 5111} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 5111} {"info/global_step": 5112, "train_info/time_within_train_step": 2.6569716930389404, "step": 5112} {"train_info/time_between_train_steps": 0.0031099319458007812, "step": 5112} {"info/global_step": 5113, "train_info/time_within_train_step": 2.6523241996765137, "step": 5113} {"train_info/time_between_train_steps": 0.0033681392669677734, "step": 5113} {"info/global_step": 5114, "train_info/time_within_train_step": 2.6497278213500977, "step": 5114} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 5114} {"info/global_step": 5115, "train_info/time_within_train_step": 2.6615664958953857, "step": 5115} {"train_info/time_between_train_steps": 0.003233194351196289, "step": 5115} {"info/global_step": 5116, "train_info/time_within_train_step": 2.6435887813568115, "step": 5116} {"train_info/time_between_train_steps": 0.003289937973022461, "step": 5116} {"info/global_step": 5117, "train_info/time_within_train_step": 2.6444242000579834, "step": 5117} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 5117} {"info/global_step": 5118, "train_info/time_within_train_step": 2.668712854385376, "step": 5118} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 5118} {"info/global_step": 5119, "train_info/time_within_train_step": 2.6636481285095215, "step": 5119} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 5119} {"info/global_step": 5120, "train_info/time_within_train_step": 2.6855287551879883, "step": 5120} {"train_info/time_between_train_steps": 0.0031681060791015625, "step": 5120} {"info/global_step": 5121, "train_info/time_within_train_step": 2.6585206985473633, "step": 5121} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 5121} {"info/global_step": 5122, "train_info/time_within_train_step": 2.6533493995666504, "step": 5122} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 5122} {"info/global_step": 5123, "train_info/time_within_train_step": 2.6505987644195557, "step": 5123} {"train_info/time_between_train_steps": 0.0032629966735839844, "step": 5123} {"info/global_step": 5124, "train_info/time_within_train_step": 2.648447036743164, "step": 5124} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 5124} {"info/global_step": 5125, "train_info/time_within_train_step": 2.6472973823547363, "step": 5125} {"train_info/time_between_train_steps": 0.0031037330627441406, "step": 5125} {"info/global_step": 5126, "train_info/time_within_train_step": 2.648993968963623, "step": 5126} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 5126} {"info/global_step": 5127, "train_info/time_within_train_step": 2.6483941078186035, "step": 5127} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 5127} {"info/global_step": 5128, "train_info/time_within_train_step": 2.663743734359741, "step": 5128} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 5128} {"info/global_step": 5129, "train_info/time_within_train_step": 2.665541172027588, "step": 5129} {"train_info/time_between_train_steps": 0.003253936767578125, "step": 5129} {"info/global_step": 5130, "train_info/time_within_train_step": 2.657104969024658, "step": 5130} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 5130} {"info/global_step": 5131, "train_info/time_within_train_step": 2.7110774517059326, "step": 5131} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 5131} {"info/global_step": 5132, "train_info/time_within_train_step": 2.6428825855255127, "step": 5132} {"train_info/time_between_train_steps": 0.0031213760375976562, "step": 5132} {"info/global_step": 5133, "train_info/time_within_train_step": 2.647397041320801, "step": 5133} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 5133} {"info/global_step": 5134, "train_info/time_within_train_step": 2.65567684173584, "step": 5134} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 5134} {"info/global_step": 5135, "train_info/time_within_train_step": 2.6446752548217773, "step": 5135} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 5135} {"info/global_step": 5136, "train_info/time_within_train_step": 2.647578239440918, "step": 5136} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 5136} {"info/global_step": 5137, "train_info/time_within_train_step": 2.648369550704956, "step": 5137} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 5137} {"info/global_step": 5138, "train_info/time_within_train_step": 2.66762638092041, "step": 5138} {"train_info/time_between_train_steps": 0.0031256675720214844, "step": 5138} {"info/global_step": 5139, "train_info/time_within_train_step": 2.688920259475708, "step": 5139} {"train_info/time_between_train_steps": 0.003141641616821289, "step": 5139} {"info/global_step": 5140, "train_info/time_within_train_step": 2.7197093963623047, "step": 5140} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 5140} {"info/global_step": 5141, "train_info/time_within_train_step": 2.6422512531280518, "step": 5141} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 5141} {"info/global_step": 5142, "train_info/time_within_train_step": 2.642286539077759, "step": 5142} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 5142} {"info/global_step": 5143, "train_info/time_within_train_step": 2.6643216609954834, "step": 5143} {"train_info/time_between_train_steps": 0.0030698776245117188, "step": 5143} {"info/global_step": 5144, "train_info/time_within_train_step": 2.6504478454589844, "step": 5144} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 5144} {"info/global_step": 5145, "train_info/time_within_train_step": 2.6456525325775146, "step": 5145} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 5145} {"info/global_step": 5146, "train_info/time_within_train_step": 2.651455879211426, "step": 5146} {"train_info/time_between_train_steps": 0.003098726272583008, "step": 5146} {"info/global_step": 5147, "train_info/time_within_train_step": 2.645988702774048, "step": 5147} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 5147} {"info/global_step": 5148, "train_info/time_within_train_step": 2.671095132827759, "step": 5148} {"train_info/time_between_train_steps": 0.003154277801513672, "step": 5148} {"info/global_step": 5149, "train_info/time_within_train_step": 2.6914901733398438, "step": 5149} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 5149} {"info/global_step": 5150, "train_info/time_within_train_step": 2.667729616165161, "step": 5150} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746911878, "_runtime": 14476}, "step": 5150} {"logs": {"train/loss": 3.5875, "train/learning_rate": 0.0003233333333333333, "train/epoch": 5.08, "_timestamp": 1746911878, "_runtime": 14476}, "step": 5150} {"train_info/time_between_train_steps": 0.024339914321899414, "step": 5150} {"info/global_step": 5151, "train_info/time_within_train_step": 2.6423187255859375, "step": 5151} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 5151} {"info/global_step": 5152, "train_info/time_within_train_step": 2.6546401977539062, "step": 5152} {"train_info/time_between_train_steps": 0.003255128860473633, "step": 5152} {"info/global_step": 5153, "train_info/time_within_train_step": 2.64725399017334, "step": 5153} {"train_info/time_between_train_steps": 0.0031561851501464844, "step": 5153} {"info/global_step": 5154, "train_info/time_within_train_step": 2.7269015312194824, "step": 5154} {"train_info/time_between_train_steps": 0.0031309127807617188, "step": 5154} {"info/global_step": 5155, "train_info/time_within_train_step": 2.652587413787842, "step": 5155} {"train_info/time_between_train_steps": 0.0030083656311035156, "step": 5155} {"info/global_step": 5156, "train_info/time_within_train_step": 2.6593005657196045, "step": 5156} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 5156} {"info/global_step": 5157, "train_info/time_within_train_step": 2.64363431930542, "step": 5157} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 5157} {"info/global_step": 5158, "train_info/time_within_train_step": 2.6437857151031494, "step": 5158} {"train_info/time_between_train_steps": 0.0031070709228515625, "step": 5158} {"info/global_step": 5159, "train_info/time_within_train_step": 2.6707491874694824, "step": 5159} {"train_info/time_between_train_steps": 0.0030853748321533203, "step": 5159} {"info/global_step": 5160, "train_info/time_within_train_step": 2.66615629196167, "step": 5160} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 5160} {"info/global_step": 5161, "train_info/time_within_train_step": 2.6735992431640625, "step": 5161} {"train_info/time_between_train_steps": 0.003526926040649414, "step": 5161} {"info/global_step": 5162, "train_info/time_within_train_step": 2.672856330871582, "step": 5162} {"train_info/time_between_train_steps": 0.0034368038177490234, "step": 5162} {"info/global_step": 5163, "train_info/time_within_train_step": 2.641170024871826, "step": 5163} {"train_info/time_between_train_steps": 0.0030922889709472656, "step": 5163} {"info/global_step": 5164, "train_info/time_within_train_step": 2.642582416534424, "step": 5164} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 5164} {"info/global_step": 5165, "train_info/time_within_train_step": 2.6631603240966797, "step": 5165} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 5165} {"info/global_step": 5166, "train_info/time_within_train_step": 2.649430990219116, "step": 5166} {"train_info/time_between_train_steps": 0.0030603408813476562, "step": 5166} {"info/global_step": 5167, "train_info/time_within_train_step": 2.6451003551483154, "step": 5167} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 5167} {"info/global_step": 5168, "train_info/time_within_train_step": 2.6665329933166504, "step": 5168} {"train_info/time_between_train_steps": 0.003268718719482422, "step": 5168} {"info/global_step": 5169, "train_info/time_within_train_step": 2.67952299118042, "step": 5169} {"train_info/time_between_train_steps": 0.0034182071685791016, "step": 5169} {"info/global_step": 5170, "train_info/time_within_train_step": 2.6752233505249023, "step": 5170} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 5170} {"info/global_step": 5171, "train_info/time_within_train_step": 2.6645138263702393, "step": 5171} {"train_info/time_between_train_steps": 0.0034322738647460938, "step": 5171} {"info/global_step": 5172, "train_info/time_within_train_step": 2.704232931137085, "step": 5172} {"train_info/time_between_train_steps": 0.0033583641052246094, "step": 5172} {"info/global_step": 5173, "train_info/time_within_train_step": 2.6426804065704346, "step": 5173} {"train_info/time_between_train_steps": 0.003535032272338867, "step": 5173} {"info/global_step": 5174, "train_info/time_within_train_step": 2.6510512828826904, "step": 5174} {"train_info/time_between_train_steps": 0.0037643909454345703, "step": 5174} {"info/global_step": 5175, "train_info/time_within_train_step": 2.665864944458008, "step": 5175} {"train_info/time_between_train_steps": 0.003518342971801758, "step": 5175} {"info/global_step": 5176, "train_info/time_within_train_step": 2.6436119079589844, "step": 5176} {"train_info/time_between_train_steps": 0.0037488937377929688, "step": 5176} {"info/global_step": 5177, "train_info/time_within_train_step": 2.6481502056121826, "step": 5177} {"train_info/time_between_train_steps": 0.004178762435913086, "step": 5177} {"info/global_step": 5178, "train_info/time_within_train_step": 2.6481833457946777, "step": 5178} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 5178} {"train_info/time_between_train_steps": 2.584491729736328, "step": 5178} {"info/global_step": 5179, "train_info/time_within_train_step": 2.659062147140503, "step": 5179} {"train_info/time_between_train_steps": 0.003244161605834961, "step": 5179} {"info/global_step": 5180, "train_info/time_within_train_step": 2.6454732418060303, "step": 5180} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 5180} {"info/global_step": 5181, "train_info/time_within_train_step": 2.6417086124420166, "step": 5181} {"train_info/time_between_train_steps": 0.0031702518463134766, "step": 5181} {"info/global_step": 5182, "train_info/time_within_train_step": 2.659778118133545, "step": 5182} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 5182} {"info/global_step": 5183, "train_info/time_within_train_step": 2.6470730304718018, "step": 5183} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 5183} {"info/global_step": 5184, "train_info/time_within_train_step": 2.646270990371704, "step": 5184} {"train_info/time_between_train_steps": 0.0031473636627197266, "step": 5184} {"info/global_step": 5185, "train_info/time_within_train_step": 2.6494150161743164, "step": 5185} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 5185} {"info/global_step": 5186, "train_info/time_within_train_step": 2.6454310417175293, "step": 5186} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 5186} {"info/global_step": 5187, "train_info/time_within_train_step": 2.6703996658325195, "step": 5187} {"train_info/time_between_train_steps": 0.0032358169555664062, "step": 5187} {"info/global_step": 5188, "train_info/time_within_train_step": 2.684098243713379, "step": 5188} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 5188} {"info/global_step": 5189, "train_info/time_within_train_step": 2.6868045330047607, "step": 5189} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 5189} {"info/global_step": 5190, "train_info/time_within_train_step": 2.6530520915985107, "step": 5190} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 5190} {"info/global_step": 5191, "train_info/time_within_train_step": 2.6410868167877197, "step": 5191} {"train_info/time_between_train_steps": 0.003222942352294922, "step": 5191} {"info/global_step": 5192, "train_info/time_within_train_step": 2.660005807876587, "step": 5192} {"train_info/time_between_train_steps": 0.0031194686889648438, "step": 5192} {"info/global_step": 5193, "train_info/time_within_train_step": 2.652935266494751, "step": 5193} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 5193} {"info/global_step": 5194, "train_info/time_within_train_step": 2.6466662883758545, "step": 5194} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 5194} {"info/global_step": 5195, "train_info/time_within_train_step": 2.645618200302124, "step": 5195} {"train_info/time_between_train_steps": 0.003360748291015625, "step": 5195} {"info/global_step": 5196, "train_info/time_within_train_step": 2.6546108722686768, "step": 5196} {"train_info/time_between_train_steps": 0.0033943653106689453, "step": 5196} {"info/global_step": 5197, "train_info/time_within_train_step": 2.6852545738220215, "step": 5197} {"train_info/time_between_train_steps": 0.003467082977294922, "step": 5197} {"info/global_step": 5198, "train_info/time_within_train_step": 2.667785406112671, "step": 5198} {"train_info/time_between_train_steps": 0.0035355091094970703, "step": 5198} {"info/global_step": 5199, "train_info/time_within_train_step": 2.677098274230957, "step": 5199} {"train_info/time_between_train_steps": 0.003420114517211914, "step": 5199} {"info/global_step": 5200, "train_info/time_within_train_step": 2.662271022796631, "step": 5200} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746912015, "_runtime": 14613}, "step": 5200} {"logs": {"train/loss": 3.6075, "train/learning_rate": 0.00031999999999999997, "train/epoch": 6.0, "_timestamp": 1746912015, "_runtime": 14613}, "step": 5200} {"train_info/time_between_train_steps": 28.12844157218933, "step": 5200} {"info/global_step": 5201, "train_info/time_within_train_step": 2.4426612854003906, "step": 5201} {"train_info/time_between_train_steps": 0.0035331249237060547, "step": 5201} {"info/global_step": 5202, "train_info/time_within_train_step": 2.4533908367156982, "step": 5202} {"train_info/time_between_train_steps": 0.003457307815551758, "step": 5202} {"info/global_step": 5203, "train_info/time_within_train_step": 2.597768545150757, "step": 5203} {"train_info/time_between_train_steps": 0.003484010696411133, "step": 5203} {"info/global_step": 5204, "train_info/time_within_train_step": 2.6463372707366943, "step": 5204} {"train_info/time_between_train_steps": 0.0034494400024414062, "step": 5204} {"info/global_step": 5205, "train_info/time_within_train_step": 2.638225793838501, "step": 5205} {"train_info/time_between_train_steps": 0.0034830570220947266, "step": 5205} {"info/global_step": 5206, "train_info/time_within_train_step": 2.642082452774048, "step": 5206} {"train_info/time_between_train_steps": 0.0036249160766601562, "step": 5206} {"info/global_step": 5207, "train_info/time_within_train_step": 2.6426994800567627, "step": 5207} {"train_info/time_between_train_steps": 0.0036253929138183594, "step": 5207} {"info/global_step": 5208, "train_info/time_within_train_step": 2.642704725265503, "step": 5208} {"train_info/time_between_train_steps": 0.0036611557006835938, "step": 5208} {"info/global_step": 5209, "train_info/time_within_train_step": 2.643796443939209, "step": 5209} {"train_info/time_between_train_steps": 0.0036509037017822266, "step": 5209} {"info/global_step": 5210, "train_info/time_within_train_step": 2.6507225036621094, "step": 5210} {"train_info/time_between_train_steps": 0.0037097930908203125, "step": 5210} {"info/global_step": 5211, "train_info/time_within_train_step": 2.658332347869873, "step": 5211} {"train_info/time_between_train_steps": 0.0036118030548095703, "step": 5211} {"info/global_step": 5212, "train_info/time_within_train_step": 2.644533634185791, "step": 5212} {"train_info/time_between_train_steps": 0.003634929656982422, "step": 5212} {"info/global_step": 5213, "train_info/time_within_train_step": 2.6442623138427734, "step": 5213} {"train_info/time_between_train_steps": 0.003528594970703125, "step": 5213} {"info/global_step": 5214, "train_info/time_within_train_step": 2.645240068435669, "step": 5214} {"train_info/time_between_train_steps": 0.0035524368286132812, "step": 5214} {"info/global_step": 5215, "train_info/time_within_train_step": 2.644432306289673, "step": 5215} {"train_info/time_between_train_steps": 0.0036830902099609375, "step": 5215} {"info/global_step": 5216, "train_info/time_within_train_step": 2.682204246520996, "step": 5216} {"train_info/time_between_train_steps": 0.0035059452056884766, "step": 5216} {"info/global_step": 5217, "train_info/time_within_train_step": 2.646820545196533, "step": 5217} {"train_info/time_between_train_steps": 0.0034360885620117188, "step": 5217} {"info/global_step": 5218, "train_info/time_within_train_step": 2.662783145904541, "step": 5218} {"train_info/time_between_train_steps": 0.003482818603515625, "step": 5218} {"info/global_step": 5219, "train_info/time_within_train_step": 2.6447811126708984, "step": 5219} {"train_info/time_between_train_steps": 0.0034499168395996094, "step": 5219} {"info/global_step": 5220, "train_info/time_within_train_step": 2.678945541381836, "step": 5220} {"train_info/time_between_train_steps": 0.003493785858154297, "step": 5220} {"info/global_step": 5221, "train_info/time_within_train_step": 2.686732530593872, "step": 5221} {"train_info/time_between_train_steps": 0.003527402877807617, "step": 5221} {"info/global_step": 5222, "train_info/time_within_train_step": 2.733351469039917, "step": 5222} {"train_info/time_between_train_steps": 0.0034623146057128906, "step": 5222} {"info/global_step": 5223, "train_info/time_within_train_step": 2.663301944732666, "step": 5223} {"train_info/time_between_train_steps": 0.0034635066986083984, "step": 5223} {"info/global_step": 5224, "train_info/time_within_train_step": 2.641453742980957, "step": 5224} {"train_info/time_between_train_steps": 0.003482341766357422, "step": 5224} {"info/global_step": 5225, "train_info/time_within_train_step": 2.654618263244629, "step": 5225} {"train_info/time_between_train_steps": 0.0034689903259277344, "step": 5225} {"info/global_step": 5226, "train_info/time_within_train_step": 2.649675130844116, "step": 5226} {"train_info/time_between_train_steps": 0.003468036651611328, "step": 5226} {"info/global_step": 5227, "train_info/time_within_train_step": 2.652369499206543, "step": 5227} {"train_info/time_between_train_steps": 0.003440380096435547, "step": 5227} {"info/global_step": 5228, "train_info/time_within_train_step": 2.6474249362945557, "step": 5228} {"train_info/time_between_train_steps": 0.0034627914428710938, "step": 5228} {"info/global_step": 5229, "train_info/time_within_train_step": 2.6504693031311035, "step": 5229} {"train_info/time_between_train_steps": 0.003500223159790039, "step": 5229} {"info/global_step": 5230, "train_info/time_within_train_step": 2.6642906665802, "step": 5230} {"train_info/time_between_train_steps": 0.0036618709564208984, "step": 5230} {"info/global_step": 5231, "train_info/time_within_train_step": 2.6701667308807373, "step": 5231} {"train_info/time_between_train_steps": 0.0033805370330810547, "step": 5231} {"info/global_step": 5232, "train_info/time_within_train_step": 3.0121583938598633, "step": 5232} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 5232} {"info/global_step": 5233, "train_info/time_within_train_step": 2.643613338470459, "step": 5233} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 5233} {"info/global_step": 5234, "train_info/time_within_train_step": 2.653996229171753, "step": 5234} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 5234} {"info/global_step": 5235, "train_info/time_within_train_step": 2.6519389152526855, "step": 5235} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 5235} {"info/global_step": 5236, "train_info/time_within_train_step": 2.654510736465454, "step": 5236} {"train_info/time_between_train_steps": 0.003448009490966797, "step": 5236} {"info/global_step": 5237, "train_info/time_within_train_step": 2.6452393531799316, "step": 5237} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 5237} {"info/global_step": 5238, "train_info/time_within_train_step": 2.6446430683135986, "step": 5238} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 5238} {"info/global_step": 5239, "train_info/time_within_train_step": 2.6545205116271973, "step": 5239} {"train_info/time_between_train_steps": 0.0034360885620117188, "step": 5239} {"info/global_step": 5240, "train_info/time_within_train_step": 2.6521406173706055, "step": 5240} {"train_info/time_between_train_steps": 0.003262758255004883, "step": 5240} {"info/global_step": 5241, "train_info/time_within_train_step": 2.8055405616760254, "step": 5241} {"train_info/time_between_train_steps": 0.00325775146484375, "step": 5241} {"info/global_step": 5242, "train_info/time_within_train_step": 2.651630401611328, "step": 5242} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 5242} {"info/global_step": 5243, "train_info/time_within_train_step": 2.662574529647827, "step": 5243} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 5243} {"info/global_step": 5244, "train_info/time_within_train_step": 2.682713270187378, "step": 5244} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 5244} {"info/global_step": 5245, "train_info/time_within_train_step": 2.7296414375305176, "step": 5245} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 5245} {"info/global_step": 5246, "train_info/time_within_train_step": 2.653407573699951, "step": 5246} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 5246} {"info/global_step": 5247, "train_info/time_within_train_step": 2.641928195953369, "step": 5247} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 5247} {"info/global_step": 5248, "train_info/time_within_train_step": 2.6565444469451904, "step": 5248} {"train_info/time_between_train_steps": 0.003261566162109375, "step": 5248} {"info/global_step": 5249, "train_info/time_within_train_step": 3.2749383449554443, "step": 5249} {"train_info/time_between_train_steps": 0.003226757049560547, "step": 5249} {"info/global_step": 5250, "train_info/time_within_train_step": 2.6458451747894287, "step": 5250} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746912182, "_runtime": 14780}, "step": 5250} {"logs": {"train/loss": 3.5692, "train/learning_rate": 0.00031666666666666665, "train/epoch": 6.01, "_timestamp": 1746912182, "_runtime": 14780}, "step": 5250} {"train_info/time_between_train_steps": 0.023722171783447266, "step": 5250} {"info/global_step": 5251, "train_info/time_within_train_step": 2.657454013824463, "step": 5251} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 5251} {"info/global_step": 5252, "train_info/time_within_train_step": 2.6519577503204346, "step": 5252} {"train_info/time_between_train_steps": 0.003193378448486328, "step": 5252} {"info/global_step": 5253, "train_info/time_within_train_step": 2.6595451831817627, "step": 5253} {"train_info/time_between_train_steps": 0.003292083740234375, "step": 5253} {"info/global_step": 5254, "train_info/time_within_train_step": 2.6972382068634033, "step": 5254} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 5254} {"info/global_step": 5255, "train_info/time_within_train_step": 2.718838691711426, "step": 5255} {"train_info/time_between_train_steps": 0.003276824951171875, "step": 5255} {"info/global_step": 5256, "train_info/time_within_train_step": 2.6432714462280273, "step": 5256} {"train_info/time_between_train_steps": 0.0032188892364501953, "step": 5256} {"info/global_step": 5257, "train_info/time_within_train_step": 2.6412088871002197, "step": 5257} {"train_info/time_between_train_steps": 0.003237485885620117, "step": 5257} {"info/global_step": 5258, "train_info/time_within_train_step": 2.6603150367736816, "step": 5258} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 5258} {"info/global_step": 5259, "train_info/time_within_train_step": 2.6490306854248047, "step": 5259} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 5259} {"info/global_step": 5260, "train_info/time_within_train_step": 2.6443984508514404, "step": 5260} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 5260} {"info/global_step": 5261, "train_info/time_within_train_step": 2.6518142223358154, "step": 5261} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 5261} {"info/global_step": 5262, "train_info/time_within_train_step": 2.6451711654663086, "step": 5262} {"train_info/time_between_train_steps": 0.0032715797424316406, "step": 5262} {"info/global_step": 5263, "train_info/time_within_train_step": 2.6706619262695312, "step": 5263} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 5263} {"info/global_step": 5264, "train_info/time_within_train_step": 2.693721294403076, "step": 5264} {"train_info/time_between_train_steps": 0.0032782554626464844, "step": 5264} {"info/global_step": 5265, "train_info/time_within_train_step": 2.667738199234009, "step": 5265} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 5265} {"info/global_step": 5266, "train_info/time_within_train_step": 2.6629245281219482, "step": 5266} {"train_info/time_between_train_steps": 0.0032706260681152344, "step": 5266} {"info/global_step": 5267, "train_info/time_within_train_step": 2.650219678878784, "step": 5267} {"train_info/time_between_train_steps": 0.0032372474670410156, "step": 5267} {"info/global_step": 5268, "train_info/time_within_train_step": 2.6470494270324707, "step": 5268} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 5268} {"info/global_step": 5269, "train_info/time_within_train_step": 2.6597976684570312, "step": 5269} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 5269} {"info/global_step": 5270, "train_info/time_within_train_step": 2.6448252201080322, "step": 5270} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 5270} {"info/global_step": 5271, "train_info/time_within_train_step": 2.645892858505249, "step": 5271} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 5271} {"info/global_step": 5272, "train_info/time_within_train_step": 2.6701831817626953, "step": 5272} {"train_info/time_between_train_steps": 0.003274202346801758, "step": 5272} {"info/global_step": 5273, "train_info/time_within_train_step": 2.679356813430786, "step": 5273} {"train_info/time_between_train_steps": 0.003629446029663086, "step": 5273} {"info/global_step": 5274, "train_info/time_within_train_step": 2.6565492153167725, "step": 5274} {"train_info/time_between_train_steps": 0.0032851696014404297, "step": 5274} {"info/global_step": 5275, "train_info/time_within_train_step": 2.6885986328125, "step": 5275} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 5275} {"info/global_step": 5276, "train_info/time_within_train_step": 2.6417829990386963, "step": 5276} {"train_info/time_between_train_steps": 0.0032820701599121094, "step": 5276} {"info/global_step": 5277, "train_info/time_within_train_step": 2.649019479751587, "step": 5277} {"train_info/time_between_train_steps": 0.0032825469970703125, "step": 5277} {"info/global_step": 5278, "train_info/time_within_train_step": 2.6622157096862793, "step": 5278} {"train_info/time_between_train_steps": 0.0032820701599121094, "step": 5278} {"info/global_step": 5279, "train_info/time_within_train_step": 2.6470437049865723, "step": 5279} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 5279} {"info/global_step": 5280, "train_info/time_within_train_step": 2.6465063095092773, "step": 5280} {"train_info/time_between_train_steps": 0.0034635066986083984, "step": 5280} {"info/global_step": 5281, "train_info/time_within_train_step": 2.662161111831665, "step": 5281} {"train_info/time_between_train_steps": 0.003445148468017578, "step": 5281} {"info/global_step": 5282, "train_info/time_within_train_step": 2.6617746353149414, "step": 5282} {"train_info/time_between_train_steps": 0.0033941268920898438, "step": 5282} {"info/global_step": 5283, "train_info/time_within_train_step": 2.677849054336548, "step": 5283} {"train_info/time_between_train_steps": 0.0035104751586914062, "step": 5283} {"info/global_step": 5284, "train_info/time_within_train_step": 2.666982412338257, "step": 5284} {"train_info/time_between_train_steps": 0.0035326480865478516, "step": 5284} {"info/global_step": 5285, "train_info/time_within_train_step": 2.703235387802124, "step": 5285} {"train_info/time_between_train_steps": 0.0035085678100585938, "step": 5285} {"info/global_step": 5286, "train_info/time_within_train_step": 2.6440606117248535, "step": 5286} {"train_info/time_between_train_steps": 0.0034673213958740234, "step": 5286} {"info/global_step": 5287, "train_info/time_within_train_step": 2.6492693424224854, "step": 5287} {"train_info/time_between_train_steps": 0.0034873485565185547, "step": 5287} {"info/global_step": 5288, "train_info/time_within_train_step": 2.6661627292633057, "step": 5288} {"train_info/time_between_train_steps": 0.0034592151641845703, "step": 5288} {"info/global_step": 5289, "train_info/time_within_train_step": 2.644577980041504, "step": 5289} {"train_info/time_between_train_steps": 0.0034821033477783203, "step": 5289} {"info/global_step": 5290, "train_info/time_within_train_step": 2.6786704063415527, "step": 5290} {"train_info/time_between_train_steps": 0.0035080909729003906, "step": 5290} {"info/global_step": 5291, "train_info/time_within_train_step": 2.645996332168579, "step": 5291} {"train_info/time_between_train_steps": 0.003413677215576172, "step": 5291} {"info/global_step": 5292, "train_info/time_within_train_step": 2.662301540374756, "step": 5292} {"train_info/time_between_train_steps": 0.0034596920013427734, "step": 5292} {"info/global_step": 5293, "train_info/time_within_train_step": 2.653311252593994, "step": 5293} {"train_info/time_between_train_steps": 0.003540515899658203, "step": 5293} {"info/global_step": 5294, "train_info/time_within_train_step": 2.6613059043884277, "step": 5294} {"train_info/time_between_train_steps": 0.0034914016723632812, "step": 5294} {"info/global_step": 5295, "train_info/time_within_train_step": 2.717024087905884, "step": 5295} {"train_info/time_between_train_steps": 0.003443479537963867, "step": 5295} {"info/global_step": 5296, "train_info/time_within_train_step": 2.6430304050445557, "step": 5296} {"train_info/time_between_train_steps": 0.003509044647216797, "step": 5296} {"info/global_step": 5297, "train_info/time_within_train_step": 2.645282030105591, "step": 5297} {"train_info/time_between_train_steps": 0.003464221954345703, "step": 5297} {"info/global_step": 5298, "train_info/time_within_train_step": 2.6507813930511475, "step": 5298} {"train_info/time_between_train_steps": 0.0034618377685546875, "step": 5298} {"info/global_step": 5299, "train_info/time_within_train_step": 2.6469531059265137, "step": 5299} {"train_info/time_between_train_steps": 0.003381013870239258, "step": 5299} {"info/global_step": 5300, "train_info/time_within_train_step": 2.6562976837158203, "step": 5300} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746912317, "_runtime": 14915}, "step": 5300} {"logs": {"train/loss": 3.564, "train/learning_rate": 0.0003133333333333333, "train/epoch": 6.01, "_timestamp": 1746912317, "_runtime": 14915}, "step": 5300} {"train_info/time_between_train_steps": 0.024840116500854492, "step": 5300} {"info/global_step": 5301, "train_info/time_within_train_step": 2.6521573066711426, "step": 5301} {"train_info/time_between_train_steps": 0.003408670425415039, "step": 5301} {"info/global_step": 5302, "train_info/time_within_train_step": 2.66508412361145, "step": 5302} {"train_info/time_between_train_steps": 0.0034325122833251953, "step": 5302} {"info/global_step": 5303, "train_info/time_within_train_step": 2.6423873901367188, "step": 5303} {"train_info/time_between_train_steps": 0.16079068183898926, "step": 5303} {"info/global_step": 5304, "train_info/time_within_train_step": 2.660073757171631, "step": 5304} {"train_info/time_between_train_steps": 0.0032639503479003906, "step": 5304} {"info/global_step": 5305, "train_info/time_within_train_step": 2.6428627967834473, "step": 5305} {"train_info/time_between_train_steps": 0.0033533573150634766, "step": 5305} {"info/global_step": 5306, "train_info/time_within_train_step": 2.6610419750213623, "step": 5306} {"train_info/time_between_train_steps": 0.0034780502319335938, "step": 5306} {"info/global_step": 5307, "train_info/time_within_train_step": 2.65364146232605, "step": 5307} {"train_info/time_between_train_steps": 0.0034301280975341797, "step": 5307} {"info/global_step": 5308, "train_info/time_within_train_step": 2.646083116531372, "step": 5308} {"train_info/time_between_train_steps": 0.0033044815063476562, "step": 5308} {"info/global_step": 5309, "train_info/time_within_train_step": 2.6441490650177, "step": 5309} {"train_info/time_between_train_steps": 0.0033473968505859375, "step": 5309} {"info/global_step": 5310, "train_info/time_within_train_step": 2.6517741680145264, "step": 5310} {"train_info/time_between_train_steps": 0.003509998321533203, "step": 5310} {"info/global_step": 5311, "train_info/time_within_train_step": 2.671497344970703, "step": 5311} {"train_info/time_between_train_steps": 0.0035572052001953125, "step": 5311} {"info/global_step": 5312, "train_info/time_within_train_step": 2.671884775161743, "step": 5312} {"train_info/time_between_train_steps": 0.0035910606384277344, "step": 5312} {"info/global_step": 5313, "train_info/time_within_train_step": 2.656888246536255, "step": 5313} {"train_info/time_between_train_steps": 0.0035424232482910156, "step": 5313} {"info/global_step": 5314, "train_info/time_within_train_step": 2.6878931522369385, "step": 5314} {"train_info/time_between_train_steps": 0.0035076141357421875, "step": 5314} {"info/global_step": 5315, "train_info/time_within_train_step": 2.6443397998809814, "step": 5315} {"train_info/time_between_train_steps": 0.0034787654876708984, "step": 5315} {"info/global_step": 5316, "train_info/time_within_train_step": 2.6560800075531006, "step": 5316} {"train_info/time_between_train_steps": 0.003493785858154297, "step": 5316} {"info/global_step": 5317, "train_info/time_within_train_step": 2.6585891246795654, "step": 5317} {"train_info/time_between_train_steps": 0.003520488739013672, "step": 5317} {"info/global_step": 5318, "train_info/time_within_train_step": 2.6453914642333984, "step": 5318} {"train_info/time_between_train_steps": 0.0035309791564941406, "step": 5318} {"info/global_step": 5319, "train_info/time_within_train_step": 2.6460201740264893, "step": 5319} {"train_info/time_between_train_steps": 0.0034914016723632812, "step": 5319} {"info/global_step": 5320, "train_info/time_within_train_step": 2.6675100326538086, "step": 5320} {"train_info/time_between_train_steps": 0.0035843849182128906, "step": 5320} {"info/global_step": 5321, "train_info/time_within_train_step": 2.659616470336914, "step": 5321} {"train_info/time_between_train_steps": 0.003582000732421875, "step": 5321} {"info/global_step": 5322, "train_info/time_within_train_step": 2.6715688705444336, "step": 5322} {"train_info/time_between_train_steps": 0.0034830570220947266, "step": 5322} {"info/global_step": 5323, "train_info/time_within_train_step": 2.677426815032959, "step": 5323} {"train_info/time_between_train_steps": 0.00351715087890625, "step": 5323} {"info/global_step": 5324, "train_info/time_within_train_step": 2.682068347930908, "step": 5324} {"train_info/time_between_train_steps": 0.003496408462524414, "step": 5324} {"info/global_step": 5325, "train_info/time_within_train_step": 2.642839193344116, "step": 5325} {"train_info/time_between_train_steps": 0.0035283565521240234, "step": 5325} {"info/global_step": 5326, "train_info/time_within_train_step": 2.642371892929077, "step": 5326} {"train_info/time_between_train_steps": 0.003553628921508789, "step": 5326} {"info/global_step": 5327, "train_info/time_within_train_step": 2.667611837387085, "step": 5327} {"train_info/time_between_train_steps": 0.0035181045532226562, "step": 5327} {"info/global_step": 5328, "train_info/time_within_train_step": 2.65322208404541, "step": 5328} {"train_info/time_between_train_steps": 0.0034945011138916016, "step": 5328} {"info/global_step": 5329, "train_info/time_within_train_step": 2.6458404064178467, "step": 5329} {"train_info/time_between_train_steps": 0.0034711360931396484, "step": 5329} {"info/global_step": 5330, "train_info/time_within_train_step": 2.9879071712493896, "step": 5330} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 5330} {"info/global_step": 5331, "train_info/time_within_train_step": 2.6423373222351074, "step": 5331} {"train_info/time_between_train_steps": 0.003231525421142578, "step": 5331} {"info/global_step": 5332, "train_info/time_within_train_step": 2.6575026512145996, "step": 5332} {"train_info/time_between_train_steps": 0.003278493881225586, "step": 5332} {"info/global_step": 5333, "train_info/time_within_train_step": 2.6541242599487305, "step": 5333} {"train_info/time_between_train_steps": 0.0032291412353515625, "step": 5333} {"info/global_step": 5334, "train_info/time_within_train_step": 2.644775629043579, "step": 5334} {"train_info/time_between_train_steps": 0.003281831741333008, "step": 5334} {"info/global_step": 5335, "train_info/time_within_train_step": 2.6698851585388184, "step": 5335} {"train_info/time_between_train_steps": 0.0032281875610351562, "step": 5335} {"info/global_step": 5336, "train_info/time_within_train_step": 2.6589176654815674, "step": 5336} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 5336} {"info/global_step": 5337, "train_info/time_within_train_step": 2.670335054397583, "step": 5337} {"train_info/time_between_train_steps": 0.003236532211303711, "step": 5337} {"info/global_step": 5338, "train_info/time_within_train_step": 2.7298507690429688, "step": 5338} {"train_info/time_between_train_steps": 0.0032486915588378906, "step": 5338} {"info/global_step": 5339, "train_info/time_within_train_step": 2.6691503524780273, "step": 5339} {"train_info/time_between_train_steps": 0.003304719924926758, "step": 5339} {"info/global_step": 5340, "train_info/time_within_train_step": 2.6421985626220703, "step": 5340} {"train_info/time_between_train_steps": 0.003236055374145508, "step": 5340} {"info/global_step": 5341, "train_info/time_within_train_step": 2.644770860671997, "step": 5341} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 5341} {"info/global_step": 5342, "train_info/time_within_train_step": 2.6560049057006836, "step": 5342} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 5342} {"info/global_step": 5343, "train_info/time_within_train_step": 2.6544413566589355, "step": 5343} {"train_info/time_between_train_steps": 0.0032546520233154297, "step": 5343} {"info/global_step": 5344, "train_info/time_within_train_step": 2.6440980434417725, "step": 5344} {"train_info/time_between_train_steps": 0.003204345703125, "step": 5344} {"info/global_step": 5345, "train_info/time_within_train_step": 2.6490979194641113, "step": 5345} {"train_info/time_between_train_steps": 0.003252744674682617, "step": 5345} {"info/global_step": 5346, "train_info/time_within_train_step": 2.6589267253875732, "step": 5346} {"train_info/time_between_train_steps": 0.0033528804779052734, "step": 5346} {"info/global_step": 5347, "train_info/time_within_train_step": 2.6671764850616455, "step": 5347} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 5347} {"info/global_step": 5348, "train_info/time_within_train_step": 2.7093002796173096, "step": 5348} {"train_info/time_between_train_steps": 0.0032792091369628906, "step": 5348} {"info/global_step": 5349, "train_info/time_within_train_step": 2.6434123516082764, "step": 5349} {"train_info/time_between_train_steps": 0.0032567977905273438, "step": 5349} {"info/global_step": 5350, "train_info/time_within_train_step": 2.654862880706787, "step": 5350} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746912451, "_runtime": 15049}, "step": 5350} {"logs": {"train/loss": 3.5549, "train/learning_rate": 0.00031, "train/epoch": 6.02, "_timestamp": 1746912451, "_runtime": 15049}, "step": 5350} {"train_info/time_between_train_steps": 0.024719715118408203, "step": 5350} {"info/global_step": 5351, "train_info/time_within_train_step": 2.6402010917663574, "step": 5351} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 5351} {"info/global_step": 5352, "train_info/time_within_train_step": 2.6556615829467773, "step": 5352} {"train_info/time_between_train_steps": 0.0032503604888916016, "step": 5352} {"info/global_step": 5353, "train_info/time_within_train_step": 2.658390760421753, "step": 5353} {"train_info/time_between_train_steps": 0.003302335739135742, "step": 5353} {"info/global_step": 5354, "train_info/time_within_train_step": 2.645491600036621, "step": 5354} {"train_info/time_between_train_steps": 0.0032203197479248047, "step": 5354} {"info/global_step": 5355, "train_info/time_within_train_step": 2.6442344188690186, "step": 5355} {"train_info/time_between_train_steps": 0.0032393932342529297, "step": 5355} {"info/global_step": 5356, "train_info/time_within_train_step": 2.6431448459625244, "step": 5356} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 5356} {"info/global_step": 5357, "train_info/time_within_train_step": 2.643047332763672, "step": 5357} {"train_info/time_between_train_steps": 0.0032367706298828125, "step": 5357} {"info/global_step": 5358, "train_info/time_within_train_step": 2.654165744781494, "step": 5358} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 5358} {"info/global_step": 5359, "train_info/time_within_train_step": 2.6637747287750244, "step": 5359} {"train_info/time_between_train_steps": 0.0032732486724853516, "step": 5359} {"info/global_step": 5360, "train_info/time_within_train_step": 2.6458215713500977, "step": 5360} {"train_info/time_between_train_steps": 0.003264188766479492, "step": 5360} {"info/global_step": 5361, "train_info/time_within_train_step": 2.6446421146392822, "step": 5361} {"train_info/time_between_train_steps": 0.003271818161010742, "step": 5361} {"info/global_step": 5362, "train_info/time_within_train_step": 2.6548359394073486, "step": 5362} {"train_info/time_between_train_steps": 0.003248453140258789, "step": 5362} {"info/global_step": 5363, "train_info/time_within_train_step": 2.6628074645996094, "step": 5363} {"train_info/time_between_train_steps": 0.003258228302001953, "step": 5363} {"info/global_step": 5364, "train_info/time_within_train_step": 2.6524276733398438, "step": 5364} {"train_info/time_between_train_steps": 0.0033566951751708984, "step": 5364} {"info/global_step": 5365, "train_info/time_within_train_step": 2.6440927982330322, "step": 5365} {"train_info/time_between_train_steps": 0.0034437179565429688, "step": 5365} {"info/global_step": 5366, "train_info/time_within_train_step": 2.823498487472534, "step": 5366} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 5366} {"info/global_step": 5367, "train_info/time_within_train_step": 2.650930643081665, "step": 5367} {"train_info/time_between_train_steps": 0.003556489944458008, "step": 5367} {"info/global_step": 5368, "train_info/time_within_train_step": 2.6504905223846436, "step": 5368} {"train_info/time_between_train_steps": 0.003545045852661133, "step": 5368} {"info/global_step": 5369, "train_info/time_within_train_step": 2.6547093391418457, "step": 5369} {"train_info/time_between_train_steps": 0.0035479068756103516, "step": 5369} {"info/global_step": 5370, "train_info/time_within_train_step": 2.6509571075439453, "step": 5370} {"train_info/time_between_train_steps": 0.0035691261291503906, "step": 5370} {"info/global_step": 5371, "train_info/time_within_train_step": 2.645814895629883, "step": 5371} {"train_info/time_between_train_steps": 0.0034494400024414062, "step": 5371} {"info/global_step": 5372, "train_info/time_within_train_step": 2.657790184020996, "step": 5372} {"train_info/time_between_train_steps": 0.003454446792602539, "step": 5372} {"info/global_step": 5373, "train_info/time_within_train_step": 2.6551501750946045, "step": 5373} {"train_info/time_between_train_steps": 0.0035729408264160156, "step": 5373} {"info/global_step": 5374, "train_info/time_within_train_step": 2.6612203121185303, "step": 5374} {"train_info/time_between_train_steps": 0.00354766845703125, "step": 5374} {"info/global_step": 5375, "train_info/time_within_train_step": 2.706660270690918, "step": 5375} {"train_info/time_between_train_steps": 0.0036559104919433594, "step": 5375} {"info/global_step": 5376, "train_info/time_within_train_step": 2.694220542907715, "step": 5376} {"train_info/time_between_train_steps": 0.003519296646118164, "step": 5376} {"info/global_step": 5377, "train_info/time_within_train_step": 2.6448538303375244, "step": 5377} {"train_info/time_between_train_steps": 0.003464221954345703, "step": 5377} {"info/global_step": 5378, "train_info/time_within_train_step": 2.643531084060669, "step": 5378} {"train_info/time_between_train_steps": 0.003412961959838867, "step": 5378} {"info/global_step": 5379, "train_info/time_within_train_step": 2.6598236560821533, "step": 5379} {"train_info/time_between_train_steps": 0.0034677982330322266, "step": 5379} {"info/global_step": 5380, "train_info/time_within_train_step": 2.6548776626586914, "step": 5380} {"train_info/time_between_train_steps": 0.0034148693084716797, "step": 5380} {"info/global_step": 5381, "train_info/time_within_train_step": 2.6453113555908203, "step": 5381} {"train_info/time_between_train_steps": 0.003472566604614258, "step": 5381} {"info/global_step": 5382, "train_info/time_within_train_step": 2.6536505222320557, "step": 5382} {"train_info/time_between_train_steps": 0.0034580230712890625, "step": 5382} {"info/global_step": 5383, "train_info/time_within_train_step": 2.6480603218078613, "step": 5383} {"train_info/time_between_train_steps": 0.003547191619873047, "step": 5383} {"info/global_step": 5384, "train_info/time_within_train_step": 2.670520067214966, "step": 5384} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 5384} {"info/global_step": 5385, "train_info/time_within_train_step": 2.689072847366333, "step": 5385} {"train_info/time_between_train_steps": 0.003490447998046875, "step": 5385} {"info/global_step": 5386, "train_info/time_within_train_step": 2.6732900142669678, "step": 5386} {"train_info/time_between_train_steps": 0.0035021305084228516, "step": 5386} {"info/global_step": 5387, "train_info/time_within_train_step": 2.660144805908203, "step": 5387} {"train_info/time_between_train_steps": 0.0035872459411621094, "step": 5387} {"info/global_step": 5388, "train_info/time_within_train_step": 2.644818067550659, "step": 5388} {"train_info/time_between_train_steps": 0.0034685134887695312, "step": 5388} {"info/global_step": 5389, "train_info/time_within_train_step": 3.0035457611083984, "step": 5389} {"train_info/time_between_train_steps": 0.003493070602416992, "step": 5389} {"info/global_step": 5390, "train_info/time_within_train_step": 2.667224168777466, "step": 5390} {"train_info/time_between_train_steps": 0.0033249855041503906, "step": 5390} {"info/global_step": 5391, "train_info/time_within_train_step": 2.702669620513916, "step": 5391} {"train_info/time_between_train_steps": 0.0032906532287597656, "step": 5391} {"info/global_step": 5392, "train_info/time_within_train_step": 2.644918918609619, "step": 5392} {"train_info/time_between_train_steps": 0.0032804012298583984, "step": 5392} {"info/global_step": 5393, "train_info/time_within_train_step": 2.651090145111084, "step": 5393} {"train_info/time_between_train_steps": 0.0032625198364257812, "step": 5393} {"info/global_step": 5394, "train_info/time_within_train_step": 2.6507561206817627, "step": 5394} {"train_info/time_between_train_steps": 0.0032749176025390625, "step": 5394} {"info/global_step": 5395, "train_info/time_within_train_step": 2.6477677822113037, "step": 5395} {"train_info/time_between_train_steps": 0.003378152847290039, "step": 5395} {"info/global_step": 5396, "train_info/time_within_train_step": 2.6562557220458984, "step": 5396} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 5396} {"info/global_step": 5397, "train_info/time_within_train_step": 2.6445181369781494, "step": 5397} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 5397} {"info/global_step": 5398, "train_info/time_within_train_step": 2.6472713947296143, "step": 5398} {"train_info/time_between_train_steps": 0.0033195018768310547, "step": 5398} {"info/global_step": 5399, "train_info/time_within_train_step": 2.6669602394104004, "step": 5399} {"train_info/time_between_train_steps": 0.0032715797424316406, "step": 5399} {"info/global_step": 5400, "train_info/time_within_train_step": 2.654397487640381, "step": 5400} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746912586, "_runtime": 15184}, "step": 5400} {"logs": {"train/loss": 3.5369, "train/learning_rate": 0.0003066666666666666, "train/epoch": 6.02, "_timestamp": 1746912586, "_runtime": 15184}, "step": 5400} {"train_info/time_between_train_steps": 13.706395149230957, "step": 5400} {"info/global_step": 5401, "train_info/time_within_train_step": 2.4539310932159424, "step": 5401} {"train_info/time_between_train_steps": 0.003346681594848633, "step": 5401} {"info/global_step": 5402, "train_info/time_within_train_step": 2.4390807151794434, "step": 5402} {"train_info/time_between_train_steps": 0.0032324790954589844, "step": 5402} {"info/global_step": 5403, "train_info/time_within_train_step": 2.58767032623291, "step": 5403} {"train_info/time_between_train_steps": 0.003301858901977539, "step": 5403} {"info/global_step": 5404, "train_info/time_within_train_step": 2.6432299613952637, "step": 5404} {"train_info/time_between_train_steps": 0.0032453536987304688, "step": 5404} {"info/global_step": 5405, "train_info/time_within_train_step": 2.648252487182617, "step": 5405} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 5405} {"info/global_step": 5406, "train_info/time_within_train_step": 2.6434686183929443, "step": 5406} {"train_info/time_between_train_steps": 0.003253936767578125, "step": 5406} {"info/global_step": 5407, "train_info/time_within_train_step": 2.669133186340332, "step": 5407} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 5407} {"info/global_step": 5408, "train_info/time_within_train_step": 2.683687686920166, "step": 5408} {"train_info/time_between_train_steps": 0.0032532215118408203, "step": 5408} {"info/global_step": 5409, "train_info/time_within_train_step": 2.667273998260498, "step": 5409} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 5409} {"info/global_step": 5410, "train_info/time_within_train_step": 2.662569522857666, "step": 5410} {"train_info/time_between_train_steps": 0.0032815933227539062, "step": 5410} {"info/global_step": 5411, "train_info/time_within_train_step": 2.642754316329956, "step": 5411} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 5411} {"info/global_step": 5412, "train_info/time_within_train_step": 2.65568208694458, "step": 5412} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 5412} {"info/global_step": 5413, "train_info/time_within_train_step": 2.6631882190704346, "step": 5413} {"train_info/time_between_train_steps": 0.003252267837524414, "step": 5413} {"info/global_step": 5414, "train_info/time_within_train_step": 2.64630126953125, "step": 5414} {"train_info/time_between_train_steps": 0.003294706344604492, "step": 5414} {"info/global_step": 5415, "train_info/time_within_train_step": 2.6461422443389893, "step": 5415} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 5415} {"info/global_step": 5416, "train_info/time_within_train_step": 2.650317668914795, "step": 5416} {"train_info/time_between_train_steps": 0.003827810287475586, "step": 5416} {"info/global_step": 5417, "train_info/time_within_train_step": 2.652031660079956, "step": 5417} {"train_info/time_between_train_steps": 0.003877878189086914, "step": 5417} {"info/global_step": 5418, "train_info/time_within_train_step": 2.6527099609375, "step": 5418} {"train_info/time_between_train_steps": 0.0038421154022216797, "step": 5418} {"info/global_step": 5419, "train_info/time_within_train_step": 2.64947772026062, "step": 5419} {"train_info/time_between_train_steps": 0.0035812854766845703, "step": 5419} {"info/global_step": 5420, "train_info/time_within_train_step": 4.188014507293701, "step": 5420} {"train_info/time_between_train_steps": 0.003604888916015625, "step": 5420} {"info/global_step": 5421, "train_info/time_within_train_step": 2.6459710597991943, "step": 5421} {"train_info/time_between_train_steps": 0.003278017044067383, "step": 5421} {"info/global_step": 5422, "train_info/time_within_train_step": 2.654017686843872, "step": 5422} {"train_info/time_between_train_steps": 0.003221273422241211, "step": 5422} {"info/global_step": 5423, "train_info/time_within_train_step": 2.64864444732666, "step": 5423} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 5423} {"info/global_step": 5424, "train_info/time_within_train_step": 2.6745007038116455, "step": 5424} {"train_info/time_between_train_steps": 0.0032684803009033203, "step": 5424} {"info/global_step": 5425, "train_info/time_within_train_step": 2.6665377616882324, "step": 5425} {"train_info/time_between_train_steps": 0.003235340118408203, "step": 5425} {"info/global_step": 5426, "train_info/time_within_train_step": 2.6531829833984375, "step": 5426} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 5426} {"info/global_step": 5427, "train_info/time_within_train_step": 2.652879238128662, "step": 5427} {"train_info/time_between_train_steps": 0.0032062530517578125, "step": 5427} {"info/global_step": 5428, "train_info/time_within_train_step": 2.6608781814575195, "step": 5428} {"train_info/time_between_train_steps": 0.13199400901794434, "step": 5428} {"info/global_step": 5429, "train_info/time_within_train_step": 2.6790692806243896, "step": 5429} {"train_info/time_between_train_steps": 0.003278493881225586, "step": 5429} {"info/global_step": 5430, "train_info/time_within_train_step": 2.715932846069336, "step": 5430} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 5430} {"info/global_step": 5431, "train_info/time_within_train_step": 2.642174482345581, "step": 5431} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 5431} {"info/global_step": 5432, "train_info/time_within_train_step": 2.6416702270507812, "step": 5432} {"train_info/time_between_train_steps": 0.0032753944396972656, "step": 5432} {"info/global_step": 5433, "train_info/time_within_train_step": 2.6615562438964844, "step": 5433} {"train_info/time_between_train_steps": 0.003208160400390625, "step": 5433} {"info/global_step": 5434, "train_info/time_within_train_step": 2.6529924869537354, "step": 5434} {"train_info/time_between_train_steps": 0.0032320022583007812, "step": 5434} {"info/global_step": 5435, "train_info/time_within_train_step": 2.645256757736206, "step": 5435} {"train_info/time_between_train_steps": 0.003286123275756836, "step": 5435} {"info/global_step": 5436, "train_info/time_within_train_step": 2.653111696243286, "step": 5436} {"train_info/time_between_train_steps": 0.0032355785369873047, "step": 5436} {"info/global_step": 5437, "train_info/time_within_train_step": 2.6499722003936768, "step": 5437} {"train_info/time_between_train_steps": 0.0032341480255126953, "step": 5437} {"info/global_step": 5438, "train_info/time_within_train_step": 2.6676695346832275, "step": 5438} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 5438} {"info/global_step": 5439, "train_info/time_within_train_step": 2.7083516120910645, "step": 5439} {"train_info/time_between_train_steps": 0.003231525421142578, "step": 5439} {"info/global_step": 5440, "train_info/time_within_train_step": 2.640773057937622, "step": 5440} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 5440} {"info/global_step": 5441, "train_info/time_within_train_step": 2.6519596576690674, "step": 5441} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 5441} {"info/global_step": 5442, "train_info/time_within_train_step": 2.6523125171661377, "step": 5442} {"train_info/time_between_train_steps": 0.003336668014526367, "step": 5442} {"info/global_step": 5443, "train_info/time_within_train_step": 2.6496875286102295, "step": 5443} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 5443} {"info/global_step": 5444, "train_info/time_within_train_step": 2.9055395126342773, "step": 5444} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 5444} {"info/global_step": 5445, "train_info/time_within_train_step": 2.642031669616699, "step": 5445} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 5445} {"info/global_step": 5446, "train_info/time_within_train_step": 2.650115728378296, "step": 5446} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 5446} {"info/global_step": 5447, "train_info/time_within_train_step": 2.6625874042510986, "step": 5447} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 5447} {"info/global_step": 5448, "train_info/time_within_train_step": 2.6443264484405518, "step": 5448} {"train_info/time_between_train_steps": 0.0032520294189453125, "step": 5448} {"info/global_step": 5449, "train_info/time_within_train_step": 2.643998146057129, "step": 5449} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 5449} {"info/global_step": 5450, "train_info/time_within_train_step": 2.666990280151367, "step": 5450} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746912737, "_runtime": 15335}, "step": 5450} {"logs": {"train/loss": 3.5354, "train/learning_rate": 0.0003033333333333333, "train/epoch": 6.03, "_timestamp": 1746912737, "_runtime": 15335}, "step": 5450} {"train_info/time_between_train_steps": 0.024534225463867188, "step": 5450} {"info/global_step": 5451, "train_info/time_within_train_step": 2.671435832977295, "step": 5451} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 5451} {"info/global_step": 5452, "train_info/time_within_train_step": 2.670382022857666, "step": 5452} {"train_info/time_between_train_steps": 0.0032806396484375, "step": 5452} {"info/global_step": 5453, "train_info/time_within_train_step": 2.658179998397827, "step": 5453} {"train_info/time_between_train_steps": 0.003327608108520508, "step": 5453} {"info/global_step": 5454, "train_info/time_within_train_step": 2.6871039867401123, "step": 5454} {"train_info/time_between_train_steps": 0.003320455551147461, "step": 5454} {"info/global_step": 5455, "train_info/time_within_train_step": 2.6455459594726562, "step": 5455} {"train_info/time_between_train_steps": 0.003416299819946289, "step": 5455} {"info/global_step": 5456, "train_info/time_within_train_step": 2.645491123199463, "step": 5456} {"train_info/time_between_train_steps": 0.0033578872680664062, "step": 5456} {"info/global_step": 5457, "train_info/time_within_train_step": 2.669282913208008, "step": 5457} {"train_info/time_between_train_steps": 0.0035071372985839844, "step": 5457} {"info/global_step": 5458, "train_info/time_within_train_step": 2.660330057144165, "step": 5458} {"train_info/time_between_train_steps": 0.004134654998779297, "step": 5458} {"info/global_step": 5459, "train_info/time_within_train_step": 2.6718411445617676, "step": 5459} {"train_info/time_between_train_steps": 0.003518819808959961, "step": 5459} {"info/global_step": 5460, "train_info/time_within_train_step": 2.680795669555664, "step": 5460} {"train_info/time_between_train_steps": 0.0034477710723876953, "step": 5460} {"info/global_step": 5461, "train_info/time_within_train_step": 2.6799659729003906, "step": 5461} {"train_info/time_between_train_steps": 0.003553628921508789, "step": 5461} {"info/global_step": 5462, "train_info/time_within_train_step": 2.6437573432922363, "step": 5462} {"train_info/time_between_train_steps": 0.0035376548767089844, "step": 5462} {"info/global_step": 5463, "train_info/time_within_train_step": 2.6433305740356445, "step": 5463} {"train_info/time_between_train_steps": 0.0034818649291992188, "step": 5463} {"info/global_step": 5464, "train_info/time_within_train_step": 2.6656856536865234, "step": 5464} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 5464} {"info/global_step": 5465, "train_info/time_within_train_step": 2.6543545722961426, "step": 5465} {"train_info/time_between_train_steps": 0.003496408462524414, "step": 5465} {"info/global_step": 5466, "train_info/time_within_train_step": 2.6468849182128906, "step": 5466} {"train_info/time_between_train_steps": 0.003521442413330078, "step": 5466} {"info/global_step": 5467, "train_info/time_within_train_step": 2.6616592407226562, "step": 5467} {"train_info/time_between_train_steps": 0.0034933090209960938, "step": 5467} {"info/global_step": 5468, "train_info/time_within_train_step": 2.6553382873535156, "step": 5468} {"train_info/time_between_train_steps": 0.0035102367401123047, "step": 5468} {"info/global_step": 5469, "train_info/time_within_train_step": 2.660912275314331, "step": 5469} {"train_info/time_between_train_steps": 0.0034809112548828125, "step": 5469} {"info/global_step": 5470, "train_info/time_within_train_step": 2.705399990081787, "step": 5470} {"train_info/time_between_train_steps": 0.0035142898559570312, "step": 5470} {"info/global_step": 5471, "train_info/time_within_train_step": 2.7092676162719727, "step": 5471} {"train_info/time_between_train_steps": 0.0034394264221191406, "step": 5471} {"info/global_step": 5472, "train_info/time_within_train_step": 2.6439363956451416, "step": 5472} {"train_info/time_between_train_steps": 0.0035080909729003906, "step": 5472} {"info/global_step": 5473, "train_info/time_within_train_step": 2.642764091491699, "step": 5473} {"train_info/time_between_train_steps": 0.003420114517211914, "step": 5473} {"info/global_step": 5474, "train_info/time_within_train_step": 2.6448700428009033, "step": 5474} {"train_info/time_between_train_steps": 0.0034689903259277344, "step": 5474} {"info/global_step": 5475, "train_info/time_within_train_step": 2.656526565551758, "step": 5475} {"train_info/time_between_train_steps": 0.003489971160888672, "step": 5475} {"info/global_step": 5476, "train_info/time_within_train_step": 2.6595864295959473, "step": 5476} {"train_info/time_between_train_steps": 0.003425121307373047, "step": 5476} {"info/global_step": 5477, "train_info/time_within_train_step": 2.6601271629333496, "step": 5477} {"train_info/time_between_train_steps": 0.003462076187133789, "step": 5477} {"info/global_step": 5478, "train_info/time_within_train_step": 2.6460440158843994, "step": 5478} {"train_info/time_between_train_steps": 0.0034644603729248047, "step": 5478} {"info/global_step": 5479, "train_info/time_within_train_step": 2.6517395973205566, "step": 5479} {"train_info/time_between_train_steps": 0.0034766197204589844, "step": 5479} {"info/global_step": 5480, "train_info/time_within_train_step": 2.6730473041534424, "step": 5480} {"train_info/time_between_train_steps": 0.0034084320068359375, "step": 5480} {"info/global_step": 5481, "train_info/time_within_train_step": 2.6743059158325195, "step": 5481} {"train_info/time_between_train_steps": 0.0034210681915283203, "step": 5481} {"info/global_step": 5482, "train_info/time_within_train_step": 2.65754771232605, "step": 5482} {"train_info/time_between_train_steps": 0.0033981800079345703, "step": 5482} {"info/global_step": 5483, "train_info/time_within_train_step": 2.688830852508545, "step": 5483} {"train_info/time_between_train_steps": 0.0034732818603515625, "step": 5483} {"info/global_step": 5484, "train_info/time_within_train_step": 2.6426520347595215, "step": 5484} {"train_info/time_between_train_steps": 0.0034296512603759766, "step": 5484} {"info/global_step": 5485, "train_info/time_within_train_step": 2.6564621925354004, "step": 5485} {"train_info/time_between_train_steps": 0.00347137451171875, "step": 5485} {"info/global_step": 5486, "train_info/time_within_train_step": 2.6668145656585693, "step": 5486} {"train_info/time_between_train_steps": 0.0033380985260009766, "step": 5486} {"info/global_step": 5487, "train_info/time_within_train_step": 2.9790022373199463, "step": 5487} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 5487} {"info/global_step": 5488, "train_info/time_within_train_step": 2.6890552043914795, "step": 5488} {"train_info/time_between_train_steps": 0.003236532211303711, "step": 5488} {"info/global_step": 5489, "train_info/time_within_train_step": 2.643765687942505, "step": 5489} {"train_info/time_between_train_steps": 0.0033919811248779297, "step": 5489} {"info/global_step": 5490, "train_info/time_within_train_step": 2.652501106262207, "step": 5490} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 5490} {"info/global_step": 5491, "train_info/time_within_train_step": 2.790225028991699, "step": 5491} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 5491} {"info/global_step": 5492, "train_info/time_within_train_step": 2.649381399154663, "step": 5492} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 5492} {"info/global_step": 5493, "train_info/time_within_train_step": 2.6525938510894775, "step": 5493} {"train_info/time_between_train_steps": 0.0031943321228027344, "step": 5493} {"info/global_step": 5494, "train_info/time_within_train_step": 2.6535322666168213, "step": 5494} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 5494} {"info/global_step": 5495, "train_info/time_within_train_step": 2.661336898803711, "step": 5495} {"train_info/time_between_train_steps": 0.003279447555541992, "step": 5495} {"info/global_step": 5496, "train_info/time_within_train_step": 2.674476385116577, "step": 5496} {"train_info/time_between_train_steps": 0.003268718719482422, "step": 5496} {"info/global_step": 5497, "train_info/time_within_train_step": 2.6680004596710205, "step": 5497} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 5497} {"info/global_step": 5498, "train_info/time_within_train_step": 2.68721604347229, "step": 5498} {"train_info/time_between_train_steps": 0.0032644271850585938, "step": 5498} {"info/global_step": 5499, "train_info/time_within_train_step": 3.256078004837036, "step": 5499} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 5499} {"info/global_step": 5500, "train_info/time_within_train_step": 2.6628754138946533, "step": 5500} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746912872, "_runtime": 15470}, "step": 5500} {"logs": {"train/loss": 3.5322, "train/learning_rate": 0.0003, "train/epoch": 6.03, "_timestamp": 1746912872, "_runtime": 15470}, "step": 5500} {"train_info/time_between_train_steps": 0.024703025817871094, "step": 5500} {"info/global_step": 5501, "train_info/time_within_train_step": 2.6557016372680664, "step": 5501} {"train_info/time_between_train_steps": 0.0032601356506347656, "step": 5501} {"info/global_step": 5502, "train_info/time_within_train_step": 2.6495790481567383, "step": 5502} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 5502} {"info/global_step": 5503, "train_info/time_within_train_step": 2.643955945968628, "step": 5503} {"train_info/time_between_train_steps": 0.0033111572265625, "step": 5503} {"info/global_step": 5504, "train_info/time_within_train_step": 2.6679749488830566, "step": 5504} {"train_info/time_between_train_steps": 0.0032563209533691406, "step": 5504} {"info/global_step": 5505, "train_info/time_within_train_step": 2.6584746837615967, "step": 5505} {"train_info/time_between_train_steps": 0.0032663345336914062, "step": 5505} {"info/global_step": 5506, "train_info/time_within_train_step": 2.661332607269287, "step": 5506} {"train_info/time_between_train_steps": 0.0032737255096435547, "step": 5506} {"info/global_step": 5507, "train_info/time_within_train_step": 2.700836181640625, "step": 5507} {"train_info/time_between_train_steps": 0.003262042999267578, "step": 5507} {"info/global_step": 5508, "train_info/time_within_train_step": 2.6553354263305664, "step": 5508} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 5508} {"info/global_step": 5509, "train_info/time_within_train_step": 2.643493890762329, "step": 5509} {"train_info/time_between_train_steps": 0.003255128860473633, "step": 5509} {"info/global_step": 5510, "train_info/time_within_train_step": 2.6649816036224365, "step": 5510} {"train_info/time_between_train_steps": 0.0032563209533691406, "step": 5510} {"info/global_step": 5511, "train_info/time_within_train_step": 2.6491684913635254, "step": 5511} {"train_info/time_between_train_steps": 0.003246784210205078, "step": 5511} {"info/global_step": 5512, "train_info/time_within_train_step": 2.644437313079834, "step": 5512} {"train_info/time_between_train_steps": 0.0032501220703125, "step": 5512} {"info/global_step": 5513, "train_info/time_within_train_step": 2.660775661468506, "step": 5513} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 5513} {"info/global_step": 5514, "train_info/time_within_train_step": 2.6551222801208496, "step": 5514} {"train_info/time_between_train_steps": 0.003293752670288086, "step": 5514} {"info/global_step": 5515, "train_info/time_within_train_step": 2.661090135574341, "step": 5515} {"train_info/time_between_train_steps": 0.0032684803009033203, "step": 5515} {"info/global_step": 5516, "train_info/time_within_train_step": 2.7054827213287354, "step": 5516} {"train_info/time_between_train_steps": 0.0032243728637695312, "step": 5516} {"info/global_step": 5517, "train_info/time_within_train_step": 2.6980936527252197, "step": 5517} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 5517} {"info/global_step": 5518, "train_info/time_within_train_step": 2.6423327922821045, "step": 5518} {"train_info/time_between_train_steps": 0.003323078155517578, "step": 5518} {"info/global_step": 5519, "train_info/time_within_train_step": 2.642608404159546, "step": 5519} {"train_info/time_between_train_steps": 0.003255605697631836, "step": 5519} {"info/global_step": 5520, "train_info/time_within_train_step": 2.660745143890381, "step": 5520} {"train_info/time_between_train_steps": 0.00323486328125, "step": 5520} {"info/global_step": 5521, "train_info/time_within_train_step": 2.6526896953582764, "step": 5521} {"train_info/time_between_train_steps": 0.0032949447631835938, "step": 5521} {"info/global_step": 5522, "train_info/time_within_train_step": 2.6454243659973145, "step": 5522} {"train_info/time_between_train_steps": 0.0032520294189453125, "step": 5522} {"info/global_step": 5523, "train_info/time_within_train_step": 2.645934581756592, "step": 5523} {"train_info/time_between_train_steps": 0.003396749496459961, "step": 5523} {"info/global_step": 5524, "train_info/time_within_train_step": 2.667788028717041, "step": 5524} {"train_info/time_between_train_steps": 0.0035543441772460938, "step": 5524} {"info/global_step": 5525, "train_info/time_within_train_step": 2.6675374507904053, "step": 5525} {"train_info/time_between_train_steps": 0.0034494400024414062, "step": 5525} {"info/global_step": 5526, "train_info/time_within_train_step": 2.7108283042907715, "step": 5526} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 5526} {"info/global_step": 5527, "train_info/time_within_train_step": 2.6447596549987793, "step": 5527} {"train_info/time_between_train_steps": 0.0032334327697753906, "step": 5527} {"info/global_step": 5528, "train_info/time_within_train_step": 2.65910267829895, "step": 5528} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 5528} {"info/global_step": 5529, "train_info/time_within_train_step": 2.6444151401519775, "step": 5529} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 5529} {"info/global_step": 5530, "train_info/time_within_train_step": 2.6486756801605225, "step": 5530} {"train_info/time_between_train_steps": 0.0032372474670410156, "step": 5530} {"info/global_step": 5531, "train_info/time_within_train_step": 2.6601171493530273, "step": 5531} {"train_info/time_between_train_steps": 0.0032677650451660156, "step": 5531} {"info/global_step": 5532, "train_info/time_within_train_step": 2.642948627471924, "step": 5532} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 5532} {"info/global_step": 5533, "train_info/time_within_train_step": 2.644395351409912, "step": 5533} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 5533} {"info/global_step": 5534, "train_info/time_within_train_step": 2.669152021408081, "step": 5534} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 5534} {"info/global_step": 5535, "train_info/time_within_train_step": 2.6690423488616943, "step": 5535} {"train_info/time_between_train_steps": 0.0032465457916259766, "step": 5535} {"info/global_step": 5536, "train_info/time_within_train_step": 2.656062364578247, "step": 5536} {"train_info/time_between_train_steps": 0.0032482147216796875, "step": 5536} {"info/global_step": 5537, "train_info/time_within_train_step": 2.6847169399261475, "step": 5537} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 5537} {"info/global_step": 5538, "train_info/time_within_train_step": 2.641190767288208, "step": 5538} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 5538} {"info/global_step": 5539, "train_info/time_within_train_step": 2.6538712978363037, "step": 5539} {"train_info/time_between_train_steps": 0.003264188766479492, "step": 5539} {"info/global_step": 5540, "train_info/time_within_train_step": 2.676046133041382, "step": 5540} {"train_info/time_between_train_steps": 0.0033419132232666016, "step": 5540} {"info/global_step": 5541, "train_info/time_within_train_step": 2.6441988945007324, "step": 5541} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 5541} {"info/global_step": 5542, "train_info/time_within_train_step": 2.644850969314575, "step": 5542} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 5542} {"info/global_step": 5543, "train_info/time_within_train_step": 2.651911735534668, "step": 5543} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 5543} {"info/global_step": 5544, "train_info/time_within_train_step": 2.6597113609313965, "step": 5544} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 5544} {"info/global_step": 5545, "train_info/time_within_train_step": 2.670337677001953, "step": 5545} {"train_info/time_between_train_steps": 0.0032548904418945312, "step": 5545} {"info/global_step": 5546, "train_info/time_within_train_step": 2.6622133255004883, "step": 5546} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 5546} {"info/global_step": 5547, "train_info/time_within_train_step": 2.7067317962646484, "step": 5547} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 5547} {"info/global_step": 5548, "train_info/time_within_train_step": 2.641477108001709, "step": 5548} {"train_info/time_between_train_steps": 0.0032498836517333984, "step": 5548} {"info/global_step": 5549, "train_info/time_within_train_step": 2.6457297801971436, "step": 5549} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 5549} {"info/global_step": 5550, "train_info/time_within_train_step": 2.664978504180908, "step": 5550} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746913007, "_runtime": 15605}, "step": 5550} {"logs": {"train/loss": 3.5111, "train/learning_rate": 0.00029666666666666665, "train/epoch": 6.04, "_timestamp": 1746913007, "_runtime": 15605}, "step": 5550} {"train_info/time_between_train_steps": 0.024668455123901367, "step": 5550} {"info/global_step": 5551, "train_info/time_within_train_step": 2.6504266262054443, "step": 5551} {"train_info/time_between_train_steps": 0.0032083988189697266, "step": 5551} {"info/global_step": 5552, "train_info/time_within_train_step": 2.6687779426574707, "step": 5552} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 5552} {"info/global_step": 5553, "train_info/time_within_train_step": 2.7273361682891846, "step": 5553} {"train_info/time_between_train_steps": 0.13300275802612305, "step": 5553} {"info/global_step": 5554, "train_info/time_within_train_step": 2.6607844829559326, "step": 5554} {"train_info/time_between_train_steps": 0.003248929977416992, "step": 5554} {"info/global_step": 5555, "train_info/time_within_train_step": 2.7113535404205322, "step": 5555} {"train_info/time_between_train_steps": 0.0032389163970947266, "step": 5555} {"info/global_step": 5556, "train_info/time_within_train_step": 2.699012517929077, "step": 5556} {"train_info/time_between_train_steps": 0.0032486915588378906, "step": 5556} {"info/global_step": 5557, "train_info/time_within_train_step": 2.661986827850342, "step": 5557} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 5557} {"info/global_step": 5558, "train_info/time_within_train_step": 2.6497254371643066, "step": 5558} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 5558} {"info/global_step": 5559, "train_info/time_within_train_step": 2.65085768699646, "step": 5559} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 5559} {"info/global_step": 5560, "train_info/time_within_train_step": 2.647198438644409, "step": 5560} {"train_info/time_between_train_steps": 0.0032804012298583984, "step": 5560} {"info/global_step": 5561, "train_info/time_within_train_step": 2.643653392791748, "step": 5561} {"train_info/time_between_train_steps": 0.0032477378845214844, "step": 5561} {"info/global_step": 5562, "train_info/time_within_train_step": 2.6666955947875977, "step": 5562} {"train_info/time_between_train_steps": 0.003273487091064453, "step": 5562} {"info/global_step": 5563, "train_info/time_within_train_step": 2.670631170272827, "step": 5563} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 5563} {"info/global_step": 5564, "train_info/time_within_train_step": 2.6949782371520996, "step": 5564} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 5564} {"info/global_step": 5565, "train_info/time_within_train_step": 2.6493799686431885, "step": 5565} {"train_info/time_between_train_steps": 0.0032341480255126953, "step": 5565} {"info/global_step": 5566, "train_info/time_within_train_step": 2.6453857421875, "step": 5566} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 5566} {"info/global_step": 5567, "train_info/time_within_train_step": 2.6607823371887207, "step": 5567} {"train_info/time_between_train_steps": 0.0032393932342529297, "step": 5567} {"info/global_step": 5568, "train_info/time_within_train_step": 2.655273675918579, "step": 5568} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 5568} {"info/global_step": 5569, "train_info/time_within_train_step": 2.6438064575195312, "step": 5569} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 5569} {"info/global_step": 5570, "train_info/time_within_train_step": 2.6438918113708496, "step": 5570} {"train_info/time_between_train_steps": 0.0032439231872558594, "step": 5570} {"info/global_step": 5571, "train_info/time_within_train_step": 2.653898239135742, "step": 5571} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 5571} {"info/global_step": 5572, "train_info/time_within_train_step": 2.6693055629730225, "step": 5572} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 5572} {"info/global_step": 5573, "train_info/time_within_train_step": 2.6802453994750977, "step": 5573} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 5573} {"info/global_step": 5574, "train_info/time_within_train_step": 2.651327133178711, "step": 5574} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 5574} {"info/global_step": 5575, "train_info/time_within_train_step": 2.686026096343994, "step": 5575} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 5575} {"info/global_step": 5576, "train_info/time_within_train_step": 2.648705244064331, "step": 5576} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 5576} {"info/global_step": 5577, "train_info/time_within_train_step": 2.6453752517700195, "step": 5577} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 5577} {"info/global_step": 5578, "train_info/time_within_train_step": 2.6556224822998047, "step": 5578} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 5578} {"info/global_step": 5579, "train_info/time_within_train_step": 2.6491646766662598, "step": 5579} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 5579} {"info/global_step": 5580, "train_info/time_within_train_step": 2.6450114250183105, "step": 5580} {"train_info/time_between_train_steps": 0.0032672882080078125, "step": 5580} {"info/global_step": 5581, "train_info/time_within_train_step": 2.6659467220306396, "step": 5581} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 5581} {"info/global_step": 5582, "train_info/time_within_train_step": 2.6581544876098633, "step": 5582} {"train_info/time_between_train_steps": 0.003239870071411133, "step": 5582} {"info/global_step": 5583, "train_info/time_within_train_step": 2.6610543727874756, "step": 5583} {"train_info/time_between_train_steps": 0.003245830535888672, "step": 5583} {"info/global_step": 5584, "train_info/time_within_train_step": 2.7011399269104004, "step": 5584} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 5584} {"info/global_step": 5585, "train_info/time_within_train_step": 2.93792986869812, "step": 5585} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 5585} {"info/global_step": 5586, "train_info/time_within_train_step": 2.6586997509002686, "step": 5586} {"train_info/time_between_train_steps": 0.003256559371948242, "step": 5586} {"info/global_step": 5587, "train_info/time_within_train_step": 2.665632724761963, "step": 5587} {"train_info/time_between_train_steps": 0.0032808780670166016, "step": 5587} {"info/global_step": 5588, "train_info/time_within_train_step": 2.685406446456909, "step": 5588} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 5588} {"info/global_step": 5589, "train_info/time_within_train_step": 2.6605684757232666, "step": 5589} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 5589} {"info/global_step": 5590, "train_info/time_within_train_step": 2.648320436477661, "step": 5590} {"train_info/time_between_train_steps": 0.0032219886779785156, "step": 5590} {"info/global_step": 5591, "train_info/time_within_train_step": 2.6477019786834717, "step": 5591} {"train_info/time_between_train_steps": 0.003275632858276367, "step": 5591} {"info/global_step": 5592, "train_info/time_within_train_step": 2.6507773399353027, "step": 5592} {"train_info/time_between_train_steps": 0.003347635269165039, "step": 5592} {"info/global_step": 5593, "train_info/time_within_train_step": 2.6502397060394287, "step": 5593} {"train_info/time_between_train_steps": 0.003273487091064453, "step": 5593} {"info/global_step": 5594, "train_info/time_within_train_step": 2.646381378173828, "step": 5594} {"train_info/time_between_train_steps": 0.003302335739135742, "step": 5594} {"info/global_step": 5595, "train_info/time_within_train_step": 2.6522440910339355, "step": 5595} {"train_info/time_between_train_steps": 0.0033426284790039062, "step": 5595} {"info/global_step": 5596, "train_info/time_within_train_step": 2.65787672996521, "step": 5596} {"train_info/time_between_train_steps": 0.003298044204711914, "step": 5596} {"info/global_step": 5597, "train_info/time_within_train_step": 2.7121880054473877, "step": 5597} {"train_info/time_between_train_steps": 0.003378152847290039, "step": 5597} {"info/global_step": 5598, "train_info/time_within_train_step": 2.7203896045684814, "step": 5598} {"train_info/time_between_train_steps": 0.0034029483795166016, "step": 5598} {"info/global_step": 5599, "train_info/time_within_train_step": 2.6777255535125732, "step": 5599} {"train_info/time_between_train_steps": 0.003397703170776367, "step": 5599} {"info/global_step": 5600, "train_info/time_within_train_step": 2.6401326656341553, "step": 5600} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746913141, "_runtime": 15739}, "step": 5600} {"logs": {"train/loss": 3.508, "train/learning_rate": 0.00029333333333333327, "train/epoch": 6.04, "_timestamp": 1746913141, "_runtime": 15739}, "step": 5600} {"train_info/time_between_train_steps": 13.487494230270386, "step": 5600} {"info/global_step": 5601, "train_info/time_within_train_step": 2.4626095294952393, "step": 5601} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 5601} {"info/global_step": 5602, "train_info/time_within_train_step": 2.456843852996826, "step": 5602} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 5602} {"info/global_step": 5603, "train_info/time_within_train_step": 2.591991424560547, "step": 5603} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 5603} {"info/global_step": 5604, "train_info/time_within_train_step": 2.647054433822632, "step": 5604} {"train_info/time_between_train_steps": 0.0032842159271240234, "step": 5604} {"info/global_step": 5605, "train_info/time_within_train_step": 2.6571195125579834, "step": 5605} {"train_info/time_between_train_steps": 0.0036516189575195312, "step": 5605} {"info/global_step": 5606, "train_info/time_within_train_step": 2.6728408336639404, "step": 5606} {"train_info/time_between_train_steps": 0.003403902053833008, "step": 5606} {"info/global_step": 5607, "train_info/time_within_train_step": 2.656125783920288, "step": 5607} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 5607} {"info/global_step": 5608, "train_info/time_within_train_step": 2.6516828536987305, "step": 5608} {"train_info/time_between_train_steps": 0.0033426284790039062, "step": 5608} {"info/global_step": 5609, "train_info/time_within_train_step": 2.6432676315307617, "step": 5609} {"train_info/time_between_train_steps": 0.0032613277435302734, "step": 5609} {"info/global_step": 5610, "train_info/time_within_train_step": 2.6586201190948486, "step": 5610} {"train_info/time_between_train_steps": 0.0033566951751708984, "step": 5610} {"info/global_step": 5611, "train_info/time_within_train_step": 2.652907609939575, "step": 5611} {"train_info/time_between_train_steps": 0.0032329559326171875, "step": 5611} {"info/global_step": 5612, "train_info/time_within_train_step": 2.668461561203003, "step": 5612} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 5612} {"info/global_step": 5613, "train_info/time_within_train_step": 2.7254433631896973, "step": 5613} {"train_info/time_between_train_steps": 0.003226041793823242, "step": 5613} {"info/global_step": 5614, "train_info/time_within_train_step": 2.666595220565796, "step": 5614} {"train_info/time_between_train_steps": 0.0032913684844970703, "step": 5614} {"info/global_step": 5615, "train_info/time_within_train_step": 2.642226219177246, "step": 5615} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 5615} {"info/global_step": 5616, "train_info/time_within_train_step": 2.7749123573303223, "step": 5616} {"train_info/time_between_train_steps": 0.003497600555419922, "step": 5616} {"info/global_step": 5617, "train_info/time_within_train_step": 2.654991626739502, "step": 5617} {"train_info/time_between_train_steps": 0.0032494068145751953, "step": 5617} {"info/global_step": 5618, "train_info/time_within_train_step": 2.6557533740997314, "step": 5618} {"train_info/time_between_train_steps": 0.0034928321838378906, "step": 5618} {"info/global_step": 5619, "train_info/time_within_train_step": 2.6448512077331543, "step": 5619} {"train_info/time_between_train_steps": 0.003256082534790039, "step": 5619} {"info/global_step": 5620, "train_info/time_within_train_step": 2.6506049633026123, "step": 5620} {"train_info/time_between_train_steps": 0.00337982177734375, "step": 5620} {"info/global_step": 5621, "train_info/time_within_train_step": 2.658409833908081, "step": 5621} {"train_info/time_between_train_steps": 0.003245830535888672, "step": 5621} {"info/global_step": 5622, "train_info/time_within_train_step": 2.6495590209960938, "step": 5622} {"train_info/time_between_train_steps": 0.003644227981567383, "step": 5622} {"info/global_step": 5623, "train_info/time_within_train_step": 2.652149200439453, "step": 5623} {"train_info/time_between_train_steps": 0.003815889358520508, "step": 5623} {"info/global_step": 5624, "train_info/time_within_train_step": 2.650536060333252, "step": 5624} {"train_info/time_between_train_steps": 0.0038971900939941406, "step": 5624} {"info/global_step": 5625, "train_info/time_within_train_step": 2.653059959411621, "step": 5625} {"train_info/time_between_train_steps": 0.003961801528930664, "step": 5625} {"info/global_step": 5626, "train_info/time_within_train_step": 2.647608757019043, "step": 5626} {"train_info/time_between_train_steps": 0.003271341323852539, "step": 5626} {"info/global_step": 5627, "train_info/time_within_train_step": 2.649005889892578, "step": 5627} {"train_info/time_between_train_steps": 0.0032434463500976562, "step": 5627} {"info/global_step": 5628, "train_info/time_within_train_step": 2.705345869064331, "step": 5628} {"train_info/time_between_train_steps": 0.003264188766479492, "step": 5628} {"info/global_step": 5629, "train_info/time_within_train_step": 2.6430108547210693, "step": 5629} {"train_info/time_between_train_steps": 0.0032422542572021484, "step": 5629} {"info/global_step": 5630, "train_info/time_within_train_step": 2.6567137241363525, "step": 5630} {"train_info/time_between_train_steps": 0.003267526626586914, "step": 5630} {"info/global_step": 5631, "train_info/time_within_train_step": 2.6431946754455566, "step": 5631} {"train_info/time_between_train_steps": 0.003252267837524414, "step": 5631} {"info/global_step": 5632, "train_info/time_within_train_step": 2.645231246948242, "step": 5632} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 5632} {"info/global_step": 5633, "train_info/time_within_train_step": 2.6541690826416016, "step": 5633} {"train_info/time_between_train_steps": 0.0032732486724853516, "step": 5633} {"info/global_step": 5634, "train_info/time_within_train_step": 2.6528353691101074, "step": 5634} {"train_info/time_between_train_steps": 0.0032761096954345703, "step": 5634} {"info/global_step": 5635, "train_info/time_within_train_step": 2.6607139110565186, "step": 5635} {"train_info/time_between_train_steps": 0.0032434463500976562, "step": 5635} {"info/global_step": 5636, "train_info/time_within_train_step": 2.6919500827789307, "step": 5636} {"train_info/time_between_train_steps": 0.003201007843017578, "step": 5636} {"info/global_step": 5637, "train_info/time_within_train_step": 2.7229859828948975, "step": 5637} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 5637} {"info/global_step": 5638, "train_info/time_within_train_step": 2.6478519439697266, "step": 5638} {"train_info/time_between_train_steps": 0.003304004669189453, "step": 5638} {"info/global_step": 5639, "train_info/time_within_train_step": 2.6414897441864014, "step": 5639} {"train_info/time_between_train_steps": 0.0032684803009033203, "step": 5639} {"info/global_step": 5640, "train_info/time_within_train_step": 2.6617231369018555, "step": 5640} {"train_info/time_between_train_steps": 0.0032591819763183594, "step": 5640} {"info/global_step": 5641, "train_info/time_within_train_step": 2.647183418273926, "step": 5641} {"train_info/time_between_train_steps": 0.0032339096069335938, "step": 5641} {"info/global_step": 5642, "train_info/time_within_train_step": 2.6447458267211914, "step": 5642} {"train_info/time_between_train_steps": 0.003240823745727539, "step": 5642} {"info/global_step": 5643, "train_info/time_within_train_step": 2.65051007270813, "step": 5643} {"train_info/time_between_train_steps": 0.0032532215118408203, "step": 5643} {"info/global_step": 5644, "train_info/time_within_train_step": 2.6456120014190674, "step": 5644} {"train_info/time_between_train_steps": 0.003283262252807617, "step": 5644} {"info/global_step": 5645, "train_info/time_within_train_step": 2.6698572635650635, "step": 5645} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 5645} {"info/global_step": 5646, "train_info/time_within_train_step": 2.691218137741089, "step": 5646} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 5646} {"info/global_step": 5647, "train_info/time_within_train_step": 2.665196180343628, "step": 5647} {"train_info/time_between_train_steps": 0.0032532215118408203, "step": 5647} {"info/global_step": 5648, "train_info/time_within_train_step": 2.664254665374756, "step": 5648} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 5648} {"info/global_step": 5649, "train_info/time_within_train_step": 2.6417572498321533, "step": 5649} {"train_info/time_between_train_steps": 0.0032775402069091797, "step": 5649} {"info/global_step": 5650, "train_info/time_within_train_step": 2.6549549102783203, "step": 5650} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746913290, "_runtime": 15888}, "step": 5650} {"logs": {"train/loss": 3.5061, "train/learning_rate": 0.00029, "train/epoch": 6.05, "_timestamp": 1746913290, "_runtime": 15888}, "step": 5650} {"train_info/time_between_train_steps": 0.024724483489990234, "step": 5650} {"info/global_step": 5651, "train_info/time_within_train_step": 2.65063214302063, "step": 5651} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 5651} {"info/global_step": 5652, "train_info/time_within_train_step": 2.655986785888672, "step": 5652} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 5652} {"info/global_step": 5653, "train_info/time_within_train_step": 2.6453890800476074, "step": 5653} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 5653} {"info/global_step": 5654, "train_info/time_within_train_step": 2.6476073265075684, "step": 5654} {"train_info/time_between_train_steps": 0.003309488296508789, "step": 5654} {"info/global_step": 5655, "train_info/time_within_train_step": 2.6725716590881348, "step": 5655} {"train_info/time_between_train_steps": 0.003204345703125, "step": 5655} {"info/global_step": 5656, "train_info/time_within_train_step": 2.667621374130249, "step": 5656} {"train_info/time_between_train_steps": 0.003309488296508789, "step": 5656} {"info/global_step": 5657, "train_info/time_within_train_step": 2.6585943698883057, "step": 5657} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 5657} {"info/global_step": 5658, "train_info/time_within_train_step": 2.684077739715576, "step": 5658} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 5658} {"info/global_step": 5659, "train_info/time_within_train_step": 2.6738808155059814, "step": 5659} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 5659} {"info/global_step": 5660, "train_info/time_within_train_step": 2.6489169597625732, "step": 5660} {"train_info/time_between_train_steps": 0.003346681594848633, "step": 5660} {"info/global_step": 5661, "train_info/time_within_train_step": 2.650692939758301, "step": 5661} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 5661} {"info/global_step": 5662, "train_info/time_within_train_step": 2.6533150672912598, "step": 5662} {"train_info/time_between_train_steps": 0.0033288002014160156, "step": 5662} {"info/global_step": 5663, "train_info/time_within_train_step": 2.6507699489593506, "step": 5663} {"train_info/time_between_train_steps": 0.0033445358276367188, "step": 5663} {"info/global_step": 5664, "train_info/time_within_train_step": 2.646521806716919, "step": 5664} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 5664} {"info/global_step": 5665, "train_info/time_within_train_step": 2.653212547302246, "step": 5665} {"train_info/time_between_train_steps": 0.0033054351806640625, "step": 5665} {"info/global_step": 5666, "train_info/time_within_train_step": 2.6493992805480957, "step": 5666} {"train_info/time_between_train_steps": 0.003263235092163086, "step": 5666} {"info/global_step": 5667, "train_info/time_within_train_step": 2.6594455242156982, "step": 5667} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 5667} {"info/global_step": 5668, "train_info/time_within_train_step": 2.645606279373169, "step": 5668} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 5668} {"info/global_step": 5669, "train_info/time_within_train_step": 2.6490683555603027, "step": 5669} {"train_info/time_between_train_steps": 0.0032684803009033203, "step": 5669} {"info/global_step": 5670, "train_info/time_within_train_step": 2.6517844200134277, "step": 5670} {"train_info/time_between_train_steps": 0.003314495086669922, "step": 5670} {"info/global_step": 5671, "train_info/time_within_train_step": 2.6572930812835693, "step": 5671} {"train_info/time_between_train_steps": 0.00333404541015625, "step": 5671} {"info/global_step": 5672, "train_info/time_within_train_step": 2.6633760929107666, "step": 5672} {"train_info/time_between_train_steps": 0.0034012794494628906, "step": 5672} {"info/global_step": 5673, "train_info/time_within_train_step": 2.9281508922576904, "step": 5673} {"train_info/time_between_train_steps": 0.0033965110778808594, "step": 5673} {"info/global_step": 5674, "train_info/time_within_train_step": 2.6613876819610596, "step": 5674} {"train_info/time_between_train_steps": 0.003298521041870117, "step": 5674} {"info/global_step": 5675, "train_info/time_within_train_step": 2.661144256591797, "step": 5675} {"train_info/time_between_train_steps": 0.0035202503204345703, "step": 5675} {"info/global_step": 5676, "train_info/time_within_train_step": 2.6680591106414795, "step": 5676} {"train_info/time_between_train_steps": 0.003477334976196289, "step": 5676} {"info/global_step": 5677, "train_info/time_within_train_step": 2.7123799324035645, "step": 5677} {"train_info/time_between_train_steps": 0.0032830238342285156, "step": 5677} {"info/global_step": 5678, "train_info/time_within_train_step": 2.651413917541504, "step": 5678} {"train_info/time_between_train_steps": 0.11149334907531738, "step": 5678} {"info/global_step": 5679, "train_info/time_within_train_step": 2.731782913208008, "step": 5679} {"train_info/time_between_train_steps": 0.0033805370330810547, "step": 5679} {"info/global_step": 5680, "train_info/time_within_train_step": 2.6570708751678467, "step": 5680} {"train_info/time_between_train_steps": 0.0033850669860839844, "step": 5680} {"info/global_step": 5681, "train_info/time_within_train_step": 2.6440491676330566, "step": 5681} {"train_info/time_between_train_steps": 0.006589651107788086, "step": 5681} {"info/global_step": 5682, "train_info/time_within_train_step": 2.6526238918304443, "step": 5682} {"train_info/time_between_train_steps": 0.0033130645751953125, "step": 5682} {"info/global_step": 5683, "train_info/time_within_train_step": 2.6554412841796875, "step": 5683} {"train_info/time_between_train_steps": 0.0066378116607666016, "step": 5683} {"info/global_step": 5684, "train_info/time_within_train_step": 2.656895399093628, "step": 5684} {"train_info/time_between_train_steps": 0.003256559371948242, "step": 5684} {"info/global_step": 5685, "train_info/time_within_train_step": 2.6524548530578613, "step": 5685} {"train_info/time_between_train_steps": 0.00666356086730957, "step": 5685} {"info/global_step": 5686, "train_info/time_within_train_step": 2.6709866523742676, "step": 5686} {"train_info/time_between_train_steps": 0.003383159637451172, "step": 5686} {"info/global_step": 5687, "train_info/time_within_train_step": 2.6980230808258057, "step": 5687} {"train_info/time_between_train_steps": 0.0032558441162109375, "step": 5687} {"info/global_step": 5688, "train_info/time_within_train_step": 2.664659023284912, "step": 5688} {"train_info/time_between_train_steps": 0.006597280502319336, "step": 5688} {"info/global_step": 5689, "train_info/time_within_train_step": 2.661478042602539, "step": 5689} {"train_info/time_between_train_steps": 0.006560802459716797, "step": 5689} {"info/global_step": 5690, "train_info/time_within_train_step": 2.6418819427490234, "step": 5690} {"train_info/time_between_train_steps": 0.006662607192993164, "step": 5690} {"info/global_step": 5691, "train_info/time_within_train_step": 2.6533637046813965, "step": 5691} {"train_info/time_between_train_steps": 0.0065250396728515625, "step": 5691} {"info/global_step": 5692, "train_info/time_within_train_step": 2.66343092918396, "step": 5692} {"train_info/time_between_train_steps": 0.006537914276123047, "step": 5692} {"info/global_step": 5693, "train_info/time_within_train_step": 2.6443324089050293, "step": 5693} {"train_info/time_between_train_steps": 0.006680011749267578, "step": 5693} {"info/global_step": 5694, "train_info/time_within_train_step": 2.644070863723755, "step": 5694} {"train_info/time_between_train_steps": 0.006588459014892578, "step": 5694} {"info/global_step": 5695, "train_info/time_within_train_step": 2.670037031173706, "step": 5695} {"train_info/time_between_train_steps": 0.0033566951751708984, "step": 5695} {"info/global_step": 5696, "train_info/time_within_train_step": 2.6764214038848877, "step": 5696} {"train_info/time_between_train_steps": 0.006667613983154297, "step": 5696} {"info/global_step": 5697, "train_info/time_within_train_step": 2.666567802429199, "step": 5697} {"train_info/time_between_train_steps": 0.006632328033447266, "step": 5697} {"info/global_step": 5698, "train_info/time_within_train_step": 2.6747353076934814, "step": 5698} {"train_info/time_between_train_steps": 0.006554365158081055, "step": 5698} {"info/global_step": 5699, "train_info/time_within_train_step": 2.66261887550354, "step": 5699} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 5699} {"info/global_step": 5700, "train_info/time_within_train_step": 2.647150993347168, "step": 5700} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746913424, "_runtime": 16022}, "step": 5700} {"logs": {"train/loss": 3.4894, "train/learning_rate": 0.0002866666666666667, "train/epoch": 6.05, "_timestamp": 1746913424, "_runtime": 16022}, "step": 5700} {"train_info/time_between_train_steps": 0.02498030662536621, "step": 5700} {"info/global_step": 5701, "train_info/time_within_train_step": 2.641549825668335, "step": 5701} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 5701} {"info/global_step": 5702, "train_info/time_within_train_step": 2.6434569358825684, "step": 5702} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 5702} {"info/global_step": 5703, "train_info/time_within_train_step": 2.6655757427215576, "step": 5703} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 5703} {"info/global_step": 5704, "train_info/time_within_train_step": 2.652698516845703, "step": 5704} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 5704} {"info/global_step": 5705, "train_info/time_within_train_step": 2.649588108062744, "step": 5705} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 5705} {"info/global_step": 5706, "train_info/time_within_train_step": 2.6588470935821533, "step": 5706} {"train_info/time_between_train_steps": 0.003225564956665039, "step": 5706} {"info/global_step": 5707, "train_info/time_within_train_step": 2.660567045211792, "step": 5707} {"train_info/time_between_train_steps": 0.0033054351806640625, "step": 5707} {"info/global_step": 5708, "train_info/time_within_train_step": 2.6744139194488525, "step": 5708} {"train_info/time_between_train_steps": 0.0032384395599365234, "step": 5708} {"info/global_step": 5709, "train_info/time_within_train_step": 2.670078992843628, "step": 5709} {"train_info/time_between_train_steps": 0.0032384395599365234, "step": 5709} {"info/global_step": 5710, "train_info/time_within_train_step": 2.693596124649048, "step": 5710} {"train_info/time_between_train_steps": 0.0033664703369140625, "step": 5710} {"info/global_step": 5711, "train_info/time_within_train_step": 2.6464591026306152, "step": 5711} {"train_info/time_between_train_steps": 0.003277301788330078, "step": 5711} {"info/global_step": 5712, "train_info/time_within_train_step": 2.6439106464385986, "step": 5712} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 5712} {"info/global_step": 5713, "train_info/time_within_train_step": 2.6656007766723633, "step": 5713} {"train_info/time_between_train_steps": 0.0032651424407958984, "step": 5713} {"info/global_step": 5714, "train_info/time_within_train_step": 2.6558592319488525, "step": 5714} {"train_info/time_between_train_steps": 0.0032901763916015625, "step": 5714} {"info/global_step": 5715, "train_info/time_within_train_step": 2.6452574729919434, "step": 5715} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 5715} {"info/global_step": 5716, "train_info/time_within_train_step": 2.6606998443603516, "step": 5716} {"train_info/time_between_train_steps": 0.003358125686645508, "step": 5716} {"info/global_step": 5717, "train_info/time_within_train_step": 2.658947706222534, "step": 5717} {"train_info/time_between_train_steps": 0.003354787826538086, "step": 5717} {"info/global_step": 5718, "train_info/time_within_train_step": 2.661048412322998, "step": 5718} {"train_info/time_between_train_steps": 0.003257274627685547, "step": 5718} {"info/global_step": 5719, "train_info/time_within_train_step": 2.706418991088867, "step": 5719} {"train_info/time_between_train_steps": 0.003263235092163086, "step": 5719} {"info/global_step": 5720, "train_info/time_within_train_step": 2.72528076171875, "step": 5720} {"train_info/time_between_train_steps": 0.0033829212188720703, "step": 5720} {"info/global_step": 5721, "train_info/time_within_train_step": 2.6484885215759277, "step": 5721} {"train_info/time_between_train_steps": 0.006612539291381836, "step": 5721} {"info/global_step": 5722, "train_info/time_within_train_step": 2.6424319744110107, "step": 5722} {"train_info/time_between_train_steps": 0.0067064762115478516, "step": 5722} {"info/global_step": 5723, "train_info/time_within_train_step": 2.6591908931732178, "step": 5723} {"train_info/time_between_train_steps": 0.006628513336181641, "step": 5723} {"info/global_step": 5724, "train_info/time_within_train_step": 2.6504805088043213, "step": 5724} {"train_info/time_between_train_steps": 0.003286123275756836, "step": 5724} {"info/global_step": 5725, "train_info/time_within_train_step": 2.649070978164673, "step": 5725} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 5725} {"info/global_step": 5726, "train_info/time_within_train_step": 2.701167583465576, "step": 5726} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 5726} {"info/global_step": 5727, "train_info/time_within_train_step": 2.6440625190734863, "step": 5727} {"train_info/time_between_train_steps": 0.0032629966735839844, "step": 5727} {"info/global_step": 5728, "train_info/time_within_train_step": 2.646080255508423, "step": 5728} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 5728} {"info/global_step": 5729, "train_info/time_within_train_step": 2.659346103668213, "step": 5729} {"train_info/time_between_train_steps": 0.002897500991821289, "step": 5729} {"info/global_step": 5730, "train_info/time_within_train_step": 2.6475462913513184, "step": 5730} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 5730} {"info/global_step": 5731, "train_info/time_within_train_step": 2.6612894535064697, "step": 5731} {"train_info/time_between_train_steps": 0.0028846263885498047, "step": 5731} {"info/global_step": 5732, "train_info/time_within_train_step": 2.6432971954345703, "step": 5732} {"train_info/time_between_train_steps": 0.003049612045288086, "step": 5732} {"info/global_step": 5733, "train_info/time_within_train_step": 2.8876073360443115, "step": 5733} {"train_info/time_between_train_steps": 0.0029408931732177734, "step": 5733} {"info/global_step": 5734, "train_info/time_within_train_step": 2.652653217315674, "step": 5734} {"train_info/time_between_train_steps": 0.0029745101928710938, "step": 5734} {"info/global_step": 5735, "train_info/time_within_train_step": 2.6426637172698975, "step": 5735} {"train_info/time_between_train_steps": 0.003061532974243164, "step": 5735} {"info/global_step": 5736, "train_info/time_within_train_step": 2.6444764137268066, "step": 5736} {"train_info/time_between_train_steps": 0.003087759017944336, "step": 5736} {"info/global_step": 5737, "train_info/time_within_train_step": 2.6489102840423584, "step": 5737} {"train_info/time_between_train_steps": 0.0030853748321533203, "step": 5737} {"info/global_step": 5738, "train_info/time_within_train_step": 2.660524845123291, "step": 5738} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 5738} {"info/global_step": 5739, "train_info/time_within_train_step": 2.6705212593078613, "step": 5739} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 5739} {"info/global_step": 5740, "train_info/time_within_train_step": 2.6631476879119873, "step": 5740} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 5740} {"info/global_step": 5741, "train_info/time_within_train_step": 2.6951191425323486, "step": 5741} {"train_info/time_between_train_steps": 0.0029375553131103516, "step": 5741} {"info/global_step": 5742, "train_info/time_within_train_step": 2.6406664848327637, "step": 5742} {"train_info/time_between_train_steps": 0.002893209457397461, "step": 5742} {"info/global_step": 5743, "train_info/time_within_train_step": 2.6386375427246094, "step": 5743} {"train_info/time_between_train_steps": 0.0029268264770507812, "step": 5743} {"info/global_step": 5744, "train_info/time_within_train_step": 2.6668336391448975, "step": 5744} {"train_info/time_between_train_steps": 0.0028803348541259766, "step": 5744} {"info/global_step": 5745, "train_info/time_within_train_step": 2.6488654613494873, "step": 5745} {"train_info/time_between_train_steps": 0.002957582473754883, "step": 5745} {"info/global_step": 5746, "train_info/time_within_train_step": 2.6432056427001953, "step": 5746} {"train_info/time_between_train_steps": 0.0029821395874023438, "step": 5746} {"info/global_step": 5747, "train_info/time_within_train_step": 2.659552574157715, "step": 5747} {"train_info/time_between_train_steps": 0.002917766571044922, "step": 5747} {"info/global_step": 5748, "train_info/time_within_train_step": 2.6503493785858154, "step": 5748} {"train_info/time_between_train_steps": 0.0030052661895751953, "step": 5748} {"info/global_step": 5749, "train_info/time_within_train_step": 3.282363176345825, "step": 5749} {"train_info/time_between_train_steps": 0.0029315948486328125, "step": 5749} {"info/global_step": 5750, "train_info/time_within_train_step": 2.6392934322357178, "step": 5750} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746913559, "_runtime": 16157}, "step": 5750} {"logs": {"train/loss": 3.4833, "train/learning_rate": 0.0002833333333333333, "train/epoch": 6.06, "_timestamp": 1746913559, "_runtime": 16157}, "step": 5750} {"train_info/time_between_train_steps": 0.02443528175354004, "step": 5750} {"info/global_step": 5751, "train_info/time_within_train_step": 2.657315969467163, "step": 5751} {"train_info/time_between_train_steps": 0.0029020309448242188, "step": 5751} {"info/global_step": 5752, "train_info/time_within_train_step": 2.6414566040039062, "step": 5752} {"train_info/time_between_train_steps": 0.002933502197265625, "step": 5752} {"info/global_step": 5753, "train_info/time_within_train_step": 2.644545078277588, "step": 5753} {"train_info/time_between_train_steps": 0.0029337406158447266, "step": 5753} {"info/global_step": 5754, "train_info/time_within_train_step": 2.651066303253174, "step": 5754} {"train_info/time_between_train_steps": 0.0029463768005371094, "step": 5754} {"info/global_step": 5755, "train_info/time_within_train_step": 2.651031017303467, "step": 5755} {"train_info/time_between_train_steps": 0.0028862953186035156, "step": 5755} {"info/global_step": 5756, "train_info/time_within_train_step": 2.6606647968292236, "step": 5756} {"train_info/time_between_train_steps": 0.0029795169830322266, "step": 5756} {"info/global_step": 5757, "train_info/time_within_train_step": 2.68873929977417, "step": 5757} {"train_info/time_between_train_steps": 0.00614476203918457, "step": 5757} {"info/global_step": 5758, "train_info/time_within_train_step": 2.724881410598755, "step": 5758} {"train_info/time_between_train_steps": 0.0041239261627197266, "step": 5758} {"info/global_step": 5759, "train_info/time_within_train_step": 2.654935359954834, "step": 5759} {"train_info/time_between_train_steps": 0.002927064895629883, "step": 5759} {"info/global_step": 5760, "train_info/time_within_train_step": 2.640502452850342, "step": 5760} {"train_info/time_between_train_steps": 0.0029129981994628906, "step": 5760} {"info/global_step": 5761, "train_info/time_within_train_step": 2.656728506088257, "step": 5761} {"train_info/time_between_train_steps": 0.0029730796813964844, "step": 5761} {"info/global_step": 5762, "train_info/time_within_train_step": 2.649155616760254, "step": 5762} {"train_info/time_between_train_steps": 0.0061342716217041016, "step": 5762} {"info/global_step": 5763, "train_info/time_within_train_step": 2.648834466934204, "step": 5763} {"train_info/time_between_train_steps": 0.006092548370361328, "step": 5763} {"info/global_step": 5764, "train_info/time_within_train_step": 2.645526647567749, "step": 5764} {"train_info/time_between_train_steps": 0.006100177764892578, "step": 5764} {"info/global_step": 5765, "train_info/time_within_train_step": 2.645613431930542, "step": 5765} {"train_info/time_between_train_steps": 0.006096363067626953, "step": 5765} {"info/global_step": 5766, "train_info/time_within_train_step": 2.661717414855957, "step": 5766} {"train_info/time_between_train_steps": 0.003069639205932617, "step": 5766} {"info/global_step": 5767, "train_info/time_within_train_step": 2.6640305519104004, "step": 5767} {"train_info/time_between_train_steps": 0.006135702133178711, "step": 5767} {"info/global_step": 5768, "train_info/time_within_train_step": 2.7093896865844727, "step": 5768} {"train_info/time_between_train_steps": 0.006119966506958008, "step": 5768} {"info/global_step": 5769, "train_info/time_within_train_step": 2.6435325145721436, "step": 5769} {"train_info/time_between_train_steps": 0.006159305572509766, "step": 5769} {"info/global_step": 5770, "train_info/time_within_train_step": 2.6579465866088867, "step": 5770} {"train_info/time_between_train_steps": 0.0029006004333496094, "step": 5770} {"info/global_step": 5771, "train_info/time_within_train_step": 2.6468088626861572, "step": 5771} {"train_info/time_between_train_steps": 0.002954721450805664, "step": 5771} {"info/global_step": 5772, "train_info/time_within_train_step": 2.645991086959839, "step": 5772} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 5772} {"info/global_step": 5773, "train_info/time_within_train_step": 2.661243200302124, "step": 5773} {"train_info/time_between_train_steps": 0.0029571056365966797, "step": 5773} {"info/global_step": 5774, "train_info/time_within_train_step": 2.643394708633423, "step": 5774} {"train_info/time_between_train_steps": 0.002900838851928711, "step": 5774} {"info/global_step": 5775, "train_info/time_within_train_step": 2.6445841789245605, "step": 5775} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 5775} {"info/global_step": 5776, "train_info/time_within_train_step": 2.6697089672088623, "step": 5776} {"train_info/time_between_train_steps": 0.0029060840606689453, "step": 5776} {"info/global_step": 5777, "train_info/time_within_train_step": 2.6674108505249023, "step": 5777} {"train_info/time_between_train_steps": 0.002971172332763672, "step": 5777} {"info/global_step": 5778, "train_info/time_within_train_step": 2.6567046642303467, "step": 5778} {"train_info/time_between_train_steps": 0.003323078155517578, "step": 5778} {"info/global_step": 5779, "train_info/time_within_train_step": 2.912032127380371, "step": 5779} {"train_info/time_between_train_steps": 0.0029315948486328125, "step": 5779} {"info/global_step": 5780, "train_info/time_within_train_step": 2.6700267791748047, "step": 5780} {"train_info/time_between_train_steps": 0.002942323684692383, "step": 5780} {"info/global_step": 5781, "train_info/time_within_train_step": 2.6554651260375977, "step": 5781} {"train_info/time_between_train_steps": 0.0029022693634033203, "step": 5781} {"info/global_step": 5782, "train_info/time_within_train_step": 2.685148000717163, "step": 5782} {"train_info/time_between_train_steps": 0.0030007362365722656, "step": 5782} {"info/global_step": 5783, "train_info/time_within_train_step": 2.642226219177246, "step": 5783} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 5783} {"info/global_step": 5784, "train_info/time_within_train_step": 2.650181531906128, "step": 5784} {"train_info/time_between_train_steps": 0.0029311180114746094, "step": 5784} {"info/global_step": 5785, "train_info/time_within_train_step": 2.6644322872161865, "step": 5785} {"train_info/time_between_train_steps": 0.0030045509338378906, "step": 5785} {"info/global_step": 5786, "train_info/time_within_train_step": 2.6651837825775146, "step": 5786} {"train_info/time_between_train_steps": 0.0029642581939697266, "step": 5786} {"info/global_step": 5787, "train_info/time_within_train_step": 2.6651270389556885, "step": 5787} {"train_info/time_between_train_steps": 0.002907991409301758, "step": 5787} {"info/global_step": 5788, "train_info/time_within_train_step": 2.694499969482422, "step": 5788} {"train_info/time_between_train_steps": 0.0029430389404296875, "step": 5788} {"info/global_step": 5789, "train_info/time_within_train_step": 2.6408374309539795, "step": 5789} {"train_info/time_between_train_steps": 0.0029458999633789062, "step": 5789} {"info/global_step": 5790, "train_info/time_within_train_step": 2.641975164413452, "step": 5790} {"train_info/time_between_train_steps": 0.002943754196166992, "step": 5790} {"info/global_step": 5791, "train_info/time_within_train_step": 2.6653428077697754, "step": 5791} {"train_info/time_between_train_steps": 0.0029311180114746094, "step": 5791} {"info/global_step": 5792, "train_info/time_within_train_step": 2.6470329761505127, "step": 5792} {"train_info/time_between_train_steps": 0.0029325485229492188, "step": 5792} {"info/global_step": 5793, "train_info/time_within_train_step": 2.690391778945923, "step": 5793} {"train_info/time_between_train_steps": 0.002920866012573242, "step": 5793} {"info/global_step": 5794, "train_info/time_within_train_step": 2.6451334953308105, "step": 5794} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 5794} {"info/global_step": 5795, "train_info/time_within_train_step": 2.6546826362609863, "step": 5795} {"train_info/time_between_train_steps": 0.0029184818267822266, "step": 5795} {"info/global_step": 5796, "train_info/time_within_train_step": 2.6550934314727783, "step": 5796} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 5796} {"info/global_step": 5797, "train_info/time_within_train_step": 2.668238401412964, "step": 5797} {"train_info/time_between_train_steps": 0.0029649734497070312, "step": 5797} {"info/global_step": 5798, "train_info/time_within_train_step": 2.7016561031341553, "step": 5798} {"train_info/time_between_train_steps": 0.002938508987426758, "step": 5798} {"info/global_step": 5799, "train_info/time_within_train_step": 2.6406409740448, "step": 5799} {"train_info/time_between_train_steps": 0.002981424331665039, "step": 5799} {"info/global_step": 5800, "train_info/time_within_train_step": 2.639730930328369, "step": 5800} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746913694, "_runtime": 16292}, "step": 5800} {"logs": {"train/loss": 3.469, "train/learning_rate": 0.00028, "train/epoch": 6.06, "_timestamp": 1746913694, "_runtime": 16292}, "step": 5800} {"train_info/time_between_train_steps": 14.177459716796875, "step": 5800} {"info/global_step": 5801, "train_info/time_within_train_step": 2.456160545349121, "step": 5801} {"train_info/time_between_train_steps": 0.0029273033142089844, "step": 5801} {"info/global_step": 5802, "train_info/time_within_train_step": 2.440659761428833, "step": 5802} {"train_info/time_between_train_steps": 0.0029296875, "step": 5802} {"info/global_step": 5803, "train_info/time_within_train_step": 2.5728609561920166, "step": 5803} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 5803} {"info/global_step": 5804, "train_info/time_within_train_step": 2.663419008255005, "step": 5804} {"train_info/time_between_train_steps": 0.0029485225677490234, "step": 5804} {"info/global_step": 5805, "train_info/time_within_train_step": 2.6865062713623047, "step": 5805} {"train_info/time_between_train_steps": 0.0029604434967041016, "step": 5805} {"info/global_step": 5806, "train_info/time_within_train_step": 2.652064800262451, "step": 5806} {"train_info/time_between_train_steps": 0.002898693084716797, "step": 5806} {"info/global_step": 5807, "train_info/time_within_train_step": 2.661878824234009, "step": 5807} {"train_info/time_between_train_steps": 0.0029036998748779297, "step": 5807} {"info/global_step": 5808, "train_info/time_within_train_step": 2.6468560695648193, "step": 5808} {"train_info/time_between_train_steps": 0.002918243408203125, "step": 5808} {"info/global_step": 5809, "train_info/time_within_train_step": 2.6454968452453613, "step": 5809} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 5809} {"info/global_step": 5810, "train_info/time_within_train_step": 2.653390407562256, "step": 5810} {"train_info/time_between_train_steps": 0.0029158592224121094, "step": 5810} {"info/global_step": 5811, "train_info/time_within_train_step": 2.6495485305786133, "step": 5811} {"train_info/time_between_train_steps": 0.003070831298828125, "step": 5811} {"info/global_step": 5812, "train_info/time_within_train_step": 2.6440861225128174, "step": 5812} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 5812} {"info/global_step": 5813, "train_info/time_within_train_step": 2.6675798892974854, "step": 5813} {"train_info/time_between_train_steps": 0.0029773712158203125, "step": 5813} {"info/global_step": 5814, "train_info/time_within_train_step": 2.658928155899048, "step": 5814} {"train_info/time_between_train_steps": 0.00295257568359375, "step": 5814} {"info/global_step": 5815, "train_info/time_within_train_step": 2.662262439727783, "step": 5815} {"train_info/time_between_train_steps": 0.0029783248901367188, "step": 5815} {"info/global_step": 5816, "train_info/time_within_train_step": 2.699963331222534, "step": 5816} {"train_info/time_between_train_steps": 0.002912282943725586, "step": 5816} {"info/global_step": 5817, "train_info/time_within_train_step": 2.6633801460266113, "step": 5817} {"train_info/time_between_train_steps": 0.002942323684692383, "step": 5817} {"info/global_step": 5818, "train_info/time_within_train_step": 2.649153232574463, "step": 5818} {"train_info/time_between_train_steps": 0.002933025360107422, "step": 5818} {"info/global_step": 5819, "train_info/time_within_train_step": 2.645358085632324, "step": 5819} {"train_info/time_between_train_steps": 0.002889394760131836, "step": 5819} {"info/global_step": 5820, "train_info/time_within_train_step": 2.654818058013916, "step": 5820} {"train_info/time_between_train_steps": 0.0029315948486328125, "step": 5820} {"info/global_step": 5821, "train_info/time_within_train_step": 2.654576063156128, "step": 5821} {"train_info/time_between_train_steps": 0.0029020309448242188, "step": 5821} {"info/global_step": 5822, "train_info/time_within_train_step": 2.645730972290039, "step": 5822} {"train_info/time_between_train_steps": 0.002919912338256836, "step": 5822} {"info/global_step": 5823, "train_info/time_within_train_step": 2.661273717880249, "step": 5823} {"train_info/time_between_train_steps": 0.0029528141021728516, "step": 5823} {"info/global_step": 5824, "train_info/time_within_train_step": 2.654430866241455, "step": 5824} {"train_info/time_between_train_steps": 0.003090381622314453, "step": 5824} {"info/global_step": 5825, "train_info/time_within_train_step": 2.667025089263916, "step": 5825} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 5825} {"info/global_step": 5826, "train_info/time_within_train_step": 2.7110421657562256, "step": 5826} {"train_info/time_between_train_steps": 0.003069639205932617, "step": 5826} {"info/global_step": 5827, "train_info/time_within_train_step": 2.6461305618286133, "step": 5827} {"train_info/time_between_train_steps": 0.0030388832092285156, "step": 5827} {"info/global_step": 5828, "train_info/time_within_train_step": 2.644728660583496, "step": 5828} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 5828} {"info/global_step": 5829, "train_info/time_within_train_step": 2.6467208862304688, "step": 5829} {"train_info/time_between_train_steps": 0.0030002593994140625, "step": 5829} {"info/global_step": 5830, "train_info/time_within_train_step": 2.64652419090271, "step": 5830} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 5830} {"info/global_step": 5831, "train_info/time_within_train_step": 2.647718906402588, "step": 5831} {"train_info/time_between_train_steps": 0.002886533737182617, "step": 5831} {"info/global_step": 5832, "train_info/time_within_train_step": 2.67141056060791, "step": 5832} {"train_info/time_between_train_steps": 0.0029702186584472656, "step": 5832} {"info/global_step": 5833, "train_info/time_within_train_step": 2.663182497024536, "step": 5833} {"train_info/time_between_train_steps": 0.0029768943786621094, "step": 5833} {"info/global_step": 5834, "train_info/time_within_train_step": 2.645686149597168, "step": 5834} {"train_info/time_between_train_steps": 0.002913951873779297, "step": 5834} {"info/global_step": 5835, "train_info/time_within_train_step": 2.66318678855896, "step": 5835} {"train_info/time_between_train_steps": 0.0029447078704833984, "step": 5835} {"info/global_step": 5836, "train_info/time_within_train_step": 2.645681381225586, "step": 5836} {"train_info/time_between_train_steps": 0.0029222965240478516, "step": 5836} {"info/global_step": 5837, "train_info/time_within_train_step": 2.6440463066101074, "step": 5837} {"train_info/time_between_train_steps": 0.0029201507568359375, "step": 5837} {"info/global_step": 5838, "train_info/time_within_train_step": 2.655484437942505, "step": 5838} {"train_info/time_between_train_steps": 0.0028984546661376953, "step": 5838} {"info/global_step": 5839, "train_info/time_within_train_step": 2.6690421104431152, "step": 5839} {"train_info/time_between_train_steps": 0.0030562877655029297, "step": 5839} {"info/global_step": 5840, "train_info/time_within_train_step": 2.6800665855407715, "step": 5840} {"train_info/time_between_train_steps": 0.0029463768005371094, "step": 5840} {"info/global_step": 5841, "train_info/time_within_train_step": 2.6505420207977295, "step": 5841} {"train_info/time_between_train_steps": 0.0029366016387939453, "step": 5841} {"info/global_step": 5842, "train_info/time_within_train_step": 2.684462547302246, "step": 5842} {"train_info/time_between_train_steps": 0.002926349639892578, "step": 5842} {"info/global_step": 5843, "train_info/time_within_train_step": 2.641911029815674, "step": 5843} {"train_info/time_between_train_steps": 0.0029745101928710938, "step": 5843} {"info/global_step": 5844, "train_info/time_within_train_step": 2.648228406906128, "step": 5844} {"train_info/time_between_train_steps": 0.0029191970825195312, "step": 5844} {"info/global_step": 5845, "train_info/time_within_train_step": 2.660231828689575, "step": 5845} {"train_info/time_between_train_steps": 0.0029010772705078125, "step": 5845} {"info/global_step": 5846, "train_info/time_within_train_step": 2.657835006713867, "step": 5846} {"train_info/time_between_train_steps": 0.002946615219116211, "step": 5846} {"info/global_step": 5847, "train_info/time_within_train_step": 2.6451468467712402, "step": 5847} {"train_info/time_between_train_steps": 0.0029489994049072266, "step": 5847} {"info/global_step": 5848, "train_info/time_within_train_step": 2.647775411605835, "step": 5848} {"train_info/time_between_train_steps": 0.002912282943725586, "step": 5848} {"info/global_step": 5849, "train_info/time_within_train_step": 2.662684202194214, "step": 5849} {"train_info/time_between_train_steps": 0.0030031204223632812, "step": 5849} {"info/global_step": 5850, "train_info/time_within_train_step": 2.666879415512085, "step": 5850} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746913842, "_runtime": 16440}, "step": 5850} {"logs": {"train/loss": 3.4658, "train/learning_rate": 0.00027666666666666665, "train/epoch": 6.07, "_timestamp": 1746913842, "_runtime": 16440}, "step": 5850} {"train_info/time_between_train_steps": 0.02445244789123535, "step": 5850} {"info/global_step": 5851, "train_info/time_within_train_step": 2.6745080947875977, "step": 5851} {"train_info/time_between_train_steps": 0.0029342174530029297, "step": 5851} {"info/global_step": 5852, "train_info/time_within_train_step": 2.672032594680786, "step": 5852} {"train_info/time_between_train_steps": 0.002945423126220703, "step": 5852} {"info/global_step": 5853, "train_info/time_within_train_step": 2.685706377029419, "step": 5853} {"train_info/time_between_train_steps": 0.0029141902923583984, "step": 5853} {"info/global_step": 5854, "train_info/time_within_train_step": 2.6412172317504883, "step": 5854} {"train_info/time_between_train_steps": 0.0028896331787109375, "step": 5854} {"info/global_step": 5855, "train_info/time_within_train_step": 2.6416265964508057, "step": 5855} {"train_info/time_between_train_steps": 0.0029244422912597656, "step": 5855} {"info/global_step": 5856, "train_info/time_within_train_step": 2.6661477088928223, "step": 5856} {"train_info/time_between_train_steps": 0.0029158592224121094, "step": 5856} {"info/global_step": 5857, "train_info/time_within_train_step": 2.6504902839660645, "step": 5857} {"train_info/time_between_train_steps": 0.0029027462005615234, "step": 5857} {"info/global_step": 5858, "train_info/time_within_train_step": 2.6426198482513428, "step": 5858} {"train_info/time_between_train_steps": 0.0030808448791503906, "step": 5858} {"info/global_step": 5859, "train_info/time_within_train_step": 2.6588587760925293, "step": 5859} {"train_info/time_between_train_steps": 0.0029206275939941406, "step": 5859} {"info/global_step": 5860, "train_info/time_within_train_step": 2.6539647579193115, "step": 5860} {"train_info/time_between_train_steps": 0.0029754638671875, "step": 5860} {"info/global_step": 5861, "train_info/time_within_train_step": 2.6608188152313232, "step": 5861} {"train_info/time_between_train_steps": 0.0029494762420654297, "step": 5861} {"info/global_step": 5862, "train_info/time_within_train_step": 2.7049975395202637, "step": 5862} {"train_info/time_between_train_steps": 0.002919912338256836, "step": 5862} {"info/global_step": 5863, "train_info/time_within_train_step": 2.7041499614715576, "step": 5863} {"train_info/time_between_train_steps": 0.0029151439666748047, "step": 5863} {"info/global_step": 5864, "train_info/time_within_train_step": 2.6421730518341064, "step": 5864} {"train_info/time_between_train_steps": 0.002885580062866211, "step": 5864} {"info/global_step": 5865, "train_info/time_within_train_step": 2.6428213119506836, "step": 5865} {"train_info/time_between_train_steps": 0.002917051315307617, "step": 5865} {"info/global_step": 5866, "train_info/time_within_train_step": 2.6515305042266846, "step": 5866} {"train_info/time_between_train_steps": 0.0029249191284179688, "step": 5866} {"info/global_step": 5867, "train_info/time_within_train_step": 2.6522958278656006, "step": 5867} {"train_info/time_between_train_steps": 0.002989530563354492, "step": 5867} {"info/global_step": 5868, "train_info/time_within_train_step": 2.669659376144409, "step": 5868} {"train_info/time_between_train_steps": 0.0029191970825195312, "step": 5868} {"info/global_step": 5869, "train_info/time_within_train_step": 2.710608720779419, "step": 5869} {"train_info/time_between_train_steps": 0.0030770301818847656, "step": 5869} {"info/global_step": 5870, "train_info/time_within_train_step": 2.646104335784912, "step": 5870} {"train_info/time_between_train_steps": 0.0029296875, "step": 5870} {"info/global_step": 5871, "train_info/time_within_train_step": 2.658214807510376, "step": 5871} {"train_info/time_between_train_steps": 0.002913951873779297, "step": 5871} {"info/global_step": 5872, "train_info/time_within_train_step": 2.646479606628418, "step": 5872} {"train_info/time_between_train_steps": 0.002952098846435547, "step": 5872} {"info/global_step": 5873, "train_info/time_within_train_step": 2.648733139038086, "step": 5873} {"train_info/time_between_train_steps": 0.002955198287963867, "step": 5873} {"info/global_step": 5874, "train_info/time_within_train_step": 2.662062168121338, "step": 5874} {"train_info/time_between_train_steps": 0.002895355224609375, "step": 5874} {"info/global_step": 5875, "train_info/time_within_train_step": 2.645663022994995, "step": 5875} {"train_info/time_between_train_steps": 0.002998828887939453, "step": 5875} {"info/global_step": 5876, "train_info/time_within_train_step": 2.6430206298828125, "step": 5876} {"train_info/time_between_train_steps": 0.002918720245361328, "step": 5876} {"info/global_step": 5877, "train_info/time_within_train_step": 2.6654884815216064, "step": 5877} {"train_info/time_between_train_steps": 0.002955198287963867, "step": 5877} {"info/global_step": 5878, "train_info/time_within_train_step": 2.669041633605957, "step": 5878} {"train_info/time_between_train_steps": 0.0029816627502441406, "step": 5878} {"info/global_step": 5879, "train_info/time_within_train_step": 2.688905954360962, "step": 5879} {"train_info/time_between_train_steps": 0.0030012130737304688, "step": 5879} {"info/global_step": 5880, "train_info/time_within_train_step": 2.653141498565674, "step": 5880} {"train_info/time_between_train_steps": 0.0028944015502929688, "step": 5880} {"info/global_step": 5881, "train_info/time_within_train_step": 2.667152166366577, "step": 5881} {"train_info/time_between_train_steps": 0.002931833267211914, "step": 5881} {"info/global_step": 5882, "train_info/time_within_train_step": 2.6539366245269775, "step": 5882} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 5882} {"info/global_step": 5883, "train_info/time_within_train_step": 2.6518778800964355, "step": 5883} {"train_info/time_between_train_steps": 0.002914905548095703, "step": 5883} {"info/global_step": 5884, "train_info/time_within_train_step": 2.6431634426116943, "step": 5884} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 5884} {"info/global_step": 5885, "train_info/time_within_train_step": 2.656059503555298, "step": 5885} {"train_info/time_between_train_steps": 0.0029468536376953125, "step": 5885} {"info/global_step": 5886, "train_info/time_within_train_step": 2.6457064151763916, "step": 5886} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 5886} {"info/global_step": 5887, "train_info/time_within_train_step": 2.668022632598877, "step": 5887} {"train_info/time_between_train_steps": 0.0029039382934570312, "step": 5887} {"info/global_step": 5888, "train_info/time_within_train_step": 2.665515661239624, "step": 5888} {"train_info/time_between_train_steps": 0.002948284149169922, "step": 5888} {"info/global_step": 5889, "train_info/time_within_train_step": 2.660634994506836, "step": 5889} {"train_info/time_between_train_steps": 0.0029456615447998047, "step": 5889} {"info/global_step": 5890, "train_info/time_within_train_step": 2.698917865753174, "step": 5890} {"train_info/time_between_train_steps": 0.0028984546661376953, "step": 5890} {"info/global_step": 5891, "train_info/time_within_train_step": 2.6577682495117188, "step": 5891} {"train_info/time_between_train_steps": 0.0029516220092773438, "step": 5891} {"info/global_step": 5892, "train_info/time_within_train_step": 2.6484999656677246, "step": 5892} {"train_info/time_between_train_steps": 0.002951383590698242, "step": 5892} {"info/global_step": 5893, "train_info/time_within_train_step": 2.647145986557007, "step": 5893} {"train_info/time_between_train_steps": 0.0028858184814453125, "step": 5893} {"info/global_step": 5894, "train_info/time_within_train_step": 2.6495606899261475, "step": 5894} {"train_info/time_between_train_steps": 0.003066539764404297, "step": 5894} {"info/global_step": 5895, "train_info/time_within_train_step": 2.653380870819092, "step": 5895} {"train_info/time_between_train_steps": 0.0028765201568603516, "step": 5895} {"info/global_step": 5896, "train_info/time_within_train_step": 2.7803289890289307, "step": 5896} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 5896} {"info/global_step": 5897, "train_info/time_within_train_step": 2.651169538497925, "step": 5897} {"train_info/time_between_train_steps": 0.0029344558715820312, "step": 5897} {"info/global_step": 5898, "train_info/time_within_train_step": 2.6427865028381348, "step": 5898} {"train_info/time_between_train_steps": 0.0029087066650390625, "step": 5898} {"info/global_step": 5899, "train_info/time_within_train_step": 2.6569042205810547, "step": 5899} {"train_info/time_between_train_steps": 0.002913951873779297, "step": 5899} {"info/global_step": 5900, "train_info/time_within_train_step": 2.6529459953308105, "step": 5900} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746913977, "_runtime": 16575}, "step": 5900} {"logs": {"train/loss": 3.458, "train/learning_rate": 0.00027333333333333333, "train/epoch": 6.07, "_timestamp": 1746913977, "_runtime": 16575}, "step": 5900} {"train_info/time_between_train_steps": 0.024523258209228516, "step": 5900} {"info/global_step": 5901, "train_info/time_within_train_step": 2.6654486656188965, "step": 5901} {"train_info/time_between_train_steps": 0.002969980239868164, "step": 5901} {"info/global_step": 5902, "train_info/time_within_train_step": 2.687690258026123, "step": 5902} {"train_info/time_between_train_steps": 0.002949237823486328, "step": 5902} {"info/global_step": 5903, "train_info/time_within_train_step": 2.7247254848480225, "step": 5903} {"train_info/time_between_train_steps": 0.002909421920776367, "step": 5903} {"info/global_step": 5904, "train_info/time_within_train_step": 2.6501431465148926, "step": 5904} {"train_info/time_between_train_steps": 0.0029778480529785156, "step": 5904} {"info/global_step": 5905, "train_info/time_within_train_step": 2.6412603855133057, "step": 5905} {"train_info/time_between_train_steps": 0.002946138381958008, "step": 5905} {"info/global_step": 5906, "train_info/time_within_train_step": 2.6602859497070312, "step": 5906} {"train_info/time_between_train_steps": 0.002899169921875, "step": 5906} {"info/global_step": 5907, "train_info/time_within_train_step": 2.648557186126709, "step": 5907} {"train_info/time_between_train_steps": 0.0030663013458251953, "step": 5907} {"info/global_step": 5908, "train_info/time_within_train_step": 2.6491236686706543, "step": 5908} {"train_info/time_between_train_steps": 0.0029969215393066406, "step": 5908} {"info/global_step": 5909, "train_info/time_within_train_step": 2.6463286876678467, "step": 5909} {"train_info/time_between_train_steps": 0.0030732154846191406, "step": 5909} {"info/global_step": 5910, "train_info/time_within_train_step": 2.6454532146453857, "step": 5910} {"train_info/time_between_train_steps": 0.003069639205932617, "step": 5910} {"info/global_step": 5911, "train_info/time_within_train_step": 2.666276216506958, "step": 5911} {"train_info/time_between_train_steps": 0.0034389495849609375, "step": 5911} {"info/global_step": 5912, "train_info/time_within_train_step": 2.6679890155792236, "step": 5912} {"train_info/time_between_train_steps": 0.003120899200439453, "step": 5912} {"info/global_step": 5913, "train_info/time_within_train_step": 2.7125980854034424, "step": 5913} {"train_info/time_between_train_steps": 0.0030775070190429688, "step": 5913} {"info/global_step": 5914, "train_info/time_within_train_step": 2.645176887512207, "step": 5914} {"train_info/time_between_train_steps": 0.003063201904296875, "step": 5914} {"info/global_step": 5915, "train_info/time_within_train_step": 2.6587822437286377, "step": 5915} {"train_info/time_between_train_steps": 0.003133535385131836, "step": 5915} {"info/global_step": 5916, "train_info/time_within_train_step": 2.6445364952087402, "step": 5916} {"train_info/time_between_train_steps": 0.003112316131591797, "step": 5916} {"info/global_step": 5917, "train_info/time_within_train_step": 2.6488564014434814, "step": 5917} {"train_info/time_between_train_steps": 0.0031380653381347656, "step": 5917} {"info/global_step": 5918, "train_info/time_within_train_step": 2.662942409515381, "step": 5918} {"train_info/time_between_train_steps": 0.0030412673950195312, "step": 5918} {"info/global_step": 5919, "train_info/time_within_train_step": 2.6452083587646484, "step": 5919} {"train_info/time_between_train_steps": 0.003073453903198242, "step": 5919} {"info/global_step": 5920, "train_info/time_within_train_step": 2.643483877182007, "step": 5920} {"train_info/time_between_train_steps": 0.0030870437622070312, "step": 5920} {"info/global_step": 5921, "train_info/time_within_train_step": 2.6678028106689453, "step": 5921} {"train_info/time_between_train_steps": 0.0030548572540283203, "step": 5921} {"info/global_step": 5922, "train_info/time_within_train_step": 2.713653087615967, "step": 5922} {"train_info/time_between_train_steps": 0.0031015872955322266, "step": 5922} {"info/global_step": 5923, "train_info/time_within_train_step": 2.6695735454559326, "step": 5923} {"train_info/time_between_train_steps": 0.0031213760375976562, "step": 5923} {"info/global_step": 5924, "train_info/time_within_train_step": 2.6578762531280518, "step": 5924} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 5924} {"info/global_step": 5925, "train_info/time_within_train_step": 2.6834893226623535, "step": 5925} {"train_info/time_between_train_steps": 0.0030794143676757812, "step": 5925} {"info/global_step": 5926, "train_info/time_within_train_step": 2.643359422683716, "step": 5926} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 5926} {"info/global_step": 5927, "train_info/time_within_train_step": 2.6544129848480225, "step": 5927} {"train_info/time_between_train_steps": 0.003040790557861328, "step": 5927} {"info/global_step": 5928, "train_info/time_within_train_step": 2.6548328399658203, "step": 5928} {"train_info/time_between_train_steps": 0.0030317306518554688, "step": 5928} {"info/global_step": 5929, "train_info/time_within_train_step": 2.642764091491699, "step": 5929} {"train_info/time_between_train_steps": 0.0030989646911621094, "step": 5929} {"info/global_step": 5930, "train_info/time_within_train_step": 2.6567134857177734, "step": 5930} {"train_info/time_between_train_steps": 0.003070354461669922, "step": 5930} {"info/global_step": 5931, "train_info/time_within_train_step": 2.667224168777466, "step": 5931} {"train_info/time_between_train_steps": 0.003013134002685547, "step": 5931} {"info/global_step": 5932, "train_info/time_within_train_step": 2.686345338821411, "step": 5932} {"train_info/time_between_train_steps": 0.0030460357666015625, "step": 5932} {"info/global_step": 5933, "train_info/time_within_train_step": 2.6692469120025635, "step": 5933} {"train_info/time_between_train_steps": 0.0030813217163085938, "step": 5933} {"info/global_step": 5934, "train_info/time_within_train_step": 2.6482462882995605, "step": 5934} {"train_info/time_between_train_steps": 0.003050565719604492, "step": 5934} {"info/global_step": 5935, "train_info/time_within_train_step": 2.646857261657715, "step": 5935} {"train_info/time_between_train_steps": 0.003069162368774414, "step": 5935} {"info/global_step": 5936, "train_info/time_within_train_step": 2.6511924266815186, "step": 5936} {"train_info/time_between_train_steps": 0.0030455589294433594, "step": 5936} {"info/global_step": 5937, "train_info/time_within_train_step": 2.6543967723846436, "step": 5937} {"train_info/time_between_train_steps": 0.003023862838745117, "step": 5937} {"info/global_step": 5938, "train_info/time_within_train_step": 2.644927740097046, "step": 5938} {"train_info/time_between_train_steps": 0.003022432327270508, "step": 5938} {"info/global_step": 5939, "train_info/time_within_train_step": 2.659968852996826, "step": 5939} {"train_info/time_between_train_steps": 0.003110647201538086, "step": 5939} {"info/global_step": 5940, "train_info/time_within_train_step": 2.6515073776245117, "step": 5940} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 5940} {"info/global_step": 5941, "train_info/time_within_train_step": 2.663095235824585, "step": 5941} {"train_info/time_between_train_steps": 0.003269672393798828, "step": 5941} {"info/global_step": 5942, "train_info/time_within_train_step": 2.7195417881011963, "step": 5942} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 5942} {"info/global_step": 5943, "train_info/time_within_train_step": 2.689445734024048, "step": 5943} {"train_info/time_between_train_steps": 0.0032439231872558594, "step": 5943} {"info/global_step": 5944, "train_info/time_within_train_step": 2.6408045291900635, "step": 5944} {"train_info/time_between_train_steps": 0.003062009811401367, "step": 5944} {"info/global_step": 5945, "train_info/time_within_train_step": 2.642787456512451, "step": 5945} {"train_info/time_between_train_steps": 0.0031163692474365234, "step": 5945} {"info/global_step": 5946, "train_info/time_within_train_step": 2.6614034175872803, "step": 5946} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 5946} {"info/global_step": 5947, "train_info/time_within_train_step": 2.654891014099121, "step": 5947} {"train_info/time_between_train_steps": 0.0031478404998779297, "step": 5947} {"info/global_step": 5948, "train_info/time_within_train_step": 2.644613742828369, "step": 5948} {"train_info/time_between_train_steps": 0.003104686737060547, "step": 5948} {"info/global_step": 5949, "train_info/time_within_train_step": 2.650266170501709, "step": 5949} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 5949} {"info/global_step": 5950, "train_info/time_within_train_step": 2.6452462673187256, "step": 5950} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746914111, "_runtime": 16709}, "step": 5950} {"logs": {"train/loss": 3.4457, "train/learning_rate": 0.00027, "train/epoch": 6.08, "_timestamp": 1746914111, "_runtime": 16709}, "step": 5950} {"train_info/time_between_train_steps": 0.02437877655029297, "step": 5950} {"info/global_step": 5951, "train_info/time_within_train_step": 2.6631224155426025, "step": 5951} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 5951} {"info/global_step": 5952, "train_info/time_within_train_step": 2.6678860187530518, "step": 5952} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 5952} {"info/global_step": 5953, "train_info/time_within_train_step": 2.711043357849121, "step": 5953} {"train_info/time_between_train_steps": 0.00307464599609375, "step": 5953} {"info/global_step": 5954, "train_info/time_within_train_step": 2.6475563049316406, "step": 5954} {"train_info/time_between_train_steps": 0.0031113624572753906, "step": 5954} {"info/global_step": 5955, "train_info/time_within_train_step": 2.66403865814209, "step": 5955} {"train_info/time_between_train_steps": 0.003108978271484375, "step": 5955} {"info/global_step": 5956, "train_info/time_within_train_step": 2.648101568222046, "step": 5956} {"train_info/time_between_train_steps": 0.003096342086791992, "step": 5956} {"info/global_step": 5957, "train_info/time_within_train_step": 2.6474437713623047, "step": 5957} {"train_info/time_between_train_steps": 0.0030307769775390625, "step": 5957} {"info/global_step": 5958, "train_info/time_within_train_step": 2.788741111755371, "step": 5958} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 5958} {"info/global_step": 5959, "train_info/time_within_train_step": 2.6499102115631104, "step": 5959} {"train_info/time_between_train_steps": 0.0030660629272460938, "step": 5959} {"info/global_step": 5960, "train_info/time_within_train_step": 2.6514365673065186, "step": 5960} {"train_info/time_between_train_steps": 0.0029044151306152344, "step": 5960} {"info/global_step": 5961, "train_info/time_within_train_step": 2.6426875591278076, "step": 5961} {"train_info/time_between_train_steps": 0.002934694290161133, "step": 5961} {"info/global_step": 5962, "train_info/time_within_train_step": 2.645623207092285, "step": 5962} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 5962} {"info/global_step": 5963, "train_info/time_within_train_step": 2.669490098953247, "step": 5963} {"train_info/time_between_train_steps": 0.002907991409301758, "step": 5963} {"info/global_step": 5964, "train_info/time_within_train_step": 2.6664111614227295, "step": 5964} {"train_info/time_between_train_steps": 0.002952098846435547, "step": 5964} {"info/global_step": 5965, "train_info/time_within_train_step": 2.67197322845459, "step": 5965} {"train_info/time_between_train_steps": 0.002968311309814453, "step": 5965} {"info/global_step": 5966, "train_info/time_within_train_step": 2.671858549118042, "step": 5966} {"train_info/time_between_train_steps": 0.0029904842376708984, "step": 5966} {"info/global_step": 5967, "train_info/time_within_train_step": 2.649657964706421, "step": 5967} {"train_info/time_between_train_steps": 0.0030667781829833984, "step": 5967} {"info/global_step": 5968, "train_info/time_within_train_step": 2.6500351428985596, "step": 5968} {"train_info/time_between_train_steps": 0.0029408931732177734, "step": 5968} {"info/global_step": 5969, "train_info/time_within_train_step": 2.6466281414031982, "step": 5969} {"train_info/time_between_train_steps": 0.0029211044311523438, "step": 5969} {"info/global_step": 5970, "train_info/time_within_train_step": 2.6483943462371826, "step": 5970} {"train_info/time_between_train_steps": 0.0029573440551757812, "step": 5970} {"info/global_step": 5971, "train_info/time_within_train_step": 2.6484246253967285, "step": 5971} {"train_info/time_between_train_steps": 0.002941608428955078, "step": 5971} {"info/global_step": 5972, "train_info/time_within_train_step": 2.646040201187134, "step": 5972} {"train_info/time_between_train_steps": 0.002894163131713867, "step": 5972} {"info/global_step": 5973, "train_info/time_within_train_step": 2.6662001609802246, "step": 5973} {"train_info/time_between_train_steps": 0.0029053688049316406, "step": 5973} {"info/global_step": 5974, "train_info/time_within_train_step": 2.650036573410034, "step": 5974} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 5974} {"info/global_step": 5975, "train_info/time_within_train_step": 2.64194917678833, "step": 5975} {"train_info/time_between_train_steps": 0.0029261112213134766, "step": 5975} {"info/global_step": 5976, "train_info/time_within_train_step": 2.647408962249756, "step": 5976} {"train_info/time_between_train_steps": 0.002943754196166992, "step": 5976} {"info/global_step": 5977, "train_info/time_within_train_step": 2.6614830493927, "step": 5977} {"train_info/time_between_train_steps": 0.002898693084716797, "step": 5977} {"info/global_step": 5978, "train_info/time_within_train_step": 2.6428165435791016, "step": 5978} {"train_info/time_between_train_steps": 0.0029249191284179688, "step": 5978} {"info/global_step": 5979, "train_info/time_within_train_step": 2.6443827152252197, "step": 5979} {"train_info/time_between_train_steps": 0.002968311309814453, "step": 5979} {"info/global_step": 5980, "train_info/time_within_train_step": 2.6478819847106934, "step": 5980} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 5980} {"info/global_step": 5981, "train_info/time_within_train_step": 2.653303384780884, "step": 5981} {"train_info/time_between_train_steps": 0.0029163360595703125, "step": 5981} {"info/global_step": 5982, "train_info/time_within_train_step": 2.6587700843811035, "step": 5982} {"train_info/time_between_train_steps": 0.0030829906463623047, "step": 5982} {"info/global_step": 5983, "train_info/time_within_train_step": 2.669752597808838, "step": 5983} {"train_info/time_between_train_steps": 0.0029172897338867188, "step": 5983} {"info/global_step": 5984, "train_info/time_within_train_step": 2.727328300476074, "step": 5984} {"train_info/time_between_train_steps": 0.00293731689453125, "step": 5984} {"info/global_step": 5985, "train_info/time_within_train_step": 2.711366891860962, "step": 5985} {"train_info/time_between_train_steps": 0.003006458282470703, "step": 5985} {"info/global_step": 5986, "train_info/time_within_train_step": 2.6467065811157227, "step": 5986} {"train_info/time_between_train_steps": 0.002894878387451172, "step": 5986} {"info/global_step": 5987, "train_info/time_within_train_step": 2.659426212310791, "step": 5987} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 5987} {"info/global_step": 5988, "train_info/time_within_train_step": 2.6438755989074707, "step": 5988} {"train_info/time_between_train_steps": 0.002919435501098633, "step": 5988} {"info/global_step": 5989, "train_info/time_within_train_step": 2.6488919258117676, "step": 5989} {"train_info/time_between_train_steps": 0.002995014190673828, "step": 5989} {"info/global_step": 5990, "train_info/time_within_train_step": 2.6511034965515137, "step": 5990} {"train_info/time_between_train_steps": 0.002901315689086914, "step": 5990} {"info/global_step": 5991, "train_info/time_within_train_step": 2.6440861225128174, "step": 5991} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 5991} {"info/global_step": 5992, "train_info/time_within_train_step": 2.6479976177215576, "step": 5992} {"train_info/time_between_train_steps": 0.0029151439666748047, "step": 5992} {"info/global_step": 5993, "train_info/time_within_train_step": 2.6688103675842285, "step": 5993} {"train_info/time_between_train_steps": 0.002941608428955078, "step": 5993} {"info/global_step": 5994, "train_info/time_within_train_step": 2.671880006790161, "step": 5994} {"train_info/time_between_train_steps": 0.0029304027557373047, "step": 5994} {"info/global_step": 5995, "train_info/time_within_train_step": 2.6576106548309326, "step": 5995} {"train_info/time_between_train_steps": 0.0029571056365966797, "step": 5995} {"info/global_step": 5996, "train_info/time_within_train_step": 2.6861236095428467, "step": 5996} {"train_info/time_between_train_steps": 0.0030362606048583984, "step": 5996} {"info/global_step": 5997, "train_info/time_within_train_step": 2.6422572135925293, "step": 5997} {"train_info/time_between_train_steps": 0.0030455589294433594, "step": 5997} {"info/global_step": 5998, "train_info/time_within_train_step": 2.655531167984009, "step": 5998} {"train_info/time_between_train_steps": 0.0030150413513183594, "step": 5998} {"info/global_step": 5999, "train_info/time_within_train_step": 3.267571449279785, "step": 5999} {"train_info/time_between_train_steps": 0.0029685497283935547, "step": 5999} {"info/global_step": 6000, "train_info/time_within_train_step": 2.7228505611419678, "step": 6000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746914246, "_runtime": 16844}, "step": 6000} {"logs": {"train/loss": 3.4373, "train/learning_rate": 0.0002666666666666666, "train/epoch": 6.08, "_timestamp": 1746914246, "_runtime": 16844}, "step": 6000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746914251, "_runtime": 16849}, "step": 6000} {"logs": {"eval/loss": 4.644469738006592, "eval/runtime": 5.1651, "eval/samples_per_second": 37.173, "eval/steps_per_second": 1.162, "train/epoch": 6.08, "_timestamp": 1746914251, "_runtime": 16849}, "step": 6000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746914251, "_runtime": 16849}, "step": 6000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.644469738006592, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 104.00819956520075, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1651, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 37.173, "train/epoch": 6.08, "_timestamp": 1746914251, "_runtime": 16849}, "step": 6000} {"train_info/time_between_train_steps": 18.74245810508728, "step": 6000} {"info/global_step": 6001, "train_info/time_within_train_step": 2.4563446044921875, "step": 6001} {"train_info/time_between_train_steps": 0.0060994625091552734, "step": 6001} {"info/global_step": 6002, "train_info/time_within_train_step": 2.4471499919891357, "step": 6002} {"train_info/time_between_train_steps": 0.0061185359954833984, "step": 6002} {"info/global_step": 6003, "train_info/time_within_train_step": 2.603646755218506, "step": 6003} {"train_info/time_between_train_steps": 0.0029532909393310547, "step": 6003} {"info/global_step": 6004, "train_info/time_within_train_step": 2.6427595615386963, "step": 6004} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 6004} {"info/global_step": 6005, "train_info/time_within_train_step": 2.647071123123169, "step": 6005} {"train_info/time_between_train_steps": 0.0030243396759033203, "step": 6005} {"info/global_step": 6006, "train_info/time_within_train_step": 2.6458003520965576, "step": 6006} {"train_info/time_between_train_steps": 0.0030727386474609375, "step": 6006} {"info/global_step": 6007, "train_info/time_within_train_step": 2.642678737640381, "step": 6007} {"train_info/time_between_train_steps": 0.0029439926147460938, "step": 6007} {"info/global_step": 6008, "train_info/time_within_train_step": 2.6672301292419434, "step": 6008} {"train_info/time_between_train_steps": 0.0030546188354492188, "step": 6008} {"info/global_step": 6009, "train_info/time_within_train_step": 2.6704161167144775, "step": 6009} {"train_info/time_between_train_steps": 0.002963542938232422, "step": 6009} {"info/global_step": 6010, "train_info/time_within_train_step": 2.6860344409942627, "step": 6010} {"train_info/time_between_train_steps": 0.006287097930908203, "step": 6010} {"info/global_step": 6011, "train_info/time_within_train_step": 2.650175094604492, "step": 6011} {"train_info/time_between_train_steps": 0.006155490875244141, "step": 6011} {"info/global_step": 6012, "train_info/time_within_train_step": 2.6499979496002197, "step": 6012} {"train_info/time_between_train_steps": 0.006177663803100586, "step": 6012} {"info/global_step": 6013, "train_info/time_within_train_step": 2.664212703704834, "step": 6013} {"train_info/time_between_train_steps": 0.0029087066650390625, "step": 6013} {"info/global_step": 6014, "train_info/time_within_train_step": 2.644446611404419, "step": 6014} {"train_info/time_between_train_steps": 0.0030388832092285156, "step": 6014} {"info/global_step": 6015, "train_info/time_within_train_step": 2.6446259021759033, "step": 6015} {"train_info/time_between_train_steps": 0.0030171871185302734, "step": 6015} {"info/global_step": 6016, "train_info/time_within_train_step": 2.669294834136963, "step": 6016} {"train_info/time_between_train_steps": 0.0030062198638916016, "step": 6016} {"info/global_step": 6017, "train_info/time_within_train_step": 2.6660945415496826, "step": 6017} {"train_info/time_between_train_steps": 0.0029811859130859375, "step": 6017} {"info/global_step": 6018, "train_info/time_within_train_step": 2.6876165866851807, "step": 6018} {"train_info/time_between_train_steps": 0.0030219554901123047, "step": 6018} {"info/global_step": 6019, "train_info/time_within_train_step": 2.6577656269073486, "step": 6019} {"train_info/time_between_train_steps": 0.003087759017944336, "step": 6019} {"info/global_step": 6020, "train_info/time_within_train_step": 2.652019500732422, "step": 6020} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 6020} {"info/global_step": 6021, "train_info/time_within_train_step": 2.6516785621643066, "step": 6021} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 6021} {"info/global_step": 6022, "train_info/time_within_train_step": 2.648038625717163, "step": 6022} {"train_info/time_between_train_steps": 0.0032439231872558594, "step": 6022} {"info/global_step": 6023, "train_info/time_within_train_step": 2.651956796646118, "step": 6023} {"train_info/time_between_train_steps": 0.006170988082885742, "step": 6023} {"info/global_step": 6024, "train_info/time_within_train_step": 2.6498615741729736, "step": 6024} {"train_info/time_between_train_steps": 0.0032308101654052734, "step": 6024} {"info/global_step": 6025, "train_info/time_within_train_step": 2.6463418006896973, "step": 6025} {"train_info/time_between_train_steps": 0.0030443668365478516, "step": 6025} {"info/global_step": 6026, "train_info/time_within_train_step": 2.6667981147766113, "step": 6026} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 6026} {"info/global_step": 6027, "train_info/time_within_train_step": 2.709935188293457, "step": 6027} {"train_info/time_between_train_steps": 0.0030698776245117188, "step": 6027} {"info/global_step": 6028, "train_info/time_within_train_step": 2.66461181640625, "step": 6028} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 6028} {"info/global_step": 6029, "train_info/time_within_train_step": 2.6576900482177734, "step": 6029} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 6029} {"info/global_step": 6030, "train_info/time_within_train_step": 2.6474568843841553, "step": 6030} {"train_info/time_between_train_steps": 0.0035665035247802734, "step": 6030} {"info/global_step": 6031, "train_info/time_within_train_step": 2.646831750869751, "step": 6031} {"train_info/time_between_train_steps": 0.0032873153686523438, "step": 6031} {"info/global_step": 6032, "train_info/time_within_train_step": 2.6475911140441895, "step": 6032} {"train_info/time_between_train_steps": 0.0034990310668945312, "step": 6032} {"info/global_step": 6033, "train_info/time_within_train_step": 2.6466777324676514, "step": 6033} {"train_info/time_between_train_steps": 0.0035657882690429688, "step": 6033} {"info/global_step": 6034, "train_info/time_within_train_step": 2.650758743286133, "step": 6034} {"train_info/time_between_train_steps": 0.0035448074340820312, "step": 6034} {"info/global_step": 6035, "train_info/time_within_train_step": 2.6492974758148193, "step": 6035} {"train_info/time_between_train_steps": 0.0035495758056640625, "step": 6035} {"info/global_step": 6036, "train_info/time_within_train_step": 2.6804614067077637, "step": 6036} {"train_info/time_between_train_steps": 0.0035784244537353516, "step": 6036} {"info/global_step": 6037, "train_info/time_within_train_step": 2.6744370460510254, "step": 6037} {"train_info/time_between_train_steps": 0.003676891326904297, "step": 6037} {"info/global_step": 6038, "train_info/time_within_train_step": 2.649836778640747, "step": 6038} {"train_info/time_between_train_steps": 0.003412485122680664, "step": 6038} {"info/global_step": 6039, "train_info/time_within_train_step": 2.662482261657715, "step": 6039} {"train_info/time_between_train_steps": 0.003982067108154297, "step": 6039} {"info/global_step": 6040, "train_info/time_within_train_step": 2.6709914207458496, "step": 6040} {"train_info/time_between_train_steps": 0.004033088684082031, "step": 6040} {"info/global_step": 6041, "train_info/time_within_train_step": 2.7142441272735596, "step": 6041} {"train_info/time_between_train_steps": 0.003498077392578125, "step": 6041} {"train_info/time_between_train_steps": 2.542550563812256, "step": 6041} {"info/global_step": 6042, "train_info/time_within_train_step": 2.610980749130249, "step": 6042} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 6042} {"info/global_step": 6043, "train_info/time_within_train_step": 2.644545316696167, "step": 6043} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 6043} {"info/global_step": 6044, "train_info/time_within_train_step": 2.6453046798706055, "step": 6044} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 6044} {"info/global_step": 6045, "train_info/time_within_train_step": 2.6519525051116943, "step": 6045} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 6045} {"info/global_step": 6046, "train_info/time_within_train_step": 2.6716742515563965, "step": 6046} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 6046} {"info/global_step": 6047, "train_info/time_within_train_step": 2.6740736961364746, "step": 6047} {"train_info/time_between_train_steps": 0.003149747848510742, "step": 6047} {"info/global_step": 6048, "train_info/time_within_train_step": 2.656372308731079, "step": 6048} {"train_info/time_between_train_steps": 0.0031371116638183594, "step": 6048} {"info/global_step": 6049, "train_info/time_within_train_step": 2.6880064010620117, "step": 6049} {"train_info/time_between_train_steps": 0.0031714439392089844, "step": 6049} {"info/global_step": 6050, "train_info/time_within_train_step": 2.6431219577789307, "step": 6050} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746914402, "_runtime": 17000}, "step": 6050} {"logs": {"train/loss": 3.4499, "train/learning_rate": 0.0002633333333333333, "train/epoch": 7.0, "_timestamp": 1746914402, "_runtime": 17000}, "step": 6050} {"train_info/time_between_train_steps": 0.024322509765625, "step": 6050} {"info/global_step": 6051, "train_info/time_within_train_step": 2.6440072059631348, "step": 6051} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 6051} {"info/global_step": 6052, "train_info/time_within_train_step": 2.64353609085083, "step": 6052} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 6052} {"info/global_step": 6053, "train_info/time_within_train_step": 2.6632726192474365, "step": 6053} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 6053} {"info/global_step": 6054, "train_info/time_within_train_step": 2.6512279510498047, "step": 6054} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 6054} {"info/global_step": 6055, "train_info/time_within_train_step": 2.644174098968506, "step": 6055} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 6055} {"info/global_step": 6056, "train_info/time_within_train_step": 2.666560173034668, "step": 6056} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 6056} {"info/global_step": 6057, "train_info/time_within_train_step": 2.6595399379730225, "step": 6057} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 6057} {"info/global_step": 6058, "train_info/time_within_train_step": 2.666940212249756, "step": 6058} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 6058} {"info/global_step": 6059, "train_info/time_within_train_step": 2.685459852218628, "step": 6059} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 6059} {"info/global_step": 6060, "train_info/time_within_train_step": 2.6680908203125, "step": 6060} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 6060} {"info/global_step": 6061, "train_info/time_within_train_step": 2.6435587406158447, "step": 6061} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 6061} {"info/global_step": 6062, "train_info/time_within_train_step": 2.6434497833251953, "step": 6062} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 6062} {"info/global_step": 6063, "train_info/time_within_train_step": 2.659741163253784, "step": 6063} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 6063} {"info/global_step": 6064, "train_info/time_within_train_step": 2.6562912464141846, "step": 6064} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 6064} {"info/global_step": 6065, "train_info/time_within_train_step": 2.64597225189209, "step": 6065} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 6065} {"info/global_step": 6066, "train_info/time_within_train_step": 2.6608400344848633, "step": 6066} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 6066} {"info/global_step": 6067, "train_info/time_within_train_step": 2.64833402633667, "step": 6067} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 6067} {"info/global_step": 6068, "train_info/time_within_train_step": 2.7032742500305176, "step": 6068} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 6068} {"info/global_step": 6069, "train_info/time_within_train_step": 2.7180309295654297, "step": 6069} {"train_info/time_between_train_steps": 0.0065250396728515625, "step": 6069} {"info/global_step": 6070, "train_info/time_within_train_step": 2.6466102600097656, "step": 6070} {"train_info/time_between_train_steps": 0.006507396697998047, "step": 6070} {"info/global_step": 6071, "train_info/time_within_train_step": 2.644176721572876, "step": 6071} {"train_info/time_between_train_steps": 0.006547212600708008, "step": 6071} {"info/global_step": 6072, "train_info/time_within_train_step": 2.6586461067199707, "step": 6072} {"train_info/time_between_train_steps": 0.00643157958984375, "step": 6072} {"info/global_step": 6073, "train_info/time_within_train_step": 2.651946544647217, "step": 6073} {"train_info/time_between_train_steps": 0.006407260894775391, "step": 6073} {"info/global_step": 6074, "train_info/time_within_train_step": 2.6562061309814453, "step": 6074} {"train_info/time_between_train_steps": 0.006491422653198242, "step": 6074} {"info/global_step": 6075, "train_info/time_within_train_step": 2.644678831100464, "step": 6075} {"train_info/time_between_train_steps": 0.006583452224731445, "step": 6075} {"info/global_step": 6076, "train_info/time_within_train_step": 2.6521565914154053, "step": 6076} {"train_info/time_between_train_steps": 0.006656169891357422, "step": 6076} {"info/global_step": 6077, "train_info/time_within_train_step": 2.652780532836914, "step": 6077} {"train_info/time_between_train_steps": 0.0065648555755615234, "step": 6077} {"info/global_step": 6078, "train_info/time_within_train_step": 2.6714324951171875, "step": 6078} {"train_info/time_between_train_steps": 0.006723165512084961, "step": 6078} {"info/global_step": 6079, "train_info/time_within_train_step": 2.6944310665130615, "step": 6079} {"train_info/time_between_train_steps": 0.0068743228912353516, "step": 6079} {"info/global_step": 6080, "train_info/time_within_train_step": 2.6927692890167236, "step": 6080} {"train_info/time_between_train_steps": 0.0067479610443115234, "step": 6080} {"info/global_step": 6081, "train_info/time_within_train_step": 2.649840831756592, "step": 6081} {"train_info/time_between_train_steps": 0.006835222244262695, "step": 6081} {"info/global_step": 6082, "train_info/time_within_train_step": 2.6502633094787598, "step": 6082} {"train_info/time_between_train_steps": 0.006932497024536133, "step": 6082} {"info/global_step": 6083, "train_info/time_within_train_step": 2.6548891067504883, "step": 6083} {"train_info/time_between_train_steps": 0.0068166255950927734, "step": 6083} {"info/global_step": 6084, "train_info/time_within_train_step": 2.6555259227752686, "step": 6084} {"train_info/time_between_train_steps": 0.006882190704345703, "step": 6084} {"info/global_step": 6085, "train_info/time_within_train_step": 2.655388116836548, "step": 6085} {"train_info/time_between_train_steps": 0.006896257400512695, "step": 6085} {"info/global_step": 6086, "train_info/time_within_train_step": 2.646911859512329, "step": 6086} {"train_info/time_between_train_steps": 0.0034551620483398438, "step": 6086} {"info/global_step": 6087, "train_info/time_within_train_step": 2.6482491493225098, "step": 6087} {"train_info/time_between_train_steps": 0.003463268280029297, "step": 6087} {"info/global_step": 6088, "train_info/time_within_train_step": 2.6739137172698975, "step": 6088} {"train_info/time_between_train_steps": 0.0033941268920898438, "step": 6088} {"info/global_step": 6089, "train_info/time_within_train_step": 2.667923927307129, "step": 6089} {"train_info/time_between_train_steps": 0.003542661666870117, "step": 6089} {"info/global_step": 6090, "train_info/time_within_train_step": 2.689141273498535, "step": 6090} {"train_info/time_between_train_steps": 0.0034554004669189453, "step": 6090} {"info/global_step": 6091, "train_info/time_within_train_step": 2.6589834690093994, "step": 6091} {"train_info/time_between_train_steps": 0.0062143802642822266, "step": 6091} {"info/global_step": 6092, "train_info/time_within_train_step": 2.674473762512207, "step": 6092} {"train_info/time_between_train_steps": 0.006865739822387695, "step": 6092} {"info/global_step": 6093, "train_info/time_within_train_step": 2.645401954650879, "step": 6093} {"train_info/time_between_train_steps": 0.006894111633300781, "step": 6093} {"info/global_step": 6094, "train_info/time_within_train_step": 2.651808738708496, "step": 6094} {"train_info/time_between_train_steps": 0.006967067718505859, "step": 6094} {"info/global_step": 6095, "train_info/time_within_train_step": 2.665804862976074, "step": 6095} {"train_info/time_between_train_steps": 0.006827831268310547, "step": 6095} {"info/global_step": 6096, "train_info/time_within_train_step": 2.6456613540649414, "step": 6096} {"train_info/time_between_train_steps": 0.006861209869384766, "step": 6096} {"info/global_step": 6097, "train_info/time_within_train_step": 2.6458752155303955, "step": 6097} {"train_info/time_between_train_steps": 0.0034401416778564453, "step": 6097} {"info/global_step": 6098, "train_info/time_within_train_step": 2.6505672931671143, "step": 6098} {"train_info/time_between_train_steps": 0.0036177635192871094, "step": 6098} {"info/global_step": 6099, "train_info/time_within_train_step": 2.6662585735321045, "step": 6099} {"train_info/time_between_train_steps": 0.0036754608154296875, "step": 6099} {"info/global_step": 6100, "train_info/time_within_train_step": 2.6647520065307617, "step": 6100} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746914536, "_runtime": 17134}, "step": 6100} {"logs": {"train/loss": 3.4226, "train/learning_rate": 0.00026, "train/epoch": 7.01, "_timestamp": 1746914536, "_runtime": 17134}, "step": 6100} {"train_info/time_between_train_steps": 0.025425434112548828, "step": 6100} {"info/global_step": 6101, "train_info/time_within_train_step": 2.6767399311065674, "step": 6101} {"train_info/time_between_train_steps": 0.003333568572998047, "step": 6101} {"info/global_step": 6102, "train_info/time_within_train_step": 2.6670384407043457, "step": 6102} {"train_info/time_between_train_steps": 0.003632068634033203, "step": 6102} {"info/global_step": 6103, "train_info/time_within_train_step": 2.7076022624969482, "step": 6103} {"train_info/time_between_train_steps": 0.003421783447265625, "step": 6103} {"info/global_step": 6104, "train_info/time_within_train_step": 3.091132402420044, "step": 6104} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 6104} {"info/global_step": 6105, "train_info/time_within_train_step": 2.6464831829071045, "step": 6105} {"train_info/time_between_train_steps": 0.0032601356506347656, "step": 6105} {"info/global_step": 6106, "train_info/time_within_train_step": 2.660707712173462, "step": 6106} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 6106} {"info/global_step": 6107, "train_info/time_within_train_step": 2.660041332244873, "step": 6107} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 6107} {"info/global_step": 6108, "train_info/time_within_train_step": 2.6741647720336914, "step": 6108} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 6108} {"info/global_step": 6109, "train_info/time_within_train_step": 2.6733596324920654, "step": 6109} {"train_info/time_between_train_steps": 0.003242969512939453, "step": 6109} {"info/global_step": 6110, "train_info/time_within_train_step": 2.6847825050354004, "step": 6110} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 6110} {"info/global_step": 6111, "train_info/time_within_train_step": 2.6435201168060303, "step": 6111} {"train_info/time_between_train_steps": 0.003292083740234375, "step": 6111} {"info/global_step": 6112, "train_info/time_within_train_step": 2.6429898738861084, "step": 6112} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 6112} {"info/global_step": 6113, "train_info/time_within_train_step": 2.659231185913086, "step": 6113} {"train_info/time_between_train_steps": 0.0065953731536865234, "step": 6113} {"info/global_step": 6114, "train_info/time_within_train_step": 2.6503350734710693, "step": 6114} {"train_info/time_between_train_steps": 0.003401517868041992, "step": 6114} {"info/global_step": 6115, "train_info/time_within_train_step": 2.6476681232452393, "step": 6115} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 6115} {"info/global_step": 6116, "train_info/time_within_train_step": 2.6423370838165283, "step": 6116} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 6116} {"info/global_step": 6117, "train_info/time_within_train_step": 2.655316114425659, "step": 6117} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 6117} {"info/global_step": 6118, "train_info/time_within_train_step": 2.661329984664917, "step": 6118} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 6118} {"info/global_step": 6119, "train_info/time_within_train_step": 2.6449902057647705, "step": 6119} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 6119} {"info/global_step": 6120, "train_info/time_within_train_step": 2.645646810531616, "step": 6120} {"train_info/time_between_train_steps": 0.0031523704528808594, "step": 6120} {"info/global_step": 6121, "train_info/time_within_train_step": 2.6578354835510254, "step": 6121} {"train_info/time_between_train_steps": 0.006548404693603516, "step": 6121} {"info/global_step": 6122, "train_info/time_within_train_step": 2.6621921062469482, "step": 6122} {"train_info/time_between_train_steps": 0.003424406051635742, "step": 6122} {"info/global_step": 6123, "train_info/time_within_train_step": 2.676129102706909, "step": 6123} {"train_info/time_between_train_steps": 0.006749868392944336, "step": 6123} {"info/global_step": 6124, "train_info/time_within_train_step": 2.66217303276062, "step": 6124} {"train_info/time_between_train_steps": 0.0065882205963134766, "step": 6124} {"info/global_step": 6125, "train_info/time_within_train_step": 2.7120745182037354, "step": 6125} {"train_info/time_between_train_steps": 0.006514072418212891, "step": 6125} {"info/global_step": 6126, "train_info/time_within_train_step": 2.6568689346313477, "step": 6126} {"train_info/time_between_train_steps": 0.006494998931884766, "step": 6126} {"info/global_step": 6127, "train_info/time_within_train_step": 2.648500442504883, "step": 6127} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 6127} {"info/global_step": 6128, "train_info/time_within_train_step": 2.6450774669647217, "step": 6128} {"train_info/time_between_train_steps": 0.003243684768676758, "step": 6128} {"info/global_step": 6129, "train_info/time_within_train_step": 2.6571693420410156, "step": 6129} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 6129} {"info/global_step": 6130, "train_info/time_within_train_step": 2.6559906005859375, "step": 6130} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 6130} {"info/global_step": 6131, "train_info/time_within_train_step": 2.64609432220459, "step": 6131} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 6131} {"info/global_step": 6132, "train_info/time_within_train_step": 2.664655923843384, "step": 6132} {"train_info/time_between_train_steps": 0.006671428680419922, "step": 6132} {"info/global_step": 6133, "train_info/time_within_train_step": 2.6546335220336914, "step": 6133} {"train_info/time_between_train_steps": 0.00645136833190918, "step": 6133} {"info/global_step": 6134, "train_info/time_within_train_step": 2.6605000495910645, "step": 6134} {"train_info/time_between_train_steps": 0.006574392318725586, "step": 6134} {"info/global_step": 6135, "train_info/time_within_train_step": 2.6919851303100586, "step": 6135} {"train_info/time_between_train_steps": 0.0068645477294921875, "step": 6135} {"info/global_step": 6136, "train_info/time_within_train_step": 2.6560521125793457, "step": 6136} {"train_info/time_between_train_steps": 0.006513118743896484, "step": 6136} {"info/global_step": 6137, "train_info/time_within_train_step": 2.6429481506347656, "step": 6137} {"train_info/time_between_train_steps": 0.0065042972564697266, "step": 6137} {"info/global_step": 6138, "train_info/time_within_train_step": 2.6509952545166016, "step": 6138} {"train_info/time_between_train_steps": 0.00324249267578125, "step": 6138} {"info/global_step": 6139, "train_info/time_within_train_step": 2.6597249507904053, "step": 6139} {"train_info/time_between_train_steps": 0.0034134387969970703, "step": 6139} {"info/global_step": 6140, "train_info/time_within_train_step": 2.6576552391052246, "step": 6140} {"train_info/time_between_train_steps": 0.006536245346069336, "step": 6140} {"info/global_step": 6141, "train_info/time_within_train_step": 2.6457455158233643, "step": 6141} {"train_info/time_between_train_steps": 0.0032761096954345703, "step": 6141} {"info/global_step": 6142, "train_info/time_within_train_step": 2.6532604694366455, "step": 6142} {"train_info/time_between_train_steps": 0.0032455921173095703, "step": 6142} {"info/global_step": 6143, "train_info/time_within_train_step": 2.652632713317871, "step": 6143} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 6143} {"info/global_step": 6144, "train_info/time_within_train_step": 2.6708340644836426, "step": 6144} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 6144} {"info/global_step": 6145, "train_info/time_within_train_step": 2.713263750076294, "step": 6145} {"train_info/time_between_train_steps": 0.0032727718353271484, "step": 6145} {"info/global_step": 6146, "train_info/time_within_train_step": 2.642728567123413, "step": 6146} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 6146} {"info/global_step": 6147, "train_info/time_within_train_step": 2.6497695446014404, "step": 6147} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 6147} {"info/global_step": 6148, "train_info/time_within_train_step": 2.657257080078125, "step": 6148} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 6148} {"info/global_step": 6149, "train_info/time_within_train_step": 2.6491189002990723, "step": 6149} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 6149} {"info/global_step": 6150, "train_info/time_within_train_step": 2.6596765518188477, "step": 6150} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746914671, "_runtime": 17269}, "step": 6150} {"logs": {"train/loss": 3.4138, "train/learning_rate": 0.00025666666666666665, "train/epoch": 7.01, "_timestamp": 1746914671, "_runtime": 17269}, "step": 6150} {"train_info/time_between_train_steps": 0.02433466911315918, "step": 6150} {"info/global_step": 6151, "train_info/time_within_train_step": 2.64741849899292, "step": 6151} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 6151} {"info/global_step": 6152, "train_info/time_within_train_step": 2.6454155445098877, "step": 6152} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 6152} {"info/global_step": 6153, "train_info/time_within_train_step": 2.6604549884796143, "step": 6153} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 6153} {"info/global_step": 6154, "train_info/time_within_train_step": 2.650883913040161, "step": 6154} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 6154} {"info/global_step": 6155, "train_info/time_within_train_step": 2.653846502304077, "step": 6155} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 6155} {"info/global_step": 6156, "train_info/time_within_train_step": 2.648735284805298, "step": 6156} {"train_info/time_between_train_steps": 0.0032663345336914062, "step": 6156} {"info/global_step": 6157, "train_info/time_within_train_step": 2.652299165725708, "step": 6157} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 6157} {"info/global_step": 6158, "train_info/time_within_train_step": 2.6507627964019775, "step": 6158} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 6158} {"info/global_step": 6159, "train_info/time_within_train_step": 2.646087169647217, "step": 6159} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 6159} {"info/global_step": 6160, "train_info/time_within_train_step": 2.719655990600586, "step": 6160} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 6160} {"info/global_step": 6161, "train_info/time_within_train_step": 2.6661159992218018, "step": 6161} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 6161} {"info/global_step": 6162, "train_info/time_within_train_step": 2.663363218307495, "step": 6162} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 6162} {"info/global_step": 6163, "train_info/time_within_train_step": 2.6569457054138184, "step": 6163} {"train_info/time_between_train_steps": 0.0031256675720214844, "step": 6163} {"info/global_step": 6164, "train_info/time_within_train_step": 2.9361324310302734, "step": 6164} {"train_info/time_between_train_steps": 0.0032083988189697266, "step": 6164} {"info/global_step": 6165, "train_info/time_within_train_step": 2.663700819015503, "step": 6165} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 6165} {"info/global_step": 6166, "train_info/time_within_train_step": 2.665450096130371, "step": 6166} {"train_info/time_between_train_steps": 0.12824797630310059, "step": 6166} {"info/global_step": 6167, "train_info/time_within_train_step": 2.663515567779541, "step": 6167} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 6167} {"info/global_step": 6168, "train_info/time_within_train_step": 2.671727180480957, "step": 6168} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 6168} {"info/global_step": 6169, "train_info/time_within_train_step": 2.665632724761963, "step": 6169} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 6169} {"info/global_step": 6170, "train_info/time_within_train_step": 2.7072525024414062, "step": 6170} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 6170} {"info/global_step": 6171, "train_info/time_within_train_step": 2.6440234184265137, "step": 6171} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 6171} {"info/global_step": 6172, "train_info/time_within_train_step": 2.65012788772583, "step": 6172} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 6172} {"info/global_step": 6173, "train_info/time_within_train_step": 2.660867214202881, "step": 6173} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 6173} {"info/global_step": 6174, "train_info/time_within_train_step": 2.644476890563965, "step": 6174} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 6174} {"info/global_step": 6175, "train_info/time_within_train_step": 2.6486525535583496, "step": 6175} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 6175} {"info/global_step": 6176, "train_info/time_within_train_step": 2.6488945484161377, "step": 6176} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 6176} {"info/global_step": 6177, "train_info/time_within_train_step": 2.6557817459106445, "step": 6177} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 6177} {"info/global_step": 6178, "train_info/time_within_train_step": 2.659255266189575, "step": 6178} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 6178} {"info/global_step": 6179, "train_info/time_within_train_step": 2.6492087841033936, "step": 6179} {"train_info/time_between_train_steps": 0.006576061248779297, "step": 6179} {"info/global_step": 6180, "train_info/time_within_train_step": 2.6437385082244873, "step": 6180} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 6180} {"info/global_step": 6181, "train_info/time_within_train_step": 2.6600265502929688, "step": 6181} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 6181} {"info/global_step": 6182, "train_info/time_within_train_step": 2.650804281234741, "step": 6182} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 6182} {"info/global_step": 6183, "train_info/time_within_train_step": 2.6512296199798584, "step": 6183} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 6183} {"info/global_step": 6184, "train_info/time_within_train_step": 2.648942470550537, "step": 6184} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 6184} {"info/global_step": 6185, "train_info/time_within_train_step": 2.648165702819824, "step": 6185} {"train_info/time_between_train_steps": 0.003396749496459961, "step": 6185} {"info/global_step": 6186, "train_info/time_within_train_step": 2.665966749191284, "step": 6186} {"train_info/time_between_train_steps": 0.003436565399169922, "step": 6186} {"info/global_step": 6187, "train_info/time_within_train_step": 2.683211326599121, "step": 6187} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 6187} {"info/global_step": 6188, "train_info/time_within_train_step": 2.6894166469573975, "step": 6188} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 6188} {"info/global_step": 6189, "train_info/time_within_train_step": 2.653407573699951, "step": 6189} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 6189} {"info/global_step": 6190, "train_info/time_within_train_step": 2.6425118446350098, "step": 6190} {"train_info/time_between_train_steps": 0.003438711166381836, "step": 6190} {"info/global_step": 6191, "train_info/time_within_train_step": 2.6565001010894775, "step": 6191} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 6191} {"info/global_step": 6192, "train_info/time_within_train_step": 2.657150983810425, "step": 6192} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 6192} {"info/global_step": 6193, "train_info/time_within_train_step": 2.6454784870147705, "step": 6193} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 6193} {"info/global_step": 6194, "train_info/time_within_train_step": 2.6450507640838623, "step": 6194} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 6194} {"info/global_step": 6195, "train_info/time_within_train_step": 2.6551384925842285, "step": 6195} {"train_info/time_between_train_steps": 0.0032987594604492188, "step": 6195} {"info/global_step": 6196, "train_info/time_within_train_step": 2.680682420730591, "step": 6196} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 6196} {"info/global_step": 6197, "train_info/time_within_train_step": 2.6731061935424805, "step": 6197} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 6197} {"info/global_step": 6198, "train_info/time_within_train_step": 2.6571218967437744, "step": 6198} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 6198} {"info/global_step": 6199, "train_info/time_within_train_step": 2.691114664077759, "step": 6199} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 6199} {"info/global_step": 6200, "train_info/time_within_train_step": 2.6452345848083496, "step": 6200} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746914805, "_runtime": 17403}, "step": 6200} {"logs": {"train/loss": 3.4076, "train/learning_rate": 0.00025333333333333333, "train/epoch": 7.02, "_timestamp": 1746914805, "_runtime": 17403}, "step": 6200} {"train_info/time_between_train_steps": 13.550623893737793, "step": 6200} {"info/global_step": 6201, "train_info/time_within_train_step": 2.436908006668091, "step": 6201} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 6201} {"info/global_step": 6202, "train_info/time_within_train_step": 2.4354004859924316, "step": 6202} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 6202} {"info/global_step": 6203, "train_info/time_within_train_step": 2.56197452545166, "step": 6203} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 6203} {"info/global_step": 6204, "train_info/time_within_train_step": 2.637302875518799, "step": 6204} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 6204} {"info/global_step": 6205, "train_info/time_within_train_step": 2.650961399078369, "step": 6205} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 6205} {"info/global_step": 6206, "train_info/time_within_train_step": 2.6539039611816406, "step": 6206} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 6206} {"info/global_step": 6207, "train_info/time_within_train_step": 2.6424636840820312, "step": 6207} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 6207} {"info/global_step": 6208, "train_info/time_within_train_step": 2.642404556274414, "step": 6208} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 6208} {"info/global_step": 6209, "train_info/time_within_train_step": 2.8928167819976807, "step": 6209} {"train_info/time_between_train_steps": 0.0032715797424316406, "step": 6209} {"info/global_step": 6210, "train_info/time_within_train_step": 2.649336576461792, "step": 6210} {"train_info/time_between_train_steps": 0.003216266632080078, "step": 6210} {"info/global_step": 6211, "train_info/time_within_train_step": 2.6432671546936035, "step": 6211} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 6211} {"info/global_step": 6212, "train_info/time_within_train_step": 2.648907423019409, "step": 6212} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 6212} {"info/global_step": 6213, "train_info/time_within_train_step": 2.6717114448547363, "step": 6213} {"train_info/time_between_train_steps": 0.0032324790954589844, "step": 6213} {"info/global_step": 6214, "train_info/time_within_train_step": 2.6701953411102295, "step": 6214} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 6214} {"info/global_step": 6215, "train_info/time_within_train_step": 2.6565585136413574, "step": 6215} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 6215} {"info/global_step": 6216, "train_info/time_within_train_step": 2.6867501735687256, "step": 6216} {"train_info/time_between_train_steps": 0.003173828125, "step": 6216} {"info/global_step": 6217, "train_info/time_within_train_step": 2.6413931846618652, "step": 6217} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 6217} {"info/global_step": 6218, "train_info/time_within_train_step": 2.6544888019561768, "step": 6218} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 6218} {"info/global_step": 6219, "train_info/time_within_train_step": 2.66023588180542, "step": 6219} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 6219} {"info/global_step": 6220, "train_info/time_within_train_step": 2.6439855098724365, "step": 6220} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 6220} {"info/global_step": 6221, "train_info/time_within_train_step": 2.644624948501587, "step": 6221} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 6221} {"info/global_step": 6222, "train_info/time_within_train_step": 2.654799461364746, "step": 6222} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 6222} {"info/global_step": 6223, "train_info/time_within_train_step": 2.661585569381714, "step": 6223} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 6223} {"info/global_step": 6224, "train_info/time_within_train_step": 2.6734137535095215, "step": 6224} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 6224} {"info/global_step": 6225, "train_info/time_within_train_step": 2.6656036376953125, "step": 6225} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 6225} {"info/global_step": 6226, "train_info/time_within_train_step": 2.7021141052246094, "step": 6226} {"train_info/time_between_train_steps": 0.00344085693359375, "step": 6226} {"info/global_step": 6227, "train_info/time_within_train_step": 2.6432549953460693, "step": 6227} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 6227} {"info/global_step": 6228, "train_info/time_within_train_step": 2.644181966781616, "step": 6228} {"train_info/time_between_train_steps": 0.0031528472900390625, "step": 6228} {"info/global_step": 6229, "train_info/time_within_train_step": 2.773709774017334, "step": 6229} {"train_info/time_between_train_steps": 0.003216266632080078, "step": 6229} {"info/global_step": 6230, "train_info/time_within_train_step": 2.642181396484375, "step": 6230} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 6230} {"info/global_step": 6231, "train_info/time_within_train_step": 2.657545566558838, "step": 6231} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 6231} {"info/global_step": 6232, "train_info/time_within_train_step": 2.6539089679718018, "step": 6232} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 6232} {"info/global_step": 6233, "train_info/time_within_train_step": 2.6509485244750977, "step": 6233} {"train_info/time_between_train_steps": 0.0032062530517578125, "step": 6233} {"info/global_step": 6234, "train_info/time_within_train_step": 2.642629861831665, "step": 6234} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 6234} {"info/global_step": 6235, "train_info/time_within_train_step": 2.6529898643493652, "step": 6235} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 6235} {"info/global_step": 6236, "train_info/time_within_train_step": 2.730717420578003, "step": 6236} {"train_info/time_between_train_steps": 0.003414154052734375, "step": 6236} {"info/global_step": 6237, "train_info/time_within_train_step": 2.644929885864258, "step": 6237} {"train_info/time_between_train_steps": 0.0033206939697265625, "step": 6237} {"info/global_step": 6238, "train_info/time_within_train_step": 2.6457433700561523, "step": 6238} {"train_info/time_between_train_steps": 0.0033681392669677734, "step": 6238} {"info/global_step": 6239, "train_info/time_within_train_step": 2.648369789123535, "step": 6239} {"train_info/time_between_train_steps": 0.0034945011138916016, "step": 6239} {"info/global_step": 6240, "train_info/time_within_train_step": 2.6443004608154297, "step": 6240} {"train_info/time_between_train_steps": 0.0033829212188720703, "step": 6240} {"info/global_step": 6241, "train_info/time_within_train_step": 2.671562910079956, "step": 6241} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 6241} {"info/global_step": 6242, "train_info/time_within_train_step": 2.6448700428009033, "step": 6242} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 6242} {"info/global_step": 6243, "train_info/time_within_train_step": 2.6538851261138916, "step": 6243} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 6243} {"info/global_step": 6244, "train_info/time_within_train_step": 2.6404926776885986, "step": 6244} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 6244} {"info/global_step": 6245, "train_info/time_within_train_step": 2.642503023147583, "step": 6245} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 6245} {"info/global_step": 6246, "train_info/time_within_train_step": 2.6557178497314453, "step": 6246} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 6246} {"info/global_step": 6247, "train_info/time_within_train_step": 2.7179434299468994, "step": 6247} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 6247} {"info/global_step": 6248, "train_info/time_within_train_step": 2.685500383377075, "step": 6248} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 6248} {"info/global_step": 6249, "train_info/time_within_train_step": 3.2212231159210205, "step": 6249} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 6249} {"info/global_step": 6250, "train_info/time_within_train_step": 2.6550140380859375, "step": 6250} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746914954, "_runtime": 17552}, "step": 6250} {"logs": {"train/loss": 3.3888, "train/learning_rate": 0.00025, "train/epoch": 7.02, "_timestamp": 1746914954, "_runtime": 17552}, "step": 6250} {"train_info/time_between_train_steps": 0.024470090866088867, "step": 6250} {"info/global_step": 6251, "train_info/time_within_train_step": 2.6430442333221436, "step": 6251} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 6251} {"info/global_step": 6252, "train_info/time_within_train_step": 2.896069288253784, "step": 6252} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 6252} {"info/global_step": 6253, "train_info/time_within_train_step": 2.645099401473999, "step": 6253} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 6253} {"info/global_step": 6254, "train_info/time_within_train_step": 2.6470820903778076, "step": 6254} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 6254} {"info/global_step": 6255, "train_info/time_within_train_step": 2.650413990020752, "step": 6255} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 6255} {"info/global_step": 6256, "train_info/time_within_train_step": 2.645872116088867, "step": 6256} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 6256} {"info/global_step": 6257, "train_info/time_within_train_step": 2.6542305946350098, "step": 6257} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 6257} {"info/global_step": 6258, "train_info/time_within_train_step": 2.6568307876586914, "step": 6258} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 6258} {"info/global_step": 6259, "train_info/time_within_train_step": 2.6753525733947754, "step": 6259} {"train_info/time_between_train_steps": 0.0032052993774414062, "step": 6259} {"info/global_step": 6260, "train_info/time_within_train_step": 2.7280678749084473, "step": 6260} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 6260} {"info/global_step": 6261, "train_info/time_within_train_step": 2.658088207244873, "step": 6261} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 6261} {"info/global_step": 6262, "train_info/time_within_train_step": 2.641334295272827, "step": 6262} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 6262} {"info/global_step": 6263, "train_info/time_within_train_step": 2.654484748840332, "step": 6263} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 6263} {"info/global_step": 6264, "train_info/time_within_train_step": 2.649841070175171, "step": 6264} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 6264} {"info/global_step": 6265, "train_info/time_within_train_step": 2.6494946479797363, "step": 6265} {"train_info/time_between_train_steps": 0.0031681060791015625, "step": 6265} {"info/global_step": 6266, "train_info/time_within_train_step": 2.6483123302459717, "step": 6266} {"train_info/time_between_train_steps": 0.0031499862670898438, "step": 6266} {"info/global_step": 6267, "train_info/time_within_train_step": 2.6442062854766846, "step": 6267} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 6267} {"info/global_step": 6268, "train_info/time_within_train_step": 2.6658339500427246, "step": 6268} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 6268} {"info/global_step": 6269, "train_info/time_within_train_step": 2.666609525680542, "step": 6269} {"train_info/time_between_train_steps": 0.0031523704528808594, "step": 6269} {"info/global_step": 6270, "train_info/time_within_train_step": 2.688943386077881, "step": 6270} {"train_info/time_between_train_steps": 0.003282785415649414, "step": 6270} {"info/global_step": 6271, "train_info/time_within_train_step": 2.6486942768096924, "step": 6271} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 6271} {"info/global_step": 6272, "train_info/time_within_train_step": 2.6420538425445557, "step": 6272} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 6272} {"info/global_step": 6273, "train_info/time_within_train_step": 2.656680107116699, "step": 6273} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 6273} {"info/global_step": 6274, "train_info/time_within_train_step": 2.652043104171753, "step": 6274} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 6274} {"info/global_step": 6275, "train_info/time_within_train_step": 2.644817352294922, "step": 6275} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 6275} {"info/global_step": 6276, "train_info/time_within_train_step": 2.643897294998169, "step": 6276} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 6276} {"info/global_step": 6277, "train_info/time_within_train_step": 2.651639223098755, "step": 6277} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 6277} {"info/global_step": 6278, "train_info/time_within_train_step": 2.6697723865509033, "step": 6278} {"train_info/time_between_train_steps": 0.003190755844116211, "step": 6278} {"info/global_step": 6279, "train_info/time_within_train_step": 2.6879658699035645, "step": 6279} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 6279} {"info/global_step": 6280, "train_info/time_within_train_step": 2.6490426063537598, "step": 6280} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 6280} {"info/global_step": 6281, "train_info/time_within_train_step": 2.6834263801574707, "step": 6281} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 6281} {"info/global_step": 6282, "train_info/time_within_train_step": 2.6467678546905518, "step": 6282} {"train_info/time_between_train_steps": 0.0031943321228027344, "step": 6282} {"info/global_step": 6283, "train_info/time_within_train_step": 2.6470394134521484, "step": 6283} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 6283} {"info/global_step": 6284, "train_info/time_within_train_step": 2.6690728664398193, "step": 6284} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 6284} {"info/global_step": 6285, "train_info/time_within_train_step": 2.6461055278778076, "step": 6285} {"train_info/time_between_train_steps": 0.0032248497009277344, "step": 6285} {"info/global_step": 6286, "train_info/time_within_train_step": 2.6446568965911865, "step": 6286} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 6286} {"info/global_step": 6287, "train_info/time_within_train_step": 2.6622865200042725, "step": 6287} {"train_info/time_between_train_steps": 0.003199338912963867, "step": 6287} {"info/global_step": 6288, "train_info/time_within_train_step": 2.66007661819458, "step": 6288} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 6288} {"info/global_step": 6289, "train_info/time_within_train_step": 2.6533315181732178, "step": 6289} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 6289} {"info/global_step": 6290, "train_info/time_within_train_step": 2.661311626434326, "step": 6290} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 6290} {"info/global_step": 6291, "train_info/time_within_train_step": 2.65264892578125, "step": 6291} {"train_info/time_between_train_steps": 0.12988972663879395, "step": 6291} {"info/global_step": 6292, "train_info/time_within_train_step": 2.6462695598602295, "step": 6292} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 6292} {"info/global_step": 6293, "train_info/time_within_train_step": 2.6458187103271484, "step": 6293} {"train_info/time_between_train_steps": 0.0032629966735839844, "step": 6293} {"info/global_step": 6294, "train_info/time_within_train_step": 2.6525652408599854, "step": 6294} {"train_info/time_between_train_steps": 0.003311634063720703, "step": 6294} {"info/global_step": 6295, "train_info/time_within_train_step": 2.653456449508667, "step": 6295} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 6295} {"info/global_step": 6296, "train_info/time_within_train_step": 2.6622164249420166, "step": 6296} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 6296} {"info/global_step": 6297, "train_info/time_within_train_step": 2.6817574501037598, "step": 6297} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 6297} {"info/global_step": 6298, "train_info/time_within_train_step": 2.7271082401275635, "step": 6298} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 6298} {"info/global_step": 6299, "train_info/time_within_train_step": 2.650520086288452, "step": 6299} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 6299} {"info/global_step": 6300, "train_info/time_within_train_step": 2.640742540359497, "step": 6300} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746915088, "_runtime": 17686}, "step": 6300} {"logs": {"train/loss": 3.3865, "train/learning_rate": 0.0002466666666666666, "train/epoch": 7.03, "_timestamp": 1746915088, "_runtime": 17686}, "step": 6300} {"train_info/time_between_train_steps": 0.024497270584106445, "step": 6300} {"info/global_step": 6301, "train_info/time_within_train_step": 2.6414294242858887, "step": 6301} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 6301} {"info/global_step": 6302, "train_info/time_within_train_step": 2.6550559997558594, "step": 6302} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 6302} {"info/global_step": 6303, "train_info/time_within_train_step": 2.6605381965637207, "step": 6303} {"train_info/time_between_train_steps": 0.003235340118408203, "step": 6303} {"info/global_step": 6304, "train_info/time_within_train_step": 2.6444501876831055, "step": 6304} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 6304} {"info/global_step": 6305, "train_info/time_within_train_step": 2.6526331901550293, "step": 6305} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 6305} {"info/global_step": 6306, "train_info/time_within_train_step": 2.65144419670105, "step": 6306} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 6306} {"info/global_step": 6307, "train_info/time_within_train_step": 2.6689612865448, "step": 6307} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 6307} {"info/global_step": 6308, "train_info/time_within_train_step": 2.710176467895508, "step": 6308} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 6308} {"info/global_step": 6309, "train_info/time_within_train_step": 2.6428630352020264, "step": 6309} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 6309} {"info/global_step": 6310, "train_info/time_within_train_step": 2.6474642753601074, "step": 6310} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 6310} {"info/global_step": 6311, "train_info/time_within_train_step": 2.6598172187805176, "step": 6311} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 6311} {"info/global_step": 6312, "train_info/time_within_train_step": 2.6432979106903076, "step": 6312} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 6312} {"info/global_step": 6313, "train_info/time_within_train_step": 2.6445889472961426, "step": 6313} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 6313} {"info/global_step": 6314, "train_info/time_within_train_step": 2.666822910308838, "step": 6314} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 6314} {"info/global_step": 6315, "train_info/time_within_train_step": 2.6659786701202393, "step": 6315} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 6315} {"info/global_step": 6316, "train_info/time_within_train_step": 2.6873271465301514, "step": 6316} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 6316} {"info/global_step": 6317, "train_info/time_within_train_step": 2.655942440032959, "step": 6317} {"train_info/time_between_train_steps": 0.0032470226287841797, "step": 6317} {"info/global_step": 6318, "train_info/time_within_train_step": 2.6650872230529785, "step": 6318} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 6318} {"info/global_step": 6319, "train_info/time_within_train_step": 2.6464366912841797, "step": 6319} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 6319} {"info/global_step": 6320, "train_info/time_within_train_step": 2.6434617042541504, "step": 6320} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 6320} {"info/global_step": 6321, "train_info/time_within_train_step": 2.657650947570801, "step": 6321} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 6321} {"info/global_step": 6322, "train_info/time_within_train_step": 2.6617746353149414, "step": 6322} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 6322} {"info/global_step": 6323, "train_info/time_within_train_step": 2.6433956623077393, "step": 6323} {"train_info/time_between_train_steps": 0.003247976303100586, "step": 6323} {"info/global_step": 6324, "train_info/time_within_train_step": 2.663675546646118, "step": 6324} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 6324} {"info/global_step": 6325, "train_info/time_within_train_step": 2.661104917526245, "step": 6325} {"train_info/time_between_train_steps": 0.003221273422241211, "step": 6325} {"info/global_step": 6326, "train_info/time_within_train_step": 2.673938512802124, "step": 6326} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 6326} {"info/global_step": 6327, "train_info/time_within_train_step": 2.673574447631836, "step": 6327} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 6327} {"info/global_step": 6328, "train_info/time_within_train_step": 2.676471471786499, "step": 6328} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 6328} {"info/global_step": 6329, "train_info/time_within_train_step": 2.641679286956787, "step": 6329} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 6329} {"info/global_step": 6330, "train_info/time_within_train_step": 2.6410775184631348, "step": 6330} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 6330} {"info/global_step": 6331, "train_info/time_within_train_step": 2.657012939453125, "step": 6331} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 6331} {"info/global_step": 6332, "train_info/time_within_train_step": 2.6531758308410645, "step": 6332} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 6332} {"info/global_step": 6333, "train_info/time_within_train_step": 2.645580768585205, "step": 6333} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 6333} {"info/global_step": 6334, "train_info/time_within_train_step": 2.662193775177002, "step": 6334} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 6334} {"info/global_step": 6335, "train_info/time_within_train_step": 2.658581495285034, "step": 6335} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 6335} {"info/global_step": 6336, "train_info/time_within_train_step": 2.660360336303711, "step": 6336} {"train_info/time_between_train_steps": 0.0032362937927246094, "step": 6336} {"info/global_step": 6337, "train_info/time_within_train_step": 2.70424222946167, "step": 6337} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 6337} {"info/global_step": 6338, "train_info/time_within_train_step": 2.706256628036499, "step": 6338} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 6338} {"info/global_step": 6339, "train_info/time_within_train_step": 2.641671657562256, "step": 6339} {"train_info/time_between_train_steps": 0.0031588077545166016, "step": 6339} {"info/global_step": 6340, "train_info/time_within_train_step": 2.6412582397460938, "step": 6340} {"train_info/time_between_train_steps": 0.003281831741333008, "step": 6340} {"info/global_step": 6341, "train_info/time_within_train_step": 2.662276268005371, "step": 6341} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 6341} {"info/global_step": 6342, "train_info/time_within_train_step": 2.6513495445251465, "step": 6342} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 6342} {"info/global_step": 6343, "train_info/time_within_train_step": 2.6452858448028564, "step": 6343} {"train_info/time_between_train_steps": 0.0032052993774414062, "step": 6343} {"info/global_step": 6344, "train_info/time_within_train_step": 2.649273157119751, "step": 6344} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 6344} {"info/global_step": 6345, "train_info/time_within_train_step": 2.6591691970825195, "step": 6345} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 6345} {"info/global_step": 6346, "train_info/time_within_train_step": 2.66622257232666, "step": 6346} {"train_info/time_between_train_steps": 0.0032372474670410156, "step": 6346} {"info/global_step": 6347, "train_info/time_within_train_step": 2.6923365592956543, "step": 6347} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 6347} {"info/global_step": 6348, "train_info/time_within_train_step": 2.6493079662323, "step": 6348} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 6348} {"info/global_step": 6349, "train_info/time_within_train_step": 2.641421318054199, "step": 6349} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 6349} {"info/global_step": 6350, "train_info/time_within_train_step": 2.6568353176116943, "step": 6350} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746915223, "_runtime": 17821}, "step": 6350} {"logs": {"train/loss": 3.3772, "train/learning_rate": 0.0002433333333333333, "train/epoch": 7.03, "_timestamp": 1746915223, "_runtime": 17821}, "step": 6350} {"train_info/time_between_train_steps": 0.024462223052978516, "step": 6350} {"info/global_step": 6351, "train_info/time_within_train_step": 2.947370767593384, "step": 6351} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 6351} {"info/global_step": 6352, "train_info/time_within_train_step": 2.6528208255767822, "step": 6352} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 6352} {"info/global_step": 6353, "train_info/time_within_train_step": 2.664860486984253, "step": 6353} {"train_info/time_between_train_steps": 0.0032167434692382812, "step": 6353} {"info/global_step": 6354, "train_info/time_within_train_step": 2.7737069129943848, "step": 6354} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 6354} {"info/global_step": 6355, "train_info/time_within_train_step": 2.663850784301758, "step": 6355} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 6355} {"info/global_step": 6356, "train_info/time_within_train_step": 2.6413986682891846, "step": 6356} {"train_info/time_between_train_steps": 0.0033006668090820312, "step": 6356} {"info/global_step": 6357, "train_info/time_within_train_step": 2.655176877975464, "step": 6357} {"train_info/time_between_train_steps": 0.003264904022216797, "step": 6357} {"info/global_step": 6358, "train_info/time_within_train_step": 2.6442644596099854, "step": 6358} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 6358} {"info/global_step": 6359, "train_info/time_within_train_step": 2.6456093788146973, "step": 6359} {"train_info/time_between_train_steps": 0.003284454345703125, "step": 6359} {"info/global_step": 6360, "train_info/time_within_train_step": 2.654240131378174, "step": 6360} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 6360} {"info/global_step": 6361, "train_info/time_within_train_step": 2.670351028442383, "step": 6361} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 6361} {"info/global_step": 6362, "train_info/time_within_train_step": 2.6778323650360107, "step": 6362} {"train_info/time_between_train_steps": 0.003297567367553711, "step": 6362} {"info/global_step": 6363, "train_info/time_within_train_step": 2.6530168056488037, "step": 6363} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 6363} {"info/global_step": 6364, "train_info/time_within_train_step": 2.6853888034820557, "step": 6364} {"train_info/time_between_train_steps": 0.003159761428833008, "step": 6364} {"info/global_step": 6365, "train_info/time_within_train_step": 2.6419029235839844, "step": 6365} {"train_info/time_between_train_steps": 0.0032341480255126953, "step": 6365} {"info/global_step": 6366, "train_info/time_within_train_step": 2.648019552230835, "step": 6366} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 6366} {"info/global_step": 6367, "train_info/time_within_train_step": 2.6640193462371826, "step": 6367} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 6367} {"info/global_step": 6368, "train_info/time_within_train_step": 2.645296573638916, "step": 6368} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 6368} {"info/global_step": 6369, "train_info/time_within_train_step": 2.6455488204956055, "step": 6369} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 6369} {"info/global_step": 6370, "train_info/time_within_train_step": 2.6574692726135254, "step": 6370} {"train_info/time_between_train_steps": 0.0031578540802001953, "step": 6370} {"info/global_step": 6371, "train_info/time_within_train_step": 2.658820629119873, "step": 6371} {"train_info/time_between_train_steps": 0.0033342838287353516, "step": 6371} {"info/global_step": 6372, "train_info/time_within_train_step": 2.675201177597046, "step": 6372} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 6372} {"info/global_step": 6373, "train_info/time_within_train_step": 2.6742935180664062, "step": 6373} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 6373} {"info/global_step": 6374, "train_info/time_within_train_step": 2.641040325164795, "step": 6374} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 6374} {"info/global_step": 6375, "train_info/time_within_train_step": 2.665830373764038, "step": 6375} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 6375} {"info/global_step": 6376, "train_info/time_within_train_step": 2.650728702545166, "step": 6376} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 6376} {"info/global_step": 6377, "train_info/time_within_train_step": 2.6445112228393555, "step": 6377} {"train_info/time_between_train_steps": 0.003237485885620117, "step": 6377} {"info/global_step": 6378, "train_info/time_within_train_step": 2.6611149311065674, "step": 6378} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 6378} {"info/global_step": 6379, "train_info/time_within_train_step": 2.6534602642059326, "step": 6379} {"train_info/time_between_train_steps": 0.003244161605834961, "step": 6379} {"info/global_step": 6380, "train_info/time_within_train_step": 2.6615545749664307, "step": 6380} {"train_info/time_between_train_steps": 0.003267049789428711, "step": 6380} {"info/global_step": 6381, "train_info/time_within_train_step": 2.7094788551330566, "step": 6381} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 6381} {"info/global_step": 6382, "train_info/time_within_train_step": 2.697197437286377, "step": 6382} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 6382} {"info/global_step": 6383, "train_info/time_within_train_step": 2.6414308547973633, "step": 6383} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 6383} {"info/global_step": 6384, "train_info/time_within_train_step": 2.640444040298462, "step": 6384} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 6384} {"info/global_step": 6385, "train_info/time_within_train_step": 2.6545932292938232, "step": 6385} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 6385} {"info/global_step": 6386, "train_info/time_within_train_step": 2.670889377593994, "step": 6386} {"train_info/time_between_train_steps": 0.0032176971435546875, "step": 6386} {"info/global_step": 6387, "train_info/time_within_train_step": 2.665235757827759, "step": 6387} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 6387} {"info/global_step": 6388, "train_info/time_within_train_step": 2.651517391204834, "step": 6388} {"train_info/time_between_train_steps": 0.0032706260681152344, "step": 6388} {"info/global_step": 6389, "train_info/time_within_train_step": 2.6772549152374268, "step": 6389} {"train_info/time_between_train_steps": 0.003242969512939453, "step": 6389} {"info/global_step": 6390, "train_info/time_within_train_step": 2.6428399085998535, "step": 6390} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 6390} {"info/global_step": 6391, "train_info/time_within_train_step": 2.6539485454559326, "step": 6391} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 6391} {"info/global_step": 6392, "train_info/time_within_train_step": 2.6544852256774902, "step": 6392} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 6392} {"info/global_step": 6393, "train_info/time_within_train_step": 2.6502087116241455, "step": 6393} {"train_info/time_between_train_steps": 0.0032777786254882812, "step": 6393} {"info/global_step": 6394, "train_info/time_within_train_step": 2.646334648132324, "step": 6394} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 6394} {"info/global_step": 6395, "train_info/time_within_train_step": 2.670217990875244, "step": 6395} {"train_info/time_between_train_steps": 0.0032455921173095703, "step": 6395} {"info/global_step": 6396, "train_info/time_within_train_step": 2.66615891456604, "step": 6396} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 6396} {"info/global_step": 6397, "train_info/time_within_train_step": 2.662311315536499, "step": 6397} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 6397} {"info/global_step": 6398, "train_info/time_within_train_step": 2.6784327030181885, "step": 6398} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 6398} {"info/global_step": 6399, "train_info/time_within_train_step": 2.6421802043914795, "step": 6399} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 6399} {"info/global_step": 6400, "train_info/time_within_train_step": 2.6541497707366943, "step": 6400} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746915357, "_runtime": 17955}, "step": 6400} {"logs": {"train/loss": 3.3719, "train/learning_rate": 0.00023999999999999998, "train/epoch": 7.04, "_timestamp": 1746915357, "_runtime": 17955}, "step": 6400} {"train_info/time_between_train_steps": 44.18488907814026, "step": 6400} {"info/global_step": 6401, "train_info/time_within_train_step": 2.4568209648132324, "step": 6401} {"train_info/time_between_train_steps": 0.0032737255096435547, "step": 6401} {"info/global_step": 6402, "train_info/time_within_train_step": 2.427816152572632, "step": 6402} {"train_info/time_between_train_steps": 0.003271341323852539, "step": 6402} {"info/global_step": 6403, "train_info/time_within_train_step": 2.490893602371216, "step": 6403} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 6403} {"info/global_step": 6404, "train_info/time_within_train_step": 2.617072343826294, "step": 6404} {"train_info/time_between_train_steps": 0.0031807422637939453, "step": 6404} {"info/global_step": 6405, "train_info/time_within_train_step": 2.6352133750915527, "step": 6405} {"train_info/time_between_train_steps": 0.003250598907470703, "step": 6405} {"info/global_step": 6406, "train_info/time_within_train_step": 2.6434755325317383, "step": 6406} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 6406} {"info/global_step": 6407, "train_info/time_within_train_step": 2.6588706970214844, "step": 6407} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 6407} {"info/global_step": 6408, "train_info/time_within_train_step": 2.6428043842315674, "step": 6408} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 6408} {"info/global_step": 6409, "train_info/time_within_train_step": 2.643495559692383, "step": 6409} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 6409} {"info/global_step": 6410, "train_info/time_within_train_step": 2.6689887046813965, "step": 6410} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 6410} {"info/global_step": 6411, "train_info/time_within_train_step": 2.667550802230835, "step": 6411} {"train_info/time_between_train_steps": 0.003225564956665039, "step": 6411} {"info/global_step": 6412, "train_info/time_within_train_step": 2.690563917160034, "step": 6412} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 6412} {"info/global_step": 6413, "train_info/time_within_train_step": 2.654423713684082, "step": 6413} {"train_info/time_between_train_steps": 0.003139019012451172, "step": 6413} {"info/global_step": 6414, "train_info/time_within_train_step": 2.6703763008117676, "step": 6414} {"train_info/time_between_train_steps": 0.0031371116638183594, "step": 6414} {"info/global_step": 6415, "train_info/time_within_train_step": 2.643588066101074, "step": 6415} {"train_info/time_between_train_steps": 0.003232240676879883, "step": 6415} {"info/global_step": 6416, "train_info/time_within_train_step": 2.641493797302246, "step": 6416} {"train_info/time_between_train_steps": 0.13425946235656738, "step": 6416} {"info/global_step": 6417, "train_info/time_within_train_step": 2.9728786945343018, "step": 6417} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 6417} {"info/global_step": 6418, "train_info/time_within_train_step": 2.667694330215454, "step": 6418} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 6418} {"info/global_step": 6419, "train_info/time_within_train_step": 2.66330885887146, "step": 6419} {"train_info/time_between_train_steps": 0.0032324790954589844, "step": 6419} {"info/global_step": 6420, "train_info/time_within_train_step": 2.6812691688537598, "step": 6420} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 6420} {"info/global_step": 6421, "train_info/time_within_train_step": 2.650444269180298, "step": 6421} {"train_info/time_between_train_steps": 0.006576061248779297, "step": 6421} {"info/global_step": 6422, "train_info/time_within_train_step": 2.654369592666626, "step": 6422} {"train_info/time_between_train_steps": 0.006497621536254883, "step": 6422} {"info/global_step": 6423, "train_info/time_within_train_step": 2.6508285999298096, "step": 6423} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 6423} {"info/global_step": 6424, "train_info/time_within_train_step": 2.647557020187378, "step": 6424} {"train_info/time_between_train_steps": 0.0032918453216552734, "step": 6424} {"info/global_step": 6425, "train_info/time_within_train_step": 2.667572498321533, "step": 6425} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 6425} {"info/global_step": 6426, "train_info/time_within_train_step": 2.662341356277466, "step": 6426} {"train_info/time_between_train_steps": 0.0032503604888916016, "step": 6426} {"info/global_step": 6427, "train_info/time_within_train_step": 2.657259941101074, "step": 6427} {"train_info/time_between_train_steps": 0.003215789794921875, "step": 6427} {"info/global_step": 6428, "train_info/time_within_train_step": 2.710066556930542, "step": 6428} {"train_info/time_between_train_steps": 0.003263235092163086, "step": 6428} {"info/global_step": 6429, "train_info/time_within_train_step": 2.648254632949829, "step": 6429} {"train_info/time_between_train_steps": 0.003173828125, "step": 6429} {"info/global_step": 6430, "train_info/time_within_train_step": 2.641488790512085, "step": 6430} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 6430} {"info/global_step": 6431, "train_info/time_within_train_step": 2.6563808917999268, "step": 6431} {"train_info/time_between_train_steps": 0.0032587051391601562, "step": 6431} {"info/global_step": 6432, "train_info/time_within_train_step": 2.6529958248138428, "step": 6432} {"train_info/time_between_train_steps": 0.003431081771850586, "step": 6432} {"info/global_step": 6433, "train_info/time_within_train_step": 2.6398258209228516, "step": 6433} {"train_info/time_between_train_steps": 0.003504037857055664, "step": 6433} {"info/global_step": 6434, "train_info/time_within_train_step": 2.6428885459899902, "step": 6434} {"train_info/time_between_train_steps": 0.003347158432006836, "step": 6434} {"info/global_step": 6435, "train_info/time_within_train_step": 2.6429619789123535, "step": 6435} {"train_info/time_between_train_steps": 0.003391742706298828, "step": 6435} {"info/global_step": 6436, "train_info/time_within_train_step": 2.641068935394287, "step": 6436} {"train_info/time_between_train_steps": 0.0034928321838378906, "step": 6436} {"info/global_step": 6437, "train_info/time_within_train_step": 2.645070791244507, "step": 6437} {"train_info/time_between_train_steps": 0.0032923221588134766, "step": 6437} {"info/global_step": 6438, "train_info/time_within_train_step": 2.639681816101074, "step": 6438} {"train_info/time_between_train_steps": 0.0035316944122314453, "step": 6438} {"info/global_step": 6439, "train_info/time_within_train_step": 2.5965065956115723, "step": 6439} {"train_info/time_between_train_steps": 0.0032825469970703125, "step": 6439} {"info/global_step": 6440, "train_info/time_within_train_step": 2.5911927223205566, "step": 6440} {"train_info/time_between_train_steps": 0.003509521484375, "step": 6440} {"info/global_step": 6441, "train_info/time_within_train_step": 3.2491488456726074, "step": 6441} {"train_info/time_between_train_steps": 0.0033135414123535156, "step": 6441} {"info/global_step": 6442, "train_info/time_within_train_step": 2.5923407077789307, "step": 6442} {"train_info/time_between_train_steps": 0.003323793411254883, "step": 6442} {"info/global_step": 6443, "train_info/time_within_train_step": 2.5858840942382812, "step": 6443} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 6443} {"info/global_step": 6444, "train_info/time_within_train_step": 2.6268725395202637, "step": 6444} {"train_info/time_between_train_steps": 0.0033807754516601562, "step": 6444} {"info/global_step": 6445, "train_info/time_within_train_step": 2.631504535675049, "step": 6445} {"train_info/time_between_train_steps": 0.0033485889434814453, "step": 6445} {"info/global_step": 6446, "train_info/time_within_train_step": 2.623378276824951, "step": 6446} {"train_info/time_between_train_steps": 0.0032749176025390625, "step": 6446} {"info/global_step": 6447, "train_info/time_within_train_step": 2.6911442279815674, "step": 6447} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 6447} {"info/global_step": 6448, "train_info/time_within_train_step": 2.649026393890381, "step": 6448} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 6448} {"info/global_step": 6449, "train_info/time_within_train_step": 2.6519405841827393, "step": 6449} {"train_info/time_between_train_steps": 0.003229379653930664, "step": 6449} {"info/global_step": 6450, "train_info/time_within_train_step": 2.639261245727539, "step": 6450} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746915547, "_runtime": 18145}, "step": 6450} {"logs": {"train/loss": 3.3564, "train/learning_rate": 0.00023666666666666663, "train/epoch": 7.04, "_timestamp": 1746915547, "_runtime": 18145}, "step": 6450} {"train_info/time_between_train_steps": 0.02496170997619629, "step": 6450} {"info/global_step": 6451, "train_info/time_within_train_step": 2.706394672393799, "step": 6451} {"train_info/time_between_train_steps": 0.003208637237548828, "step": 6451} {"info/global_step": 6452, "train_info/time_within_train_step": 2.684007406234741, "step": 6452} {"train_info/time_between_train_steps": 0.003315448760986328, "step": 6452} {"info/global_step": 6453, "train_info/time_within_train_step": 2.6508214473724365, "step": 6453} {"train_info/time_between_train_steps": 0.003267049789428711, "step": 6453} {"info/global_step": 6454, "train_info/time_within_train_step": 2.671996593475342, "step": 6454} {"train_info/time_between_train_steps": 0.003278493881225586, "step": 6454} {"info/global_step": 6455, "train_info/time_within_train_step": 2.6408205032348633, "step": 6455} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 6455} {"info/global_step": 6456, "train_info/time_within_train_step": 2.6439080238342285, "step": 6456} {"train_info/time_between_train_steps": 0.0032706260681152344, "step": 6456} {"info/global_step": 6457, "train_info/time_within_train_step": 2.6607534885406494, "step": 6457} {"train_info/time_between_train_steps": 0.003288745880126953, "step": 6457} {"info/global_step": 6458, "train_info/time_within_train_step": 2.647536277770996, "step": 6458} {"train_info/time_between_train_steps": 0.0032618045806884766, "step": 6458} {"info/global_step": 6459, "train_info/time_within_train_step": 2.646575689315796, "step": 6459} {"train_info/time_between_train_steps": 0.0032563209533691406, "step": 6459} {"info/global_step": 6460, "train_info/time_within_train_step": 2.6642539501190186, "step": 6460} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 6460} {"info/global_step": 6461, "train_info/time_within_train_step": 2.6629927158355713, "step": 6461} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 6461} {"info/global_step": 6462, "train_info/time_within_train_step": 2.6594901084899902, "step": 6462} {"train_info/time_between_train_steps": 0.003235340118408203, "step": 6462} {"info/global_step": 6463, "train_info/time_within_train_step": 2.7069926261901855, "step": 6463} {"train_info/time_between_train_steps": 0.0032291412353515625, "step": 6463} {"info/global_step": 6464, "train_info/time_within_train_step": 2.6444666385650635, "step": 6464} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 6464} {"info/global_step": 6465, "train_info/time_within_train_step": 2.6476588249206543, "step": 6465} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 6465} {"info/global_step": 6466, "train_info/time_within_train_step": 2.6610267162323, "step": 6466} {"train_info/time_between_train_steps": 0.003255128860473633, "step": 6466} {"info/global_step": 6467, "train_info/time_within_train_step": 2.6450066566467285, "step": 6467} {"train_info/time_between_train_steps": 0.0032393932342529297, "step": 6467} {"info/global_step": 6468, "train_info/time_within_train_step": 2.644766092300415, "step": 6468} {"train_info/time_between_train_steps": 0.0031502246856689453, "step": 6468} {"info/global_step": 6469, "train_info/time_within_train_step": 2.6529266834259033, "step": 6469} {"train_info/time_between_train_steps": 0.003258228302001953, "step": 6469} {"info/global_step": 6470, "train_info/time_within_train_step": 2.6536619663238525, "step": 6470} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 6470} {"info/global_step": 6471, "train_info/time_within_train_step": 2.661065101623535, "step": 6471} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 6471} {"info/global_step": 6472, "train_info/time_within_train_step": 2.6916239261627197, "step": 6472} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 6472} {"info/global_step": 6473, "train_info/time_within_train_step": 2.716783285140991, "step": 6473} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 6473} {"info/global_step": 6474, "train_info/time_within_train_step": 2.642849922180176, "step": 6474} {"train_info/time_between_train_steps": 0.003136157989501953, "step": 6474} {"info/global_step": 6475, "train_info/time_within_train_step": 2.6423983573913574, "step": 6475} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 6475} {"info/global_step": 6476, "train_info/time_within_train_step": 2.6645474433898926, "step": 6476} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 6476} {"info/global_step": 6477, "train_info/time_within_train_step": 2.9768142700195312, "step": 6477} {"train_info/time_between_train_steps": 0.003250598907470703, "step": 6477} {"info/global_step": 6478, "train_info/time_within_train_step": 2.6504950523376465, "step": 6478} {"train_info/time_between_train_steps": 0.0033652782440185547, "step": 6478} {"info/global_step": 6479, "train_info/time_within_train_step": 2.8258113861083984, "step": 6479} {"train_info/time_between_train_steps": 0.003239870071411133, "step": 6479} {"info/global_step": 6480, "train_info/time_within_train_step": 2.691787004470825, "step": 6480} {"train_info/time_between_train_steps": 0.0032737255096435547, "step": 6480} {"info/global_step": 6481, "train_info/time_within_train_step": 2.641613483428955, "step": 6481} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 6481} {"info/global_step": 6482, "train_info/time_within_train_step": 2.6435391902923584, "step": 6482} {"train_info/time_between_train_steps": 0.003262042999267578, "step": 6482} {"info/global_step": 6483, "train_info/time_within_train_step": 2.656214714050293, "step": 6483} {"train_info/time_between_train_steps": 0.0032362937927246094, "step": 6483} {"info/global_step": 6484, "train_info/time_within_train_step": 2.657627582550049, "step": 6484} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 6484} {"info/global_step": 6485, "train_info/time_within_train_step": 2.6456735134124756, "step": 6485} {"train_info/time_between_train_steps": 0.003188610076904297, "step": 6485} {"info/global_step": 6486, "train_info/time_within_train_step": 2.651762008666992, "step": 6486} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 6486} {"info/global_step": 6487, "train_info/time_within_train_step": 2.658032178878784, "step": 6487} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 6487} {"info/global_step": 6488, "train_info/time_within_train_step": 2.6653151512145996, "step": 6488} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 6488} {"info/global_step": 6489, "train_info/time_within_train_step": 2.6485090255737305, "step": 6489} {"train_info/time_between_train_steps": 0.003330230712890625, "step": 6489} {"info/global_step": 6490, "train_info/time_within_train_step": 2.6590843200683594, "step": 6490} {"train_info/time_between_train_steps": 0.0032019615173339844, "step": 6490} {"info/global_step": 6491, "train_info/time_within_train_step": 2.645064115524292, "step": 6491} {"train_info/time_between_train_steps": 0.0031478404998779297, "step": 6491} {"info/global_step": 6492, "train_info/time_within_train_step": 2.6484012603759766, "step": 6492} {"train_info/time_between_train_steps": 0.0032074451446533203, "step": 6492} {"info/global_step": 6493, "train_info/time_within_train_step": 2.6734275817871094, "step": 6493} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 6493} {"info/global_step": 6494, "train_info/time_within_train_step": 2.668017625808716, "step": 6494} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 6494} {"info/global_step": 6495, "train_info/time_within_train_step": 2.6772854328155518, "step": 6495} {"train_info/time_between_train_steps": 0.0034630298614501953, "step": 6495} {"info/global_step": 6496, "train_info/time_within_train_step": 2.670508861541748, "step": 6496} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 6496} {"info/global_step": 6497, "train_info/time_within_train_step": 2.6543846130371094, "step": 6497} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 6497} {"info/global_step": 6498, "train_info/time_within_train_step": 2.712019443511963, "step": 6498} {"train_info/time_between_train_steps": 0.003208160400390625, "step": 6498} {"info/global_step": 6499, "train_info/time_within_train_step": 3.277315855026245, "step": 6499} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 6499} {"info/global_step": 6500, "train_info/time_within_train_step": 2.645211935043335, "step": 6500} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746915682, "_runtime": 18280}, "step": 6500} {"logs": {"train/loss": 3.3563, "train/learning_rate": 0.0002333333333333333, "train/epoch": 7.05, "_timestamp": 1746915682, "_runtime": 18280}, "step": 6500} {"train_info/time_between_train_steps": 0.024391889572143555, "step": 6500} {"info/global_step": 6501, "train_info/time_within_train_step": 2.6502859592437744, "step": 6501} {"train_info/time_between_train_steps": 0.003241300582885742, "step": 6501} {"info/global_step": 6502, "train_info/time_within_train_step": 2.652010202407837, "step": 6502} {"train_info/time_between_train_steps": 0.003226041793823242, "step": 6502} {"info/global_step": 6503, "train_info/time_within_train_step": 2.681504726409912, "step": 6503} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 6503} {"info/global_step": 6504, "train_info/time_within_train_step": 2.65766978263855, "step": 6504} {"train_info/time_between_train_steps": 0.0032367706298828125, "step": 6504} {"info/global_step": 6505, "train_info/time_within_train_step": 2.6647517681121826, "step": 6505} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 6505} {"info/global_step": 6506, "train_info/time_within_train_step": 2.7011256217956543, "step": 6506} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 6506} {"info/global_step": 6507, "train_info/time_within_train_step": 2.6811447143554688, "step": 6507} {"train_info/time_between_train_steps": 0.003235340118408203, "step": 6507} {"info/global_step": 6508, "train_info/time_within_train_step": 2.6433141231536865, "step": 6508} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 6508} {"info/global_step": 6509, "train_info/time_within_train_step": 2.643176794052124, "step": 6509} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 6509} {"info/global_step": 6510, "train_info/time_within_train_step": 2.66097354888916, "step": 6510} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 6510} {"info/global_step": 6511, "train_info/time_within_train_step": 2.6555349826812744, "step": 6511} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 6511} {"info/global_step": 6512, "train_info/time_within_train_step": 2.645632028579712, "step": 6512} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 6512} {"info/global_step": 6513, "train_info/time_within_train_step": 2.6602799892425537, "step": 6513} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 6513} {"info/global_step": 6514, "train_info/time_within_train_step": 2.657689332962036, "step": 6514} {"train_info/time_between_train_steps": 0.0032901763916015625, "step": 6514} {"info/global_step": 6515, "train_info/time_within_train_step": 2.66275954246521, "step": 6515} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 6515} {"info/global_step": 6516, "train_info/time_within_train_step": 2.6658027172088623, "step": 6516} {"train_info/time_between_train_steps": 0.0031702518463134766, "step": 6516} {"info/global_step": 6517, "train_info/time_within_train_step": 2.6457602977752686, "step": 6517} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 6517} {"info/global_step": 6518, "train_info/time_within_train_step": 2.650942325592041, "step": 6518} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 6518} {"info/global_step": 6519, "train_info/time_within_train_step": 2.654496669769287, "step": 6519} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 6519} {"info/global_step": 6520, "train_info/time_within_train_step": 2.9194540977478027, "step": 6520} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 6520} {"info/global_step": 6521, "train_info/time_within_train_step": 2.643171548843384, "step": 6521} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 6521} {"info/global_step": 6522, "train_info/time_within_train_step": 2.657184362411499, "step": 6522} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 6522} {"info/global_step": 6523, "train_info/time_within_train_step": 2.651907205581665, "step": 6523} {"train_info/time_between_train_steps": 0.006243705749511719, "step": 6523} {"info/global_step": 6524, "train_info/time_within_train_step": 2.6552011966705322, "step": 6524} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 6524} {"info/global_step": 6525, "train_info/time_within_train_step": 2.646481990814209, "step": 6525} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 6525} {"info/global_step": 6526, "train_info/time_within_train_step": 2.6485037803649902, "step": 6526} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 6526} {"info/global_step": 6527, "train_info/time_within_train_step": 2.665417432785034, "step": 6527} {"train_info/time_between_train_steps": 0.003244161605834961, "step": 6527} {"info/global_step": 6528, "train_info/time_within_train_step": 2.666625499725342, "step": 6528} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 6528} {"info/global_step": 6529, "train_info/time_within_train_step": 2.681652784347534, "step": 6529} {"train_info/time_between_train_steps": 0.0032875537872314453, "step": 6529} {"info/global_step": 6530, "train_info/time_within_train_step": 2.6569175720214844, "step": 6530} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 6530} {"info/global_step": 6531, "train_info/time_within_train_step": 2.6409530639648438, "step": 6531} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 6531} {"info/global_step": 6532, "train_info/time_within_train_step": 2.660734176635742, "step": 6532} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 6532} {"info/global_step": 6533, "train_info/time_within_train_step": 2.655005931854248, "step": 6533} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 6533} {"info/global_step": 6534, "train_info/time_within_train_step": 2.648716688156128, "step": 6534} {"train_info/time_between_train_steps": 0.0031714439392089844, "step": 6534} {"info/global_step": 6535, "train_info/time_within_train_step": 2.6458709239959717, "step": 6535} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 6535} {"info/global_step": 6536, "train_info/time_within_train_step": 2.64943790435791, "step": 6536} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 6536} {"info/global_step": 6537, "train_info/time_within_train_step": 2.6731293201446533, "step": 6537} {"train_info/time_between_train_steps": 0.00324249267578125, "step": 6537} {"info/global_step": 6538, "train_info/time_within_train_step": 2.6680335998535156, "step": 6538} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 6538} {"info/global_step": 6539, "train_info/time_within_train_step": 2.663494348526001, "step": 6539} {"train_info/time_between_train_steps": 0.003244161605834961, "step": 6539} {"info/global_step": 6540, "train_info/time_within_train_step": 2.682063102722168, "step": 6540} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 6540} {"info/global_step": 6541, "train_info/time_within_train_step": 2.6440036296844482, "step": 6541} {"train_info/time_between_train_steps": 0.11495637893676758, "step": 6541} {"info/global_step": 6542, "train_info/time_within_train_step": 2.689366102218628, "step": 6542} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 6542} {"info/global_step": 6543, "train_info/time_within_train_step": 2.6421687602996826, "step": 6543} {"train_info/time_between_train_steps": 0.0032358169555664062, "step": 6543} {"info/global_step": 6544, "train_info/time_within_train_step": 2.6526665687561035, "step": 6544} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 6544} {"info/global_step": 6545, "train_info/time_within_train_step": 2.6638295650482178, "step": 6545} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 6545} {"info/global_step": 6546, "train_info/time_within_train_step": 2.6466562747955322, "step": 6546} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 6546} {"info/global_step": 6547, "train_info/time_within_train_step": 2.645160675048828, "step": 6547} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 6547} {"info/global_step": 6548, "train_info/time_within_train_step": 2.662631034851074, "step": 6548} {"train_info/time_between_train_steps": 0.0032219886779785156, "step": 6548} {"info/global_step": 6549, "train_info/time_within_train_step": 2.669553518295288, "step": 6549} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 6549} {"info/global_step": 6550, "train_info/time_within_train_step": 2.6615896224975586, "step": 6550} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746915816, "_runtime": 18414}, "step": 6550} {"logs": {"train/loss": 3.3405, "train/learning_rate": 0.00023, "train/epoch": 7.05, "_timestamp": 1746915816, "_runtime": 18414}, "step": 6550} {"train_info/time_between_train_steps": 0.024750232696533203, "step": 6550} {"info/global_step": 6551, "train_info/time_within_train_step": 2.679696559906006, "step": 6551} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 6551} {"info/global_step": 6552, "train_info/time_within_train_step": 2.692119836807251, "step": 6552} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 6552} {"info/global_step": 6553, "train_info/time_within_train_step": 2.644120216369629, "step": 6553} {"train_info/time_between_train_steps": 0.0033016204833984375, "step": 6553} {"info/global_step": 6554, "train_info/time_within_train_step": 2.642622947692871, "step": 6554} {"train_info/time_between_train_steps": 0.003264904022216797, "step": 6554} {"info/global_step": 6555, "train_info/time_within_train_step": 2.667149305343628, "step": 6555} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 6555} {"info/global_step": 6556, "train_info/time_within_train_step": 2.6489384174346924, "step": 6556} {"train_info/time_between_train_steps": 0.003247976303100586, "step": 6556} {"info/global_step": 6557, "train_info/time_within_train_step": 2.6457009315490723, "step": 6557} {"train_info/time_between_train_steps": 0.0036139488220214844, "step": 6557} {"info/global_step": 6558, "train_info/time_within_train_step": 2.660409927368164, "step": 6558} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 6558} {"info/global_step": 6559, "train_info/time_within_train_step": 2.654050827026367, "step": 6559} {"train_info/time_between_train_steps": 0.003254413604736328, "step": 6559} {"info/global_step": 6560, "train_info/time_within_train_step": 2.661543846130371, "step": 6560} {"train_info/time_between_train_steps": 0.0033180713653564453, "step": 6560} {"info/global_step": 6561, "train_info/time_within_train_step": 2.7032904624938965, "step": 6561} {"train_info/time_between_train_steps": 0.0032804012298583984, "step": 6561} {"info/global_step": 6562, "train_info/time_within_train_step": 2.7146987915039062, "step": 6562} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 6562} {"info/global_step": 6563, "train_info/time_within_train_step": 2.642733097076416, "step": 6563} {"train_info/time_between_train_steps": 0.003278017044067383, "step": 6563} {"info/global_step": 6564, "train_info/time_within_train_step": 2.6408040523529053, "step": 6564} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 6564} {"info/global_step": 6565, "train_info/time_within_train_step": 2.6627748012542725, "step": 6565} {"train_info/time_between_train_steps": 0.0032384395599365234, "step": 6565} {"info/global_step": 6566, "train_info/time_within_train_step": 2.6499576568603516, "step": 6566} {"train_info/time_between_train_steps": 0.0032618045806884766, "step": 6566} {"info/global_step": 6567, "train_info/time_within_train_step": 2.6443467140197754, "step": 6567} {"train_info/time_between_train_steps": 0.0032682418823242188, "step": 6567} {"info/global_step": 6568, "train_info/time_within_train_step": 2.666611909866333, "step": 6568} {"train_info/time_between_train_steps": 0.003384113311767578, "step": 6568} {"info/global_step": 6569, "train_info/time_within_train_step": 2.6721198558807373, "step": 6569} {"train_info/time_between_train_steps": 0.0033147335052490234, "step": 6569} {"info/global_step": 6570, "train_info/time_within_train_step": 2.69415283203125, "step": 6570} {"train_info/time_between_train_steps": 0.0032243728637695312, "step": 6570} {"info/global_step": 6571, "train_info/time_within_train_step": 2.670182228088379, "step": 6571} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 6571} {"info/global_step": 6572, "train_info/time_within_train_step": 2.660555124282837, "step": 6572} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 6572} {"info/global_step": 6573, "train_info/time_within_train_step": 2.641503095626831, "step": 6573} {"train_info/time_between_train_steps": 0.003256559371948242, "step": 6573} {"info/global_step": 6574, "train_info/time_within_train_step": 2.6549296379089355, "step": 6574} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 6574} {"info/global_step": 6575, "train_info/time_within_train_step": 2.657106399536133, "step": 6575} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 6575} {"info/global_step": 6576, "train_info/time_within_train_step": 2.6458194255828857, "step": 6576} {"train_info/time_between_train_steps": 0.0033059120178222656, "step": 6576} {"info/global_step": 6577, "train_info/time_within_train_step": 2.646897315979004, "step": 6577} {"train_info/time_between_train_steps": 0.003214120864868164, "step": 6577} {"info/global_step": 6578, "train_info/time_within_train_step": 2.65691876411438, "step": 6578} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 6578} {"info/global_step": 6579, "train_info/time_within_train_step": 2.67036509513855, "step": 6579} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 6579} {"info/global_step": 6580, "train_info/time_within_train_step": 2.6782426834106445, "step": 6580} {"train_info/time_between_train_steps": 0.0032842159271240234, "step": 6580} {"info/global_step": 6581, "train_info/time_within_train_step": 2.653791666030884, "step": 6581} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 6581} {"info/global_step": 6582, "train_info/time_within_train_step": 2.687819480895996, "step": 6582} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 6582} {"info/global_step": 6583, "train_info/time_within_train_step": 2.6419451236724854, "step": 6583} {"train_info/time_between_train_steps": 0.003233194351196289, "step": 6583} {"info/global_step": 6584, "train_info/time_within_train_step": 2.649585008621216, "step": 6584} {"train_info/time_between_train_steps": 0.0031425952911376953, "step": 6584} {"info/global_step": 6585, "train_info/time_within_train_step": 2.66186261177063, "step": 6585} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 6585} {"info/global_step": 6586, "train_info/time_within_train_step": 2.6704750061035156, "step": 6586} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 6586} {"info/global_step": 6587, "train_info/time_within_train_step": 2.677227258682251, "step": 6587} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 6587} {"info/global_step": 6588, "train_info/time_within_train_step": 2.669099807739258, "step": 6588} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 6588} {"info/global_step": 6589, "train_info/time_within_train_step": 2.6450531482696533, "step": 6589} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 6589} {"info/global_step": 6590, "train_info/time_within_train_step": 2.6438043117523193, "step": 6590} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 6590} {"info/global_step": 6591, "train_info/time_within_train_step": 2.656266450881958, "step": 6591} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 6591} {"info/global_step": 6592, "train_info/time_within_train_step": 2.678978204727173, "step": 6592} {"train_info/time_between_train_steps": 0.0029189586639404297, "step": 6592} {"info/global_step": 6593, "train_info/time_within_train_step": 2.6452016830444336, "step": 6593} {"train_info/time_between_train_steps": 0.002992391586303711, "step": 6593} {"info/global_step": 6594, "train_info/time_within_train_step": 2.657877206802368, "step": 6594} {"train_info/time_between_train_steps": 0.0028793811798095703, "step": 6594} {"info/global_step": 6595, "train_info/time_within_train_step": 2.651115894317627, "step": 6595} {"train_info/time_between_train_steps": 0.0029654502868652344, "step": 6595} {"info/global_step": 6596, "train_info/time_within_train_step": 2.660043954849243, "step": 6596} {"train_info/time_between_train_steps": 0.0029571056365966797, "step": 6596} {"info/global_step": 6597, "train_info/time_within_train_step": 2.7062714099884033, "step": 6597} {"train_info/time_between_train_steps": 0.0029048919677734375, "step": 6597} {"info/global_step": 6598, "train_info/time_within_train_step": 2.6957590579986572, "step": 6598} {"train_info/time_between_train_steps": 0.002906322479248047, "step": 6598} {"info/global_step": 6599, "train_info/time_within_train_step": 2.6413090229034424, "step": 6599} {"train_info/time_between_train_steps": 0.002900362014770508, "step": 6599} {"info/global_step": 6600, "train_info/time_within_train_step": 2.6568892002105713, "step": 6600} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746915951, "_runtime": 18549}, "step": 6600} {"logs": {"train/loss": 3.3352, "train/learning_rate": 0.00022666666666666663, "train/epoch": 7.06, "_timestamp": 1746915951, "_runtime": 18549}, "step": 6600} {"train_info/time_between_train_steps": 19.09940505027771, "step": 6600} {"info/global_step": 6601, "train_info/time_within_train_step": 2.441505193710327, "step": 6601} {"train_info/time_between_train_steps": 0.0028917789459228516, "step": 6601} {"info/global_step": 6602, "train_info/time_within_train_step": 2.424328327178955, "step": 6602} {"train_info/time_between_train_steps": 0.0028793811798095703, "step": 6602} {"info/global_step": 6603, "train_info/time_within_train_step": 2.562040090560913, "step": 6603} {"train_info/time_between_train_steps": 0.0029282569885253906, "step": 6603} {"info/global_step": 6604, "train_info/time_within_train_step": 2.635901689529419, "step": 6604} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 6604} {"info/global_step": 6605, "train_info/time_within_train_step": 2.6533029079437256, "step": 6605} {"train_info/time_between_train_steps": 0.0028829574584960938, "step": 6605} {"info/global_step": 6606, "train_info/time_within_train_step": 2.654303550720215, "step": 6606} {"train_info/time_between_train_steps": 0.0029065608978271484, "step": 6606} {"info/global_step": 6607, "train_info/time_within_train_step": 2.6435112953186035, "step": 6607} {"train_info/time_between_train_steps": 0.0029201507568359375, "step": 6607} {"info/global_step": 6608, "train_info/time_within_train_step": 2.6562886238098145, "step": 6608} {"train_info/time_between_train_steps": 0.002913236618041992, "step": 6608} {"info/global_step": 6609, "train_info/time_within_train_step": 2.6534557342529297, "step": 6609} {"train_info/time_between_train_steps": 0.0029532909393310547, "step": 6609} {"info/global_step": 6610, "train_info/time_within_train_step": 2.6714723110198975, "step": 6610} {"train_info/time_between_train_steps": 0.002914905548095703, "step": 6610} {"info/global_step": 6611, "train_info/time_within_train_step": 2.6743075847625732, "step": 6611} {"train_info/time_between_train_steps": 0.0029261112213134766, "step": 6611} {"info/global_step": 6612, "train_info/time_within_train_step": 2.6495747566223145, "step": 6612} {"train_info/time_between_train_steps": 0.00287628173828125, "step": 6612} {"info/global_step": 6613, "train_info/time_within_train_step": 2.68807053565979, "step": 6613} {"train_info/time_between_train_steps": 0.0032951831817626953, "step": 6613} {"info/global_step": 6614, "train_info/time_within_train_step": 2.642470121383667, "step": 6614} {"train_info/time_between_train_steps": 0.002908468246459961, "step": 6614} {"info/global_step": 6615, "train_info/time_within_train_step": 2.6506829261779785, "step": 6615} {"train_info/time_between_train_steps": 0.0029075145721435547, "step": 6615} {"info/global_step": 6616, "train_info/time_within_train_step": 2.6635284423828125, "step": 6616} {"train_info/time_between_train_steps": 0.002901315689086914, "step": 6616} {"info/global_step": 6617, "train_info/time_within_train_step": 2.643734931945801, "step": 6617} {"train_info/time_between_train_steps": 0.0029180049896240234, "step": 6617} {"info/global_step": 6618, "train_info/time_within_train_step": 2.6442513465881348, "step": 6618} {"train_info/time_between_train_steps": 0.0029408931732177734, "step": 6618} {"info/global_step": 6619, "train_info/time_within_train_step": 2.6586639881134033, "step": 6619} {"train_info/time_between_train_steps": 0.0029201507568359375, "step": 6619} {"info/global_step": 6620, "train_info/time_within_train_step": 2.672088146209717, "step": 6620} {"train_info/time_between_train_steps": 0.002901792526245117, "step": 6620} {"info/global_step": 6621, "train_info/time_within_train_step": 2.67345929145813, "step": 6621} {"train_info/time_between_train_steps": 0.002902984619140625, "step": 6621} {"info/global_step": 6622, "train_info/time_within_train_step": 2.6644740104675293, "step": 6622} {"train_info/time_between_train_steps": 0.002884387969970703, "step": 6622} {"info/global_step": 6623, "train_info/time_within_train_step": 2.7077224254608154, "step": 6623} {"train_info/time_between_train_steps": 0.0029141902923583984, "step": 6623} {"info/global_step": 6624, "train_info/time_within_train_step": 2.8819339275360107, "step": 6624} {"train_info/time_between_train_steps": 0.002911806106567383, "step": 6624} {"info/global_step": 6625, "train_info/time_within_train_step": 2.7006773948669434, "step": 6625} {"train_info/time_between_train_steps": 0.0029027462005615234, "step": 6625} {"info/global_step": 6626, "train_info/time_within_train_step": 2.655710458755493, "step": 6626} {"train_info/time_between_train_steps": 0.0029604434967041016, "step": 6626} {"info/global_step": 6627, "train_info/time_within_train_step": 2.6473567485809326, "step": 6627} {"train_info/time_between_train_steps": 0.0028638839721679688, "step": 6627} {"info/global_step": 6628, "train_info/time_within_train_step": 2.648581027984619, "step": 6628} {"train_info/time_between_train_steps": 0.002887248992919922, "step": 6628} {"info/global_step": 6629, "train_info/time_within_train_step": 2.650338649749756, "step": 6629} {"train_info/time_between_train_steps": 0.002893686294555664, "step": 6629} {"info/global_step": 6630, "train_info/time_within_train_step": 2.650482654571533, "step": 6630} {"train_info/time_between_train_steps": 0.0028693675994873047, "step": 6630} {"info/global_step": 6631, "train_info/time_within_train_step": 2.6469099521636963, "step": 6631} {"train_info/time_between_train_steps": 0.0028769969940185547, "step": 6631} {"info/global_step": 6632, "train_info/time_within_train_step": 2.6555440425872803, "step": 6632} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 6632} {"info/global_step": 6633, "train_info/time_within_train_step": 2.658179759979248, "step": 6633} {"train_info/time_between_train_steps": 0.002926349639892578, "step": 6633} {"info/global_step": 6634, "train_info/time_within_train_step": 2.672300100326538, "step": 6634} {"train_info/time_between_train_steps": 0.002870798110961914, "step": 6634} {"info/global_step": 6635, "train_info/time_within_train_step": 2.7279744148254395, "step": 6635} {"train_info/time_between_train_steps": 0.0028891563415527344, "step": 6635} {"info/global_step": 6636, "train_info/time_within_train_step": 2.661343812942505, "step": 6636} {"train_info/time_between_train_steps": 0.0028908252716064453, "step": 6636} {"info/global_step": 6637, "train_info/time_within_train_step": 2.6408145427703857, "step": 6637} {"train_info/time_between_train_steps": 0.0028781890869140625, "step": 6637} {"info/global_step": 6638, "train_info/time_within_train_step": 2.650139331817627, "step": 6638} {"train_info/time_between_train_steps": 0.0028901100158691406, "step": 6638} {"info/global_step": 6639, "train_info/time_within_train_step": 2.6565089225769043, "step": 6639} {"train_info/time_between_train_steps": 0.00293731689453125, "step": 6639} {"info/global_step": 6640, "train_info/time_within_train_step": 2.666574001312256, "step": 6640} {"train_info/time_between_train_steps": 0.0029032230377197266, "step": 6640} {"info/global_step": 6641, "train_info/time_within_train_step": 2.7021334171295166, "step": 6641} {"train_info/time_between_train_steps": 0.002947092056274414, "step": 6641} {"info/global_step": 6642, "train_info/time_within_train_step": 2.645871639251709, "step": 6642} {"train_info/time_between_train_steps": 0.002938508987426758, "step": 6642} {"info/global_step": 6643, "train_info/time_within_train_step": 2.6490252017974854, "step": 6643} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 6643} {"info/global_step": 6644, "train_info/time_within_train_step": 2.653879165649414, "step": 6644} {"train_info/time_between_train_steps": 0.002878904342651367, "step": 6644} {"info/global_step": 6645, "train_info/time_within_train_step": 2.6464173793792725, "step": 6645} {"train_info/time_between_train_steps": 0.003084897994995117, "step": 6645} {"info/global_step": 6646, "train_info/time_within_train_step": 2.6452672481536865, "step": 6646} {"train_info/time_between_train_steps": 0.0030181407928466797, "step": 6646} {"info/global_step": 6647, "train_info/time_within_train_step": 2.64546275138855, "step": 6647} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 6647} {"info/global_step": 6648, "train_info/time_within_train_step": 2.646036148071289, "step": 6648} {"train_info/time_between_train_steps": 0.003056764602661133, "step": 6648} {"info/global_step": 6649, "train_info/time_within_train_step": 2.6445090770721436, "step": 6649} {"train_info/time_between_train_steps": 0.002962350845336914, "step": 6649} {"info/global_step": 6650, "train_info/time_within_train_step": 2.6503045558929443, "step": 6650} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746916104, "_runtime": 18702}, "step": 6650} {"logs": {"train/loss": 3.3217, "train/learning_rate": 0.00022333333333333333, "train/epoch": 7.06, "_timestamp": 1746916104, "_runtime": 18702}, "step": 6650} {"train_info/time_between_train_steps": 0.023930072784423828, "step": 6650} {"info/global_step": 6651, "train_info/time_within_train_step": 2.6482431888580322, "step": 6651} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 6651} {"info/global_step": 6652, "train_info/time_within_train_step": 2.679647922515869, "step": 6652} {"train_info/time_between_train_steps": 0.0029599666595458984, "step": 6652} {"info/global_step": 6653, "train_info/time_within_train_step": 2.673945665359497, "step": 6653} {"train_info/time_between_train_steps": 0.002920866012573242, "step": 6653} {"info/global_step": 6654, "train_info/time_within_train_step": 2.653432607650757, "step": 6654} {"train_info/time_between_train_steps": 0.0029692649841308594, "step": 6654} {"info/global_step": 6655, "train_info/time_within_train_step": 2.6604957580566406, "step": 6655} {"train_info/time_between_train_steps": 0.0029540061950683594, "step": 6655} {"info/global_step": 6656, "train_info/time_within_train_step": 2.7131948471069336, "step": 6656} {"train_info/time_between_train_steps": 0.0029261112213134766, "step": 6656} {"info/global_step": 6657, "train_info/time_within_train_step": 2.6624624729156494, "step": 6657} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 6657} {"info/global_step": 6658, "train_info/time_within_train_step": 2.640108108520508, "step": 6658} {"train_info/time_between_train_steps": 0.0029680728912353516, "step": 6658} {"info/global_step": 6659, "train_info/time_within_train_step": 2.6510074138641357, "step": 6659} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 6659} {"info/global_step": 6660, "train_info/time_within_train_step": 2.647312879562378, "step": 6660} {"train_info/time_between_train_steps": 0.0029506683349609375, "step": 6660} {"info/global_step": 6661, "train_info/time_within_train_step": 2.6517317295074463, "step": 6661} {"train_info/time_between_train_steps": 0.002926349639892578, "step": 6661} {"info/global_step": 6662, "train_info/time_within_train_step": 2.645035743713379, "step": 6662} {"train_info/time_between_train_steps": 0.0029058456420898438, "step": 6662} {"info/global_step": 6663, "train_info/time_within_train_step": 2.6447267532348633, "step": 6663} {"train_info/time_between_train_steps": 0.002910614013671875, "step": 6663} {"info/global_step": 6664, "train_info/time_within_train_step": 2.6646220684051514, "step": 6664} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 6664} {"info/global_step": 6665, "train_info/time_within_train_step": 2.6641035079956055, "step": 6665} {"train_info/time_between_train_steps": 0.0029230117797851562, "step": 6665} {"info/global_step": 6666, "train_info/time_within_train_step": 2.690497636795044, "step": 6666} {"train_info/time_between_train_steps": 0.0028777122497558594, "step": 6666} {"info/global_step": 6667, "train_info/time_within_train_step": 2.6492714881896973, "step": 6667} {"train_info/time_between_train_steps": 0.002896547317504883, "step": 6667} {"info/global_step": 6668, "train_info/time_within_train_step": 2.640472650527954, "step": 6668} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 6668} {"info/global_step": 6669, "train_info/time_within_train_step": 2.657742738723755, "step": 6669} {"train_info/time_between_train_steps": 0.0029115676879882812, "step": 6669} {"info/global_step": 6670, "train_info/time_within_train_step": 2.654128313064575, "step": 6670} {"train_info/time_between_train_steps": 0.002946615219116211, "step": 6670} {"info/global_step": 6671, "train_info/time_within_train_step": 2.643437623977661, "step": 6671} {"train_info/time_between_train_steps": 0.0029296875, "step": 6671} {"info/global_step": 6672, "train_info/time_within_train_step": 2.6436777114868164, "step": 6672} {"train_info/time_between_train_steps": 0.0029137134552001953, "step": 6672} {"info/global_step": 6673, "train_info/time_within_train_step": 2.658299207687378, "step": 6673} {"train_info/time_between_train_steps": 0.0029048919677734375, "step": 6673} {"info/global_step": 6674, "train_info/time_within_train_step": 2.6684372425079346, "step": 6674} {"train_info/time_between_train_steps": 0.0029230117797851562, "step": 6674} {"info/global_step": 6675, "train_info/time_within_train_step": 2.6997170448303223, "step": 6675} {"train_info/time_between_train_steps": 0.002950906753540039, "step": 6675} {"info/global_step": 6676, "train_info/time_within_train_step": 2.6532411575317383, "step": 6676} {"train_info/time_between_train_steps": 0.0029571056365966797, "step": 6676} {"info/global_step": 6677, "train_info/time_within_train_step": 2.6869044303894043, "step": 6677} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 6677} {"info/global_step": 6678, "train_info/time_within_train_step": 2.641500473022461, "step": 6678} {"train_info/time_between_train_steps": 0.0029609203338623047, "step": 6678} {"info/global_step": 6679, "train_info/time_within_train_step": 2.643355131149292, "step": 6679} {"train_info/time_between_train_steps": 0.0028765201568603516, "step": 6679} {"info/global_step": 6680, "train_info/time_within_train_step": 2.664268732070923, "step": 6680} {"train_info/time_between_train_steps": 0.0029036998748779297, "step": 6680} {"info/global_step": 6681, "train_info/time_within_train_step": 2.6534347534179688, "step": 6681} {"train_info/time_between_train_steps": 0.002959728240966797, "step": 6681} {"info/global_step": 6682, "train_info/time_within_train_step": 2.642946720123291, "step": 6682} {"train_info/time_between_train_steps": 0.002907276153564453, "step": 6682} {"info/global_step": 6683, "train_info/time_within_train_step": 2.6653919219970703, "step": 6683} {"train_info/time_between_train_steps": 0.0028924942016601562, "step": 6683} {"info/global_step": 6684, "train_info/time_within_train_step": 2.659599542617798, "step": 6684} {"train_info/time_between_train_steps": 0.0029702186584472656, "step": 6684} {"info/global_step": 6685, "train_info/time_within_train_step": 2.6679465770721436, "step": 6685} {"train_info/time_between_train_steps": 0.0029571056365966797, "step": 6685} {"info/global_step": 6686, "train_info/time_within_train_step": 2.6809215545654297, "step": 6686} {"train_info/time_between_train_steps": 0.003093719482421875, "step": 6686} {"info/global_step": 6687, "train_info/time_within_train_step": 2.7069668769836426, "step": 6687} {"train_info/time_between_train_steps": 0.0029561519622802734, "step": 6687} {"info/global_step": 6688, "train_info/time_within_train_step": 2.641993522644043, "step": 6688} {"train_info/time_between_train_steps": 0.002946615219116211, "step": 6688} {"info/global_step": 6689, "train_info/time_within_train_step": 2.647414207458496, "step": 6689} {"train_info/time_between_train_steps": 0.002895832061767578, "step": 6689} {"info/global_step": 6690, "train_info/time_within_train_step": 2.8712551593780518, "step": 6690} {"train_info/time_between_train_steps": 0.0028989315032958984, "step": 6690} {"info/global_step": 6691, "train_info/time_within_train_step": 2.639808416366577, "step": 6691} {"train_info/time_between_train_steps": 0.0029020309448242188, "step": 6691} {"info/global_step": 6692, "train_info/time_within_train_step": 2.6465210914611816, "step": 6692} {"train_info/time_between_train_steps": 0.0029478073120117188, "step": 6692} {"info/global_step": 6693, "train_info/time_within_train_step": 2.6634747982025146, "step": 6693} {"train_info/time_between_train_steps": 0.00289154052734375, "step": 6693} {"info/global_step": 6694, "train_info/time_within_train_step": 2.646991014480591, "step": 6694} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 6694} {"info/global_step": 6695, "train_info/time_within_train_step": 2.6443352699279785, "step": 6695} {"train_info/time_between_train_steps": 0.002902984619140625, "step": 6695} {"info/global_step": 6696, "train_info/time_within_train_step": 2.6562068462371826, "step": 6696} {"train_info/time_between_train_steps": 0.0028908252716064453, "step": 6696} {"info/global_step": 6697, "train_info/time_within_train_step": 2.6529414653778076, "step": 6697} {"train_info/time_between_train_steps": 0.0029175281524658203, "step": 6697} {"info/global_step": 6698, "train_info/time_within_train_step": 2.6599044799804688, "step": 6698} {"train_info/time_between_train_steps": 0.0029549598693847656, "step": 6698} {"info/global_step": 6699, "train_info/time_within_train_step": 2.6938953399658203, "step": 6699} {"train_info/time_between_train_steps": 0.0029060840606689453, "step": 6699} {"info/global_step": 6700, "train_info/time_within_train_step": 2.7157230377197266, "step": 6700} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746916239, "_runtime": 18837}, "step": 6700} {"logs": {"train/loss": 3.3158, "train/learning_rate": 0.00021999999999999995, "train/epoch": 7.07, "_timestamp": 1746916239, "_runtime": 18837}, "step": 6700} {"train_info/time_between_train_steps": 0.024203062057495117, "step": 6700} {"info/global_step": 6701, "train_info/time_within_train_step": 2.641080856323242, "step": 6701} {"train_info/time_between_train_steps": 0.0029633045196533203, "step": 6701} {"info/global_step": 6702, "train_info/time_within_train_step": 2.640378952026367, "step": 6702} {"train_info/time_between_train_steps": 0.002912282943725586, "step": 6702} {"info/global_step": 6703, "train_info/time_within_train_step": 2.6588518619537354, "step": 6703} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 6703} {"info/global_step": 6704, "train_info/time_within_train_step": 2.6562132835388184, "step": 6704} {"train_info/time_between_train_steps": 0.0029532909393310547, "step": 6704} {"info/global_step": 6705, "train_info/time_within_train_step": 2.6449928283691406, "step": 6705} {"train_info/time_between_train_steps": 0.0029752254486083984, "step": 6705} {"info/global_step": 6706, "train_info/time_within_train_step": 2.6525068283081055, "step": 6706} {"train_info/time_between_train_steps": 0.0029027462005615234, "step": 6706} {"info/global_step": 6707, "train_info/time_within_train_step": 2.647310972213745, "step": 6707} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 6707} {"info/global_step": 6708, "train_info/time_within_train_step": 2.668292284011841, "step": 6708} {"train_info/time_between_train_steps": 0.002918243408203125, "step": 6708} {"info/global_step": 6709, "train_info/time_within_train_step": 2.694885492324829, "step": 6709} {"train_info/time_between_train_steps": 0.002938508987426758, "step": 6709} {"info/global_step": 6710, "train_info/time_within_train_step": 2.6630523204803467, "step": 6710} {"train_info/time_between_train_steps": 0.002907276153564453, "step": 6710} {"info/global_step": 6711, "train_info/time_within_train_step": 2.663543939590454, "step": 6711} {"train_info/time_between_train_steps": 0.0029468536376953125, "step": 6711} {"info/global_step": 6712, "train_info/time_within_train_step": 2.640944004058838, "step": 6712} {"train_info/time_between_train_steps": 0.0028989315032958984, "step": 6712} {"info/global_step": 6713, "train_info/time_within_train_step": 2.653446674346924, "step": 6713} {"train_info/time_between_train_steps": 0.0028870105743408203, "step": 6713} {"info/global_step": 6714, "train_info/time_within_train_step": 2.657299518585205, "step": 6714} {"train_info/time_between_train_steps": 0.0029888153076171875, "step": 6714} {"info/global_step": 6715, "train_info/time_within_train_step": 2.6427648067474365, "step": 6715} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 6715} {"info/global_step": 6716, "train_info/time_within_train_step": 2.644246816635132, "step": 6716} {"train_info/time_between_train_steps": 0.0029113292694091797, "step": 6716} {"info/global_step": 6717, "train_info/time_within_train_step": 2.6608386039733887, "step": 6717} {"train_info/time_between_train_steps": 0.002917766571044922, "step": 6717} {"info/global_step": 6718, "train_info/time_within_train_step": 2.66921067237854, "step": 6718} {"train_info/time_between_train_steps": 0.0029227733612060547, "step": 6718} {"info/global_step": 6719, "train_info/time_within_train_step": 2.686321258544922, "step": 6719} {"train_info/time_between_train_steps": 0.002890348434448242, "step": 6719} {"info/global_step": 6720, "train_info/time_within_train_step": 2.6505513191223145, "step": 6720} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 6720} {"info/global_step": 6721, "train_info/time_within_train_step": 2.683148145675659, "step": 6721} {"train_info/time_between_train_steps": 0.0029230117797851562, "step": 6721} {"info/global_step": 6722, "train_info/time_within_train_step": 2.6417977809906006, "step": 6722} {"train_info/time_between_train_steps": 0.0029103755950927734, "step": 6722} {"info/global_step": 6723, "train_info/time_within_train_step": 2.657043695449829, "step": 6723} {"train_info/time_between_train_steps": 0.002882719039916992, "step": 6723} {"info/global_step": 6724, "train_info/time_within_train_step": 2.6624608039855957, "step": 6724} {"train_info/time_between_train_steps": 0.0029392242431640625, "step": 6724} {"info/global_step": 6725, "train_info/time_within_train_step": 2.642932415008545, "step": 6725} {"train_info/time_between_train_steps": 0.002901315689086914, "step": 6725} {"info/global_step": 6726, "train_info/time_within_train_step": 2.6442673206329346, "step": 6726} {"train_info/time_between_train_steps": 0.0028939247131347656, "step": 6726} {"info/global_step": 6727, "train_info/time_within_train_step": 2.654940605163574, "step": 6727} {"train_info/time_between_train_steps": 0.0028955936431884766, "step": 6727} {"info/global_step": 6728, "train_info/time_within_train_step": 2.6606335639953613, "step": 6728} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 6728} {"info/global_step": 6729, "train_info/time_within_train_step": 2.6755480766296387, "step": 6729} {"train_info/time_between_train_steps": 0.0029020309448242188, "step": 6729} {"info/global_step": 6730, "train_info/time_within_train_step": 2.6664836406707764, "step": 6730} {"train_info/time_between_train_steps": 0.002924203872680664, "step": 6730} {"info/global_step": 6731, "train_info/time_within_train_step": 2.7006869316101074, "step": 6731} {"train_info/time_between_train_steps": 0.0029349327087402344, "step": 6731} {"info/global_step": 6732, "train_info/time_within_train_step": 2.641936779022217, "step": 6732} {"train_info/time_between_train_steps": 0.0028922557830810547, "step": 6732} {"info/global_step": 6733, "train_info/time_within_train_step": 2.6406619548797607, "step": 6733} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 6733} {"info/global_step": 6734, "train_info/time_within_train_step": 2.6655526161193848, "step": 6734} {"train_info/time_between_train_steps": 0.00292205810546875, "step": 6734} {"info/global_step": 6735, "train_info/time_within_train_step": 2.8050243854522705, "step": 6735} {"train_info/time_between_train_steps": 0.0029244422912597656, "step": 6735} {"info/global_step": 6736, "train_info/time_within_train_step": 2.665008068084717, "step": 6736} {"train_info/time_between_train_steps": 0.002900838851928711, "step": 6736} {"info/global_step": 6737, "train_info/time_within_train_step": 2.646864652633667, "step": 6737} {"train_info/time_between_train_steps": 0.0029954910278320312, "step": 6737} {"info/global_step": 6738, "train_info/time_within_train_step": 2.644796371459961, "step": 6738} {"train_info/time_between_train_steps": 0.0029141902923583984, "step": 6738} {"info/global_step": 6739, "train_info/time_within_train_step": 2.6546056270599365, "step": 6739} {"train_info/time_between_train_steps": 0.0029458999633789062, "step": 6739} {"info/global_step": 6740, "train_info/time_within_train_step": 2.6523818969726562, "step": 6740} {"train_info/time_between_train_steps": 0.0029785633087158203, "step": 6740} {"info/global_step": 6741, "train_info/time_within_train_step": 2.6606853008270264, "step": 6741} {"train_info/time_between_train_steps": 0.002931833267211914, "step": 6741} {"info/global_step": 6742, "train_info/time_within_train_step": 2.6462247371673584, "step": 6742} {"train_info/time_between_train_steps": 0.002927064895629883, "step": 6742} {"info/global_step": 6743, "train_info/time_within_train_step": 2.6550464630126953, "step": 6743} {"train_info/time_between_train_steps": 0.0029671192169189453, "step": 6743} {"info/global_step": 6744, "train_info/time_within_train_step": 2.656029224395752, "step": 6744} {"train_info/time_between_train_steps": 0.0029556751251220703, "step": 6744} {"info/global_step": 6745, "train_info/time_within_train_step": 2.643226385116577, "step": 6745} {"train_info/time_between_train_steps": 0.0029942989349365234, "step": 6745} {"info/global_step": 6746, "train_info/time_within_train_step": 2.6501336097717285, "step": 6746} {"train_info/time_between_train_steps": 0.0028867721557617188, "step": 6746} {"info/global_step": 6747, "train_info/time_within_train_step": 2.6532163619995117, "step": 6747} {"train_info/time_between_train_steps": 0.002967357635498047, "step": 6747} {"info/global_step": 6748, "train_info/time_within_train_step": 2.669048309326172, "step": 6748} {"train_info/time_between_train_steps": 0.002893209457397461, "step": 6748} {"info/global_step": 6749, "train_info/time_within_train_step": 3.2592430114746094, "step": 6749} {"train_info/time_between_train_steps": 0.002933025360107422, "step": 6749} {"info/global_step": 6750, "train_info/time_within_train_step": 2.639559745788574, "step": 6750} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746916374, "_runtime": 18972}, "step": 6750} {"logs": {"train/loss": 3.3136, "train/learning_rate": 0.00021666666666666666, "train/epoch": 7.07, "_timestamp": 1746916374, "_runtime": 18972}, "step": 6750} {"train_info/time_between_train_steps": 0.024318456649780273, "step": 6750} {"info/global_step": 6751, "train_info/time_within_train_step": 2.6408917903900146, "step": 6751} {"train_info/time_between_train_steps": 0.0029048919677734375, "step": 6751} {"info/global_step": 6752, "train_info/time_within_train_step": 2.646273612976074, "step": 6752} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 6752} {"info/global_step": 6753, "train_info/time_within_train_step": 2.6461997032165527, "step": 6753} {"train_info/time_between_train_steps": 0.002961397171020508, "step": 6753} {"info/global_step": 6754, "train_info/time_within_train_step": 2.6982336044311523, "step": 6754} {"train_info/time_between_train_steps": 0.002921581268310547, "step": 6754} {"info/global_step": 6755, "train_info/time_within_train_step": 2.6449105739593506, "step": 6755} {"train_info/time_between_train_steps": 0.002880573272705078, "step": 6755} {"info/global_step": 6756, "train_info/time_within_train_step": 2.644878625869751, "step": 6756} {"train_info/time_between_train_steps": 0.0029463768005371094, "step": 6756} {"info/global_step": 6757, "train_info/time_within_train_step": 2.6513640880584717, "step": 6757} {"train_info/time_between_train_steps": 0.0029022693634033203, "step": 6757} {"info/global_step": 6758, "train_info/time_within_train_step": 2.6701414585113525, "step": 6758} {"train_info/time_between_train_steps": 0.002890348434448242, "step": 6758} {"info/global_step": 6759, "train_info/time_within_train_step": 2.6727640628814697, "step": 6759} {"train_info/time_between_train_steps": 0.0029778480529785156, "step": 6759} {"info/global_step": 6760, "train_info/time_within_train_step": 2.653214454650879, "step": 6760} {"train_info/time_between_train_steps": 0.002949237823486328, "step": 6760} {"info/global_step": 6761, "train_info/time_within_train_step": 2.6865177154541016, "step": 6761} {"train_info/time_between_train_steps": 0.0028946399688720703, "step": 6761} {"info/global_step": 6762, "train_info/time_within_train_step": 2.6395745277404785, "step": 6762} {"train_info/time_between_train_steps": 0.0029098987579345703, "step": 6762} {"info/global_step": 6763, "train_info/time_within_train_step": 2.6487526893615723, "step": 6763} {"train_info/time_between_train_steps": 0.0029494762420654297, "step": 6763} {"info/global_step": 6764, "train_info/time_within_train_step": 2.6626482009887695, "step": 6764} {"train_info/time_between_train_steps": 0.002900362014770508, "step": 6764} {"info/global_step": 6765, "train_info/time_within_train_step": 2.642503023147583, "step": 6765} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 6765} {"info/global_step": 6766, "train_info/time_within_train_step": 2.6433777809143066, "step": 6766} {"train_info/time_between_train_steps": 0.002964019775390625, "step": 6766} {"info/global_step": 6767, "train_info/time_within_train_step": 2.660932779312134, "step": 6767} {"train_info/time_between_train_steps": 0.002896547317504883, "step": 6767} {"info/global_step": 6768, "train_info/time_within_train_step": 2.6585850715637207, "step": 6768} {"train_info/time_between_train_steps": 0.0029239654541015625, "step": 6768} {"info/global_step": 6769, "train_info/time_within_train_step": 2.670093059539795, "step": 6769} {"train_info/time_between_train_steps": 0.002989530563354492, "step": 6769} {"info/global_step": 6770, "train_info/time_within_train_step": 2.6706409454345703, "step": 6770} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 6770} {"info/global_step": 6771, "train_info/time_within_train_step": 2.678335428237915, "step": 6771} {"train_info/time_between_train_steps": 0.0029189586639404297, "step": 6771} {"info/global_step": 6772, "train_info/time_within_train_step": 2.640611410140991, "step": 6772} {"train_info/time_between_train_steps": 0.0028908252716064453, "step": 6772} {"info/global_step": 6773, "train_info/time_within_train_step": 2.6398355960845947, "step": 6773} {"train_info/time_between_train_steps": 0.002979755401611328, "step": 6773} {"info/global_step": 6774, "train_info/time_within_train_step": 2.6576740741729736, "step": 6774} {"train_info/time_between_train_steps": 0.0029006004333496094, "step": 6774} {"info/global_step": 6775, "train_info/time_within_train_step": 2.65285325050354, "step": 6775} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 6775} {"info/global_step": 6776, "train_info/time_within_train_step": 2.6435928344726562, "step": 6776} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 6776} {"info/global_step": 6777, "train_info/time_within_train_step": 2.6599104404449463, "step": 6777} {"train_info/time_between_train_steps": 0.0029556751251220703, "step": 6777} {"info/global_step": 6778, "train_info/time_within_train_step": 2.6527349948883057, "step": 6778} {"train_info/time_between_train_steps": 0.0029761791229248047, "step": 6778} {"info/global_step": 6779, "train_info/time_within_train_step": 2.6601696014404297, "step": 6779} {"train_info/time_between_train_steps": 0.002974987030029297, "step": 6779} {"info/global_step": 6780, "train_info/time_within_train_step": 2.7054038047790527, "step": 6780} {"train_info/time_between_train_steps": 0.0029397010803222656, "step": 6780} {"info/global_step": 6781, "train_info/time_within_train_step": 2.702165126800537, "step": 6781} {"train_info/time_between_train_steps": 0.0029494762420654297, "step": 6781} {"info/global_step": 6782, "train_info/time_within_train_step": 2.641596555709839, "step": 6782} {"train_info/time_between_train_steps": 0.0029442310333251953, "step": 6782} {"info/global_step": 6783, "train_info/time_within_train_step": 2.640122652053833, "step": 6783} {"train_info/time_between_train_steps": 0.0029549598693847656, "step": 6783} {"info/global_step": 6784, "train_info/time_within_train_step": 2.657825469970703, "step": 6784} {"train_info/time_between_train_steps": 0.0029370784759521484, "step": 6784} {"info/global_step": 6785, "train_info/time_within_train_step": 2.6523196697235107, "step": 6785} {"train_info/time_between_train_steps": 0.002909421920776367, "step": 6785} {"info/global_step": 6786, "train_info/time_within_train_step": 2.644270181655884, "step": 6786} {"train_info/time_between_train_steps": 0.003309488296508789, "step": 6786} {"info/global_step": 6787, "train_info/time_within_train_step": 2.652829885482788, "step": 6787} {"train_info/time_between_train_steps": 0.0029418468475341797, "step": 6787} {"info/global_step": 6788, "train_info/time_within_train_step": 2.646786689758301, "step": 6788} {"train_info/time_between_train_steps": 0.0030007362365722656, "step": 6788} {"info/global_step": 6789, "train_info/time_within_train_step": 2.6694860458374023, "step": 6789} {"train_info/time_between_train_steps": 0.002920389175415039, "step": 6789} {"info/global_step": 6790, "train_info/time_within_train_step": 2.7027032375335693, "step": 6790} {"train_info/time_between_train_steps": 0.002943754196166992, "step": 6790} {"info/global_step": 6791, "train_info/time_within_train_step": 2.6837387084960938, "step": 6791} {"train_info/time_between_train_steps": 0.002972841262817383, "step": 6791} {"info/global_step": 6792, "train_info/time_within_train_step": 2.652834177017212, "step": 6792} {"train_info/time_between_train_steps": 0.0029363632202148438, "step": 6792} {"info/global_step": 6793, "train_info/time_within_train_step": 2.640852212905884, "step": 6793} {"train_info/time_between_train_steps": 0.0029494762420654297, "step": 6793} {"info/global_step": 6794, "train_info/time_within_train_step": 2.658552885055542, "step": 6794} {"train_info/time_between_train_steps": 0.003042459487915039, "step": 6794} {"info/global_step": 6795, "train_info/time_within_train_step": 2.654277801513672, "step": 6795} {"train_info/time_between_train_steps": 0.002877950668334961, "step": 6795} {"info/global_step": 6796, "train_info/time_within_train_step": 2.6430606842041016, "step": 6796} {"train_info/time_between_train_steps": 0.0029687881469726562, "step": 6796} {"info/global_step": 6797, "train_info/time_within_train_step": 2.644014358520508, "step": 6797} {"train_info/time_between_train_steps": 0.0029065608978271484, "step": 6797} {"info/global_step": 6798, "train_info/time_within_train_step": 2.652773141860962, "step": 6798} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 6798} {"info/global_step": 6799, "train_info/time_within_train_step": 2.709489583969116, "step": 6799} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 6799} {"info/global_step": 6800, "train_info/time_within_train_step": 2.665764570236206, "step": 6800} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746916508, "_runtime": 19106}, "step": 6800} {"logs": {"train/loss": 3.2924, "train/learning_rate": 0.00021333333333333333, "train/epoch": 7.08, "_timestamp": 1746916508, "_runtime": 19106}, "step": 6800} {"train_info/time_between_train_steps": 13.679494619369507, "step": 6800} {"info/global_step": 6801, "train_info/time_within_train_step": 2.4497547149658203, "step": 6801} {"train_info/time_between_train_steps": 0.0029113292694091797, "step": 6801} {"info/global_step": 6802, "train_info/time_within_train_step": 2.441774368286133, "step": 6802} {"train_info/time_between_train_steps": 0.0029566287994384766, "step": 6802} {"info/global_step": 6803, "train_info/time_within_train_step": 2.5683984756469727, "step": 6803} {"train_info/time_between_train_steps": 0.0028934478759765625, "step": 6803} {"info/global_step": 6804, "train_info/time_within_train_step": 2.67136549949646, "step": 6804} {"train_info/time_between_train_steps": 0.0029044151306152344, "step": 6804} {"info/global_step": 6805, "train_info/time_within_train_step": 2.6546525955200195, "step": 6805} {"train_info/time_between_train_steps": 0.002978801727294922, "step": 6805} {"info/global_step": 6806, "train_info/time_within_train_step": 2.639221429824829, "step": 6806} {"train_info/time_between_train_steps": 0.0029511451721191406, "step": 6806} {"info/global_step": 6807, "train_info/time_within_train_step": 2.652383327484131, "step": 6807} {"train_info/time_between_train_steps": 0.002886533737182617, "step": 6807} {"info/global_step": 6808, "train_info/time_within_train_step": 2.654810667037964, "step": 6808} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 6808} {"info/global_step": 6809, "train_info/time_within_train_step": 2.644273042678833, "step": 6809} {"train_info/time_between_train_steps": 0.0028951168060302734, "step": 6809} {"info/global_step": 6810, "train_info/time_within_train_step": 2.6446754932403564, "step": 6810} {"train_info/time_between_train_steps": 0.00295257568359375, "step": 6810} {"info/global_step": 6811, "train_info/time_within_train_step": 2.6577861309051514, "step": 6811} {"train_info/time_between_train_steps": 0.0029134750366210938, "step": 6811} {"info/global_step": 6812, "train_info/time_within_train_step": 2.6686129570007324, "step": 6812} {"train_info/time_between_train_steps": 0.002954721450805664, "step": 6812} {"info/global_step": 6813, "train_info/time_within_train_step": 2.6822309494018555, "step": 6813} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 6813} {"info/global_step": 6814, "train_info/time_within_train_step": 2.6508710384368896, "step": 6814} {"train_info/time_between_train_steps": 0.0028984546661376953, "step": 6814} {"info/global_step": 6815, "train_info/time_within_train_step": 2.6849632263183594, "step": 6815} {"train_info/time_between_train_steps": 0.0029191970825195312, "step": 6815} {"info/global_step": 6816, "train_info/time_within_train_step": 2.6423094272613525, "step": 6816} {"train_info/time_between_train_steps": 0.002883434295654297, "step": 6816} {"info/global_step": 6817, "train_info/time_within_train_step": 2.6488778591156006, "step": 6817} {"train_info/time_between_train_steps": 0.0028848648071289062, "step": 6817} {"info/global_step": 6818, "train_info/time_within_train_step": 2.6658084392547607, "step": 6818} {"train_info/time_between_train_steps": 0.00292205810546875, "step": 6818} {"info/global_step": 6819, "train_info/time_within_train_step": 2.6463329792022705, "step": 6819} {"train_info/time_between_train_steps": 0.0029251575469970703, "step": 6819} {"info/global_step": 6820, "train_info/time_within_train_step": 2.6467888355255127, "step": 6820} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 6820} {"info/global_step": 6821, "train_info/time_within_train_step": 2.6561200618743896, "step": 6821} {"train_info/time_between_train_steps": 0.002908468246459961, "step": 6821} {"info/global_step": 6822, "train_info/time_within_train_step": 2.6613404750823975, "step": 6822} {"train_info/time_between_train_steps": 0.0029549598693847656, "step": 6822} {"info/global_step": 6823, "train_info/time_within_train_step": 2.6745059490203857, "step": 6823} {"train_info/time_between_train_steps": 0.0028951168060302734, "step": 6823} {"info/global_step": 6824, "train_info/time_within_train_step": 2.6619961261749268, "step": 6824} {"train_info/time_between_train_steps": 0.002879619598388672, "step": 6824} {"info/global_step": 6825, "train_info/time_within_train_step": 2.7024011611938477, "step": 6825} {"train_info/time_between_train_steps": 0.002947092056274414, "step": 6825} {"info/global_step": 6826, "train_info/time_within_train_step": 2.6459245681762695, "step": 6826} {"train_info/time_between_train_steps": 0.002928018569946289, "step": 6826} {"info/global_step": 6827, "train_info/time_within_train_step": 2.6442315578460693, "step": 6827} {"train_info/time_between_train_steps": 0.0029006004333496094, "step": 6827} {"info/global_step": 6828, "train_info/time_within_train_step": 2.664088487625122, "step": 6828} {"train_info/time_between_train_steps": 0.0029299259185791016, "step": 6828} {"info/global_step": 6829, "train_info/time_within_train_step": 2.648150682449341, "step": 6829} {"train_info/time_between_train_steps": 0.006148338317871094, "step": 6829} {"info/global_step": 6830, "train_info/time_within_train_step": 2.653985023498535, "step": 6830} {"train_info/time_between_train_steps": 0.0060536861419677734, "step": 6830} {"info/global_step": 6831, "train_info/time_within_train_step": 2.648165225982666, "step": 6831} {"train_info/time_between_train_steps": 0.006132602691650391, "step": 6831} {"info/global_step": 6832, "train_info/time_within_train_step": 2.655550241470337, "step": 6832} {"train_info/time_between_train_steps": 0.0061187744140625, "step": 6832} {"info/global_step": 6833, "train_info/time_within_train_step": 2.6560356616973877, "step": 6833} {"train_info/time_between_train_steps": 0.0061969757080078125, "step": 6833} {"info/global_step": 6834, "train_info/time_within_train_step": 2.66880464553833, "step": 6834} {"train_info/time_between_train_steps": 0.006090641021728516, "step": 6834} {"info/global_step": 6835, "train_info/time_within_train_step": 2.7251014709472656, "step": 6835} {"train_info/time_between_train_steps": 0.006081581115722656, "step": 6835} {"info/global_step": 6836, "train_info/time_within_train_step": 2.7070908546447754, "step": 6836} {"train_info/time_between_train_steps": 0.006084442138671875, "step": 6836} {"info/global_step": 6837, "train_info/time_within_train_step": 2.64190673828125, "step": 6837} {"train_info/time_between_train_steps": 0.00611567497253418, "step": 6837} {"info/global_step": 6838, "train_info/time_within_train_step": 2.641058921813965, "step": 6838} {"train_info/time_between_train_steps": 0.0061855316162109375, "step": 6838} {"info/global_step": 6839, "train_info/time_within_train_step": 2.6577248573303223, "step": 6839} {"train_info/time_between_train_steps": 0.00607609748840332, "step": 6839} {"info/global_step": 6840, "train_info/time_within_train_step": 2.6536688804626465, "step": 6840} {"train_info/time_between_train_steps": 0.006155967712402344, "step": 6840} {"info/global_step": 6841, "train_info/time_within_train_step": 2.6439592838287354, "step": 6841} {"train_info/time_between_train_steps": 0.006106853485107422, "step": 6841} {"info/global_step": 6842, "train_info/time_within_train_step": 2.651073694229126, "step": 6842} {"train_info/time_between_train_steps": 0.006085395812988281, "step": 6842} {"info/global_step": 6843, "train_info/time_within_train_step": 2.644916534423828, "step": 6843} {"train_info/time_between_train_steps": 0.006064891815185547, "step": 6843} {"info/global_step": 6844, "train_info/time_within_train_step": 2.66981840133667, "step": 6844} {"train_info/time_between_train_steps": 0.006187915802001953, "step": 6844} {"info/global_step": 6845, "train_info/time_within_train_step": 2.672414541244507, "step": 6845} {"train_info/time_between_train_steps": 0.006123781204223633, "step": 6845} {"info/global_step": 6846, "train_info/time_within_train_step": 2.6778266429901123, "step": 6846} {"train_info/time_between_train_steps": 0.0060498714447021484, "step": 6846} {"info/global_step": 6847, "train_info/time_within_train_step": 2.725261688232422, "step": 6847} {"train_info/time_between_train_steps": 0.0060405731201171875, "step": 6847} {"info/global_step": 6848, "train_info/time_within_train_step": 2.6502983570098877, "step": 6848} {"train_info/time_between_train_steps": 0.006125450134277344, "step": 6848} {"info/global_step": 6849, "train_info/time_within_train_step": 2.6464247703552246, "step": 6849} {"train_info/time_between_train_steps": 0.006064891815185547, "step": 6849} {"info/global_step": 6850, "train_info/time_within_train_step": 2.659022808074951, "step": 6850} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746916655, "_runtime": 19253}, "step": 6850} {"logs": {"train/loss": 3.2899, "train/learning_rate": 0.00020999999999999998, "train/epoch": 7.08, "_timestamp": 1746916655, "_runtime": 19253}, "step": 6850} {"train_info/time_between_train_steps": 0.2044823169708252, "step": 6850} {"info/global_step": 6851, "train_info/time_within_train_step": 2.646397829055786, "step": 6851} {"train_info/time_between_train_steps": 0.0033788681030273438, "step": 6851} {"info/global_step": 6852, "train_info/time_within_train_step": 2.6455368995666504, "step": 6852} {"train_info/time_between_train_steps": 0.003038644790649414, "step": 6852} {"info/global_step": 6853, "train_info/time_within_train_step": 2.646298408508301, "step": 6853} {"train_info/time_between_train_steps": 0.0030670166015625, "step": 6853} {"info/global_step": 6854, "train_info/time_within_train_step": 2.6429574489593506, "step": 6854} {"train_info/time_between_train_steps": 0.006078004837036133, "step": 6854} {"info/global_step": 6855, "train_info/time_within_train_step": 2.6817729473114014, "step": 6855} {"train_info/time_between_train_steps": 0.006157398223876953, "step": 6855} {"info/global_step": 6856, "train_info/time_within_train_step": 2.6434402465820312, "step": 6856} {"train_info/time_between_train_steps": 0.0029973983764648438, "step": 6856} {"info/global_step": 6857, "train_info/time_within_train_step": 2.655125379562378, "step": 6857} {"train_info/time_between_train_steps": 0.0030090808868408203, "step": 6857} {"info/global_step": 6858, "train_info/time_within_train_step": 2.640033006668091, "step": 6858} {"train_info/time_between_train_steps": 0.0028891563415527344, "step": 6858} {"info/global_step": 6859, "train_info/time_within_train_step": 2.645559787750244, "step": 6859} {"train_info/time_between_train_steps": 0.002931833267211914, "step": 6859} {"info/global_step": 6860, "train_info/time_within_train_step": 2.663936138153076, "step": 6860} {"train_info/time_between_train_steps": 0.0032753944396972656, "step": 6860} {"info/global_step": 6861, "train_info/time_within_train_step": 2.683138370513916, "step": 6861} {"train_info/time_between_train_steps": 0.002989530563354492, "step": 6861} {"info/global_step": 6862, "train_info/time_within_train_step": 2.652050018310547, "step": 6862} {"train_info/time_between_train_steps": 0.0028967857360839844, "step": 6862} {"info/global_step": 6863, "train_info/time_within_train_step": 2.643477201461792, "step": 6863} {"train_info/time_between_train_steps": 0.002898693084716797, "step": 6863} {"info/global_step": 6864, "train_info/time_within_train_step": 2.6584415435791016, "step": 6864} {"train_info/time_between_train_steps": 0.0029828548431396484, "step": 6864} {"info/global_step": 6865, "train_info/time_within_train_step": 2.650801181793213, "step": 6865} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 6865} {"info/global_step": 6866, "train_info/time_within_train_step": 2.6613850593566895, "step": 6866} {"train_info/time_between_train_steps": 0.0030412673950195312, "step": 6866} {"info/global_step": 6867, "train_info/time_within_train_step": 2.7199625968933105, "step": 6867} {"train_info/time_between_train_steps": 0.002938508987426758, "step": 6867} {"info/global_step": 6868, "train_info/time_within_train_step": 2.676743268966675, "step": 6868} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 6868} {"info/global_step": 6869, "train_info/time_within_train_step": 2.64009428024292, "step": 6869} {"train_info/time_between_train_steps": 0.002971172332763672, "step": 6869} {"info/global_step": 6870, "train_info/time_within_train_step": 2.6431164741516113, "step": 6870} {"train_info/time_between_train_steps": 0.003088235855102539, "step": 6870} {"info/global_step": 6871, "train_info/time_within_train_step": 2.652683734893799, "step": 6871} {"train_info/time_between_train_steps": 0.003376483917236328, "step": 6871} {"info/global_step": 6872, "train_info/time_within_train_step": 2.6530251502990723, "step": 6872} {"train_info/time_between_train_steps": 0.003023862838745117, "step": 6872} {"info/global_step": 6873, "train_info/time_within_train_step": 2.642939329147339, "step": 6873} {"train_info/time_between_train_steps": 0.0030143260955810547, "step": 6873} {"info/global_step": 6874, "train_info/time_within_train_step": 2.646709680557251, "step": 6874} {"train_info/time_between_train_steps": 0.003319978713989258, "step": 6874} {"info/global_step": 6875, "train_info/time_within_train_step": 2.663069725036621, "step": 6875} {"train_info/time_between_train_steps": 0.003039121627807617, "step": 6875} {"info/global_step": 6876, "train_info/time_within_train_step": 2.6628949642181396, "step": 6876} {"train_info/time_between_train_steps": 0.0030088424682617188, "step": 6876} {"info/global_step": 6877, "train_info/time_within_train_step": 2.680373191833496, "step": 6877} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 6877} {"info/global_step": 6878, "train_info/time_within_train_step": 2.654878854751587, "step": 6878} {"train_info/time_between_train_steps": 0.003129720687866211, "step": 6878} {"info/global_step": 6879, "train_info/time_within_train_step": 2.6407179832458496, "step": 6879} {"train_info/time_between_train_steps": 0.003072977066040039, "step": 6879} {"info/global_step": 6880, "train_info/time_within_train_step": 2.6570942401885986, "step": 6880} {"train_info/time_between_train_steps": 0.0029702186584472656, "step": 6880} {"info/global_step": 6881, "train_info/time_within_train_step": 2.6546473503112793, "step": 6881} {"train_info/time_between_train_steps": 0.0030138492584228516, "step": 6881} {"info/global_step": 6882, "train_info/time_within_train_step": 2.643829822540283, "step": 6882} {"train_info/time_between_train_steps": 0.003027200698852539, "step": 6882} {"info/global_step": 6883, "train_info/time_within_train_step": 2.643571376800537, "step": 6883} {"train_info/time_between_train_steps": 0.0029675960540771484, "step": 6883} {"info/global_step": 6884, "train_info/time_within_train_step": 2.661198854446411, "step": 6884} {"train_info/time_between_train_steps": 0.0030879974365234375, "step": 6884} {"info/global_step": 6885, "train_info/time_within_train_step": 2.667731761932373, "step": 6885} {"train_info/time_between_train_steps": 0.0030269622802734375, "step": 6885} {"info/global_step": 6886, "train_info/time_within_train_step": 2.6879537105560303, "step": 6886} {"train_info/time_between_train_steps": 0.003043651580810547, "step": 6886} {"info/global_step": 6887, "train_info/time_within_train_step": 2.6529910564422607, "step": 6887} {"train_info/time_between_train_steps": 0.003039836883544922, "step": 6887} {"info/global_step": 6888, "train_info/time_within_train_step": 2.6654629707336426, "step": 6888} {"train_info/time_between_train_steps": 0.003046751022338867, "step": 6888} {"info/global_step": 6889, "train_info/time_within_train_step": 2.6459972858428955, "step": 6889} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 6889} {"info/global_step": 6890, "train_info/time_within_train_step": 2.6428184509277344, "step": 6890} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 6890} {"info/global_step": 6891, "train_info/time_within_train_step": 2.6598715782165527, "step": 6891} {"train_info/time_between_train_steps": 0.0032608509063720703, "step": 6891} {"info/global_step": 6892, "train_info/time_within_train_step": 2.648294687271118, "step": 6892} {"train_info/time_between_train_steps": 0.003276824951171875, "step": 6892} {"info/global_step": 6893, "train_info/time_within_train_step": 2.6441657543182373, "step": 6893} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 6893} {"info/global_step": 6894, "train_info/time_within_train_step": 2.6654229164123535, "step": 6894} {"train_info/time_between_train_steps": 0.0030672550201416016, "step": 6894} {"info/global_step": 6895, "train_info/time_within_train_step": 2.6568617820739746, "step": 6895} {"train_info/time_between_train_steps": 0.003356456756591797, "step": 6895} {"info/global_step": 6896, "train_info/time_within_train_step": 2.679673433303833, "step": 6896} {"train_info/time_between_train_steps": 0.0034394264221191406, "step": 6896} {"info/global_step": 6897, "train_info/time_within_train_step": 2.6508374214172363, "step": 6897} {"train_info/time_between_train_steps": 0.003304004669189453, "step": 6897} {"info/global_step": 6898, "train_info/time_within_train_step": 2.6411538124084473, "step": 6898} {"train_info/time_between_train_steps": 0.003657817840576172, "step": 6898} {"info/global_step": 6899, "train_info/time_within_train_step": 2.6656665802001953, "step": 6899} {"train_info/time_between_train_steps": 0.0034923553466796875, "step": 6899} {"info/global_step": 6900, "train_info/time_within_train_step": 2.649623394012451, "step": 6900} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746916790, "_runtime": 19388}, "step": 6900} {"logs": {"train/loss": 3.2904, "train/learning_rate": 0.00020666666666666666, "train/epoch": 7.09, "_timestamp": 1746916790, "_runtime": 19388}, "step": 6900} {"train_info/time_between_train_steps": 0.02486395835876465, "step": 6900} {"info/global_step": 6901, "train_info/time_within_train_step": 2.652125835418701, "step": 6901} {"train_info/time_between_train_steps": 0.007355213165283203, "step": 6901} {"info/global_step": 6902, "train_info/time_within_train_step": 2.64585018157959, "step": 6902} {"train_info/time_between_train_steps": 0.003620624542236328, "step": 6902} {"info/global_step": 6903, "train_info/time_within_train_step": 2.659895896911621, "step": 6903} {"train_info/time_between_train_steps": 0.008298397064208984, "step": 6903} {"info/global_step": 6904, "train_info/time_within_train_step": 2.655149459838867, "step": 6904} {"train_info/time_between_train_steps": 0.0063800811767578125, "step": 6904} {"train_info/time_between_train_steps": 2.4596292972564697, "step": 6904} {"info/global_step": 6905, "train_info/time_within_train_step": 2.6101412773132324, "step": 6905} {"train_info/time_between_train_steps": 0.006632328033447266, "step": 6905} {"info/global_step": 6906, "train_info/time_within_train_step": 2.641557455062866, "step": 6906} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 6906} {"info/global_step": 6907, "train_info/time_within_train_step": 2.652306079864502, "step": 6907} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 6907} {"info/global_step": 6908, "train_info/time_within_train_step": 2.647336721420288, "step": 6908} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 6908} {"info/global_step": 6909, "train_info/time_within_train_step": 2.665884017944336, "step": 6909} {"train_info/time_between_train_steps": 0.0031359195709228516, "step": 6909} {"info/global_step": 6910, "train_info/time_within_train_step": 2.695188045501709, "step": 6910} {"train_info/time_between_train_steps": 0.0033435821533203125, "step": 6910} {"info/global_step": 6911, "train_info/time_within_train_step": 2.6580088138580322, "step": 6911} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 6911} {"info/global_step": 6912, "train_info/time_within_train_step": 2.6628482341766357, "step": 6912} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 6912} {"info/global_step": 6913, "train_info/time_within_train_step": 2.6404950618743896, "step": 6913} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 6913} {"info/global_step": 6914, "train_info/time_within_train_step": 2.651062488555908, "step": 6914} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 6914} {"info/global_step": 6915, "train_info/time_within_train_step": 2.6615583896636963, "step": 6915} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 6915} {"info/global_step": 6916, "train_info/time_within_train_step": 2.643867015838623, "step": 6916} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 6916} {"info/global_step": 6917, "train_info/time_within_train_step": 2.6425130367279053, "step": 6917} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 6917} {"info/global_step": 6918, "train_info/time_within_train_step": 2.6644866466522217, "step": 6918} {"train_info/time_between_train_steps": 0.003110170364379883, "step": 6918} {"info/global_step": 6919, "train_info/time_within_train_step": 2.6656389236450195, "step": 6919} {"train_info/time_between_train_steps": 0.0032808780670166016, "step": 6919} {"info/global_step": 6920, "train_info/time_within_train_step": 2.687592029571533, "step": 6920} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 6920} {"info/global_step": 6921, "train_info/time_within_train_step": 2.653982639312744, "step": 6921} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 6921} {"info/global_step": 6922, "train_info/time_within_train_step": 2.66084361076355, "step": 6922} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 6922} {"info/global_step": 6923, "train_info/time_within_train_step": 2.647212028503418, "step": 6923} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 6923} {"info/global_step": 6924, "train_info/time_within_train_step": 2.642530679702759, "step": 6924} {"train_info/time_between_train_steps": 0.003179788589477539, "step": 6924} {"info/global_step": 6925, "train_info/time_within_train_step": 2.6601004600524902, "step": 6925} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 6925} {"info/global_step": 6926, "train_info/time_within_train_step": 2.6483020782470703, "step": 6926} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 6926} {"info/global_step": 6927, "train_info/time_within_train_step": 2.645034074783325, "step": 6927} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 6927} {"info/global_step": 6928, "train_info/time_within_train_step": 2.6660220623016357, "step": 6928} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 6928} {"info/global_step": 6929, "train_info/time_within_train_step": 2.65640926361084, "step": 6929} {"train_info/time_between_train_steps": 0.0032248497009277344, "step": 6929} {"info/global_step": 6930, "train_info/time_within_train_step": 2.665842294692993, "step": 6930} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 6930} {"info/global_step": 6931, "train_info/time_within_train_step": 2.682413101196289, "step": 6931} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 6931} {"info/global_step": 6932, "train_info/time_within_train_step": 2.6652753353118896, "step": 6932} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 6932} {"info/global_step": 6933, "train_info/time_within_train_step": 2.6452291011810303, "step": 6933} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 6933} {"info/global_step": 6934, "train_info/time_within_train_step": 2.6417860984802246, "step": 6934} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 6934} {"info/global_step": 6935, "train_info/time_within_train_step": 2.6534852981567383, "step": 6935} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 6935} {"info/global_step": 6936, "train_info/time_within_train_step": 2.6550114154815674, "step": 6936} {"train_info/time_between_train_steps": 0.0031194686889648438, "step": 6936} {"info/global_step": 6937, "train_info/time_within_train_step": 2.6446163654327393, "step": 6937} {"train_info/time_between_train_steps": 0.0031080245971679688, "step": 6937} {"info/global_step": 6938, "train_info/time_within_train_step": 2.658670663833618, "step": 6938} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 6938} {"info/global_step": 6939, "train_info/time_within_train_step": 2.6545417308807373, "step": 6939} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 6939} {"info/global_step": 6940, "train_info/time_within_train_step": 2.6667492389678955, "step": 6940} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 6940} {"info/global_step": 6941, "train_info/time_within_train_step": 2.7340540885925293, "step": 6941} {"train_info/time_between_train_steps": 0.0031578540802001953, "step": 6941} {"info/global_step": 6942, "train_info/time_within_train_step": 2.913630723953247, "step": 6942} {"train_info/time_between_train_steps": 0.003233194351196289, "step": 6942} {"info/global_step": 6943, "train_info/time_within_train_step": 2.653463363647461, "step": 6943} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 6943} {"info/global_step": 6944, "train_info/time_within_train_step": 2.6654953956604004, "step": 6944} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 6944} {"info/global_step": 6945, "train_info/time_within_train_step": 2.722820997238159, "step": 6945} {"train_info/time_between_train_steps": 0.0032083988189697266, "step": 6945} {"info/global_step": 6946, "train_info/time_within_train_step": 2.676633834838867, "step": 6946} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 6946} {"info/global_step": 6947, "train_info/time_within_train_step": 2.6400482654571533, "step": 6947} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 6947} {"info/global_step": 6948, "train_info/time_within_train_step": 2.6422624588012695, "step": 6948} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 6948} {"info/global_step": 6949, "train_info/time_within_train_step": 2.654449462890625, "step": 6949} {"train_info/time_between_train_steps": 0.0031490325927734375, "step": 6949} {"info/global_step": 6950, "train_info/time_within_train_step": 2.6544811725616455, "step": 6950} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746916927, "_runtime": 19525}, "step": 6950} {"logs": {"train/loss": 3.2999, "train/learning_rate": 0.00020333333333333333, "train/epoch": 8.0, "_timestamp": 1746916927, "_runtime": 19525}, "step": 6950} {"train_info/time_between_train_steps": 0.024305105209350586, "step": 6950} {"info/global_step": 6951, "train_info/time_within_train_step": 2.6447906494140625, "step": 6951} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 6951} {"info/global_step": 6952, "train_info/time_within_train_step": 2.651423931121826, "step": 6952} {"train_info/time_between_train_steps": 0.003584623336791992, "step": 6952} {"info/global_step": 6953, "train_info/time_within_train_step": 2.647311210632324, "step": 6953} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 6953} {"info/global_step": 6954, "train_info/time_within_train_step": 2.6676220893859863, "step": 6954} {"train_info/time_between_train_steps": 0.0031092166900634766, "step": 6954} {"info/global_step": 6955, "train_info/time_within_train_step": 2.6983377933502197, "step": 6955} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 6955} {"info/global_step": 6956, "train_info/time_within_train_step": 2.6405229568481445, "step": 6956} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 6956} {"info/global_step": 6957, "train_info/time_within_train_step": 2.6498448848724365, "step": 6957} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 6957} {"info/global_step": 6958, "train_info/time_within_train_step": 2.6508467197418213, "step": 6958} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 6958} {"info/global_step": 6959, "train_info/time_within_train_step": 2.646491289138794, "step": 6959} {"train_info/time_between_train_steps": 0.0031249523162841797, "step": 6959} {"info/global_step": 6960, "train_info/time_within_train_step": 2.6555821895599365, "step": 6960} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 6960} {"info/global_step": 6961, "train_info/time_within_train_step": 2.644411087036133, "step": 6961} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 6961} {"info/global_step": 6962, "train_info/time_within_train_step": 2.6461410522460938, "step": 6962} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 6962} {"info/global_step": 6963, "train_info/time_within_train_step": 2.6703100204467773, "step": 6963} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 6963} {"info/global_step": 6964, "train_info/time_within_train_step": 2.6669373512268066, "step": 6964} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 6964} {"info/global_step": 6965, "train_info/time_within_train_step": 2.6570630073547363, "step": 6965} {"train_info/time_between_train_steps": 0.003159761428833008, "step": 6965} {"info/global_step": 6966, "train_info/time_within_train_step": 2.688755750656128, "step": 6966} {"train_info/time_between_train_steps": 0.003244638442993164, "step": 6966} {"info/global_step": 6967, "train_info/time_within_train_step": 2.783935308456421, "step": 6967} {"train_info/time_between_train_steps": 0.003267526626586914, "step": 6967} {"info/global_step": 6968, "train_info/time_within_train_step": 2.6742796897888184, "step": 6968} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 6968} {"info/global_step": 6969, "train_info/time_within_train_step": 2.6422197818756104, "step": 6969} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 6969} {"info/global_step": 6970, "train_info/time_within_train_step": 2.6559438705444336, "step": 6970} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 6970} {"info/global_step": 6971, "train_info/time_within_train_step": 2.6581919193267822, "step": 6971} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 6971} {"info/global_step": 6972, "train_info/time_within_train_step": 2.6533455848693848, "step": 6972} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 6972} {"info/global_step": 6973, "train_info/time_within_train_step": 2.652655839920044, "step": 6973} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 6973} {"info/global_step": 6974, "train_info/time_within_train_step": 2.6477408409118652, "step": 6974} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 6974} {"info/global_step": 6975, "train_info/time_within_train_step": 2.663642406463623, "step": 6975} {"train_info/time_between_train_steps": 0.0032248497009277344, "step": 6975} {"info/global_step": 6976, "train_info/time_within_train_step": 2.6609160900115967, "step": 6976} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 6976} {"info/global_step": 6977, "train_info/time_within_train_step": 2.656547784805298, "step": 6977} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 6977} {"info/global_step": 6978, "train_info/time_within_train_step": 2.708038568496704, "step": 6978} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 6978} {"info/global_step": 6979, "train_info/time_within_train_step": 2.644617795944214, "step": 6979} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 6979} {"info/global_step": 6980, "train_info/time_within_train_step": 2.647387981414795, "step": 6980} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 6980} {"info/global_step": 6981, "train_info/time_within_train_step": 2.6591923236846924, "step": 6981} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 6981} {"info/global_step": 6982, "train_info/time_within_train_step": 2.6415412425994873, "step": 6982} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 6982} {"info/global_step": 6983, "train_info/time_within_train_step": 2.6447277069091797, "step": 6983} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 6983} {"info/global_step": 6984, "train_info/time_within_train_step": 2.6518585681915283, "step": 6984} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 6984} {"info/global_step": 6985, "train_info/time_within_train_step": 2.6522040367126465, "step": 6985} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 6985} {"info/global_step": 6986, "train_info/time_within_train_step": 2.660031318664551, "step": 6986} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 6986} {"info/global_step": 6987, "train_info/time_within_train_step": 2.701174020767212, "step": 6987} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 6987} {"info/global_step": 6988, "train_info/time_within_train_step": 2.719160556793213, "step": 6988} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 6988} {"info/global_step": 6989, "train_info/time_within_train_step": 2.64241886138916, "step": 6989} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 6989} {"info/global_step": 6990, "train_info/time_within_train_step": 2.640500068664551, "step": 6990} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 6990} {"info/global_step": 6991, "train_info/time_within_train_step": 2.6628904342651367, "step": 6991} {"train_info/time_between_train_steps": 0.0032203197479248047, "step": 6991} {"info/global_step": 6992, "train_info/time_within_train_step": 2.6515328884124756, "step": 6992} {"train_info/time_between_train_steps": 0.0032482147216796875, "step": 6992} {"info/global_step": 6993, "train_info/time_within_train_step": 2.6435515880584717, "step": 6993} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 6993} {"info/global_step": 6994, "train_info/time_within_train_step": 2.6523265838623047, "step": 6994} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 6994} {"info/global_step": 6995, "train_info/time_within_train_step": 2.649026393890381, "step": 6995} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 6995} {"info/global_step": 6996, "train_info/time_within_train_step": 2.6646454334259033, "step": 6996} {"train_info/time_between_train_steps": 0.003275632858276367, "step": 6996} {"info/global_step": 6997, "train_info/time_within_train_step": 2.65269136428833, "step": 6997} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 6997} {"info/global_step": 6998, "train_info/time_within_train_step": 3.254153251647949, "step": 6998} {"train_info/time_between_train_steps": 0.006617307662963867, "step": 6998} {"info/global_step": 6999, "train_info/time_within_train_step": 2.6427600383758545, "step": 6999} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 6999} {"info/global_step": 7000, "train_info/time_within_train_step": 2.6647913455963135, "step": 7000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746917062, "_runtime": 19660}, "step": 7000} {"logs": {"train/loss": 3.2643, "train/learning_rate": 0.00019999999999999998, "train/epoch": 8.01, "_timestamp": 1746917062, "_runtime": 19660}, "step": 7000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746917067, "_runtime": 19665}, "step": 7000} {"logs": {"eval/loss": 4.694533824920654, "eval/runtime": 5.1656, "eval/samples_per_second": 37.169, "eval/steps_per_second": 1.162, "train/epoch": 8.01, "_timestamp": 1746917067, "_runtime": 19665}, "step": 7000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746917067, "_runtime": 19665}, "step": 7000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.694533824920654, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 109.34782152889794, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1656, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 37.169, "train/epoch": 8.01, "_timestamp": 1746917067, "_runtime": 19665}, "step": 7000} {"train_info/time_between_train_steps": 18.767412900924683, "step": 7000} {"info/global_step": 7001, "train_info/time_within_train_step": 2.701033115386963, "step": 7001} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 7001} {"info/global_step": 7002, "train_info/time_within_train_step": 2.444946527481079, "step": 7002} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 7002} {"info/global_step": 7003, "train_info/time_within_train_step": 2.6123995780944824, "step": 7003} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 7003} {"info/global_step": 7004, "train_info/time_within_train_step": 2.6415324211120605, "step": 7004} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 7004} {"info/global_step": 7005, "train_info/time_within_train_step": 2.64154314994812, "step": 7005} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 7005} {"info/global_step": 7006, "train_info/time_within_train_step": 2.6630971431732178, "step": 7006} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 7006} {"info/global_step": 7007, "train_info/time_within_train_step": 2.661365032196045, "step": 7007} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 7007} {"info/global_step": 7008, "train_info/time_within_train_step": 2.656038999557495, "step": 7008} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 7008} {"info/global_step": 7009, "train_info/time_within_train_step": 2.7080507278442383, "step": 7009} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 7009} {"info/global_step": 7010, "train_info/time_within_train_step": 2.647719621658325, "step": 7010} {"train_info/time_between_train_steps": 0.006523847579956055, "step": 7010} {"info/global_step": 7011, "train_info/time_within_train_step": 2.6470987796783447, "step": 7011} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 7011} {"info/global_step": 7012, "train_info/time_within_train_step": 2.6522116661071777, "step": 7012} {"train_info/time_between_train_steps": 0.0031332969665527344, "step": 7012} {"info/global_step": 7013, "train_info/time_within_train_step": 2.651057720184326, "step": 7013} {"train_info/time_between_train_steps": 0.003170490264892578, "step": 7013} {"info/global_step": 7014, "train_info/time_within_train_step": 2.6513843536376953, "step": 7014} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 7014} {"info/global_step": 7015, "train_info/time_within_train_step": 2.6464810371398926, "step": 7015} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 7015} {"info/global_step": 7016, "train_info/time_within_train_step": 2.6568849086761475, "step": 7016} {"train_info/time_between_train_steps": 0.0031294822692871094, "step": 7016} {"info/global_step": 7017, "train_info/time_within_train_step": 2.6587090492248535, "step": 7017} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 7017} {"info/global_step": 7018, "train_info/time_within_train_step": 2.6701042652130127, "step": 7018} {"train_info/time_between_train_steps": 0.003107786178588867, "step": 7018} {"info/global_step": 7019, "train_info/time_within_train_step": 2.7304558753967285, "step": 7019} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 7019} {"info/global_step": 7020, "train_info/time_within_train_step": 2.661879301071167, "step": 7020} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 7020} {"info/global_step": 7021, "train_info/time_within_train_step": 2.642056465148926, "step": 7021} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 7021} {"info/global_step": 7022, "train_info/time_within_train_step": 2.65273380279541, "step": 7022} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 7022} {"info/global_step": 7023, "train_info/time_within_train_step": 2.6513519287109375, "step": 7023} {"train_info/time_between_train_steps": 0.003362417221069336, "step": 7023} {"info/global_step": 7024, "train_info/time_within_train_step": 2.65464186668396, "step": 7024} {"train_info/time_between_train_steps": 0.0031468868255615234, "step": 7024} {"info/global_step": 7025, "train_info/time_within_train_step": 2.6456971168518066, "step": 7025} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 7025} {"info/global_step": 7026, "train_info/time_within_train_step": 2.6475634574890137, "step": 7026} {"train_info/time_between_train_steps": 0.003130674362182617, "step": 7026} {"info/global_step": 7027, "train_info/time_within_train_step": 2.662651300430298, "step": 7027} {"train_info/time_between_train_steps": 0.003324270248413086, "step": 7027} {"info/global_step": 7028, "train_info/time_within_train_step": 2.6692094802856445, "step": 7028} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 7028} {"info/global_step": 7029, "train_info/time_within_train_step": 2.6983132362365723, "step": 7029} {"train_info/time_between_train_steps": 0.12769079208374023, "step": 7029} {"info/global_step": 7030, "train_info/time_within_train_step": 2.6711368560791016, "step": 7030} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 7030} {"info/global_step": 7031, "train_info/time_within_train_step": 2.6930954456329346, "step": 7031} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 7031} {"info/global_step": 7032, "train_info/time_within_train_step": 2.651155710220337, "step": 7032} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 7032} {"info/global_step": 7033, "train_info/time_within_train_step": 2.644319534301758, "step": 7033} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 7033} {"info/global_step": 7034, "train_info/time_within_train_step": 2.6558620929718018, "step": 7034} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 7034} {"info/global_step": 7035, "train_info/time_within_train_step": 2.6510260105133057, "step": 7035} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 7035} {"info/global_step": 7036, "train_info/time_within_train_step": 2.649819850921631, "step": 7036} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 7036} {"info/global_step": 7037, "train_info/time_within_train_step": 2.6459343433380127, "step": 7037} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 7037} {"info/global_step": 7038, "train_info/time_within_train_step": 2.6476824283599854, "step": 7038} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 7038} {"info/global_step": 7039, "train_info/time_within_train_step": 2.673539638519287, "step": 7039} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 7039} {"info/global_step": 7040, "train_info/time_within_train_step": 2.6673643589019775, "step": 7040} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 7040} {"info/global_step": 7041, "train_info/time_within_train_step": 2.6670100688934326, "step": 7041} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 7041} {"info/global_step": 7042, "train_info/time_within_train_step": 2.6780526638031006, "step": 7042} {"train_info/time_between_train_steps": 0.0031287670135498047, "step": 7042} {"info/global_step": 7043, "train_info/time_within_train_step": 2.644019842147827, "step": 7043} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 7043} {"info/global_step": 7044, "train_info/time_within_train_step": 2.656013250350952, "step": 7044} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 7044} {"info/global_step": 7045, "train_info/time_within_train_step": 2.652708053588867, "step": 7045} {"train_info/time_between_train_steps": 0.003116607666015625, "step": 7045} {"info/global_step": 7046, "train_info/time_within_train_step": 2.643479108810425, "step": 7046} {"train_info/time_between_train_steps": 0.0032019615173339844, "step": 7046} {"info/global_step": 7047, "train_info/time_within_train_step": 2.6470203399658203, "step": 7047} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 7047} {"info/global_step": 7048, "train_info/time_within_train_step": 2.6516218185424805, "step": 7048} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 7048} {"info/global_step": 7049, "train_info/time_within_train_step": 2.6605749130249023, "step": 7049} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 7049} {"info/global_step": 7050, "train_info/time_within_train_step": 2.6696715354919434, "step": 7050} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746917215, "_runtime": 19813}, "step": 7050} {"logs": {"train/loss": 3.2616, "train/learning_rate": 0.00019666666666666666, "train/epoch": 8.01, "_timestamp": 1746917215, "_runtime": 19813}, "step": 7050} {"train_info/time_between_train_steps": 0.024704456329345703, "step": 7050} {"info/global_step": 7051, "train_info/time_within_train_step": 2.6726951599121094, "step": 7051} {"train_info/time_between_train_steps": 0.003188610076904297, "step": 7051} {"info/global_step": 7052, "train_info/time_within_train_step": 2.6772172451019287, "step": 7052} {"train_info/time_between_train_steps": 0.003314971923828125, "step": 7052} {"info/global_step": 7053, "train_info/time_within_train_step": 2.645676851272583, "step": 7053} {"train_info/time_between_train_steps": 0.0032982826232910156, "step": 7053} {"info/global_step": 7054, "train_info/time_within_train_step": 2.647442102432251, "step": 7054} {"train_info/time_between_train_steps": 0.003308534622192383, "step": 7054} {"info/global_step": 7055, "train_info/time_within_train_step": 2.6458957195281982, "step": 7055} {"train_info/time_between_train_steps": 0.003387928009033203, "step": 7055} {"info/global_step": 7056, "train_info/time_within_train_step": 2.6462395191192627, "step": 7056} {"train_info/time_between_train_steps": 0.003330230712890625, "step": 7056} {"info/global_step": 7057, "train_info/time_within_train_step": 2.646958827972412, "step": 7057} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 7057} {"info/global_step": 7058, "train_info/time_within_train_step": 2.659332752227783, "step": 7058} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 7058} {"info/global_step": 7059, "train_info/time_within_train_step": 2.641986846923828, "step": 7059} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 7059} {"info/global_step": 7060, "train_info/time_within_train_step": 2.639437437057495, "step": 7060} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 7060} {"info/global_step": 7061, "train_info/time_within_train_step": 2.712263345718384, "step": 7061} {"train_info/time_between_train_steps": 0.0031578540802001953, "step": 7061} {"info/global_step": 7062, "train_info/time_within_train_step": 2.6515588760375977, "step": 7062} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 7062} {"info/global_step": 7063, "train_info/time_within_train_step": 2.6631574630737305, "step": 7063} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 7063} {"info/global_step": 7064, "train_info/time_within_train_step": 2.6413204669952393, "step": 7064} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 7064} {"info/global_step": 7065, "train_info/time_within_train_step": 2.6547799110412598, "step": 7065} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 7065} {"info/global_step": 7066, "train_info/time_within_train_step": 2.663177251815796, "step": 7066} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 7066} {"info/global_step": 7067, "train_info/time_within_train_step": 2.644310235977173, "step": 7067} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 7067} {"info/global_step": 7068, "train_info/time_within_train_step": 2.6534066200256348, "step": 7068} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 7068} {"info/global_step": 7069, "train_info/time_within_train_step": 2.6602089405059814, "step": 7069} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 7069} {"info/global_step": 7070, "train_info/time_within_train_step": 2.6711666584014893, "step": 7070} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 7070} {"info/global_step": 7071, "train_info/time_within_train_step": 2.6812655925750732, "step": 7071} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 7071} {"info/global_step": 7072, "train_info/time_within_train_step": 2.650486469268799, "step": 7072} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 7072} {"info/global_step": 7073, "train_info/time_within_train_step": 2.6831576824188232, "step": 7073} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 7073} {"info/global_step": 7074, "train_info/time_within_train_step": 2.641603469848633, "step": 7074} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 7074} {"info/global_step": 7075, "train_info/time_within_train_step": 2.647444486618042, "step": 7075} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 7075} {"info/global_step": 7076, "train_info/time_within_train_step": 2.666317939758301, "step": 7076} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 7076} {"info/global_step": 7077, "train_info/time_within_train_step": 2.6744384765625, "step": 7077} {"train_info/time_between_train_steps": 0.0032324790954589844, "step": 7077} {"info/global_step": 7078, "train_info/time_within_train_step": 2.6450583934783936, "step": 7078} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 7078} {"info/global_step": 7079, "train_info/time_within_train_step": 2.6435306072235107, "step": 7079} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 7079} {"info/global_step": 7080, "train_info/time_within_train_step": 2.640993118286133, "step": 7080} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 7080} {"info/global_step": 7081, "train_info/time_within_train_step": 2.6418795585632324, "step": 7081} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 7081} {"info/global_step": 7082, "train_info/time_within_train_step": 2.6668543815612793, "step": 7082} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 7082} {"info/global_step": 7083, "train_info/time_within_train_step": 2.6481237411499023, "step": 7083} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 7083} {"info/global_step": 7084, "train_info/time_within_train_step": 2.643409490585327, "step": 7084} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 7084} {"info/global_step": 7085, "train_info/time_within_train_step": 2.6606740951538086, "step": 7085} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 7085} {"info/global_step": 7086, "train_info/time_within_train_step": 2.6568892002105713, "step": 7086} {"train_info/time_between_train_steps": 0.003208637237548828, "step": 7086} {"info/global_step": 7087, "train_info/time_within_train_step": 2.660588026046753, "step": 7087} {"train_info/time_between_train_steps": 0.003208637237548828, "step": 7087} {"info/global_step": 7088, "train_info/time_within_train_step": 2.7014780044555664, "step": 7088} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 7088} {"info/global_step": 7089, "train_info/time_within_train_step": 2.7029237747192383, "step": 7089} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 7089} {"info/global_step": 7090, "train_info/time_within_train_step": 2.6407101154327393, "step": 7090} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 7090} {"info/global_step": 7091, "train_info/time_within_train_step": 2.6408183574676514, "step": 7091} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 7091} {"info/global_step": 7092, "train_info/time_within_train_step": 2.7734031677246094, "step": 7092} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 7092} {"info/global_step": 7093, "train_info/time_within_train_step": 2.643104314804077, "step": 7093} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 7093} {"info/global_step": 7094, "train_info/time_within_train_step": 2.6549763679504395, "step": 7094} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 7094} {"info/global_step": 7095, "train_info/time_within_train_step": 2.6531031131744385, "step": 7095} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 7095} {"info/global_step": 7096, "train_info/time_within_train_step": 2.642929792404175, "step": 7096} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 7096} {"info/global_step": 7097, "train_info/time_within_train_step": 2.649040937423706, "step": 7097} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 7097} {"info/global_step": 7098, "train_info/time_within_train_step": 2.6597297191619873, "step": 7098} {"train_info/time_between_train_steps": 0.0033042430877685547, "step": 7098} {"info/global_step": 7099, "train_info/time_within_train_step": 2.6699259281158447, "step": 7099} {"train_info/time_between_train_steps": 0.003238677978515625, "step": 7099} {"info/global_step": 7100, "train_info/time_within_train_step": 2.6987080574035645, "step": 7100} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746917350, "_runtime": 19948}, "step": 7100} {"logs": {"train/loss": 3.2475, "train/learning_rate": 0.00019333333333333333, "train/epoch": 8.02, "_timestamp": 1746917350, "_runtime": 19948}, "step": 7100} {"train_info/time_between_train_steps": 0.02440643310546875, "step": 7100} {"info/global_step": 7101, "train_info/time_within_train_step": 2.709073543548584, "step": 7101} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 7101} {"info/global_step": 7102, "train_info/time_within_train_step": 2.9100868701934814, "step": 7102} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 7102} {"info/global_step": 7103, "train_info/time_within_train_step": 2.648332357406616, "step": 7103} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 7103} {"info/global_step": 7104, "train_info/time_within_train_step": 2.668642044067383, "step": 7104} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 7104} {"info/global_step": 7105, "train_info/time_within_train_step": 2.6998772621154785, "step": 7105} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 7105} {"info/global_step": 7106, "train_info/time_within_train_step": 2.6541473865509033, "step": 7106} {"train_info/time_between_train_steps": 0.0032548904418945312, "step": 7106} {"info/global_step": 7107, "train_info/time_within_train_step": 2.6628806591033936, "step": 7107} {"train_info/time_between_train_steps": 0.003276824951171875, "step": 7107} {"info/global_step": 7108, "train_info/time_within_train_step": 2.6481804847717285, "step": 7108} {"train_info/time_between_train_steps": 0.0032377243041992188, "step": 7108} {"info/global_step": 7109, "train_info/time_within_train_step": 2.6458582878112793, "step": 7109} {"train_info/time_between_train_steps": 0.003246784210205078, "step": 7109} {"info/global_step": 7110, "train_info/time_within_train_step": 2.658578872680664, "step": 7110} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 7110} {"info/global_step": 7111, "train_info/time_within_train_step": 2.644207715988159, "step": 7111} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 7111} {"info/global_step": 7112, "train_info/time_within_train_step": 2.645477294921875, "step": 7112} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 7112} {"info/global_step": 7113, "train_info/time_within_train_step": 2.6697962284088135, "step": 7113} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 7113} {"info/global_step": 7114, "train_info/time_within_train_step": 2.6662795543670654, "step": 7114} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 7114} {"info/global_step": 7115, "train_info/time_within_train_step": 2.6707358360290527, "step": 7115} {"train_info/time_between_train_steps": 0.0032501220703125, "step": 7115} {"info/global_step": 7116, "train_info/time_within_train_step": 2.670356273651123, "step": 7116} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 7116} {"info/global_step": 7117, "train_info/time_within_train_step": 2.6424176692962646, "step": 7117} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 7117} {"info/global_step": 7118, "train_info/time_within_train_step": 2.6545193195343018, "step": 7118} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 7118} {"info/global_step": 7119, "train_info/time_within_train_step": 2.655967950820923, "step": 7119} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 7119} {"info/global_step": 7120, "train_info/time_within_train_step": 2.642801284790039, "step": 7120} {"train_info/time_between_train_steps": 0.0032317638397216797, "step": 7120} {"info/global_step": 7121, "train_info/time_within_train_step": 2.6442840099334717, "step": 7121} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 7121} {"info/global_step": 7122, "train_info/time_within_train_step": 2.6445987224578857, "step": 7122} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 7122} {"info/global_step": 7123, "train_info/time_within_train_step": 2.6481568813323975, "step": 7123} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 7123} {"info/global_step": 7124, "train_info/time_within_train_step": 2.6481683254241943, "step": 7124} {"train_info/time_between_train_steps": 0.0035364627838134766, "step": 7124} {"info/global_step": 7125, "train_info/time_within_train_step": 2.6491870880126953, "step": 7125} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 7125} {"info/global_step": 7126, "train_info/time_within_train_step": 2.6466193199157715, "step": 7126} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 7126} {"info/global_step": 7127, "train_info/time_within_train_step": 2.6538660526275635, "step": 7127} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 7127} {"info/global_step": 7128, "train_info/time_within_train_step": 2.6575961112976074, "step": 7128} {"train_info/time_between_train_steps": 0.0032460689544677734, "step": 7128} {"info/global_step": 7129, "train_info/time_within_train_step": 2.6765758991241455, "step": 7129} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 7129} {"info/global_step": 7130, "train_info/time_within_train_step": 2.727734327316284, "step": 7130} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 7130} {"info/global_step": 7131, "train_info/time_within_train_step": 2.653475284576416, "step": 7131} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 7131} {"info/global_step": 7132, "train_info/time_within_train_step": 2.6414477825164795, "step": 7132} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 7132} {"info/global_step": 7133, "train_info/time_within_train_step": 2.6603848934173584, "step": 7133} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 7133} {"info/global_step": 7134, "train_info/time_within_train_step": 2.6494696140289307, "step": 7134} {"train_info/time_between_train_steps": 0.003318309783935547, "step": 7134} {"info/global_step": 7135, "train_info/time_within_train_step": 2.6563916206359863, "step": 7135} {"train_info/time_between_train_steps": 0.003256559371948242, "step": 7135} {"info/global_step": 7136, "train_info/time_within_train_step": 2.6465837955474854, "step": 7136} {"train_info/time_between_train_steps": 0.0032782554626464844, "step": 7136} {"info/global_step": 7137, "train_info/time_within_train_step": 2.6471853256225586, "step": 7137} {"train_info/time_between_train_steps": 0.003265857696533203, "step": 7137} {"info/global_step": 7138, "train_info/time_within_train_step": 2.6643147468566895, "step": 7138} {"train_info/time_between_train_steps": 0.0033178329467773438, "step": 7138} {"info/global_step": 7139, "train_info/time_within_train_step": 2.667877435684204, "step": 7139} {"train_info/time_between_train_steps": 0.003229379653930664, "step": 7139} {"info/global_step": 7140, "train_info/time_within_train_step": 2.6873295307159424, "step": 7140} {"train_info/time_between_train_steps": 0.003244638442993164, "step": 7140} {"info/global_step": 7141, "train_info/time_within_train_step": 2.651536464691162, "step": 7141} {"train_info/time_between_train_steps": 0.0032548904418945312, "step": 7141} {"info/global_step": 7142, "train_info/time_within_train_step": 2.6449413299560547, "step": 7142} {"train_info/time_between_train_steps": 0.003239870071411133, "step": 7142} {"info/global_step": 7143, "train_info/time_within_train_step": 2.656017780303955, "step": 7143} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 7143} {"info/global_step": 7144, "train_info/time_within_train_step": 2.653026580810547, "step": 7144} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 7144} {"info/global_step": 7145, "train_info/time_within_train_step": 2.6443116664886475, "step": 7145} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 7145} {"info/global_step": 7146, "train_info/time_within_train_step": 2.6435370445251465, "step": 7146} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 7146} {"info/global_step": 7147, "train_info/time_within_train_step": 2.648764133453369, "step": 7147} {"train_info/time_between_train_steps": 0.0031943321228027344, "step": 7147} {"info/global_step": 7148, "train_info/time_within_train_step": 2.670499801635742, "step": 7148} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 7148} {"info/global_step": 7149, "train_info/time_within_train_step": 2.6714565753936768, "step": 7149} {"train_info/time_between_train_steps": 0.0032334327697753906, "step": 7149} {"info/global_step": 7150, "train_info/time_within_train_step": 2.657165050506592, "step": 7150} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746917484, "_runtime": 20082}, "step": 7150} {"logs": {"train/loss": 3.242, "train/learning_rate": 0.00018999999999999998, "train/epoch": 8.02, "_timestamp": 1746917484, "_runtime": 20082}, "step": 7150} {"train_info/time_between_train_steps": 0.024483442306518555, "step": 7150} {"info/global_step": 7151, "train_info/time_within_train_step": 2.6568286418914795, "step": 7151} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 7151} {"info/global_step": 7152, "train_info/time_within_train_step": 2.6531729698181152, "step": 7152} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 7152} {"info/global_step": 7153, "train_info/time_within_train_step": 2.6474361419677734, "step": 7153} {"train_info/time_between_train_steps": 0.003282308578491211, "step": 7153} {"info/global_step": 7154, "train_info/time_within_train_step": 2.643541097640991, "step": 7154} {"train_info/time_between_train_steps": 0.13747048377990723, "step": 7154} {"info/global_step": 7155, "train_info/time_within_train_step": 2.674863815307617, "step": 7155} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 7155} {"info/global_step": 7156, "train_info/time_within_train_step": 2.6487746238708496, "step": 7156} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 7156} {"info/global_step": 7157, "train_info/time_within_train_step": 2.666945695877075, "step": 7157} {"train_info/time_between_train_steps": 0.003226041793823242, "step": 7157} {"info/global_step": 7158, "train_info/time_within_train_step": 2.6501684188842773, "step": 7158} {"train_info/time_between_train_steps": 0.003188610076904297, "step": 7158} {"info/global_step": 7159, "train_info/time_within_train_step": 2.644653797149658, "step": 7159} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 7159} {"info/global_step": 7160, "train_info/time_within_train_step": 2.6661875247955322, "step": 7160} {"train_info/time_between_train_steps": 0.0032646656036376953, "step": 7160} {"info/global_step": 7161, "train_info/time_within_train_step": 2.660374164581299, "step": 7161} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 7161} {"info/global_step": 7162, "train_info/time_within_train_step": 2.660344362258911, "step": 7162} {"train_info/time_between_train_steps": 0.003241300582885742, "step": 7162} {"info/global_step": 7163, "train_info/time_within_train_step": 2.929133176803589, "step": 7163} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 7163} {"info/global_step": 7164, "train_info/time_within_train_step": 2.6674695014953613, "step": 7164} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 7164} {"info/global_step": 7165, "train_info/time_within_train_step": 2.6473019123077393, "step": 7165} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 7165} {"info/global_step": 7166, "train_info/time_within_train_step": 2.641446828842163, "step": 7166} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 7166} {"info/global_step": 7167, "train_info/time_within_train_step": 2.661386251449585, "step": 7167} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 7167} {"info/global_step": 7168, "train_info/time_within_train_step": 2.653745174407959, "step": 7168} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 7168} {"info/global_step": 7169, "train_info/time_within_train_step": 2.645681142807007, "step": 7169} {"train_info/time_between_train_steps": 0.003190755844116211, "step": 7169} {"info/global_step": 7170, "train_info/time_within_train_step": 2.6605236530303955, "step": 7170} {"train_info/time_between_train_steps": 0.003208160400390625, "step": 7170} {"info/global_step": 7171, "train_info/time_within_train_step": 2.6539502143859863, "step": 7171} {"train_info/time_between_train_steps": 0.0032296180725097656, "step": 7171} {"info/global_step": 7172, "train_info/time_within_train_step": 2.660303831100464, "step": 7172} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 7172} {"info/global_step": 7173, "train_info/time_within_train_step": 2.703836441040039, "step": 7173} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 7173} {"info/global_step": 7174, "train_info/time_within_train_step": 2.69545578956604, "step": 7174} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 7174} {"info/global_step": 7175, "train_info/time_within_train_step": 2.641486644744873, "step": 7175} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 7175} {"info/global_step": 7176, "train_info/time_within_train_step": 2.641169548034668, "step": 7176} {"train_info/time_between_train_steps": 0.0032165050506591797, "step": 7176} {"info/global_step": 7177, "train_info/time_within_train_step": 2.6580610275268555, "step": 7177} {"train_info/time_between_train_steps": 0.006536245346069336, "step": 7177} {"info/global_step": 7178, "train_info/time_within_train_step": 2.6530697345733643, "step": 7178} {"train_info/time_between_train_steps": 0.0032961368560791016, "step": 7178} {"info/global_step": 7179, "train_info/time_within_train_step": 2.6439428329467773, "step": 7179} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 7179} {"info/global_step": 7180, "train_info/time_within_train_step": 2.651426076889038, "step": 7180} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 7180} {"info/global_step": 7181, "train_info/time_within_train_step": 2.6455984115600586, "step": 7181} {"train_info/time_between_train_steps": 0.0032367706298828125, "step": 7181} {"info/global_step": 7182, "train_info/time_within_train_step": 2.6705126762390137, "step": 7182} {"train_info/time_between_train_steps": 0.003597736358642578, "step": 7182} {"info/global_step": 7183, "train_info/time_within_train_step": 2.687426805496216, "step": 7183} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 7183} {"info/global_step": 7184, "train_info/time_within_train_step": 2.6794018745422363, "step": 7184} {"train_info/time_between_train_steps": 0.003216266632080078, "step": 7184} {"info/global_step": 7185, "train_info/time_within_train_step": 2.6548054218292236, "step": 7185} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 7185} {"info/global_step": 7186, "train_info/time_within_train_step": 2.641772508621216, "step": 7186} {"train_info/time_between_train_steps": 0.0032176971435546875, "step": 7186} {"info/global_step": 7187, "train_info/time_within_train_step": 2.6497323513031006, "step": 7187} {"train_info/time_between_train_steps": 0.003173828125, "step": 7187} {"info/global_step": 7188, "train_info/time_within_train_step": 2.6431519985198975, "step": 7188} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 7188} {"info/global_step": 7189, "train_info/time_within_train_step": 2.6449379920959473, "step": 7189} {"train_info/time_between_train_steps": 0.006553173065185547, "step": 7189} {"info/global_step": 7190, "train_info/time_within_train_step": 2.672945261001587, "step": 7190} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 7190} {"info/global_step": 7191, "train_info/time_within_train_step": 2.6654245853424072, "step": 7191} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 7191} {"info/global_step": 7192, "train_info/time_within_train_step": 2.673542022705078, "step": 7192} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 7192} {"info/global_step": 7193, "train_info/time_within_train_step": 2.6667068004608154, "step": 7193} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 7193} {"info/global_step": 7194, "train_info/time_within_train_step": 2.6495542526245117, "step": 7194} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 7194} {"info/global_step": 7195, "train_info/time_within_train_step": 2.65004825592041, "step": 7195} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 7195} {"info/global_step": 7196, "train_info/time_within_train_step": 2.6458990573883057, "step": 7196} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 7196} {"info/global_step": 7197, "train_info/time_within_train_step": 2.649893283843994, "step": 7197} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 7197} {"info/global_step": 7198, "train_info/time_within_train_step": 2.6503121852874756, "step": 7198} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 7198} {"info/global_step": 7199, "train_info/time_within_train_step": 2.6600308418273926, "step": 7199} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 7199} {"info/global_step": 7200, "train_info/time_within_train_step": 2.666443109512329, "step": 7200} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746917619, "_runtime": 20217}, "step": 7200} {"logs": {"train/loss": 3.2276, "train/learning_rate": 0.00018666666666666666, "train/epoch": 8.03, "_timestamp": 1746917619, "_runtime": 20217}, "step": 7200} {"train_info/time_between_train_steps": 13.507788896560669, "step": 7200} {"info/global_step": 7201, "train_info/time_within_train_step": 2.4336650371551514, "step": 7201} {"train_info/time_between_train_steps": 0.0032958984375, "step": 7201} {"info/global_step": 7202, "train_info/time_within_train_step": 2.4507088661193848, "step": 7202} {"train_info/time_between_train_steps": 0.0033042430877685547, "step": 7202} {"info/global_step": 7203, "train_info/time_within_train_step": 2.592449426651001, "step": 7203} {"train_info/time_between_train_steps": 0.0032465457916259766, "step": 7203} {"info/global_step": 7204, "train_info/time_within_train_step": 2.638674259185791, "step": 7204} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 7204} {"info/global_step": 7205, "train_info/time_within_train_step": 2.660745859146118, "step": 7205} {"train_info/time_between_train_steps": 0.003260374069213867, "step": 7205} {"info/global_step": 7206, "train_info/time_within_train_step": 2.665379524230957, "step": 7206} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 7206} {"info/global_step": 7207, "train_info/time_within_train_step": 2.6610300540924072, "step": 7207} {"train_info/time_between_train_steps": 0.003179788589477539, "step": 7207} {"info/global_step": 7208, "train_info/time_within_train_step": 2.9458019733428955, "step": 7208} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 7208} {"info/global_step": 7209, "train_info/time_within_train_step": 2.6711087226867676, "step": 7209} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 7209} {"info/global_step": 7210, "train_info/time_within_train_step": 2.6672565937042236, "step": 7210} {"train_info/time_between_train_steps": 0.003485441207885742, "step": 7210} {"info/global_step": 7211, "train_info/time_within_train_step": 2.6835954189300537, "step": 7211} {"train_info/time_between_train_steps": 0.0032389163970947266, "step": 7211} {"info/global_step": 7212, "train_info/time_within_train_step": 2.66184663772583, "step": 7212} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 7212} {"info/global_step": 7213, "train_info/time_within_train_step": 2.6559457778930664, "step": 7213} {"train_info/time_between_train_steps": 0.0031599998474121094, "step": 7213} {"info/global_step": 7214, "train_info/time_within_train_step": 2.648775100708008, "step": 7214} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 7214} {"info/global_step": 7215, "train_info/time_within_train_step": 2.6468231678009033, "step": 7215} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 7215} {"info/global_step": 7216, "train_info/time_within_train_step": 2.659245014190674, "step": 7216} {"train_info/time_between_train_steps": 0.003199338912963867, "step": 7216} {"info/global_step": 7217, "train_info/time_within_train_step": 2.7923452854156494, "step": 7217} {"train_info/time_between_train_steps": 0.0032815933227539062, "step": 7217} {"info/global_step": 7218, "train_info/time_within_train_step": 2.6447956562042236, "step": 7218} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 7218} {"info/global_step": 7219, "train_info/time_within_train_step": 2.647442102432251, "step": 7219} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 7219} {"info/global_step": 7220, "train_info/time_within_train_step": 2.65041446685791, "step": 7220} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 7220} {"info/global_step": 7221, "train_info/time_within_train_step": 2.6712186336517334, "step": 7221} {"train_info/time_between_train_steps": 0.0032503604888916016, "step": 7221} {"info/global_step": 7222, "train_info/time_within_train_step": 2.662959337234497, "step": 7222} {"train_info/time_between_train_steps": 0.003344297409057617, "step": 7222} {"info/global_step": 7223, "train_info/time_within_train_step": 2.6629905700683594, "step": 7223} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 7223} {"info/global_step": 7224, "train_info/time_within_train_step": 2.7012903690338135, "step": 7224} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 7224} {"info/global_step": 7225, "train_info/time_within_train_step": 2.6617977619171143, "step": 7225} {"train_info/time_between_train_steps": 0.006524324417114258, "step": 7225} {"info/global_step": 7226, "train_info/time_within_train_step": 2.6484384536743164, "step": 7226} {"train_info/time_between_train_steps": 0.006558656692504883, "step": 7226} {"info/global_step": 7227, "train_info/time_within_train_step": 2.643261194229126, "step": 7227} {"train_info/time_between_train_steps": 0.006529331207275391, "step": 7227} {"info/global_step": 7228, "train_info/time_within_train_step": 2.6590428352355957, "step": 7228} {"train_info/time_between_train_steps": 0.006502628326416016, "step": 7228} {"info/global_step": 7229, "train_info/time_within_train_step": 2.6541359424591064, "step": 7229} {"train_info/time_between_train_steps": 0.006543636322021484, "step": 7229} {"info/global_step": 7230, "train_info/time_within_train_step": 2.645475149154663, "step": 7230} {"train_info/time_between_train_steps": 0.00652623176574707, "step": 7230} {"info/global_step": 7231, "train_info/time_within_train_step": 2.66070294380188, "step": 7231} {"train_info/time_between_train_steps": 0.006547689437866211, "step": 7231} {"info/global_step": 7232, "train_info/time_within_train_step": 2.65338134765625, "step": 7232} {"train_info/time_between_train_steps": 0.006541013717651367, "step": 7232} {"info/global_step": 7233, "train_info/time_within_train_step": 2.660569190979004, "step": 7233} {"train_info/time_between_train_steps": 0.0065882205963134766, "step": 7233} {"info/global_step": 7234, "train_info/time_within_train_step": 2.6943023204803467, "step": 7234} {"train_info/time_between_train_steps": 0.006582975387573242, "step": 7234} {"info/global_step": 7235, "train_info/time_within_train_step": 2.729465961456299, "step": 7235} {"train_info/time_between_train_steps": 0.0065174102783203125, "step": 7235} {"info/global_step": 7236, "train_info/time_within_train_step": 2.656370162963867, "step": 7236} {"train_info/time_between_train_steps": 0.0032422542572021484, "step": 7236} {"info/global_step": 7237, "train_info/time_within_train_step": 2.644514799118042, "step": 7237} {"train_info/time_between_train_steps": 0.006452083587646484, "step": 7237} {"info/global_step": 7238, "train_info/time_within_train_step": 2.64898943901062, "step": 7238} {"train_info/time_between_train_steps": 0.006549358367919922, "step": 7238} {"info/global_step": 7239, "train_info/time_within_train_step": 2.6557555198669434, "step": 7239} {"train_info/time_between_train_steps": 0.00649571418762207, "step": 7239} {"info/global_step": 7240, "train_info/time_within_train_step": 2.655564546585083, "step": 7240} {"train_info/time_between_train_steps": 0.006439924240112305, "step": 7240} {"info/global_step": 7241, "train_info/time_within_train_step": 2.645246982574463, "step": 7241} {"train_info/time_between_train_steps": 0.006493330001831055, "step": 7241} {"info/global_step": 7242, "train_info/time_within_train_step": 2.652078866958618, "step": 7242} {"train_info/time_between_train_steps": 0.006516456604003906, "step": 7242} {"info/global_step": 7243, "train_info/time_within_train_step": 2.653893232345581, "step": 7243} {"train_info/time_between_train_steps": 0.006491422653198242, "step": 7243} {"info/global_step": 7244, "train_info/time_within_train_step": 2.6694743633270264, "step": 7244} {"train_info/time_between_train_steps": 0.006571054458618164, "step": 7244} {"info/global_step": 7245, "train_info/time_within_train_step": 2.710036039352417, "step": 7245} {"train_info/time_between_train_steps": 0.006533622741699219, "step": 7245} {"info/global_step": 7246, "train_info/time_within_train_step": 2.6481149196624756, "step": 7246} {"train_info/time_between_train_steps": 0.0033326148986816406, "step": 7246} {"info/global_step": 7247, "train_info/time_within_train_step": 2.677757501602173, "step": 7247} {"train_info/time_between_train_steps": 0.0065653324127197266, "step": 7247} {"info/global_step": 7248, "train_info/time_within_train_step": 3.260270118713379, "step": 7248} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 7248} {"info/global_step": 7249, "train_info/time_within_train_step": 2.6525511741638184, "step": 7249} {"train_info/time_between_train_steps": 0.006499528884887695, "step": 7249} {"info/global_step": 7250, "train_info/time_within_train_step": 2.645617961883545, "step": 7250} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746917767, "_runtime": 20365}, "step": 7250} {"logs": {"train/loss": 3.2354, "train/learning_rate": 0.00018333333333333334, "train/epoch": 8.03, "_timestamp": 1746917767, "_runtime": 20365}, "step": 7250} {"train_info/time_between_train_steps": 0.024606704711914062, "step": 7250} {"info/global_step": 7251, "train_info/time_within_train_step": 2.664994478225708, "step": 7251} {"train_info/time_between_train_steps": 0.0034592151641845703, "step": 7251} {"info/global_step": 7252, "train_info/time_within_train_step": 2.916621446609497, "step": 7252} {"train_info/time_between_train_steps": 0.006512641906738281, "step": 7252} {"info/global_step": 7253, "train_info/time_within_train_step": 2.644104242324829, "step": 7253} {"train_info/time_between_train_steps": 0.006575345993041992, "step": 7253} {"info/global_step": 7254, "train_info/time_within_train_step": 2.6487479209899902, "step": 7254} {"train_info/time_between_train_steps": 0.006547212600708008, "step": 7254} {"info/global_step": 7255, "train_info/time_within_train_step": 2.656726121902466, "step": 7255} {"train_info/time_between_train_steps": 0.0065135955810546875, "step": 7255} {"info/global_step": 7256, "train_info/time_within_train_step": 2.6686058044433594, "step": 7256} {"train_info/time_between_train_steps": 0.006540536880493164, "step": 7256} {"info/global_step": 7257, "train_info/time_within_train_step": 2.645082950592041, "step": 7257} {"train_info/time_between_train_steps": 0.0031402111053466797, "step": 7257} {"info/global_step": 7258, "train_info/time_within_train_step": 2.664669990539551, "step": 7258} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 7258} {"info/global_step": 7259, "train_info/time_within_train_step": 2.6495440006256104, "step": 7259} {"train_info/time_between_train_steps": 0.0033576488494873047, "step": 7259} {"info/global_step": 7260, "train_info/time_within_train_step": 2.6456387042999268, "step": 7260} {"train_info/time_between_train_steps": 0.003284454345703125, "step": 7260} {"info/global_step": 7261, "train_info/time_within_train_step": 2.650742292404175, "step": 7261} {"train_info/time_between_train_steps": 0.0034427642822265625, "step": 7261} {"info/global_step": 7262, "train_info/time_within_train_step": 2.6477320194244385, "step": 7262} {"train_info/time_between_train_steps": 0.00354766845703125, "step": 7262} {"info/global_step": 7263, "train_info/time_within_train_step": 2.64499831199646, "step": 7263} {"train_info/time_between_train_steps": 0.003345012664794922, "step": 7263} {"info/global_step": 7264, "train_info/time_within_train_step": 2.648855209350586, "step": 7264} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 7264} {"info/global_step": 7265, "train_info/time_within_train_step": 2.657317638397217, "step": 7265} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 7265} {"info/global_step": 7266, "train_info/time_within_train_step": 2.6676955223083496, "step": 7266} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 7266} {"info/global_step": 7267, "train_info/time_within_train_step": 2.6430327892303467, "step": 7267} {"train_info/time_between_train_steps": 0.006462812423706055, "step": 7267} {"info/global_step": 7268, "train_info/time_within_train_step": 2.645221710205078, "step": 7268} {"train_info/time_between_train_steps": 0.0065958499908447266, "step": 7268} {"info/global_step": 7269, "train_info/time_within_train_step": 2.6523306369781494, "step": 7269} {"train_info/time_between_train_steps": 0.0032622814178466797, "step": 7269} {"info/global_step": 7270, "train_info/time_within_train_step": 2.6527459621429443, "step": 7270} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 7270} {"info/global_step": 7271, "train_info/time_within_train_step": 2.6678647994995117, "step": 7271} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 7271} {"info/global_step": 7272, "train_info/time_within_train_step": 2.711117744445801, "step": 7272} {"train_info/time_between_train_steps": 0.0032300949096679688, "step": 7272} {"info/global_step": 7273, "train_info/time_within_train_step": 2.645979166030884, "step": 7273} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 7273} {"info/global_step": 7274, "train_info/time_within_train_step": 2.6583969593048096, "step": 7274} {"train_info/time_between_train_steps": 0.003231525421142578, "step": 7274} {"info/global_step": 7275, "train_info/time_within_train_step": 2.647677183151245, "step": 7275} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 7275} {"info/global_step": 7276, "train_info/time_within_train_step": 2.646420955657959, "step": 7276} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 7276} {"info/global_step": 7277, "train_info/time_within_train_step": 2.6553542613983154, "step": 7277} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 7277} {"info/global_step": 7278, "train_info/time_within_train_step": 2.6439757347106934, "step": 7278} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 7278} {"info/global_step": 7279, "train_info/time_within_train_step": 2.645298957824707, "step": 7279} {"train_info/time_between_train_steps": 0.1330878734588623, "step": 7279} {"info/global_step": 7280, "train_info/time_within_train_step": 2.643953800201416, "step": 7280} {"train_info/time_between_train_steps": 0.003262758255004883, "step": 7280} {"info/global_step": 7281, "train_info/time_within_train_step": 2.649845838546753, "step": 7281} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 7281} {"info/global_step": 7282, "train_info/time_within_train_step": 2.651512861251831, "step": 7282} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 7282} {"info/global_step": 7283, "train_info/time_within_train_step": 2.6471214294433594, "step": 7283} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 7283} {"info/global_step": 7284, "train_info/time_within_train_step": 2.6649911403656006, "step": 7284} {"train_info/time_between_train_steps": 0.0032770633697509766, "step": 7284} {"info/global_step": 7285, "train_info/time_within_train_step": 2.644421339035034, "step": 7285} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 7285} {"info/global_step": 7286, "train_info/time_within_train_step": 2.649324417114258, "step": 7286} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 7286} {"info/global_step": 7287, "train_info/time_within_train_step": 2.667948007583618, "step": 7287} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 7287} {"info/global_step": 7288, "train_info/time_within_train_step": 2.6597859859466553, "step": 7288} {"train_info/time_between_train_steps": 0.0032808780670166016, "step": 7288} {"info/global_step": 7289, "train_info/time_within_train_step": 2.67657208442688, "step": 7289} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 7289} {"info/global_step": 7290, "train_info/time_within_train_step": 2.6704659461975098, "step": 7290} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 7290} {"info/global_step": 7291, "train_info/time_within_train_step": 2.677736520767212, "step": 7291} {"train_info/time_between_train_steps": 0.003261566162109375, "step": 7291} {"info/global_step": 7292, "train_info/time_within_train_step": 2.640873432159424, "step": 7292} {"train_info/time_between_train_steps": 0.003204345703125, "step": 7292} {"info/global_step": 7293, "train_info/time_within_train_step": 2.640923023223877, "step": 7293} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 7293} {"info/global_step": 7294, "train_info/time_within_train_step": 2.6577112674713135, "step": 7294} {"train_info/time_between_train_steps": 0.0032722949981689453, "step": 7294} {"info/global_step": 7295, "train_info/time_within_train_step": 2.6534080505371094, "step": 7295} {"train_info/time_between_train_steps": 0.003267526626586914, "step": 7295} {"info/global_step": 7296, "train_info/time_within_train_step": 2.6438937187194824, "step": 7296} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 7296} {"info/global_step": 7297, "train_info/time_within_train_step": 2.659087896347046, "step": 7297} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 7297} {"info/global_step": 7298, "train_info/time_within_train_step": 2.654010534286499, "step": 7298} {"train_info/time_between_train_steps": 0.0032694339752197266, "step": 7298} {"info/global_step": 7299, "train_info/time_within_train_step": 2.664933919906616, "step": 7299} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 7299} {"info/global_step": 7300, "train_info/time_within_train_step": 2.722747564315796, "step": 7300} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746917903, "_runtime": 20501}, "step": 7300} {"logs": {"train/loss": 3.2122, "train/learning_rate": 0.00017999999999999998, "train/epoch": 8.04, "_timestamp": 1746917903, "_runtime": 20501}, "step": 7300} {"train_info/time_between_train_steps": 0.024677276611328125, "step": 7300} {"info/global_step": 7301, "train_info/time_within_train_step": 2.7285289764404297, "step": 7301} {"train_info/time_between_train_steps": 0.003287792205810547, "step": 7301} {"info/global_step": 7302, "train_info/time_within_train_step": 2.662320137023926, "step": 7302} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 7302} {"info/global_step": 7303, "train_info/time_within_train_step": 2.641231060028076, "step": 7303} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 7303} {"info/global_step": 7304, "train_info/time_within_train_step": 2.652867555618286, "step": 7304} {"train_info/time_between_train_steps": 0.0032587051391601562, "step": 7304} {"info/global_step": 7305, "train_info/time_within_train_step": 2.648430824279785, "step": 7305} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 7305} {"info/global_step": 7306, "train_info/time_within_train_step": 2.6495938301086426, "step": 7306} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 7306} {"info/global_step": 7307, "train_info/time_within_train_step": 2.6453840732574463, "step": 7307} {"train_info/time_between_train_steps": 0.003300189971923828, "step": 7307} {"info/global_step": 7308, "train_info/time_within_train_step": 2.6467556953430176, "step": 7308} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 7308} {"info/global_step": 7309, "train_info/time_within_train_step": 2.661080837249756, "step": 7309} {"train_info/time_between_train_steps": 0.0032737255096435547, "step": 7309} {"info/global_step": 7310, "train_info/time_within_train_step": 2.6641647815704346, "step": 7310} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 7310} {"info/global_step": 7311, "train_info/time_within_train_step": 2.695784091949463, "step": 7311} {"train_info/time_between_train_steps": 0.0032062530517578125, "step": 7311} {"info/global_step": 7312, "train_info/time_within_train_step": 2.646557331085205, "step": 7312} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 7312} {"info/global_step": 7313, "train_info/time_within_train_step": 2.641134023666382, "step": 7313} {"train_info/time_between_train_steps": 0.003236532211303711, "step": 7313} {"info/global_step": 7314, "train_info/time_within_train_step": 2.65681529045105, "step": 7314} {"train_info/time_between_train_steps": 0.0032367706298828125, "step": 7314} {"info/global_step": 7315, "train_info/time_within_train_step": 2.6581320762634277, "step": 7315} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 7315} {"info/global_step": 7316, "train_info/time_within_train_step": 2.6438400745391846, "step": 7316} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 7316} {"info/global_step": 7317, "train_info/time_within_train_step": 2.6515262126922607, "step": 7317} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 7317} {"info/global_step": 7318, "train_info/time_within_train_step": 2.6859567165374756, "step": 7318} {"train_info/time_between_train_steps": 0.003271818161010742, "step": 7318} {"info/global_step": 7319, "train_info/time_within_train_step": 2.6549415588378906, "step": 7319} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 7319} {"info/global_step": 7320, "train_info/time_within_train_step": 2.6565604209899902, "step": 7320} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 7320} {"info/global_step": 7321, "train_info/time_within_train_step": 2.646954298019409, "step": 7321} {"train_info/time_between_train_steps": 0.003249645233154297, "step": 7321} {"info/global_step": 7322, "train_info/time_within_train_step": 2.647686719894409, "step": 7322} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 7322} {"info/global_step": 7323, "train_info/time_within_train_step": 2.6502928733825684, "step": 7323} {"train_info/time_between_train_steps": 0.003245115280151367, "step": 7323} {"info/global_step": 7324, "train_info/time_within_train_step": 2.6489460468292236, "step": 7324} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 7324} {"info/global_step": 7325, "train_info/time_within_train_step": 2.643069267272949, "step": 7325} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 7325} {"info/global_step": 7326, "train_info/time_within_train_step": 2.6413185596466064, "step": 7326} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 7326} {"info/global_step": 7327, "train_info/time_within_train_step": 2.64129900932312, "step": 7327} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 7327} {"info/global_step": 7328, "train_info/time_within_train_step": 2.6554148197174072, "step": 7328} {"train_info/time_between_train_steps": 0.0032308101654052734, "step": 7328} {"info/global_step": 7329, "train_info/time_within_train_step": 2.653369903564453, "step": 7329} {"train_info/time_between_train_steps": 0.0032553672790527344, "step": 7329} {"info/global_step": 7330, "train_info/time_within_train_step": 2.6436049938201904, "step": 7330} {"train_info/time_between_train_steps": 0.0031604766845703125, "step": 7330} {"info/global_step": 7331, "train_info/time_within_train_step": 2.6622650623321533, "step": 7331} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 7331} {"info/global_step": 7332, "train_info/time_within_train_step": 2.6538519859313965, "step": 7332} {"train_info/time_between_train_steps": 0.003244161605834961, "step": 7332} {"info/global_step": 7333, "train_info/time_within_train_step": 2.6667964458465576, "step": 7333} {"train_info/time_between_train_steps": 0.0032470226287841797, "step": 7333} {"info/global_step": 7334, "train_info/time_within_train_step": 2.7250218391418457, "step": 7334} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 7334} {"info/global_step": 7335, "train_info/time_within_train_step": 2.6714563369750977, "step": 7335} {"train_info/time_between_train_steps": 0.003273487091064453, "step": 7335} {"info/global_step": 7336, "train_info/time_within_train_step": 2.6402297019958496, "step": 7336} {"train_info/time_between_train_steps": 0.003257274627685547, "step": 7336} {"info/global_step": 7337, "train_info/time_within_train_step": 2.6462910175323486, "step": 7337} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 7337} {"info/global_step": 7338, "train_info/time_within_train_step": 2.654400587081909, "step": 7338} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 7338} {"info/global_step": 7339, "train_info/time_within_train_step": 2.6533291339874268, "step": 7339} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 7339} {"info/global_step": 7340, "train_info/time_within_train_step": 2.643557071685791, "step": 7340} {"train_info/time_between_train_steps": 0.003255128860473633, "step": 7340} {"info/global_step": 7341, "train_info/time_within_train_step": 2.64654803276062, "step": 7341} {"train_info/time_between_train_steps": 0.0032906532287597656, "step": 7341} {"info/global_step": 7342, "train_info/time_within_train_step": 2.7896642684936523, "step": 7342} {"train_info/time_between_train_steps": 0.0032961368560791016, "step": 7342} {"info/global_step": 7343, "train_info/time_within_train_step": 2.6499462127685547, "step": 7343} {"train_info/time_between_train_steps": 0.0032052993774414062, "step": 7343} {"info/global_step": 7344, "train_info/time_within_train_step": 2.6595914363861084, "step": 7344} {"train_info/time_between_train_steps": 0.003367900848388672, "step": 7344} {"info/global_step": 7345, "train_info/time_within_train_step": 2.66565203666687, "step": 7345} {"train_info/time_between_train_steps": 0.0032587051391601562, "step": 7345} {"info/global_step": 7346, "train_info/time_within_train_step": 2.6989662647247314, "step": 7346} {"train_info/time_between_train_steps": 0.003258228302001953, "step": 7346} {"info/global_step": 7347, "train_info/time_within_train_step": 2.6449244022369385, "step": 7347} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 7347} {"info/global_step": 7348, "train_info/time_within_train_step": 2.6454973220825195, "step": 7348} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 7348} {"info/global_step": 7349, "train_info/time_within_train_step": 2.6556544303894043, "step": 7349} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 7349} {"info/global_step": 7350, "train_info/time_within_train_step": 2.6525425910949707, "step": 7350} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746918037, "_runtime": 20635}, "step": 7350} {"logs": {"train/loss": 3.2177, "train/learning_rate": 0.00017666666666666666, "train/epoch": 8.04, "_timestamp": 1746918037, "_runtime": 20635}, "step": 7350} {"train_info/time_between_train_steps": 0.02416539192199707, "step": 7350} {"info/global_step": 7351, "train_info/time_within_train_step": 2.6628506183624268, "step": 7351} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 7351} {"info/global_step": 7352, "train_info/time_within_train_step": 2.6446051597595215, "step": 7352} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 7352} {"info/global_step": 7353, "train_info/time_within_train_step": 2.919835329055786, "step": 7353} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 7353} {"info/global_step": 7354, "train_info/time_within_train_step": 2.648500680923462, "step": 7354} {"train_info/time_between_train_steps": 0.003245115280151367, "step": 7354} {"info/global_step": 7355, "train_info/time_within_train_step": 2.659526824951172, "step": 7355} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 7355} {"info/global_step": 7356, "train_info/time_within_train_step": 2.643326759338379, "step": 7356} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 7356} {"info/global_step": 7357, "train_info/time_within_train_step": 2.6458191871643066, "step": 7357} {"train_info/time_between_train_steps": 0.003226041793823242, "step": 7357} {"info/global_step": 7358, "train_info/time_within_train_step": 2.6695756912231445, "step": 7358} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 7358} {"info/global_step": 7359, "train_info/time_within_train_step": 2.6657397747039795, "step": 7359} {"train_info/time_between_train_steps": 0.0033049583435058594, "step": 7359} {"info/global_step": 7360, "train_info/time_within_train_step": 2.6718087196350098, "step": 7360} {"train_info/time_between_train_steps": 0.0032377243041992188, "step": 7360} {"info/global_step": 7361, "train_info/time_within_train_step": 2.6705901622772217, "step": 7361} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 7361} {"info/global_step": 7362, "train_info/time_within_train_step": 2.6442453861236572, "step": 7362} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 7362} {"info/global_step": 7363, "train_info/time_within_train_step": 2.641602039337158, "step": 7363} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 7363} {"info/global_step": 7364, "train_info/time_within_train_step": 2.659801483154297, "step": 7364} {"train_info/time_between_train_steps": 0.003271818161010742, "step": 7364} {"info/global_step": 7365, "train_info/time_within_train_step": 2.64789080619812, "step": 7365} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 7365} {"info/global_step": 7366, "train_info/time_within_train_step": 2.653022527694702, "step": 7366} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 7366} {"info/global_step": 7367, "train_info/time_within_train_step": 2.660374641418457, "step": 7367} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 7367} {"info/global_step": 7368, "train_info/time_within_train_step": 2.673696756362915, "step": 7368} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 7368} {"info/global_step": 7369, "train_info/time_within_train_step": 2.663403272628784, "step": 7369} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 7369} {"info/global_step": 7370, "train_info/time_within_train_step": 2.707360029220581, "step": 7370} {"train_info/time_between_train_steps": 0.0032570362091064453, "step": 7370} {"info/global_step": 7371, "train_info/time_within_train_step": 2.640359878540039, "step": 7371} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 7371} {"info/global_step": 7372, "train_info/time_within_train_step": 2.6484739780426025, "step": 7372} {"train_info/time_between_train_steps": 0.0032579898834228516, "step": 7372} {"info/global_step": 7373, "train_info/time_within_train_step": 2.6608126163482666, "step": 7373} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 7373} {"info/global_step": 7374, "train_info/time_within_train_step": 2.6470117568969727, "step": 7374} {"train_info/time_between_train_steps": 0.0032892227172851562, "step": 7374} {"info/global_step": 7375, "train_info/time_within_train_step": 2.644097089767456, "step": 7375} {"train_info/time_between_train_steps": 0.0032422542572021484, "step": 7375} {"info/global_step": 7376, "train_info/time_within_train_step": 2.6597044467926025, "step": 7376} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 7376} {"info/global_step": 7377, "train_info/time_within_train_step": 2.657719373703003, "step": 7377} {"train_info/time_between_train_steps": 0.0032248497009277344, "step": 7377} {"info/global_step": 7378, "train_info/time_within_train_step": 2.6603989601135254, "step": 7378} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 7378} {"info/global_step": 7379, "train_info/time_within_train_step": 2.6833386421203613, "step": 7379} {"train_info/time_between_train_steps": 0.0032300949096679688, "step": 7379} {"info/global_step": 7380, "train_info/time_within_train_step": 2.724210262298584, "step": 7380} {"train_info/time_between_train_steps": 0.0033102035522460938, "step": 7380} {"info/global_step": 7381, "train_info/time_within_train_step": 2.6531970500946045, "step": 7381} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 7381} {"info/global_step": 7382, "train_info/time_within_train_step": 2.6475789546966553, "step": 7382} {"train_info/time_between_train_steps": 0.003239870071411133, "step": 7382} {"info/global_step": 7383, "train_info/time_within_train_step": 2.649401903152466, "step": 7383} {"train_info/time_between_train_steps": 0.0032501220703125, "step": 7383} {"info/global_step": 7384, "train_info/time_within_train_step": 2.6451871395111084, "step": 7384} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 7384} {"info/global_step": 7385, "train_info/time_within_train_step": 2.6459085941314697, "step": 7385} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 7385} {"info/global_step": 7386, "train_info/time_within_train_step": 2.6616618633270264, "step": 7386} {"train_info/time_between_train_steps": 0.0036492347717285156, "step": 7386} {"info/global_step": 7387, "train_info/time_within_train_step": 2.665076494216919, "step": 7387} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 7387} {"info/global_step": 7388, "train_info/time_within_train_step": 2.6980435848236084, "step": 7388} {"train_info/time_between_train_steps": 0.003236055374145508, "step": 7388} {"info/global_step": 7389, "train_info/time_within_train_step": 2.6454954147338867, "step": 7389} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 7389} {"info/global_step": 7390, "train_info/time_within_train_step": 2.6440067291259766, "step": 7390} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 7390} {"info/global_step": 7391, "train_info/time_within_train_step": 2.6528754234313965, "step": 7391} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 7391} {"info/global_step": 7392, "train_info/time_within_train_step": 2.651310920715332, "step": 7392} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 7392} {"info/global_step": 7393, "train_info/time_within_train_step": 2.642670154571533, "step": 7393} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 7393} {"info/global_step": 7394, "train_info/time_within_train_step": 2.643765449523926, "step": 7394} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 7394} {"info/global_step": 7395, "train_info/time_within_train_step": 2.665849208831787, "step": 7395} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 7395} {"info/global_step": 7396, "train_info/time_within_train_step": 2.6688177585601807, "step": 7396} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 7396} {"info/global_step": 7397, "train_info/time_within_train_step": 2.6669888496398926, "step": 7397} {"train_info/time_between_train_steps": 0.0033016204833984375, "step": 7397} {"info/global_step": 7398, "train_info/time_within_train_step": 2.663705348968506, "step": 7398} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 7398} {"info/global_step": 7399, "train_info/time_within_train_step": 2.6758251190185547, "step": 7399} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 7399} {"info/global_step": 7400, "train_info/time_within_train_step": 2.640883684158325, "step": 7400} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746918171, "_runtime": 20769}, "step": 7400} {"logs": {"train/loss": 3.2034, "train/learning_rate": 0.0001733333333333333, "train/epoch": 8.05, "_timestamp": 1746918171, "_runtime": 20769}, "step": 7400} {"train_info/time_between_train_steps": 13.230282545089722, "step": 7400} {"info/global_step": 7401, "train_info/time_within_train_step": 2.4401800632476807, "step": 7401} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 7401} {"info/global_step": 7402, "train_info/time_within_train_step": 2.4329755306243896, "step": 7402} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 7402} {"info/global_step": 7403, "train_info/time_within_train_step": 2.6566991806030273, "step": 7403} {"train_info/time_between_train_steps": 0.003229856491088867, "step": 7403} {"info/global_step": 7404, "train_info/time_within_train_step": 2.643354892730713, "step": 7404} {"train_info/time_between_train_steps": 0.11408734321594238, "step": 7404} {"info/global_step": 7405, "train_info/time_within_train_step": 2.707854747772217, "step": 7405} {"train_info/time_between_train_steps": 0.003262042999267578, "step": 7405} {"info/global_step": 7406, "train_info/time_within_train_step": 2.6393280029296875, "step": 7406} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 7406} {"info/global_step": 7407, "train_info/time_within_train_step": 2.6507973670959473, "step": 7407} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 7407} {"info/global_step": 7408, "train_info/time_within_train_step": 2.6524550914764404, "step": 7408} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 7408} {"info/global_step": 7409, "train_info/time_within_train_step": 2.6506271362304688, "step": 7409} {"train_info/time_between_train_steps": 0.003239154815673828, "step": 7409} {"info/global_step": 7410, "train_info/time_within_train_step": 2.6492669582366943, "step": 7410} {"train_info/time_between_train_steps": 0.0065042972564697266, "step": 7410} {"info/global_step": 7411, "train_info/time_within_train_step": 2.645188570022583, "step": 7411} {"train_info/time_between_train_steps": 0.006567955017089844, "step": 7411} {"info/global_step": 7412, "train_info/time_within_train_step": 2.6482341289520264, "step": 7412} {"train_info/time_between_train_steps": 0.006598234176635742, "step": 7412} {"info/global_step": 7413, "train_info/time_within_train_step": 2.67040753364563, "step": 7413} {"train_info/time_between_train_steps": 0.006594181060791016, "step": 7413} {"info/global_step": 7414, "train_info/time_within_train_step": 2.6818346977233887, "step": 7414} {"train_info/time_between_train_steps": 0.006510257720947266, "step": 7414} {"info/global_step": 7415, "train_info/time_within_train_step": 2.6524806022644043, "step": 7415} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 7415} {"info/global_step": 7416, "train_info/time_within_train_step": 2.692997932434082, "step": 7416} {"train_info/time_between_train_steps": 0.003243684768676758, "step": 7416} {"info/global_step": 7417, "train_info/time_within_train_step": 2.642333984375, "step": 7417} {"train_info/time_between_train_steps": 0.003301858901977539, "step": 7417} {"info/global_step": 7418, "train_info/time_within_train_step": 2.6494858264923096, "step": 7418} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 7418} {"info/global_step": 7419, "train_info/time_within_train_step": 2.6607205867767334, "step": 7419} {"train_info/time_between_train_steps": 0.0033102035522460938, "step": 7419} {"info/global_step": 7420, "train_info/time_within_train_step": 2.665194272994995, "step": 7420} {"train_info/time_between_train_steps": 0.0032739639282226562, "step": 7420} {"info/global_step": 7421, "train_info/time_within_train_step": 2.970573902130127, "step": 7421} {"train_info/time_between_train_steps": 0.0032722949981689453, "step": 7421} {"info/global_step": 7422, "train_info/time_within_train_step": 2.656744956970215, "step": 7422} {"train_info/time_between_train_steps": 0.0032711029052734375, "step": 7422} {"info/global_step": 7423, "train_info/time_within_train_step": 2.662519931793213, "step": 7423} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 7423} {"info/global_step": 7424, "train_info/time_within_train_step": 2.6771719455718994, "step": 7424} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 7424} {"info/global_step": 7425, "train_info/time_within_train_step": 2.6649973392486572, "step": 7425} {"train_info/time_between_train_steps": 0.00323486328125, "step": 7425} {"info/global_step": 7426, "train_info/time_within_train_step": 2.701503038406372, "step": 7426} {"train_info/time_between_train_steps": 0.006540060043334961, "step": 7426} {"info/global_step": 7427, "train_info/time_within_train_step": 2.642017126083374, "step": 7427} {"train_info/time_between_train_steps": 0.0065038204193115234, "step": 7427} {"info/global_step": 7428, "train_info/time_within_train_step": 2.6499106884002686, "step": 7428} {"train_info/time_between_train_steps": 0.0066204071044921875, "step": 7428} {"info/global_step": 7429, "train_info/time_within_train_step": 2.6605966091156006, "step": 7429} {"train_info/time_between_train_steps": 0.006535530090332031, "step": 7429} {"info/global_step": 7430, "train_info/time_within_train_step": 2.643033027648926, "step": 7430} {"train_info/time_between_train_steps": 0.0065500736236572266, "step": 7430} {"info/global_step": 7431, "train_info/time_within_train_step": 2.6507651805877686, "step": 7431} {"train_info/time_between_train_steps": 0.006573200225830078, "step": 7431} {"info/global_step": 7432, "train_info/time_within_train_step": 2.6467971801757812, "step": 7432} {"train_info/time_between_train_steps": 0.006578207015991211, "step": 7432} {"info/global_step": 7433, "train_info/time_within_train_step": 2.656381845474243, "step": 7433} {"train_info/time_between_train_steps": 0.003237485885620117, "step": 7433} {"info/global_step": 7434, "train_info/time_within_train_step": 2.6570329666137695, "step": 7434} {"train_info/time_between_train_steps": 0.003248453140258789, "step": 7434} {"info/global_step": 7435, "train_info/time_within_train_step": 2.672356367111206, "step": 7435} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 7435} {"info/global_step": 7436, "train_info/time_within_train_step": 2.7288618087768555, "step": 7436} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 7436} {"info/global_step": 7437, "train_info/time_within_train_step": 2.662748098373413, "step": 7437} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 7437} {"info/global_step": 7438, "train_info/time_within_train_step": 2.6424262523651123, "step": 7438} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 7438} {"info/global_step": 7439, "train_info/time_within_train_step": 2.655278205871582, "step": 7439} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 7439} {"info/global_step": 7440, "train_info/time_within_train_step": 2.6487538814544678, "step": 7440} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 7440} {"info/global_step": 7441, "train_info/time_within_train_step": 2.654371738433838, "step": 7441} {"train_info/time_between_train_steps": 0.003335714340209961, "step": 7441} {"info/global_step": 7442, "train_info/time_within_train_step": 2.6594953536987305, "step": 7442} {"train_info/time_between_train_steps": 0.0032989978790283203, "step": 7442} {"info/global_step": 7443, "train_info/time_within_train_step": 2.665550947189331, "step": 7443} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 7443} {"info/global_step": 7444, "train_info/time_within_train_step": 2.696528434753418, "step": 7444} {"train_info/time_between_train_steps": 0.0032770633697509766, "step": 7444} {"info/global_step": 7445, "train_info/time_within_train_step": 2.6468212604522705, "step": 7445} {"train_info/time_between_train_steps": 0.0032672882080078125, "step": 7445} {"info/global_step": 7446, "train_info/time_within_train_step": 2.6436216831207275, "step": 7446} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 7446} {"info/global_step": 7447, "train_info/time_within_train_step": 2.6541097164154053, "step": 7447} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 7447} {"info/global_step": 7448, "train_info/time_within_train_step": 2.6528263092041016, "step": 7448} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 7448} {"info/global_step": 7449, "train_info/time_within_train_step": 2.6456611156463623, "step": 7449} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 7449} {"info/global_step": 7450, "train_info/time_within_train_step": 2.6457042694091797, "step": 7450} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746918319, "_runtime": 20917}, "step": 7450} {"logs": {"train/loss": 3.1885, "train/learning_rate": 0.00016999999999999999, "train/epoch": 8.05, "_timestamp": 1746918319, "_runtime": 20917}, "step": 7450} {"train_info/time_between_train_steps": 0.02452707290649414, "step": 7450} {"info/global_step": 7451, "train_info/time_within_train_step": 2.6445460319519043, "step": 7451} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 7451} {"info/global_step": 7452, "train_info/time_within_train_step": 2.6650125980377197, "step": 7452} {"train_info/time_between_train_steps": 0.0032358169555664062, "step": 7452} {"info/global_step": 7453, "train_info/time_within_train_step": 2.66556978225708, "step": 7453} {"train_info/time_between_train_steps": 0.006539583206176758, "step": 7453} {"info/global_step": 7454, "train_info/time_within_train_step": 2.6880717277526855, "step": 7454} {"train_info/time_between_train_steps": 0.006585597991943359, "step": 7454} {"info/global_step": 7455, "train_info/time_within_train_step": 2.680208683013916, "step": 7455} {"train_info/time_between_train_steps": 0.006066322326660156, "step": 7455} {"info/global_step": 7456, "train_info/time_within_train_step": 2.68373966217041, "step": 7456} {"train_info/time_between_train_steps": 0.00608515739440918, "step": 7456} {"info/global_step": 7457, "train_info/time_within_train_step": 2.6398637294769287, "step": 7457} {"train_info/time_between_train_steps": 0.006059885025024414, "step": 7457} {"info/global_step": 7458, "train_info/time_within_train_step": 2.651449203491211, "step": 7458} {"train_info/time_between_train_steps": 0.005490303039550781, "step": 7458} {"info/global_step": 7459, "train_info/time_within_train_step": 2.658480167388916, "step": 7459} {"train_info/time_between_train_steps": 0.006060600280761719, "step": 7459} {"info/global_step": 7460, "train_info/time_within_train_step": 2.647416830062866, "step": 7460} {"train_info/time_between_train_steps": 0.006139039993286133, "step": 7460} {"info/global_step": 7461, "train_info/time_within_train_step": 2.6439437866210938, "step": 7461} {"train_info/time_between_train_steps": 0.006116390228271484, "step": 7461} {"info/global_step": 7462, "train_info/time_within_train_step": 2.6552700996398926, "step": 7462} {"train_info/time_between_train_steps": 0.006137847900390625, "step": 7462} {"info/global_step": 7463, "train_info/time_within_train_step": 2.6605165004730225, "step": 7463} {"train_info/time_between_train_steps": 0.006044149398803711, "step": 7463} {"info/global_step": 7464, "train_info/time_within_train_step": 2.651215076446533, "step": 7464} {"train_info/time_between_train_steps": 0.0030710697174072266, "step": 7464} {"info/global_step": 7465, "train_info/time_within_train_step": 2.6452882289886475, "step": 7465} {"train_info/time_between_train_steps": 0.0030586719512939453, "step": 7465} {"info/global_step": 7466, "train_info/time_within_train_step": 2.6444082260131836, "step": 7466} {"train_info/time_between_train_steps": 0.0030241012573242188, "step": 7466} {"info/global_step": 7467, "train_info/time_within_train_step": 2.645240545272827, "step": 7467} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 7467} {"info/global_step": 7468, "train_info/time_within_train_step": 2.643496513366699, "step": 7468} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 7468} {"info/global_step": 7469, "train_info/time_within_train_step": 2.647784948348999, "step": 7469} {"train_info/time_between_train_steps": 0.005312681198120117, "step": 7469} {"info/global_step": 7470, "train_info/time_within_train_step": 2.6534340381622314, "step": 7470} {"train_info/time_between_train_steps": 0.006073951721191406, "step": 7470} {"info/global_step": 7471, "train_info/time_within_train_step": 2.6402695178985596, "step": 7471} {"train_info/time_between_train_steps": 0.006091117858886719, "step": 7471} {"info/global_step": 7472, "train_info/time_within_train_step": 2.6745290756225586, "step": 7472} {"train_info/time_between_train_steps": 0.005968570709228516, "step": 7472} {"info/global_step": 7473, "train_info/time_within_train_step": 2.6647908687591553, "step": 7473} {"train_info/time_between_train_steps": 0.0030252933502197266, "step": 7473} {"info/global_step": 7474, "train_info/time_within_train_step": 2.6646957397460938, "step": 7474} {"train_info/time_between_train_steps": 0.006110429763793945, "step": 7474} {"info/global_step": 7475, "train_info/time_within_train_step": 2.7072534561157227, "step": 7475} {"train_info/time_between_train_steps": 0.006214618682861328, "step": 7475} {"info/global_step": 7476, "train_info/time_within_train_step": 2.64064884185791, "step": 7476} {"train_info/time_between_train_steps": 0.0060672760009765625, "step": 7476} {"info/global_step": 7477, "train_info/time_within_train_step": 2.6542928218841553, "step": 7477} {"train_info/time_between_train_steps": 0.00608062744140625, "step": 7477} {"info/global_step": 7478, "train_info/time_within_train_step": 2.6451525688171387, "step": 7478} {"train_info/time_between_train_steps": 0.0060803890228271484, "step": 7478} {"info/global_step": 7479, "train_info/time_within_train_step": 2.6448147296905518, "step": 7479} {"train_info/time_between_train_steps": 0.006051778793334961, "step": 7479} {"info/global_step": 7480, "train_info/time_within_train_step": 2.656062364578247, "step": 7480} {"train_info/time_between_train_steps": 0.006090641021728516, "step": 7480} {"info/global_step": 7481, "train_info/time_within_train_step": 2.6418113708496094, "step": 7481} {"train_info/time_between_train_steps": 0.006085872650146484, "step": 7481} {"info/global_step": 7482, "train_info/time_within_train_step": 2.648925542831421, "step": 7482} {"train_info/time_between_train_steps": 0.006093740463256836, "step": 7482} {"info/global_step": 7483, "train_info/time_within_train_step": 2.6672322750091553, "step": 7483} {"train_info/time_between_train_steps": 0.006069660186767578, "step": 7483} {"info/global_step": 7484, "train_info/time_within_train_step": 2.8911783695220947, "step": 7484} {"train_info/time_between_train_steps": 0.003040313720703125, "step": 7484} {"info/global_step": 7485, "train_info/time_within_train_step": 2.6427981853485107, "step": 7485} {"train_info/time_between_train_steps": 0.006020069122314453, "step": 7485} {"info/global_step": 7486, "train_info/time_within_train_step": 2.659209966659546, "step": 7486} {"train_info/time_between_train_steps": 0.0029990673065185547, "step": 7486} {"info/global_step": 7487, "train_info/time_within_train_step": 2.6668214797973633, "step": 7487} {"train_info/time_between_train_steps": 0.002919435501098633, "step": 7487} {"info/global_step": 7488, "train_info/time_within_train_step": 2.685073137283325, "step": 7488} {"train_info/time_between_train_steps": 0.0029098987579345703, "step": 7488} {"info/global_step": 7489, "train_info/time_within_train_step": 2.6514246463775635, "step": 7489} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 7489} {"info/global_step": 7490, "train_info/time_within_train_step": 2.673412799835205, "step": 7490} {"train_info/time_between_train_steps": 0.0029489994049072266, "step": 7490} {"info/global_step": 7491, "train_info/time_within_train_step": 2.641601800918579, "step": 7491} {"train_info/time_between_train_steps": 0.0028731822967529297, "step": 7491} {"info/global_step": 7492, "train_info/time_within_train_step": 2.662959098815918, "step": 7492} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 7492} {"info/global_step": 7493, "train_info/time_within_train_step": 2.6567447185516357, "step": 7493} {"train_info/time_between_train_steps": 0.002952098846435547, "step": 7493} {"info/global_step": 7494, "train_info/time_within_train_step": 2.659154176712036, "step": 7494} {"train_info/time_between_train_steps": 0.002974987030029297, "step": 7494} {"info/global_step": 7495, "train_info/time_within_train_step": 2.7000181674957275, "step": 7495} {"train_info/time_between_train_steps": 0.0029349327087402344, "step": 7495} {"info/global_step": 7496, "train_info/time_within_train_step": 2.652796983718872, "step": 7496} {"train_info/time_between_train_steps": 0.0029397010803222656, "step": 7496} {"info/global_step": 7497, "train_info/time_within_train_step": 2.646597146987915, "step": 7497} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 7497} {"info/global_step": 7498, "train_info/time_within_train_step": 3.23522686958313, "step": 7498} {"train_info/time_between_train_steps": 0.0029344558715820312, "step": 7498} {"info/global_step": 7499, "train_info/time_within_train_step": 2.643944025039673, "step": 7499} {"train_info/time_between_train_steps": 0.002960205078125, "step": 7499} {"info/global_step": 7500, "train_info/time_within_train_step": 2.65010929107666, "step": 7500} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746918455, "_runtime": 21053}, "step": 7500} {"logs": {"train/loss": 3.1837, "train/learning_rate": 0.00016666666666666666, "train/epoch": 8.06, "_timestamp": 1746918455, "_runtime": 21053}, "step": 7500} {"train_info/time_between_train_steps": 0.02362990379333496, "step": 7500} {"info/global_step": 7501, "train_info/time_within_train_step": 2.664339065551758, "step": 7501} {"train_info/time_between_train_steps": 0.002959728240966797, "step": 7501} {"info/global_step": 7502, "train_info/time_within_train_step": 2.6546781063079834, "step": 7502} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 7502} {"info/global_step": 7503, "train_info/time_within_train_step": 2.6630852222442627, "step": 7503} {"train_info/time_between_train_steps": 0.0029726028442382812, "step": 7503} {"info/global_step": 7504, "train_info/time_within_train_step": 2.6916873455047607, "step": 7504} {"train_info/time_between_train_steps": 0.0029087066650390625, "step": 7504} {"info/global_step": 7505, "train_info/time_within_train_step": 2.649545907974243, "step": 7505} {"train_info/time_between_train_steps": 0.0029532909393310547, "step": 7505} {"info/global_step": 7506, "train_info/time_within_train_step": 2.6462485790252686, "step": 7506} {"train_info/time_between_train_steps": 0.002930879592895508, "step": 7506} {"info/global_step": 7507, "train_info/time_within_train_step": 2.65771484375, "step": 7507} {"train_info/time_between_train_steps": 0.002940654754638672, "step": 7507} {"info/global_step": 7508, "train_info/time_within_train_step": 2.6423017978668213, "step": 7508} {"train_info/time_between_train_steps": 0.0029659271240234375, "step": 7508} {"info/global_step": 7509, "train_info/time_within_train_step": 2.652132511138916, "step": 7509} {"train_info/time_between_train_steps": 0.002933502197265625, "step": 7509} {"info/global_step": 7510, "train_info/time_within_train_step": 2.660633087158203, "step": 7510} {"train_info/time_between_train_steps": 0.002977609634399414, "step": 7510} {"info/global_step": 7511, "train_info/time_within_train_step": 2.6987833976745605, "step": 7511} {"train_info/time_between_train_steps": 0.002926349639892578, "step": 7511} {"info/global_step": 7512, "train_info/time_within_train_step": 2.7027482986450195, "step": 7512} {"train_info/time_between_train_steps": 0.0029649734497070312, "step": 7512} {"info/global_step": 7513, "train_info/time_within_train_step": 2.6404337882995605, "step": 7513} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 7513} {"info/global_step": 7514, "train_info/time_within_train_step": 2.6461448669433594, "step": 7514} {"train_info/time_between_train_steps": 0.0029449462890625, "step": 7514} {"info/global_step": 7515, "train_info/time_within_train_step": 2.6484146118164062, "step": 7515} {"train_info/time_between_train_steps": 0.002946615219116211, "step": 7515} {"info/global_step": 7516, "train_info/time_within_train_step": 2.6481521129608154, "step": 7516} {"train_info/time_between_train_steps": 0.002928018569946289, "step": 7516} {"info/global_step": 7517, "train_info/time_within_train_step": 2.644773006439209, "step": 7517} {"train_info/time_between_train_steps": 0.002911090850830078, "step": 7517} {"info/global_step": 7518, "train_info/time_within_train_step": 2.64392352104187, "step": 7518} {"train_info/time_between_train_steps": 0.002928018569946289, "step": 7518} {"info/global_step": 7519, "train_info/time_within_train_step": 2.665012836456299, "step": 7519} {"train_info/time_between_train_steps": 0.002914905548095703, "step": 7519} {"info/global_step": 7520, "train_info/time_within_train_step": 2.6687159538269043, "step": 7520} {"train_info/time_between_train_steps": 0.002947092056274414, "step": 7520} {"info/global_step": 7521, "train_info/time_within_train_step": 2.6758649349212646, "step": 7521} {"train_info/time_between_train_steps": 0.0029497146606445312, "step": 7521} {"info/global_step": 7522, "train_info/time_within_train_step": 2.6519980430603027, "step": 7522} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 7522} {"info/global_step": 7523, "train_info/time_within_train_step": 2.686516761779785, "step": 7523} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 7523} {"info/global_step": 7524, "train_info/time_within_train_step": 2.6399714946746826, "step": 7524} {"train_info/time_between_train_steps": 0.0029358863830566406, "step": 7524} {"info/global_step": 7525, "train_info/time_within_train_step": 2.647172451019287, "step": 7525} {"train_info/time_between_train_steps": 0.0029098987579345703, "step": 7525} {"info/global_step": 7526, "train_info/time_within_train_step": 2.664638042449951, "step": 7526} {"train_info/time_between_train_steps": 0.0029342174530029297, "step": 7526} {"info/global_step": 7527, "train_info/time_within_train_step": 2.6452205181121826, "step": 7527} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 7527} {"info/global_step": 7528, "train_info/time_within_train_step": 2.6434648036956787, "step": 7528} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 7528} {"info/global_step": 7529, "train_info/time_within_train_step": 2.6645002365112305, "step": 7529} {"train_info/time_between_train_steps": 0.002913236618041992, "step": 7529} {"info/global_step": 7530, "train_info/time_within_train_step": 2.665619373321533, "step": 7530} {"train_info/time_between_train_steps": 0.002936840057373047, "step": 7530} {"info/global_step": 7531, "train_info/time_within_train_step": 2.8447718620300293, "step": 7531} {"train_info/time_between_train_steps": 0.0030138492584228516, "step": 7531} {"info/global_step": 7532, "train_info/time_within_train_step": 2.662128210067749, "step": 7532} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 7532} {"info/global_step": 7533, "train_info/time_within_train_step": 2.6614151000976562, "step": 7533} {"train_info/time_between_train_steps": 0.006143808364868164, "step": 7533} {"info/global_step": 7534, "train_info/time_within_train_step": 2.673067331314087, "step": 7534} {"train_info/time_between_train_steps": 0.006051540374755859, "step": 7534} {"info/global_step": 7535, "train_info/time_within_train_step": 2.6638286113739014, "step": 7535} {"train_info/time_between_train_steps": 0.0061511993408203125, "step": 7535} {"info/global_step": 7536, "train_info/time_within_train_step": 2.7015719413757324, "step": 7536} {"train_info/time_between_train_steps": 0.006062507629394531, "step": 7536} {"info/global_step": 7537, "train_info/time_within_train_step": 2.639885187149048, "step": 7537} {"train_info/time_between_train_steps": 0.004857301712036133, "step": 7537} {"info/global_step": 7538, "train_info/time_within_train_step": 2.6475212574005127, "step": 7538} {"train_info/time_between_train_steps": 0.006069660186767578, "step": 7538} {"info/global_step": 7539, "train_info/time_within_train_step": 2.662419557571411, "step": 7539} {"train_info/time_between_train_steps": 0.006107330322265625, "step": 7539} {"info/global_step": 7540, "train_info/time_within_train_step": 2.6419525146484375, "step": 7540} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 7540} {"info/global_step": 7541, "train_info/time_within_train_step": 2.6445443630218506, "step": 7541} {"train_info/time_between_train_steps": 0.0029418468475341797, "step": 7541} {"info/global_step": 7542, "train_info/time_within_train_step": 2.64990234375, "step": 7542} {"train_info/time_between_train_steps": 0.0029044151306152344, "step": 7542} {"info/global_step": 7543, "train_info/time_within_train_step": 2.6521706581115723, "step": 7543} {"train_info/time_between_train_steps": 0.0029463768005371094, "step": 7543} {"info/global_step": 7544, "train_info/time_within_train_step": 2.659381151199341, "step": 7544} {"train_info/time_between_train_steps": 0.002892732620239258, "step": 7544} {"info/global_step": 7545, "train_info/time_within_train_step": 2.6847944259643555, "step": 7545} {"train_info/time_between_train_steps": 0.002984285354614258, "step": 7545} {"info/global_step": 7546, "train_info/time_within_train_step": 2.7358462810516357, "step": 7546} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 7546} {"info/global_step": 7547, "train_info/time_within_train_step": 2.6548969745635986, "step": 7547} {"train_info/time_between_train_steps": 0.0029239654541015625, "step": 7547} {"info/global_step": 7548, "train_info/time_within_train_step": 2.639894962310791, "step": 7548} {"train_info/time_between_train_steps": 0.0029523372650146484, "step": 7548} {"info/global_step": 7549, "train_info/time_within_train_step": 2.656351327896118, "step": 7549} {"train_info/time_between_train_steps": 0.0029540061950683594, "step": 7549} {"info/global_step": 7550, "train_info/time_within_train_step": 2.648142099380493, "step": 7550} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746918589, "_runtime": 21187}, "step": 7550} {"logs": {"train/loss": 3.1742, "train/learning_rate": 0.0001633333333333333, "train/epoch": 8.06, "_timestamp": 1746918589, "_runtime": 21187}, "step": 7550} {"train_info/time_between_train_steps": 0.024023771286010742, "step": 7550} {"info/global_step": 7551, "train_info/time_within_train_step": 2.653574228286743, "step": 7551} {"train_info/time_between_train_steps": 0.002924203872680664, "step": 7551} {"info/global_step": 7552, "train_info/time_within_train_step": 2.6434216499328613, "step": 7552} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 7552} {"info/global_step": 7553, "train_info/time_within_train_step": 2.6482467651367188, "step": 7553} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 7553} {"info/global_step": 7554, "train_info/time_within_train_step": 2.6584312915802, "step": 7554} {"train_info/time_between_train_steps": 0.0029718875885009766, "step": 7554} {"info/global_step": 7555, "train_info/time_within_train_step": 2.6656835079193115, "step": 7555} {"train_info/time_between_train_steps": 0.002898693084716797, "step": 7555} {"info/global_step": 7556, "train_info/time_within_train_step": 2.6984705924987793, "step": 7556} {"train_info/time_between_train_steps": 0.0028824806213378906, "step": 7556} {"info/global_step": 7557, "train_info/time_within_train_step": 2.644131898880005, "step": 7557} {"train_info/time_between_train_steps": 0.0028955936431884766, "step": 7557} {"info/global_step": 7558, "train_info/time_within_train_step": 2.645503044128418, "step": 7558} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 7558} {"info/global_step": 7559, "train_info/time_within_train_step": 2.655194044113159, "step": 7559} {"train_info/time_between_train_steps": 0.0028989315032958984, "step": 7559} {"info/global_step": 7560, "train_info/time_within_train_step": 2.654331922531128, "step": 7560} {"train_info/time_between_train_steps": 0.0029180049896240234, "step": 7560} {"info/global_step": 7561, "train_info/time_within_train_step": 2.643054962158203, "step": 7561} {"train_info/time_between_train_steps": 0.0029087066650390625, "step": 7561} {"info/global_step": 7562, "train_info/time_within_train_step": 2.6430373191833496, "step": 7562} {"train_info/time_between_train_steps": 0.0029036998748779297, "step": 7562} {"info/global_step": 7563, "train_info/time_within_train_step": 2.6586830615997314, "step": 7563} {"train_info/time_between_train_steps": 0.002875804901123047, "step": 7563} {"info/global_step": 7564, "train_info/time_within_train_step": 2.666918992996216, "step": 7564} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 7564} {"info/global_step": 7565, "train_info/time_within_train_step": 2.6851627826690674, "step": 7565} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 7565} {"info/global_step": 7566, "train_info/time_within_train_step": 2.6492528915405273, "step": 7566} {"train_info/time_between_train_steps": 0.002894878387451172, "step": 7566} {"info/global_step": 7567, "train_info/time_within_train_step": 2.680732488632202, "step": 7567} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 7567} {"info/global_step": 7568, "train_info/time_within_train_step": 2.6416244506835938, "step": 7568} {"train_info/time_between_train_steps": 0.002897977828979492, "step": 7568} {"info/global_step": 7569, "train_info/time_within_train_step": 2.6475653648376465, "step": 7569} {"train_info/time_between_train_steps": 0.003100156784057617, "step": 7569} {"info/global_step": 7570, "train_info/time_within_train_step": 2.665299892425537, "step": 7570} {"train_info/time_between_train_steps": 0.0029044151306152344, "step": 7570} {"info/global_step": 7571, "train_info/time_within_train_step": 2.645211935043335, "step": 7571} {"train_info/time_between_train_steps": 0.0029065608978271484, "step": 7571} {"info/global_step": 7572, "train_info/time_within_train_step": 2.6506636142730713, "step": 7572} {"train_info/time_between_train_steps": 0.002933025360107422, "step": 7572} {"info/global_step": 7573, "train_info/time_within_train_step": 2.6703364849090576, "step": 7573} {"train_info/time_between_train_steps": 0.002912759780883789, "step": 7573} {"info/global_step": 7574, "train_info/time_within_train_step": 2.658316135406494, "step": 7574} {"train_info/time_between_train_steps": 0.0029296875, "step": 7574} {"info/global_step": 7575, "train_info/time_within_train_step": 2.654005527496338, "step": 7575} {"train_info/time_between_train_steps": 0.0030717849731445312, "step": 7575} {"info/global_step": 7576, "train_info/time_within_train_step": 2.705371618270874, "step": 7576} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 7576} {"info/global_step": 7577, "train_info/time_within_train_step": 2.6462795734405518, "step": 7577} {"train_info/time_between_train_steps": 0.0029561519622802734, "step": 7577} {"info/global_step": 7578, "train_info/time_within_train_step": 2.647064447402954, "step": 7578} {"train_info/time_between_train_steps": 0.002923727035522461, "step": 7578} {"info/global_step": 7579, "train_info/time_within_train_step": 2.6541409492492676, "step": 7579} {"train_info/time_between_train_steps": 0.0028955936431884766, "step": 7579} {"info/global_step": 7580, "train_info/time_within_train_step": 2.6498701572418213, "step": 7580} {"train_info/time_between_train_steps": 0.002894163131713867, "step": 7580} {"info/global_step": 7581, "train_info/time_within_train_step": 2.6910409927368164, "step": 7581} {"train_info/time_between_train_steps": 0.0029447078704833984, "step": 7581} {"info/global_step": 7582, "train_info/time_within_train_step": 2.6433653831481934, "step": 7582} {"train_info/time_between_train_steps": 0.002913236618041992, "step": 7582} {"info/global_step": 7583, "train_info/time_within_train_step": 2.654130697250366, "step": 7583} {"train_info/time_between_train_steps": 0.002886056900024414, "step": 7583} {"info/global_step": 7584, "train_info/time_within_train_step": 2.651042938232422, "step": 7584} {"train_info/time_between_train_steps": 0.0028905868530273438, "step": 7584} {"info/global_step": 7585, "train_info/time_within_train_step": 2.6588430404663086, "step": 7585} {"train_info/time_between_train_steps": 0.0029287338256835938, "step": 7585} {"info/global_step": 7586, "train_info/time_within_train_step": 2.694751262664795, "step": 7586} {"train_info/time_between_train_steps": 0.002919435501098633, "step": 7586} {"info/global_step": 7587, "train_info/time_within_train_step": 2.7124433517456055, "step": 7587} {"train_info/time_between_train_steps": 0.002960205078125, "step": 7587} {"info/global_step": 7588, "train_info/time_within_train_step": 2.641296863555908, "step": 7588} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 7588} {"info/global_step": 7589, "train_info/time_within_train_step": 2.6403465270996094, "step": 7589} {"train_info/time_between_train_steps": 0.0028848648071289062, "step": 7589} {"info/global_step": 7590, "train_info/time_within_train_step": 2.6632513999938965, "step": 7590} {"train_info/time_between_train_steps": 0.002910137176513672, "step": 7590} {"info/global_step": 7591, "train_info/time_within_train_step": 2.648616075515747, "step": 7591} {"train_info/time_between_train_steps": 0.0029485225677490234, "step": 7591} {"info/global_step": 7592, "train_info/time_within_train_step": 2.643538236618042, "step": 7592} {"train_info/time_between_train_steps": 0.002932310104370117, "step": 7592} {"info/global_step": 7593, "train_info/time_within_train_step": 2.648754119873047, "step": 7593} {"train_info/time_between_train_steps": 0.0029151439666748047, "step": 7593} {"info/global_step": 7594, "train_info/time_within_train_step": 2.6456897258758545, "step": 7594} {"train_info/time_between_train_steps": 0.006120204925537109, "step": 7594} {"info/global_step": 7595, "train_info/time_within_train_step": 2.6695995330810547, "step": 7595} {"train_info/time_between_train_steps": 0.006102561950683594, "step": 7595} {"info/global_step": 7596, "train_info/time_within_train_step": 2.6434996128082275, "step": 7596} {"train_info/time_between_train_steps": 0.0054531097412109375, "step": 7596} {"info/global_step": 7597, "train_info/time_within_train_step": 2.648340940475464, "step": 7597} {"train_info/time_between_train_steps": 0.002899169921875, "step": 7597} {"info/global_step": 7598, "train_info/time_within_train_step": 2.659484624862671, "step": 7598} {"train_info/time_between_train_steps": 0.0029137134552001953, "step": 7598} {"info/global_step": 7599, "train_info/time_within_train_step": 2.6433260440826416, "step": 7599} {"train_info/time_between_train_steps": 0.0028972625732421875, "step": 7599} {"info/global_step": 7600, "train_info/time_within_train_step": 2.644152879714966, "step": 7600} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746918723, "_runtime": 21321}, "step": 7600} {"logs": {"train/loss": 3.1707, "train/learning_rate": 0.00015999999999999999, "train/epoch": 8.07, "_timestamp": 1746918723, "_runtime": 21321}, "step": 7600} {"train_info/time_between_train_steps": 12.704705476760864, "step": 7600} {"info/global_step": 7601, "train_info/time_within_train_step": 2.435805320739746, "step": 7601} {"train_info/time_between_train_steps": 0.003013134002685547, "step": 7601} {"info/global_step": 7602, "train_info/time_within_train_step": 2.448441743850708, "step": 7602} {"train_info/time_between_train_steps": 0.0029315948486328125, "step": 7602} {"info/global_step": 7603, "train_info/time_within_train_step": 2.617061138153076, "step": 7603} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 7603} {"info/global_step": 7604, "train_info/time_within_train_step": 2.656599283218384, "step": 7604} {"train_info/time_between_train_steps": 0.002905130386352539, "step": 7604} {"info/global_step": 7605, "train_info/time_within_train_step": 2.64062762260437, "step": 7605} {"train_info/time_between_train_steps": 0.0030007362365722656, "step": 7605} {"info/global_step": 7606, "train_info/time_within_train_step": 2.642000436782837, "step": 7606} {"train_info/time_between_train_steps": 0.0029075145721435547, "step": 7606} {"info/global_step": 7607, "train_info/time_within_train_step": 2.664585828781128, "step": 7607} {"train_info/time_between_train_steps": 0.002918243408203125, "step": 7607} {"info/global_step": 7608, "train_info/time_within_train_step": 2.661834239959717, "step": 7608} {"train_info/time_between_train_steps": 0.002956390380859375, "step": 7608} {"info/global_step": 7609, "train_info/time_within_train_step": 2.6753299236297607, "step": 7609} {"train_info/time_between_train_steps": 0.002937793731689453, "step": 7609} {"info/global_step": 7610, "train_info/time_within_train_step": 2.6619932651519775, "step": 7610} {"train_info/time_between_train_steps": 0.002950906753540039, "step": 7610} {"info/global_step": 7611, "train_info/time_within_train_step": 2.649258852005005, "step": 7611} {"train_info/time_between_train_steps": 0.0060710906982421875, "step": 7611} {"info/global_step": 7612, "train_info/time_within_train_step": 2.6525118350982666, "step": 7612} {"train_info/time_between_train_steps": 0.006131172180175781, "step": 7612} {"info/global_step": 7613, "train_info/time_within_train_step": 2.6482067108154297, "step": 7613} {"train_info/time_between_train_steps": 0.0029206275939941406, "step": 7613} {"info/global_step": 7614, "train_info/time_within_train_step": 2.6494386196136475, "step": 7614} {"train_info/time_between_train_steps": 0.002906322479248047, "step": 7614} {"info/global_step": 7615, "train_info/time_within_train_step": 2.649348258972168, "step": 7615} {"train_info/time_between_train_steps": 0.0029914379119873047, "step": 7615} {"info/global_step": 7616, "train_info/time_within_train_step": 2.64677095413208, "step": 7616} {"train_info/time_between_train_steps": 0.002952098846435547, "step": 7616} {"info/global_step": 7617, "train_info/time_within_train_step": 2.6662840843200684, "step": 7617} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 7617} {"info/global_step": 7618, "train_info/time_within_train_step": 2.667227268218994, "step": 7618} {"train_info/time_between_train_steps": 0.0030198097229003906, "step": 7618} {"info/global_step": 7619, "train_info/time_within_train_step": 2.662853717803955, "step": 7619} {"train_info/time_between_train_steps": 0.006074428558349609, "step": 7619} {"info/global_step": 7620, "train_info/time_within_train_step": 2.7116780281066895, "step": 7620} {"train_info/time_between_train_steps": 0.0028967857360839844, "step": 7620} {"info/global_step": 7621, "train_info/time_within_train_step": 2.6486454010009766, "step": 7621} {"train_info/time_between_train_steps": 0.002935171127319336, "step": 7621} {"info/global_step": 7622, "train_info/time_within_train_step": 2.6481032371520996, "step": 7622} {"train_info/time_between_train_steps": 0.0029754638671875, "step": 7622} {"info/global_step": 7623, "train_info/time_within_train_step": 2.655228853225708, "step": 7623} {"train_info/time_between_train_steps": 0.0029027462005615234, "step": 7623} {"info/global_step": 7624, "train_info/time_within_train_step": 2.648737907409668, "step": 7624} {"train_info/time_between_train_steps": 0.0029053688049316406, "step": 7624} {"info/global_step": 7625, "train_info/time_within_train_step": 2.650416374206543, "step": 7625} {"train_info/time_between_train_steps": 0.002930879592895508, "step": 7625} {"info/global_step": 7626, "train_info/time_within_train_step": 2.6447324752807617, "step": 7626} {"train_info/time_between_train_steps": 0.0029206275939941406, "step": 7626} {"info/global_step": 7627, "train_info/time_within_train_step": 2.65434193611145, "step": 7627} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 7627} {"info/global_step": 7628, "train_info/time_within_train_step": 2.656022071838379, "step": 7628} {"train_info/time_between_train_steps": 0.0029811859130859375, "step": 7628} {"info/global_step": 7629, "train_info/time_within_train_step": 2.6691908836364746, "step": 7629} {"train_info/time_between_train_steps": 0.002974271774291992, "step": 7629} {"info/global_step": 7630, "train_info/time_within_train_step": 2.727692127227783, "step": 7630} {"train_info/time_between_train_steps": 0.0029282569885253906, "step": 7630} {"info/global_step": 7631, "train_info/time_within_train_step": 2.665616989135742, "step": 7631} {"train_info/time_between_train_steps": 0.002942323684692383, "step": 7631} {"info/global_step": 7632, "train_info/time_within_train_step": 2.6409752368927, "step": 7632} {"train_info/time_between_train_steps": 0.0029249191284179688, "step": 7632} {"info/global_step": 7633, "train_info/time_within_train_step": 2.652881383895874, "step": 7633} {"train_info/time_between_train_steps": 0.0029654502868652344, "step": 7633} {"info/global_step": 7634, "train_info/time_within_train_step": 2.6494193077087402, "step": 7634} {"train_info/time_between_train_steps": 0.002904653549194336, "step": 7634} {"info/global_step": 7635, "train_info/time_within_train_step": 2.6520962715148926, "step": 7635} {"train_info/time_between_train_steps": 0.002980947494506836, "step": 7635} {"info/global_step": 7636, "train_info/time_within_train_step": 2.645507335662842, "step": 7636} {"train_info/time_between_train_steps": 0.0029687881469726562, "step": 7636} {"info/global_step": 7637, "train_info/time_within_train_step": 2.648040533065796, "step": 7637} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 7637} {"info/global_step": 7638, "train_info/time_within_train_step": 2.660313129425049, "step": 7638} {"train_info/time_between_train_steps": 0.0029964447021484375, "step": 7638} {"info/global_step": 7639, "train_info/time_within_train_step": 2.6652565002441406, "step": 7639} {"train_info/time_between_train_steps": 0.002892732620239258, "step": 7639} {"info/global_step": 7640, "train_info/time_within_train_step": 2.701227903366089, "step": 7640} {"train_info/time_between_train_steps": 0.002930879592895508, "step": 7640} {"info/global_step": 7641, "train_info/time_within_train_step": 2.643874406814575, "step": 7641} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 7641} {"info/global_step": 7642, "train_info/time_within_train_step": 2.6487557888031006, "step": 7642} {"train_info/time_between_train_steps": 0.002902984619140625, "step": 7642} {"info/global_step": 7643, "train_info/time_within_train_step": 2.649510622024536, "step": 7643} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 7643} {"info/global_step": 7644, "train_info/time_within_train_step": 2.645960569381714, "step": 7644} {"train_info/time_between_train_steps": 0.003092527389526367, "step": 7644} {"info/global_step": 7645, "train_info/time_within_train_step": 2.65559458732605, "step": 7645} {"train_info/time_between_train_steps": 0.002943277359008789, "step": 7645} {"info/global_step": 7646, "train_info/time_within_train_step": 2.6433064937591553, "step": 7646} {"train_info/time_between_train_steps": 0.002901315689086914, "step": 7646} {"info/global_step": 7647, "train_info/time_within_train_step": 2.769994020462036, "step": 7647} {"train_info/time_between_train_steps": 0.0030078887939453125, "step": 7647} {"info/global_step": 7648, "train_info/time_within_train_step": 2.6438348293304443, "step": 7648} {"train_info/time_between_train_steps": 0.002927064895629883, "step": 7648} {"info/global_step": 7649, "train_info/time_within_train_step": 2.6476969718933105, "step": 7649} {"train_info/time_between_train_steps": 0.0029189586639404297, "step": 7649} {"info/global_step": 7650, "train_info/time_within_train_step": 2.669570207595825, "step": 7650} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746918870, "_runtime": 21468}, "step": 7650} {"logs": {"train/loss": 3.1571, "train/learning_rate": 0.00015666666666666666, "train/epoch": 8.07, "_timestamp": 1746918870, "_runtime": 21468}, "step": 7650} {"train_info/time_between_train_steps": 0.024092674255371094, "step": 7650} {"info/global_step": 7651, "train_info/time_within_train_step": 2.6673202514648438, "step": 7651} {"train_info/time_between_train_steps": 0.0029060840606689453, "step": 7651} {"info/global_step": 7652, "train_info/time_within_train_step": 2.685037136077881, "step": 7652} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 7652} {"info/global_step": 7653, "train_info/time_within_train_step": 2.650175094604492, "step": 7653} {"train_info/time_between_train_steps": 0.0029060840606689453, "step": 7653} {"info/global_step": 7654, "train_info/time_within_train_step": 2.6841092109680176, "step": 7654} {"train_info/time_between_train_steps": 0.0029425621032714844, "step": 7654} {"info/global_step": 7655, "train_info/time_within_train_step": 2.6413733959198, "step": 7655} {"train_info/time_between_train_steps": 0.002924680709838867, "step": 7655} {"info/global_step": 7656, "train_info/time_within_train_step": 2.6481122970581055, "step": 7656} {"train_info/time_between_train_steps": 0.0029175281524658203, "step": 7656} {"info/global_step": 7657, "train_info/time_within_train_step": 2.659611463546753, "step": 7657} {"train_info/time_between_train_steps": 0.0028929710388183594, "step": 7657} {"info/global_step": 7658, "train_info/time_within_train_step": 2.665738105773926, "step": 7658} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 7658} {"info/global_step": 7659, "train_info/time_within_train_step": 2.662118911743164, "step": 7659} {"train_info/time_between_train_steps": 0.002941608428955078, "step": 7659} {"info/global_step": 7660, "train_info/time_within_train_step": 2.659027338027954, "step": 7660} {"train_info/time_between_train_steps": 0.0034148693084716797, "step": 7660} {"info/global_step": 7661, "train_info/time_within_train_step": 2.7045950889587402, "step": 7661} {"train_info/time_between_train_steps": 0.002901315689086914, "step": 7661} {"info/global_step": 7662, "train_info/time_within_train_step": 2.6483190059661865, "step": 7662} {"train_info/time_between_train_steps": 0.0029370784759521484, "step": 7662} {"info/global_step": 7663, "train_info/time_within_train_step": 2.647047758102417, "step": 7663} {"train_info/time_between_train_steps": 0.0029349327087402344, "step": 7663} {"info/global_step": 7664, "train_info/time_within_train_step": 2.6543939113616943, "step": 7664} {"train_info/time_between_train_steps": 0.0029675960540771484, "step": 7664} {"info/global_step": 7665, "train_info/time_within_train_step": 2.64571213722229, "step": 7665} {"train_info/time_between_train_steps": 0.002944469451904297, "step": 7665} {"info/global_step": 7666, "train_info/time_within_train_step": 2.648536443710327, "step": 7666} {"train_info/time_between_train_steps": 0.0029709339141845703, "step": 7666} {"info/global_step": 7667, "train_info/time_within_train_step": 2.6460697650909424, "step": 7667} {"train_info/time_between_train_steps": 0.0029692649841308594, "step": 7667} {"info/global_step": 7668, "train_info/time_within_train_step": 2.65338134765625, "step": 7668} {"train_info/time_between_train_steps": 0.0029239654541015625, "step": 7668} {"info/global_step": 7669, "train_info/time_within_train_step": 2.6541712284088135, "step": 7669} {"train_info/time_between_train_steps": 0.003238677978515625, "step": 7669} {"info/global_step": 7670, "train_info/time_within_train_step": 2.644078254699707, "step": 7670} {"train_info/time_between_train_steps": 0.0030210018157958984, "step": 7670} {"info/global_step": 7671, "train_info/time_within_train_step": 2.642869472503662, "step": 7671} {"train_info/time_between_train_steps": 0.0030279159545898438, "step": 7671} {"info/global_step": 7672, "train_info/time_within_train_step": 2.6430282592773438, "step": 7672} {"train_info/time_between_train_steps": 0.0030508041381835938, "step": 7672} {"info/global_step": 7673, "train_info/time_within_train_step": 2.6450626850128174, "step": 7673} {"train_info/time_between_train_steps": 0.003078460693359375, "step": 7673} {"info/global_step": 7674, "train_info/time_within_train_step": 2.643000364303589, "step": 7674} {"train_info/time_between_train_steps": 0.0029633045196533203, "step": 7674} {"info/global_step": 7675, "train_info/time_within_train_step": 2.665170907974243, "step": 7675} {"train_info/time_between_train_steps": 0.002973794937133789, "step": 7675} {"info/global_step": 7676, "train_info/time_within_train_step": 2.670470714569092, "step": 7676} {"train_info/time_between_train_steps": 0.0029807090759277344, "step": 7676} {"info/global_step": 7677, "train_info/time_within_train_step": 2.641968011856079, "step": 7677} {"train_info/time_between_train_steps": 0.0029625892639160156, "step": 7677} {"info/global_step": 7678, "train_info/time_within_train_step": 2.6459836959838867, "step": 7678} {"train_info/time_between_train_steps": 0.0029206275939941406, "step": 7678} {"info/global_step": 7679, "train_info/time_within_train_step": 2.658273935317993, "step": 7679} {"train_info/time_between_train_steps": 0.002932310104370117, "step": 7679} {"info/global_step": 7680, "train_info/time_within_train_step": 2.646792411804199, "step": 7680} {"train_info/time_between_train_steps": 0.0029418468475341797, "step": 7680} {"info/global_step": 7681, "train_info/time_within_train_step": 2.643728494644165, "step": 7681} {"train_info/time_between_train_steps": 0.0029497146606445312, "step": 7681} {"info/global_step": 7682, "train_info/time_within_train_step": 2.653989791870117, "step": 7682} {"train_info/time_between_train_steps": 0.0029571056365966797, "step": 7682} {"info/global_step": 7683, "train_info/time_within_train_step": 2.6497743129730225, "step": 7683} {"train_info/time_between_train_steps": 0.002936840057373047, "step": 7683} {"info/global_step": 7684, "train_info/time_within_train_step": 2.6577556133270264, "step": 7684} {"train_info/time_between_train_steps": 0.003116607666015625, "step": 7684} {"info/global_step": 7685, "train_info/time_within_train_step": 2.678652286529541, "step": 7685} {"train_info/time_between_train_steps": 0.0029366016387939453, "step": 7685} {"info/global_step": 7686, "train_info/time_within_train_step": 2.7256622314453125, "step": 7686} {"train_info/time_between_train_steps": 0.002956867218017578, "step": 7686} {"info/global_step": 7687, "train_info/time_within_train_step": 2.655123233795166, "step": 7687} {"train_info/time_between_train_steps": 0.0029087066650390625, "step": 7687} {"info/global_step": 7688, "train_info/time_within_train_step": 2.638704299926758, "step": 7688} {"train_info/time_between_train_steps": 0.002938508987426758, "step": 7688} {"info/global_step": 7689, "train_info/time_within_train_step": 2.657280206680298, "step": 7689} {"train_info/time_between_train_steps": 0.0029926300048828125, "step": 7689} {"info/global_step": 7690, "train_info/time_within_train_step": 2.6482012271881104, "step": 7690} {"train_info/time_between_train_steps": 0.002908945083618164, "step": 7690} {"info/global_step": 7691, "train_info/time_within_train_step": 2.6468517780303955, "step": 7691} {"train_info/time_between_train_steps": 0.0029380321502685547, "step": 7691} {"info/global_step": 7692, "train_info/time_within_train_step": 2.6477560997009277, "step": 7692} {"train_info/time_between_train_steps": 0.002928018569946289, "step": 7692} {"info/global_step": 7693, "train_info/time_within_train_step": 2.643249034881592, "step": 7693} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 7693} {"info/global_step": 7694, "train_info/time_within_train_step": 2.6668238639831543, "step": 7694} {"train_info/time_between_train_steps": 0.0029625892639160156, "step": 7694} {"info/global_step": 7695, "train_info/time_within_train_step": 2.6698801517486572, "step": 7695} {"train_info/time_between_train_steps": 0.002954244613647461, "step": 7695} {"info/global_step": 7696, "train_info/time_within_train_step": 2.6836748123168945, "step": 7696} {"train_info/time_between_train_steps": 0.0029592514038085938, "step": 7696} {"info/global_step": 7697, "train_info/time_within_train_step": 2.6512815952301025, "step": 7697} {"train_info/time_between_train_steps": 0.0029180049896240234, "step": 7697} {"info/global_step": 7698, "train_info/time_within_train_step": 2.6394715309143066, "step": 7698} {"train_info/time_between_train_steps": 0.002889871597290039, "step": 7698} {"info/global_step": 7699, "train_info/time_within_train_step": 2.655885934829712, "step": 7699} {"train_info/time_between_train_steps": 0.0029103755950927734, "step": 7699} {"info/global_step": 7700, "train_info/time_within_train_step": 2.6564016342163086, "step": 7700} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746919005, "_runtime": 21603}, "step": 7700} {"logs": {"train/loss": 3.1504, "train/learning_rate": 0.0001533333333333333, "train/epoch": 8.08, "_timestamp": 1746919005, "_runtime": 21603}, "step": 7700} {"train_info/time_between_train_steps": 0.02395915985107422, "step": 7700} {"info/global_step": 7701, "train_info/time_within_train_step": 2.655677080154419, "step": 7701} {"train_info/time_between_train_steps": 0.0028798580169677734, "step": 7701} {"info/global_step": 7702, "train_info/time_within_train_step": 2.640899658203125, "step": 7702} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 7702} {"info/global_step": 7703, "train_info/time_within_train_step": 2.650085926055908, "step": 7703} {"train_info/time_between_train_steps": 0.0029001235961914062, "step": 7703} {"info/global_step": 7704, "train_info/time_within_train_step": 2.668013572692871, "step": 7704} {"train_info/time_between_train_steps": 0.002924203872680664, "step": 7704} {"info/global_step": 7705, "train_info/time_within_train_step": 2.671617269515991, "step": 7705} {"train_info/time_between_train_steps": 0.003094911575317383, "step": 7705} {"info/global_step": 7706, "train_info/time_within_train_step": 2.6511316299438477, "step": 7706} {"train_info/time_between_train_steps": 0.0029609203338623047, "step": 7706} {"info/global_step": 7707, "train_info/time_within_train_step": 2.684685707092285, "step": 7707} {"train_info/time_between_train_steps": 0.0029528141021728516, "step": 7707} {"info/global_step": 7708, "train_info/time_within_train_step": 2.7246530055999756, "step": 7708} {"train_info/time_between_train_steps": 0.0029811859130859375, "step": 7708} {"info/global_step": 7709, "train_info/time_within_train_step": 2.6399455070495605, "step": 7709} {"train_info/time_between_train_steps": 0.0029282569885253906, "step": 7709} {"info/global_step": 7710, "train_info/time_within_train_step": 2.6511948108673096, "step": 7710} {"train_info/time_between_train_steps": 0.0029392242431640625, "step": 7710} {"info/global_step": 7711, "train_info/time_within_train_step": 2.665550947189331, "step": 7711} {"train_info/time_between_train_steps": 0.002919435501098633, "step": 7711} {"info/global_step": 7712, "train_info/time_within_train_step": 2.6425302028656006, "step": 7712} {"train_info/time_between_train_steps": 0.0029349327087402344, "step": 7712} {"info/global_step": 7713, "train_info/time_within_train_step": 2.6416547298431396, "step": 7713} {"train_info/time_between_train_steps": 0.0028867721557617188, "step": 7713} {"info/global_step": 7714, "train_info/time_within_train_step": 2.6499173641204834, "step": 7714} {"train_info/time_between_train_steps": 0.002912282943725586, "step": 7714} {"info/global_step": 7715, "train_info/time_within_train_step": 2.660604476928711, "step": 7715} {"train_info/time_between_train_steps": 0.0029077529907226562, "step": 7715} {"info/global_step": 7716, "train_info/time_within_train_step": 2.671159267425537, "step": 7716} {"train_info/time_between_train_steps": 0.0029659271240234375, "step": 7716} {"info/global_step": 7717, "train_info/time_within_train_step": 2.6606407165527344, "step": 7717} {"train_info/time_between_train_steps": 0.003029346466064453, "step": 7717} {"info/global_step": 7718, "train_info/time_within_train_step": 2.7038912773132324, "step": 7718} {"train_info/time_between_train_steps": 0.0028955936431884766, "step": 7718} {"info/global_step": 7719, "train_info/time_within_train_step": 2.638604164123535, "step": 7719} {"train_info/time_between_train_steps": 0.0029447078704833984, "step": 7719} {"info/global_step": 7720, "train_info/time_within_train_step": 2.6489803791046143, "step": 7720} {"train_info/time_between_train_steps": 0.0029358863830566406, "step": 7720} {"info/global_step": 7721, "train_info/time_within_train_step": 2.642746686935425, "step": 7721} {"train_info/time_between_train_steps": 0.002909421920776367, "step": 7721} {"info/global_step": 7722, "train_info/time_within_train_step": 2.657519817352295, "step": 7722} {"train_info/time_between_train_steps": 0.0029363632202148438, "step": 7722} {"info/global_step": 7723, "train_info/time_within_train_step": 2.650998115539551, "step": 7723} {"train_info/time_between_train_steps": 0.0030052661895751953, "step": 7723} {"info/global_step": 7724, "train_info/time_within_train_step": 2.665363311767578, "step": 7724} {"train_info/time_between_train_steps": 0.002971649169921875, "step": 7724} {"info/global_step": 7725, "train_info/time_within_train_step": 2.7131764888763428, "step": 7725} {"train_info/time_between_train_steps": 0.0029900074005126953, "step": 7725} {"info/global_step": 7726, "train_info/time_within_train_step": 2.6405317783355713, "step": 7726} {"train_info/time_between_train_steps": 0.002965211868286133, "step": 7726} {"info/global_step": 7727, "train_info/time_within_train_step": 2.6395559310913086, "step": 7727} {"train_info/time_between_train_steps": 0.0029244422912597656, "step": 7727} {"info/global_step": 7728, "train_info/time_within_train_step": 2.6536755561828613, "step": 7728} {"train_info/time_between_train_steps": 0.0030333995819091797, "step": 7728} {"info/global_step": 7729, "train_info/time_within_train_step": 2.6550068855285645, "step": 7729} {"train_info/time_between_train_steps": 0.0029990673065185547, "step": 7729} {"info/global_step": 7730, "train_info/time_within_train_step": 2.642566204071045, "step": 7730} {"train_info/time_between_train_steps": 0.0029888153076171875, "step": 7730} {"info/global_step": 7731, "train_info/time_within_train_step": 2.649942636489868, "step": 7731} {"train_info/time_between_train_steps": 0.0029976367950439453, "step": 7731} {"info/global_step": 7732, "train_info/time_within_train_step": 2.6521027088165283, "step": 7732} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 7732} {"info/global_step": 7733, "train_info/time_within_train_step": 2.706054449081421, "step": 7733} {"train_info/time_between_train_steps": 0.0029456615447998047, "step": 7733} {"info/global_step": 7734, "train_info/time_within_train_step": 2.6952028274536133, "step": 7734} {"train_info/time_between_train_steps": 0.0029058456420898438, "step": 7734} {"info/global_step": 7735, "train_info/time_within_train_step": 2.6613149642944336, "step": 7735} {"train_info/time_between_train_steps": 0.003034353256225586, "step": 7735} {"info/global_step": 7736, "train_info/time_within_train_step": 2.662508964538574, "step": 7736} {"train_info/time_between_train_steps": 0.003052234649658203, "step": 7736} {"info/global_step": 7737, "train_info/time_within_train_step": 2.640632390975952, "step": 7737} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 7737} {"info/global_step": 7738, "train_info/time_within_train_step": 2.653602123260498, "step": 7738} {"train_info/time_between_train_steps": 0.002972126007080078, "step": 7738} {"info/global_step": 7739, "train_info/time_within_train_step": 2.656299591064453, "step": 7739} {"train_info/time_between_train_steps": 0.0029420852661132812, "step": 7739} {"info/global_step": 7740, "train_info/time_within_train_step": 2.6441526412963867, "step": 7740} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 7740} {"info/global_step": 7741, "train_info/time_within_train_step": 2.6435792446136475, "step": 7741} {"train_info/time_between_train_steps": 0.0030701160430908203, "step": 7741} {"info/global_step": 7742, "train_info/time_within_train_step": 2.6566386222839355, "step": 7742} {"train_info/time_between_train_steps": 0.0029799938201904297, "step": 7742} {"info/global_step": 7743, "train_info/time_within_train_step": 2.681756019592285, "step": 7743} {"train_info/time_between_train_steps": 0.0029582977294921875, "step": 7743} {"info/global_step": 7744, "train_info/time_within_train_step": 2.675740957260132, "step": 7744} {"train_info/time_between_train_steps": 0.0030028820037841797, "step": 7744} {"info/global_step": 7745, "train_info/time_within_train_step": 2.6522939205169678, "step": 7745} {"train_info/time_between_train_steps": 0.003055095672607422, "step": 7745} {"info/global_step": 7746, "train_info/time_within_train_step": 2.6884984970092773, "step": 7746} {"train_info/time_between_train_steps": 0.003237009048461914, "step": 7746} {"info/global_step": 7747, "train_info/time_within_train_step": 2.6450061798095703, "step": 7747} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 7747} {"info/global_step": 7748, "train_info/time_within_train_step": 3.265691041946411, "step": 7748} {"train_info/time_between_train_steps": 0.0031523704528808594, "step": 7748} {"info/global_step": 7749, "train_info/time_within_train_step": 2.6484897136688232, "step": 7749} {"train_info/time_between_train_steps": 0.003036975860595703, "step": 7749} {"info/global_step": 7750, "train_info/time_within_train_step": 2.643052816390991, "step": 7750} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746919140, "_runtime": 21738}, "step": 7750} {"logs": {"train/loss": 3.1469, "train/learning_rate": 0.00015, "train/epoch": 8.08, "_timestamp": 1746919140, "_runtime": 21738}, "step": 7750} {"train_info/time_between_train_steps": 0.024363994598388672, "step": 7750} {"info/global_step": 7751, "train_info/time_within_train_step": 2.698490619659424, "step": 7751} {"train_info/time_between_train_steps": 0.0034058094024658203, "step": 7751} {"info/global_step": 7752, "train_info/time_within_train_step": 2.645017147064209, "step": 7752} {"train_info/time_between_train_steps": 0.0032613277435302734, "step": 7752} {"info/global_step": 7753, "train_info/time_within_train_step": 2.6676342487335205, "step": 7753} {"train_info/time_between_train_steps": 0.003058910369873047, "step": 7753} {"info/global_step": 7754, "train_info/time_within_train_step": 2.6641294956207275, "step": 7754} {"train_info/time_between_train_steps": 0.0032444000244140625, "step": 7754} {"info/global_step": 7755, "train_info/time_within_train_step": 2.6741955280303955, "step": 7755} {"train_info/time_between_train_steps": 0.0034651756286621094, "step": 7755} {"info/global_step": 7756, "train_info/time_within_train_step": 2.666590929031372, "step": 7756} {"train_info/time_between_train_steps": 0.0033805370330810547, "step": 7756} {"info/global_step": 7757, "train_info/time_within_train_step": 2.650043487548828, "step": 7757} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 7757} {"info/global_step": 7758, "train_info/time_within_train_step": 2.650289535522461, "step": 7758} {"train_info/time_between_train_steps": 0.0035419464111328125, "step": 7758} {"info/global_step": 7759, "train_info/time_within_train_step": 2.6463494300842285, "step": 7759} {"train_info/time_between_train_steps": 0.003567218780517578, "step": 7759} {"info/global_step": 7760, "train_info/time_within_train_step": 2.6529550552368164, "step": 7760} {"train_info/time_between_train_steps": 0.003415346145629883, "step": 7760} {"info/global_step": 7761, "train_info/time_within_train_step": 2.6503591537475586, "step": 7761} {"train_info/time_between_train_steps": 0.003564596176147461, "step": 7761} {"info/global_step": 7762, "train_info/time_within_train_step": 2.6467204093933105, "step": 7762} {"train_info/time_between_train_steps": 0.003373861312866211, "step": 7762} {"info/global_step": 7763, "train_info/time_within_train_step": 2.665649175643921, "step": 7763} {"train_info/time_between_train_steps": 0.003484010696411133, "step": 7763} {"info/global_step": 7764, "train_info/time_within_train_step": 2.6601691246032715, "step": 7764} {"train_info/time_between_train_steps": 0.0035037994384765625, "step": 7764} {"info/global_step": 7765, "train_info/time_within_train_step": 2.6589627265930176, "step": 7765} {"train_info/time_between_train_steps": 0.0035364627838134766, "step": 7765} {"info/global_step": 7766, "train_info/time_within_train_step": 2.7050909996032715, "step": 7766} {"train_info/time_between_train_steps": 0.00429081916809082, "step": 7766} {"info/global_step": 7767, "train_info/time_within_train_step": 2.6595113277435303, "step": 7767} {"train_info/time_between_train_steps": 0.0032062530517578125, "step": 7767} {"train_info/time_between_train_steps": 2.367147922515869, "step": 7767} {"info/global_step": 7768, "train_info/time_within_train_step": 2.614790678024292, "step": 7768} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 7768} {"info/global_step": 7769, "train_info/time_within_train_step": 2.6649274826049805, "step": 7769} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 7769} {"info/global_step": 7770, "train_info/time_within_train_step": 2.72715425491333, "step": 7770} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 7770} {"info/global_step": 7771, "train_info/time_within_train_step": 2.6573750972747803, "step": 7771} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 7771} {"info/global_step": 7772, "train_info/time_within_train_step": 2.6406140327453613, "step": 7772} {"train_info/time_between_train_steps": 0.0033562183380126953, "step": 7772} {"info/global_step": 7773, "train_info/time_within_train_step": 2.6518449783325195, "step": 7773} {"train_info/time_between_train_steps": 0.0035266876220703125, "step": 7773} {"info/global_step": 7774, "train_info/time_within_train_step": 2.6491916179656982, "step": 7774} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 7774} {"info/global_step": 7775, "train_info/time_within_train_step": 2.650533676147461, "step": 7775} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 7775} {"info/global_step": 7776, "train_info/time_within_train_step": 2.652317762374878, "step": 7776} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 7776} {"info/global_step": 7777, "train_info/time_within_train_step": 2.8728299140930176, "step": 7777} {"train_info/time_between_train_steps": 0.003307819366455078, "step": 7777} {"info/global_step": 7778, "train_info/time_within_train_step": 2.6467976570129395, "step": 7778} {"train_info/time_between_train_steps": 0.003343820571899414, "step": 7778} {"info/global_step": 7779, "train_info/time_within_train_step": 2.6628575325012207, "step": 7779} {"train_info/time_between_train_steps": 0.003349781036376953, "step": 7779} {"info/global_step": 7780, "train_info/time_within_train_step": 2.644831895828247, "step": 7780} {"train_info/time_between_train_steps": 0.003317594528198242, "step": 7780} {"info/global_step": 7781, "train_info/time_within_train_step": 2.6487762928009033, "step": 7781} {"train_info/time_between_train_steps": 0.003368854522705078, "step": 7781} {"info/global_step": 7782, "train_info/time_within_train_step": 2.6855204105377197, "step": 7782} {"train_info/time_between_train_steps": 0.003346681594848633, "step": 7782} {"info/global_step": 7783, "train_info/time_within_train_step": 2.6509921550750732, "step": 7783} {"train_info/time_between_train_steps": 0.0034432411193847656, "step": 7783} {"info/global_step": 7784, "train_info/time_within_train_step": 2.6845200061798096, "step": 7784} {"train_info/time_between_train_steps": 0.0034503936767578125, "step": 7784} {"info/global_step": 7785, "train_info/time_within_train_step": 2.6409196853637695, "step": 7785} {"train_info/time_between_train_steps": 0.003392457962036133, "step": 7785} {"info/global_step": 7786, "train_info/time_within_train_step": 2.649693012237549, "step": 7786} {"train_info/time_between_train_steps": 0.0034220218658447266, "step": 7786} {"info/global_step": 7787, "train_info/time_within_train_step": 2.6627445220947266, "step": 7787} {"train_info/time_between_train_steps": 0.003428936004638672, "step": 7787} {"info/global_step": 7788, "train_info/time_within_train_step": 2.6437294483184814, "step": 7788} {"train_info/time_between_train_steps": 0.0033643245697021484, "step": 7788} {"info/global_step": 7789, "train_info/time_within_train_step": 2.6448521614074707, "step": 7789} {"train_info/time_between_train_steps": 0.003434896469116211, "step": 7789} {"info/global_step": 7790, "train_info/time_within_train_step": 2.6567461490631104, "step": 7790} {"train_info/time_between_train_steps": 0.003471851348876953, "step": 7790} {"info/global_step": 7791, "train_info/time_within_train_step": 2.6701462268829346, "step": 7791} {"train_info/time_between_train_steps": 0.003420114517211914, "step": 7791} {"info/global_step": 7792, "train_info/time_within_train_step": 2.661508083343506, "step": 7792} {"train_info/time_between_train_steps": 0.0035233497619628906, "step": 7792} {"info/global_step": 7793, "train_info/time_within_train_step": 2.6619529724121094, "step": 7793} {"train_info/time_between_train_steps": 0.0034177303314208984, "step": 7793} {"info/global_step": 7794, "train_info/time_within_train_step": 2.706787109375, "step": 7794} {"train_info/time_between_train_steps": 0.0034627914428710938, "step": 7794} {"info/global_step": 7795, "train_info/time_within_train_step": 2.6509182453155518, "step": 7795} {"train_info/time_between_train_steps": 0.0034606456756591797, "step": 7795} {"info/global_step": 7796, "train_info/time_within_train_step": 2.648590326309204, "step": 7796} {"train_info/time_between_train_steps": 0.0034422874450683594, "step": 7796} {"info/global_step": 7797, "train_info/time_within_train_step": 2.649014949798584, "step": 7797} {"train_info/time_between_train_steps": 0.003444194793701172, "step": 7797} {"info/global_step": 7798, "train_info/time_within_train_step": 2.650240898132324, "step": 7798} {"train_info/time_between_train_steps": 0.0033931732177734375, "step": 7798} {"info/global_step": 7799, "train_info/time_within_train_step": 2.694305181503296, "step": 7799} {"train_info/time_between_train_steps": 0.003350496292114258, "step": 7799} {"info/global_step": 7800, "train_info/time_within_train_step": 2.646205425262451, "step": 7800} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746919277, "_runtime": 21875}, "step": 7800} {"logs": {"train/loss": 3.1595, "train/learning_rate": 0.00014666666666666664, "train/epoch": 9.0, "_timestamp": 1746919277, "_runtime": 21875}, "step": 7800} {"train_info/time_between_train_steps": 13.04564642906189, "step": 7800} {"info/global_step": 7801, "train_info/time_within_train_step": 2.433269739151001, "step": 7801} {"train_info/time_between_train_steps": 0.0034112930297851562, "step": 7801} {"info/global_step": 7802, "train_info/time_within_train_step": 2.4271366596221924, "step": 7802} {"train_info/time_between_train_steps": 0.0035636425018310547, "step": 7802} {"info/global_step": 7803, "train_info/time_within_train_step": 2.603719711303711, "step": 7803} {"train_info/time_between_train_steps": 0.0033783912658691406, "step": 7803} {"info/global_step": 7804, "train_info/time_within_train_step": 2.64497709274292, "step": 7804} {"train_info/time_between_train_steps": 0.003413677215576172, "step": 7804} {"info/global_step": 7805, "train_info/time_within_train_step": 2.643782377243042, "step": 7805} {"train_info/time_between_train_steps": 0.003470182418823242, "step": 7805} {"info/global_step": 7806, "train_info/time_within_train_step": 2.662696361541748, "step": 7806} {"train_info/time_between_train_steps": 0.0033714771270751953, "step": 7806} {"info/global_step": 7807, "train_info/time_within_train_step": 2.6583878993988037, "step": 7807} {"train_info/time_between_train_steps": 0.0034325122833251953, "step": 7807} {"info/global_step": 7808, "train_info/time_within_train_step": 2.6704211235046387, "step": 7808} {"train_info/time_between_train_steps": 0.003414154052734375, "step": 7808} {"info/global_step": 7809, "train_info/time_within_train_step": 2.6761224269866943, "step": 7809} {"train_info/time_between_train_steps": 0.0033440589904785156, "step": 7809} {"info/global_step": 7810, "train_info/time_within_train_step": 2.668938159942627, "step": 7810} {"train_info/time_between_train_steps": 0.003412485122680664, "step": 7810} {"info/global_step": 7811, "train_info/time_within_train_step": 2.6426897048950195, "step": 7811} {"train_info/time_between_train_steps": 0.0033872127532958984, "step": 7811} {"info/global_step": 7812, "train_info/time_within_train_step": 2.6431424617767334, "step": 7812} {"train_info/time_between_train_steps": 0.0034317970275878906, "step": 7812} {"info/global_step": 7813, "train_info/time_within_train_step": 2.6641976833343506, "step": 7813} {"train_info/time_between_train_steps": 0.0034027099609375, "step": 7813} {"info/global_step": 7814, "train_info/time_within_train_step": 2.6527276039123535, "step": 7814} {"train_info/time_between_train_steps": 0.003398895263671875, "step": 7814} {"info/global_step": 7815, "train_info/time_within_train_step": 2.6462528705596924, "step": 7815} {"train_info/time_between_train_steps": 0.0034241676330566406, "step": 7815} {"info/global_step": 7816, "train_info/time_within_train_step": 2.658635139465332, "step": 7816} {"train_info/time_between_train_steps": 0.0033817291259765625, "step": 7816} {"info/global_step": 7817, "train_info/time_within_train_step": 2.646554946899414, "step": 7817} {"train_info/time_between_train_steps": 0.003419160842895508, "step": 7817} {"info/global_step": 7818, "train_info/time_within_train_step": 2.672273874282837, "step": 7818} {"train_info/time_between_train_steps": 0.0033326148986816406, "step": 7818} {"info/global_step": 7819, "train_info/time_within_train_step": 2.729980230331421, "step": 7819} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 7819} {"info/global_step": 7820, "train_info/time_within_train_step": 2.6756839752197266, "step": 7820} {"train_info/time_between_train_steps": 0.00341796875, "step": 7820} {"info/global_step": 7821, "train_info/time_within_train_step": 2.6460304260253906, "step": 7821} {"train_info/time_between_train_steps": 0.003426790237426758, "step": 7821} {"info/global_step": 7822, "train_info/time_within_train_step": 2.6570887565612793, "step": 7822} {"train_info/time_between_train_steps": 0.0033578872680664062, "step": 7822} {"info/global_step": 7823, "train_info/time_within_train_step": 2.6462886333465576, "step": 7823} {"train_info/time_between_train_steps": 0.003429412841796875, "step": 7823} {"info/global_step": 7824, "train_info/time_within_train_step": 2.6490261554718018, "step": 7824} {"train_info/time_between_train_steps": 0.003422260284423828, "step": 7824} {"info/global_step": 7825, "train_info/time_within_train_step": 2.647603988647461, "step": 7825} {"train_info/time_between_train_steps": 0.0036804676055908203, "step": 7825} {"info/global_step": 7826, "train_info/time_within_train_step": 2.6656808853149414, "step": 7826} {"train_info/time_between_train_steps": 0.0034432411193847656, "step": 7826} {"info/global_step": 7827, "train_info/time_within_train_step": 2.6698789596557617, "step": 7827} {"train_info/time_between_train_steps": 0.003353118896484375, "step": 7827} {"info/global_step": 7828, "train_info/time_within_train_step": 2.940478563308716, "step": 7828} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 7828} {"info/global_step": 7829, "train_info/time_within_train_step": 2.6507515907287598, "step": 7829} {"train_info/time_between_train_steps": 0.0032362937927246094, "step": 7829} {"info/global_step": 7830, "train_info/time_within_train_step": 2.7783877849578857, "step": 7830} {"train_info/time_between_train_steps": 0.003238677978515625, "step": 7830} {"info/global_step": 7831, "train_info/time_within_train_step": 2.650383710861206, "step": 7831} {"train_info/time_between_train_steps": 0.0032453536987304688, "step": 7831} {"info/global_step": 7832, "train_info/time_within_train_step": 2.6552884578704834, "step": 7832} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 7832} {"info/global_step": 7833, "train_info/time_within_train_step": 2.671395778656006, "step": 7833} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 7833} {"info/global_step": 7834, "train_info/time_within_train_step": 2.711996555328369, "step": 7834} {"train_info/time_between_train_steps": 0.0033452510833740234, "step": 7834} {"info/global_step": 7835, "train_info/time_within_train_step": 2.649178981781006, "step": 7835} {"train_info/time_between_train_steps": 0.0032958984375, "step": 7835} {"info/global_step": 7836, "train_info/time_within_train_step": 2.6651697158813477, "step": 7836} {"train_info/time_between_train_steps": 0.003468036651611328, "step": 7836} {"info/global_step": 7837, "train_info/time_within_train_step": 2.642920970916748, "step": 7837} {"train_info/time_between_train_steps": 0.003454923629760742, "step": 7837} {"info/global_step": 7838, "train_info/time_within_train_step": 2.653200387954712, "step": 7838} {"train_info/time_between_train_steps": 0.0034933090209960938, "step": 7838} {"info/global_step": 7839, "train_info/time_within_train_step": 2.704936981201172, "step": 7839} {"train_info/time_between_train_steps": 0.003437519073486328, "step": 7839} {"info/global_step": 7840, "train_info/time_within_train_step": 2.657743453979492, "step": 7840} {"train_info/time_between_train_steps": 0.003450155258178711, "step": 7840} {"info/global_step": 7841, "train_info/time_within_train_step": 2.64497447013855, "step": 7841} {"train_info/time_between_train_steps": 0.0033423900604248047, "step": 7841} {"info/global_step": 7842, "train_info/time_within_train_step": 2.6458022594451904, "step": 7842} {"train_info/time_between_train_steps": 0.0034928321838378906, "step": 7842} {"info/global_step": 7843, "train_info/time_within_train_step": 2.669820785522461, "step": 7843} {"train_info/time_between_train_steps": 0.003446340560913086, "step": 7843} {"info/global_step": 7844, "train_info/time_within_train_step": 2.6652743816375732, "step": 7844} {"train_info/time_between_train_steps": 0.0034699440002441406, "step": 7844} {"info/global_step": 7845, "train_info/time_within_train_step": 2.6824700832366943, "step": 7845} {"train_info/time_between_train_steps": 0.003381967544555664, "step": 7845} {"info/global_step": 7846, "train_info/time_within_train_step": 2.660818099975586, "step": 7846} {"train_info/time_between_train_steps": 0.0034551620483398438, "step": 7846} {"info/global_step": 7847, "train_info/time_within_train_step": 2.6626110076904297, "step": 7847} {"train_info/time_between_train_steps": 0.0034379959106445312, "step": 7847} {"info/global_step": 7848, "train_info/time_within_train_step": 2.6491968631744385, "step": 7848} {"train_info/time_between_train_steps": 0.003373384475708008, "step": 7848} {"info/global_step": 7849, "train_info/time_within_train_step": 2.64493727684021, "step": 7849} {"train_info/time_between_train_steps": 0.0034766197204589844, "step": 7849} {"info/global_step": 7850, "train_info/time_within_train_step": 2.6592397689819336, "step": 7850} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746919424, "_runtime": 22022}, "step": 7850} {"logs": {"train/loss": 3.1275, "train/learning_rate": 0.00014333333333333334, "train/epoch": 9.01, "_timestamp": 1746919424, "_runtime": 22022}, "step": 7850} {"train_info/time_between_train_steps": 0.024475574493408203, "step": 7850} {"info/global_step": 7851, "train_info/time_within_train_step": 2.6433095932006836, "step": 7851} {"train_info/time_between_train_steps": 0.0034165382385253906, "step": 7851} {"info/global_step": 7852, "train_info/time_within_train_step": 2.6462292671203613, "step": 7852} {"train_info/time_between_train_steps": 0.0034766197204589844, "step": 7852} {"info/global_step": 7853, "train_info/time_within_train_step": 2.6586079597473145, "step": 7853} {"train_info/time_between_train_steps": 0.0034575462341308594, "step": 7853} {"info/global_step": 7854, "train_info/time_within_train_step": 2.6609723567962646, "step": 7854} {"train_info/time_between_train_steps": 0.003491640090942383, "step": 7854} {"info/global_step": 7855, "train_info/time_within_train_step": 2.6754391193389893, "step": 7855} {"train_info/time_between_train_steps": 0.0034813880920410156, "step": 7855} {"info/global_step": 7856, "train_info/time_within_train_step": 2.6686534881591797, "step": 7856} {"train_info/time_between_train_steps": 0.003488302230834961, "step": 7856} {"info/global_step": 7857, "train_info/time_within_train_step": 2.703382968902588, "step": 7857} {"train_info/time_between_train_steps": 0.003418445587158203, "step": 7857} {"info/global_step": 7858, "train_info/time_within_train_step": 2.6424388885498047, "step": 7858} {"train_info/time_between_train_steps": 0.0033788681030273438, "step": 7858} {"info/global_step": 7859, "train_info/time_within_train_step": 2.645954132080078, "step": 7859} {"train_info/time_between_train_steps": 0.0034825801849365234, "step": 7859} {"info/global_step": 7860, "train_info/time_within_train_step": 2.664828300476074, "step": 7860} {"train_info/time_between_train_steps": 0.003425121307373047, "step": 7860} {"info/global_step": 7861, "train_info/time_within_train_step": 2.653921604156494, "step": 7861} {"train_info/time_between_train_steps": 0.003438711166381836, "step": 7861} {"info/global_step": 7862, "train_info/time_within_train_step": 2.6502931118011475, "step": 7862} {"train_info/time_between_train_steps": 0.003456592559814453, "step": 7862} {"info/global_step": 7863, "train_info/time_within_train_step": 2.65537428855896, "step": 7863} {"train_info/time_between_train_steps": 0.0034041404724121094, "step": 7863} {"info/global_step": 7864, "train_info/time_within_train_step": 2.652869701385498, "step": 7864} {"train_info/time_between_train_steps": 0.0035169124603271484, "step": 7864} {"info/global_step": 7865, "train_info/time_within_train_step": 2.661060333251953, "step": 7865} {"train_info/time_between_train_steps": 0.0034415721893310547, "step": 7865} {"info/global_step": 7866, "train_info/time_within_train_step": 2.6855857372283936, "step": 7866} {"train_info/time_between_train_steps": 0.00348663330078125, "step": 7866} {"info/global_step": 7867, "train_info/time_within_train_step": 2.7254137992858887, "step": 7867} {"train_info/time_between_train_steps": 0.003493785858154297, "step": 7867} {"info/global_step": 7868, "train_info/time_within_train_step": 2.6502175331115723, "step": 7868} {"train_info/time_between_train_steps": 0.0033953189849853516, "step": 7868} {"info/global_step": 7869, "train_info/time_within_train_step": 2.641561508178711, "step": 7869} {"train_info/time_between_train_steps": 0.003455638885498047, "step": 7869} {"info/global_step": 7870, "train_info/time_within_train_step": 2.660705089569092, "step": 7870} {"train_info/time_between_train_steps": 0.0034596920013427734, "step": 7870} {"info/global_step": 7871, "train_info/time_within_train_step": 2.984640121459961, "step": 7871} {"train_info/time_between_train_steps": 0.0032618045806884766, "step": 7871} {"info/global_step": 7872, "train_info/time_within_train_step": 2.725245237350464, "step": 7872} {"train_info/time_between_train_steps": 0.0036284923553466797, "step": 7872} {"info/global_step": 7873, "train_info/time_within_train_step": 2.651036500930786, "step": 7873} {"train_info/time_between_train_steps": 0.0035276412963867188, "step": 7873} {"info/global_step": 7874, "train_info/time_within_train_step": 2.6445271968841553, "step": 7874} {"train_info/time_between_train_steps": 0.0034203529357910156, "step": 7874} {"info/global_step": 7875, "train_info/time_within_train_step": 2.6484227180480957, "step": 7875} {"train_info/time_between_train_steps": 0.003346681594848633, "step": 7875} {"info/global_step": 7876, "train_info/time_within_train_step": 2.6457226276397705, "step": 7876} {"train_info/time_between_train_steps": 0.003411531448364258, "step": 7876} {"info/global_step": 7877, "train_info/time_within_train_step": 2.644571542739868, "step": 7877} {"train_info/time_between_train_steps": 0.0033631324768066406, "step": 7877} {"info/global_step": 7878, "train_info/time_within_train_step": 2.644343137741089, "step": 7878} {"train_info/time_between_train_steps": 0.003254413604736328, "step": 7878} {"info/global_step": 7879, "train_info/time_within_train_step": 2.6480798721313477, "step": 7879} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 7879} {"info/global_step": 7880, "train_info/time_within_train_step": 2.6570558547973633, "step": 7880} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 7880} {"info/global_step": 7881, "train_info/time_within_train_step": 2.6416141986846924, "step": 7881} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 7881} {"info/global_step": 7882, "train_info/time_within_train_step": 2.671666145324707, "step": 7882} {"train_info/time_between_train_steps": 0.0032644271850585938, "step": 7882} {"info/global_step": 7883, "train_info/time_within_train_step": 2.6564292907714844, "step": 7883} {"train_info/time_between_train_steps": 0.003252267837524414, "step": 7883} {"info/global_step": 7884, "train_info/time_within_train_step": 2.6716208457946777, "step": 7884} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 7884} {"info/global_step": 7885, "train_info/time_within_train_step": 2.706605911254883, "step": 7885} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 7885} {"info/global_step": 7886, "train_info/time_within_train_step": 2.6397008895874023, "step": 7886} {"train_info/time_between_train_steps": 0.003232717514038086, "step": 7886} {"info/global_step": 7887, "train_info/time_within_train_step": 2.649873971939087, "step": 7887} {"train_info/time_between_train_steps": 0.0035784244537353516, "step": 7887} {"info/global_step": 7888, "train_info/time_within_train_step": 2.651277780532837, "step": 7888} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 7888} {"info/global_step": 7889, "train_info/time_within_train_step": 2.6471352577209473, "step": 7889} {"train_info/time_between_train_steps": 0.0032444000244140625, "step": 7889} {"info/global_step": 7890, "train_info/time_within_train_step": 2.6505725383758545, "step": 7890} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 7890} {"info/global_step": 7891, "train_info/time_within_train_step": 2.643439769744873, "step": 7891} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 7891} {"info/global_step": 7892, "train_info/time_within_train_step": 2.6475799083709717, "step": 7892} {"train_info/time_between_train_steps": 0.137040376663208, "step": 7892} {"info/global_step": 7893, "train_info/time_within_train_step": 2.6444098949432373, "step": 7893} {"train_info/time_between_train_steps": 0.0032455921173095703, "step": 7893} {"info/global_step": 7894, "train_info/time_within_train_step": 2.6489193439483643, "step": 7894} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 7894} {"info/global_step": 7895, "train_info/time_within_train_step": 2.668084144592285, "step": 7895} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 7895} {"info/global_step": 7896, "train_info/time_within_train_step": 2.672356367111206, "step": 7896} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 7896} {"info/global_step": 7897, "train_info/time_within_train_step": 2.6497299671173096, "step": 7897} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 7897} {"info/global_step": 7898, "train_info/time_within_train_step": 2.684175968170166, "step": 7898} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 7898} {"info/global_step": 7899, "train_info/time_within_train_step": 2.641047954559326, "step": 7899} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 7899} {"info/global_step": 7900, "train_info/time_within_train_step": 2.6485042572021484, "step": 7900} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746919559, "_runtime": 22157}, "step": 7900} {"logs": {"train/loss": 3.1217, "train/learning_rate": 0.00014, "train/epoch": 9.01, "_timestamp": 1746919559, "_runtime": 22157}, "step": 7900} {"train_info/time_between_train_steps": 0.02415943145751953, "step": 7900} {"info/global_step": 7901, "train_info/time_within_train_step": 2.648414373397827, "step": 7901} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 7901} {"info/global_step": 7902, "train_info/time_within_train_step": 2.644467830657959, "step": 7902} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 7902} {"info/global_step": 7903, "train_info/time_within_train_step": 2.648604154586792, "step": 7903} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 7903} {"info/global_step": 7904, "train_info/time_within_train_step": 2.648174285888672, "step": 7904} {"train_info/time_between_train_steps": 0.003290414810180664, "step": 7904} {"info/global_step": 7905, "train_info/time_within_train_step": 2.6648659706115723, "step": 7905} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 7905} {"info/global_step": 7906, "train_info/time_within_train_step": 2.6605310440063477, "step": 7906} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 7906} {"info/global_step": 7907, "train_info/time_within_train_step": 2.655111312866211, "step": 7907} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 7907} {"info/global_step": 7908, "train_info/time_within_train_step": 2.706265687942505, "step": 7908} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 7908} {"info/global_step": 7909, "train_info/time_within_train_step": 2.649118423461914, "step": 7909} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 7909} {"info/global_step": 7910, "train_info/time_within_train_step": 2.646278142929077, "step": 7910} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 7910} {"info/global_step": 7911, "train_info/time_within_train_step": 2.6530933380126953, "step": 7911} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 7911} {"info/global_step": 7912, "train_info/time_within_train_step": 2.6475911140441895, "step": 7912} {"train_info/time_between_train_steps": 0.003224611282348633, "step": 7912} {"info/global_step": 7913, "train_info/time_within_train_step": 2.6485090255737305, "step": 7913} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 7913} {"info/global_step": 7914, "train_info/time_within_train_step": 2.6489734649658203, "step": 7914} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 7914} {"info/global_step": 7915, "train_info/time_within_train_step": 2.653235912322998, "step": 7915} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 7915} {"info/global_step": 7916, "train_info/time_within_train_step": 2.6721887588500977, "step": 7916} {"train_info/time_between_train_steps": 0.003214120864868164, "step": 7916} {"info/global_step": 7917, "train_info/time_within_train_step": 2.66664981842041, "step": 7917} {"train_info/time_between_train_steps": 0.0032405853271484375, "step": 7917} {"info/global_step": 7918, "train_info/time_within_train_step": 2.723036289215088, "step": 7918} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 7918} {"info/global_step": 7919, "train_info/time_within_train_step": 2.669332504272461, "step": 7919} {"train_info/time_between_train_steps": 0.0032203197479248047, "step": 7919} {"info/global_step": 7920, "train_info/time_within_train_step": 2.6459572315216064, "step": 7920} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 7920} {"info/global_step": 7921, "train_info/time_within_train_step": 2.640897512435913, "step": 7921} {"train_info/time_between_train_steps": 0.003262042999267578, "step": 7921} {"info/global_step": 7922, "train_info/time_within_train_step": 2.65541410446167, "step": 7922} {"train_info/time_between_train_steps": 0.0032083988189697266, "step": 7922} {"info/global_step": 7923, "train_info/time_within_train_step": 2.6551966667175293, "step": 7923} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 7923} {"info/global_step": 7924, "train_info/time_within_train_step": 2.6446638107299805, "step": 7924} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 7924} {"info/global_step": 7925, "train_info/time_within_train_step": 2.6520447731018066, "step": 7925} {"train_info/time_between_train_steps": 0.0032317638397216797, "step": 7925} {"info/global_step": 7926, "train_info/time_within_train_step": 2.6548705101013184, "step": 7926} {"train_info/time_between_train_steps": 0.003267049789428711, "step": 7926} {"info/global_step": 7927, "train_info/time_within_train_step": 2.6663978099823, "step": 7927} {"train_info/time_between_train_steps": 0.0032188892364501953, "step": 7927} {"info/global_step": 7928, "train_info/time_within_train_step": 2.7113144397735596, "step": 7928} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 7928} {"info/global_step": 7929, "train_info/time_within_train_step": 2.6442649364471436, "step": 7929} {"train_info/time_between_train_steps": 0.0032672882080078125, "step": 7929} {"info/global_step": 7930, "train_info/time_within_train_step": 2.6572229862213135, "step": 7930} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 7930} {"info/global_step": 7931, "train_info/time_within_train_step": 2.654686689376831, "step": 7931} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 7931} {"info/global_step": 7932, "train_info/time_within_train_step": 2.648970127105713, "step": 7932} {"train_info/time_between_train_steps": 0.0031714439392089844, "step": 7932} {"info/global_step": 7933, "train_info/time_within_train_step": 2.6519858837127686, "step": 7933} {"train_info/time_between_train_steps": 0.003242969512939453, "step": 7933} {"info/global_step": 7934, "train_info/time_within_train_step": 2.644766330718994, "step": 7934} {"train_info/time_between_train_steps": 0.003232717514038086, "step": 7934} {"info/global_step": 7935, "train_info/time_within_train_step": 2.6487443447113037, "step": 7935} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 7935} {"info/global_step": 7936, "train_info/time_within_train_step": 2.6726932525634766, "step": 7936} {"train_info/time_between_train_steps": 0.0031523704528808594, "step": 7936} {"info/global_step": 7937, "train_info/time_within_train_step": 2.664367198944092, "step": 7937} {"train_info/time_between_train_steps": 0.003246307373046875, "step": 7937} {"info/global_step": 7938, "train_info/time_within_train_step": 2.664142608642578, "step": 7938} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 7938} {"info/global_step": 7939, "train_info/time_within_train_step": 2.6785433292388916, "step": 7939} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 7939} {"info/global_step": 7940, "train_info/time_within_train_step": 2.643190622329712, "step": 7940} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 7940} {"info/global_step": 7941, "train_info/time_within_train_step": 2.6555871963500977, "step": 7941} {"train_info/time_between_train_steps": 0.0032858848571777344, "step": 7941} {"info/global_step": 7942, "train_info/time_within_train_step": 2.651315450668335, "step": 7942} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 7942} {"info/global_step": 7943, "train_info/time_within_train_step": 2.648301839828491, "step": 7943} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 7943} {"info/global_step": 7944, "train_info/time_within_train_step": 2.6611173152923584, "step": 7944} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 7944} {"info/global_step": 7945, "train_info/time_within_train_step": 2.6657259464263916, "step": 7945} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 7945} {"info/global_step": 7946, "train_info/time_within_train_step": 2.660684108734131, "step": 7946} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 7946} {"info/global_step": 7947, "train_info/time_within_train_step": 2.709197759628296, "step": 7947} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 7947} {"info/global_step": 7948, "train_info/time_within_train_step": 2.642052173614502, "step": 7948} {"train_info/time_between_train_steps": 0.0032935142517089844, "step": 7948} {"info/global_step": 7949, "train_info/time_within_train_step": 2.648991584777832, "step": 7949} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 7949} {"info/global_step": 7950, "train_info/time_within_train_step": 2.6641576290130615, "step": 7950} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746919694, "_runtime": 22292}, "step": 7950} {"logs": {"train/loss": 3.1176, "train/learning_rate": 0.00013666666666666666, "train/epoch": 9.02, "_timestamp": 1746919694, "_runtime": 22292}, "step": 7950} {"train_info/time_between_train_steps": 0.024286508560180664, "step": 7950} {"info/global_step": 7951, "train_info/time_within_train_step": 2.6527411937713623, "step": 7951} {"train_info/time_between_train_steps": 0.0032377243041992188, "step": 7951} {"info/global_step": 7952, "train_info/time_within_train_step": 2.653873920440674, "step": 7952} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 7952} {"info/global_step": 7953, "train_info/time_within_train_step": 2.64455509185791, "step": 7953} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 7953} {"info/global_step": 7954, "train_info/time_within_train_step": 2.658050298690796, "step": 7954} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 7954} {"info/global_step": 7955, "train_info/time_within_train_step": 2.7797446250915527, "step": 7955} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 7955} {"info/global_step": 7956, "train_info/time_within_train_step": 2.659708261489868, "step": 7956} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 7956} {"info/global_step": 7957, "train_info/time_within_train_step": 2.6521971225738525, "step": 7957} {"train_info/time_between_train_steps": 0.0032525062561035156, "step": 7957} {"info/global_step": 7958, "train_info/time_within_train_step": 2.6652932167053223, "step": 7958} {"train_info/time_between_train_steps": 0.0032367706298828125, "step": 7958} {"info/global_step": 7959, "train_info/time_within_train_step": 2.7248518466949463, "step": 7959} {"train_info/time_between_train_steps": 0.0032389163970947266, "step": 7959} {"info/global_step": 7960, "train_info/time_within_train_step": 2.665431499481201, "step": 7960} {"train_info/time_between_train_steps": 0.0032372474670410156, "step": 7960} {"info/global_step": 7961, "train_info/time_within_train_step": 2.6445205211639404, "step": 7961} {"train_info/time_between_train_steps": 0.003267049789428711, "step": 7961} {"info/global_step": 7962, "train_info/time_within_train_step": 2.649610996246338, "step": 7962} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 7962} {"info/global_step": 7963, "train_info/time_within_train_step": 2.644212245941162, "step": 7963} {"train_info/time_between_train_steps": 0.003286123275756836, "step": 7963} {"info/global_step": 7964, "train_info/time_within_train_step": 2.6688425540924072, "step": 7964} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 7964} {"info/global_step": 7965, "train_info/time_within_train_step": 2.673121929168701, "step": 7965} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 7965} {"info/global_step": 7966, "train_info/time_within_train_step": 2.6951894760131836, "step": 7966} {"train_info/time_between_train_steps": 0.0032958984375, "step": 7966} {"info/global_step": 7967, "train_info/time_within_train_step": 2.6485249996185303, "step": 7967} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 7967} {"info/global_step": 7968, "train_info/time_within_train_step": 2.6446590423583984, "step": 7968} {"train_info/time_between_train_steps": 0.003252744674682617, "step": 7968} {"info/global_step": 7969, "train_info/time_within_train_step": 2.6540777683258057, "step": 7969} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 7969} {"info/global_step": 7970, "train_info/time_within_train_step": 2.893375873565674, "step": 7970} {"train_info/time_between_train_steps": 0.0032815933227539062, "step": 7970} {"info/global_step": 7971, "train_info/time_within_train_step": 2.664829730987549, "step": 7971} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 7971} {"info/global_step": 7972, "train_info/time_within_train_step": 2.64182186126709, "step": 7972} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 7972} {"info/global_step": 7973, "train_info/time_within_train_step": 2.6926321983337402, "step": 7973} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 7973} {"info/global_step": 7974, "train_info/time_within_train_step": 2.646498441696167, "step": 7974} {"train_info/time_between_train_steps": 0.003188610076904297, "step": 7974} {"info/global_step": 7975, "train_info/time_within_train_step": 2.6560275554656982, "step": 7975} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 7975} {"info/global_step": 7976, "train_info/time_within_train_step": 2.6441023349761963, "step": 7976} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 7976} {"info/global_step": 7977, "train_info/time_within_train_step": 2.6474196910858154, "step": 7977} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 7977} {"info/global_step": 7978, "train_info/time_within_train_step": 2.670930862426758, "step": 7978} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 7978} {"info/global_step": 7979, "train_info/time_within_train_step": 2.665530204772949, "step": 7979} {"train_info/time_between_train_steps": 0.0032799243927001953, "step": 7979} {"info/global_step": 7980, "train_info/time_within_train_step": 2.6552574634552, "step": 7980} {"train_info/time_between_train_steps": 0.0032074451446533203, "step": 7980} {"info/global_step": 7981, "train_info/time_within_train_step": 2.6844730377197266, "step": 7981} {"train_info/time_between_train_steps": 0.003228425979614258, "step": 7981} {"info/global_step": 7982, "train_info/time_within_train_step": 2.642003059387207, "step": 7982} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 7982} {"info/global_step": 7983, "train_info/time_within_train_step": 2.643768548965454, "step": 7983} {"train_info/time_between_train_steps": 0.0032863616943359375, "step": 7983} {"info/global_step": 7984, "train_info/time_within_train_step": 2.6652629375457764, "step": 7984} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 7984} {"info/global_step": 7985, "train_info/time_within_train_step": 2.6520919799804688, "step": 7985} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 7985} {"info/global_step": 7986, "train_info/time_within_train_step": 2.6443886756896973, "step": 7986} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 7986} {"info/global_step": 7987, "train_info/time_within_train_step": 2.6615803241729736, "step": 7987} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 7987} {"info/global_step": 7988, "train_info/time_within_train_step": 2.6581263542175293, "step": 7988} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 7988} {"info/global_step": 7989, "train_info/time_within_train_step": 2.6686294078826904, "step": 7989} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 7989} {"info/global_step": 7990, "train_info/time_within_train_step": 2.6761889457702637, "step": 7990} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 7990} {"info/global_step": 7991, "train_info/time_within_train_step": 2.6706910133361816, "step": 7991} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 7991} {"info/global_step": 7992, "train_info/time_within_train_step": 2.6408746242523193, "step": 7992} {"train_info/time_between_train_steps": 0.0032432079315185547, "step": 7992} {"info/global_step": 7993, "train_info/time_within_train_step": 2.640193223953247, "step": 7993} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 7993} {"info/global_step": 7994, "train_info/time_within_train_step": 2.656989336013794, "step": 7994} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 7994} {"info/global_step": 7995, "train_info/time_within_train_step": 2.653573513031006, "step": 7995} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 7995} {"info/global_step": 7996, "train_info/time_within_train_step": 2.647256374359131, "step": 7996} {"train_info/time_between_train_steps": 0.0032274723052978516, "step": 7996} {"info/global_step": 7997, "train_info/time_within_train_step": 2.6604700088500977, "step": 7997} {"train_info/time_between_train_steps": 0.003229856491088867, "step": 7997} {"info/global_step": 7998, "train_info/time_within_train_step": 3.270179033279419, "step": 7998} {"train_info/time_between_train_steps": 0.0064775943756103516, "step": 7998} {"info/global_step": 7999, "train_info/time_within_train_step": 2.6680052280426025, "step": 7999} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 7999} {"info/global_step": 8000, "train_info/time_within_train_step": 2.693721055984497, "step": 8000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746919829, "_runtime": 22427}, "step": 8000} {"logs": {"train/loss": 3.0998, "train/learning_rate": 0.0001333333333333333, "train/epoch": 9.02, "_timestamp": 1746919829, "_runtime": 22427}, "step": 8000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746919834, "_runtime": 22432}, "step": 8000} {"logs": {"eval/loss": 4.757665157318115, "eval/runtime": 5.1899, "eval/samples_per_second": 36.995, "eval/steps_per_second": 1.156, "train/epoch": 9.02, "_timestamp": 1746919834, "_runtime": 22432}, "step": 8000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746919834, "_runtime": 22432}, "step": 8000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.757665157318115, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 116.4736605003892, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1899, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.995, "train/epoch": 9.02, "_timestamp": 1746919834, "_runtime": 22432}, "step": 8000} {"train_info/time_between_train_steps": 18.95218825340271, "step": 8000} {"info/global_step": 8001, "train_info/time_within_train_step": 2.4692342281341553, "step": 8001} {"train_info/time_between_train_steps": 0.006540775299072266, "step": 8001} {"info/global_step": 8002, "train_info/time_within_train_step": 2.437635660171509, "step": 8002} {"train_info/time_between_train_steps": 0.00650787353515625, "step": 8002} {"info/global_step": 8003, "train_info/time_within_train_step": 2.5793263912200928, "step": 8003} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 8003} {"info/global_step": 8004, "train_info/time_within_train_step": 2.6637351512908936, "step": 8004} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 8004} {"info/global_step": 8005, "train_info/time_within_train_step": 2.6802029609680176, "step": 8005} {"train_info/time_between_train_steps": 0.003265380859375, "step": 8005} {"info/global_step": 8006, "train_info/time_within_train_step": 2.646951913833618, "step": 8006} {"train_info/time_between_train_steps": 0.0032188892364501953, "step": 8006} {"info/global_step": 8007, "train_info/time_within_train_step": 2.681896686553955, "step": 8007} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 8007} {"info/global_step": 8008, "train_info/time_within_train_step": 2.641162395477295, "step": 8008} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 8008} {"info/global_step": 8009, "train_info/time_within_train_step": 2.6488659381866455, "step": 8009} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 8009} {"info/global_step": 8010, "train_info/time_within_train_step": 2.6665945053100586, "step": 8010} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 8010} {"info/global_step": 8011, "train_info/time_within_train_step": 2.643578290939331, "step": 8011} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 8011} {"info/global_step": 8012, "train_info/time_within_train_step": 2.646557092666626, "step": 8012} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 8012} {"info/global_step": 8013, "train_info/time_within_train_step": 2.651965379714966, "step": 8013} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 8013} {"info/global_step": 8014, "train_info/time_within_train_step": 2.641879081726074, "step": 8014} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 8014} {"info/global_step": 8015, "train_info/time_within_train_step": 2.6434803009033203, "step": 8015} {"train_info/time_between_train_steps": 0.003231525421142578, "step": 8015} {"info/global_step": 8016, "train_info/time_within_train_step": 2.661511182785034, "step": 8016} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 8016} {"info/global_step": 8017, "train_info/time_within_train_step": 2.655087471008301, "step": 8017} {"train_info/time_between_train_steps": 0.13071370124816895, "step": 8017} {"info/global_step": 8018, "train_info/time_within_train_step": 2.655945062637329, "step": 8018} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 8018} {"info/global_step": 8019, "train_info/time_within_train_step": 2.6564600467681885, "step": 8019} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 8019} {"info/global_step": 8020, "train_info/time_within_train_step": 2.906130790710449, "step": 8020} {"train_info/time_between_train_steps": 0.003235340118408203, "step": 8020} {"info/global_step": 8021, "train_info/time_within_train_step": 2.6589882373809814, "step": 8021} {"train_info/time_between_train_steps": 0.003226041793823242, "step": 8021} {"info/global_step": 8022, "train_info/time_within_train_step": 2.6442630290985107, "step": 8022} {"train_info/time_between_train_steps": 0.003240823745727539, "step": 8022} {"info/global_step": 8023, "train_info/time_within_train_step": 2.6484732627868652, "step": 8023} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 8023} {"info/global_step": 8024, "train_info/time_within_train_step": 2.651261568069458, "step": 8024} {"train_info/time_between_train_steps": 0.0032825469970703125, "step": 8024} {"info/global_step": 8025, "train_info/time_within_train_step": 2.646967649459839, "step": 8025} {"train_info/time_between_train_steps": 0.0032341480255126953, "step": 8025} {"info/global_step": 8026, "train_info/time_within_train_step": 2.6481237411499023, "step": 8026} {"train_info/time_between_train_steps": 0.0032308101654052734, "step": 8026} {"info/global_step": 8027, "train_info/time_within_train_step": 2.6641223430633545, "step": 8027} {"train_info/time_between_train_steps": 0.003332853317260742, "step": 8027} {"info/global_step": 8028, "train_info/time_within_train_step": 2.666961908340454, "step": 8028} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 8028} {"info/global_step": 8029, "train_info/time_within_train_step": 2.7130966186523438, "step": 8029} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 8029} {"info/global_step": 8030, "train_info/time_within_train_step": 2.649462938308716, "step": 8030} {"train_info/time_between_train_steps": 0.003241300582885742, "step": 8030} {"info/global_step": 8031, "train_info/time_within_train_step": 2.6642327308654785, "step": 8031} {"train_info/time_between_train_steps": 0.0032439231872558594, "step": 8031} {"info/global_step": 8032, "train_info/time_within_train_step": 2.6430466175079346, "step": 8032} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 8032} {"info/global_step": 8033, "train_info/time_within_train_step": 2.6543660163879395, "step": 8033} {"train_info/time_between_train_steps": 0.0031943321228027344, "step": 8033} {"info/global_step": 8034, "train_info/time_within_train_step": 2.65427827835083, "step": 8034} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 8034} {"info/global_step": 8035, "train_info/time_within_train_step": 2.643656015396118, "step": 8035} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 8035} {"info/global_step": 8036, "train_info/time_within_train_step": 2.651475429534912, "step": 8036} {"train_info/time_between_train_steps": 0.0036334991455078125, "step": 8036} {"info/global_step": 8037, "train_info/time_within_train_step": 2.6713995933532715, "step": 8037} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 8037} {"info/global_step": 8038, "train_info/time_within_train_step": 2.6719868183135986, "step": 8038} {"train_info/time_between_train_steps": 0.0032782554626464844, "step": 8038} {"info/global_step": 8039, "train_info/time_within_train_step": 2.6556777954101562, "step": 8039} {"train_info/time_between_train_steps": 0.003299713134765625, "step": 8039} {"info/global_step": 8040, "train_info/time_within_train_step": 2.683267593383789, "step": 8040} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 8040} {"info/global_step": 8041, "train_info/time_within_train_step": 2.648787498474121, "step": 8041} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 8041} {"info/global_step": 8042, "train_info/time_within_train_step": 2.6501853466033936, "step": 8042} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 8042} {"info/global_step": 8043, "train_info/time_within_train_step": 2.646461009979248, "step": 8043} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 8043} {"info/global_step": 8044, "train_info/time_within_train_step": 2.652289867401123, "step": 8044} {"train_info/time_between_train_steps": 0.003274202346801758, "step": 8044} {"info/global_step": 8045, "train_info/time_within_train_step": 2.6537158489227295, "step": 8045} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 8045} {"info/global_step": 8046, "train_info/time_within_train_step": 2.6452555656433105, "step": 8046} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 8046} {"info/global_step": 8047, "train_info/time_within_train_step": 2.675917863845825, "step": 8047} {"train_info/time_between_train_steps": 0.003232240676879883, "step": 8047} {"info/global_step": 8048, "train_info/time_within_train_step": 2.656944513320923, "step": 8048} {"train_info/time_between_train_steps": 0.003256082534790039, "step": 8048} {"info/global_step": 8049, "train_info/time_within_train_step": 2.662198781967163, "step": 8049} {"train_info/time_between_train_steps": 0.003255128860473633, "step": 8049} {"info/global_step": 8050, "train_info/time_within_train_step": 2.699138879776001, "step": 8050} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746919982, "_runtime": 22580}, "step": 8050} {"logs": {"train/loss": 3.0984, "train/learning_rate": 0.00013, "train/epoch": 9.03, "_timestamp": 1746919982, "_runtime": 22580}, "step": 8050} {"train_info/time_between_train_steps": 0.0248415470123291, "step": 8050} {"info/global_step": 8051, "train_info/time_within_train_step": 2.7076618671417236, "step": 8051} {"train_info/time_between_train_steps": 0.0032341480255126953, "step": 8051} {"info/global_step": 8052, "train_info/time_within_train_step": 2.6406848430633545, "step": 8052} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 8052} {"info/global_step": 8053, "train_info/time_within_train_step": 2.6488144397735596, "step": 8053} {"train_info/time_between_train_steps": 0.0032186508178710938, "step": 8053} {"info/global_step": 8054, "train_info/time_within_train_step": 2.663137435913086, "step": 8054} {"train_info/time_between_train_steps": 0.0032880306243896484, "step": 8054} {"info/global_step": 8055, "train_info/time_within_train_step": 2.6452908515930176, "step": 8055} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 8055} {"info/global_step": 8056, "train_info/time_within_train_step": 2.652306079864502, "step": 8056} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 8056} {"info/global_step": 8057, "train_info/time_within_train_step": 2.6485350131988525, "step": 8057} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 8057} {"info/global_step": 8058, "train_info/time_within_train_step": 2.642777919769287, "step": 8058} {"train_info/time_between_train_steps": 0.0032787322998046875, "step": 8058} {"info/global_step": 8059, "train_info/time_within_train_step": 2.6410746574401855, "step": 8059} {"train_info/time_between_train_steps": 0.003240823745727539, "step": 8059} {"info/global_step": 8060, "train_info/time_within_train_step": 2.663619041442871, "step": 8060} {"train_info/time_between_train_steps": 0.0033464431762695312, "step": 8060} {"info/global_step": 8061, "train_info/time_within_train_step": 2.6476495265960693, "step": 8061} {"train_info/time_between_train_steps": 0.0034050941467285156, "step": 8061} {"info/global_step": 8062, "train_info/time_within_train_step": 2.646927833557129, "step": 8062} {"train_info/time_between_train_steps": 0.003368854522705078, "step": 8062} {"info/global_step": 8063, "train_info/time_within_train_step": 2.6496949195861816, "step": 8063} {"train_info/time_between_train_steps": 0.0035054683685302734, "step": 8063} {"info/global_step": 8064, "train_info/time_within_train_step": 2.6594767570495605, "step": 8064} {"train_info/time_between_train_steps": 0.0034627914428710938, "step": 8064} {"info/global_step": 8065, "train_info/time_within_train_step": 2.6910173892974854, "step": 8065} {"train_info/time_between_train_steps": 0.0034415721893310547, "step": 8065} {"info/global_step": 8066, "train_info/time_within_train_step": 2.6527957916259766, "step": 8066} {"train_info/time_between_train_steps": 0.0035724639892578125, "step": 8066} {"info/global_step": 8067, "train_info/time_within_train_step": 2.6498117446899414, "step": 8067} {"train_info/time_between_train_steps": 0.0036764144897460938, "step": 8067} {"info/global_step": 8068, "train_info/time_within_train_step": 2.6558594703674316, "step": 8068} {"train_info/time_between_train_steps": 0.003490924835205078, "step": 8068} {"info/global_step": 8069, "train_info/time_within_train_step": 2.6505396366119385, "step": 8069} {"train_info/time_between_train_steps": 0.0035178661346435547, "step": 8069} {"info/global_step": 8070, "train_info/time_within_train_step": 2.6518912315368652, "step": 8070} {"train_info/time_between_train_steps": 0.0034494400024414062, "step": 8070} {"info/global_step": 8071, "train_info/time_within_train_step": 2.644880533218384, "step": 8071} {"train_info/time_between_train_steps": 0.0034499168395996094, "step": 8071} {"info/global_step": 8072, "train_info/time_within_train_step": 2.649160146713257, "step": 8072} {"train_info/time_between_train_steps": 0.003507375717163086, "step": 8072} {"info/global_step": 8073, "train_info/time_within_train_step": 2.6711297035217285, "step": 8073} {"train_info/time_between_train_steps": 0.003432750701904297, "step": 8073} {"info/global_step": 8074, "train_info/time_within_train_step": 2.6664793491363525, "step": 8074} {"train_info/time_between_train_steps": 0.0034639835357666016, "step": 8074} {"info/global_step": 8075, "train_info/time_within_train_step": 2.6669788360595703, "step": 8075} {"train_info/time_between_train_steps": 0.0034689903259277344, "step": 8075} {"info/global_step": 8076, "train_info/time_within_train_step": 2.667043685913086, "step": 8076} {"train_info/time_between_train_steps": 0.0034193992614746094, "step": 8076} {"info/global_step": 8077, "train_info/time_within_train_step": 2.660648822784424, "step": 8077} {"train_info/time_between_train_steps": 0.003589153289794922, "step": 8077} {"info/global_step": 8078, "train_info/time_within_train_step": 2.6484930515289307, "step": 8078} {"train_info/time_between_train_steps": 0.0035021305084228516, "step": 8078} {"info/global_step": 8079, "train_info/time_within_train_step": 2.6535487174987793, "step": 8079} {"train_info/time_between_train_steps": 0.003591775894165039, "step": 8079} {"info/global_step": 8080, "train_info/time_within_train_step": 2.8099513053894043, "step": 8080} {"train_info/time_between_train_steps": 0.0034110546112060547, "step": 8080} {"info/global_step": 8081, "train_info/time_within_train_step": 2.6465258598327637, "step": 8081} {"train_info/time_between_train_steps": 0.0034024715423583984, "step": 8081} {"info/global_step": 8082, "train_info/time_within_train_step": 2.6495203971862793, "step": 8082} {"train_info/time_between_train_steps": 0.003344297409057617, "step": 8082} {"info/global_step": 8083, "train_info/time_within_train_step": 2.6559150218963623, "step": 8083} {"train_info/time_between_train_steps": 0.0032949447631835938, "step": 8083} {"info/global_step": 8084, "train_info/time_within_train_step": 2.647820472717285, "step": 8084} {"train_info/time_between_train_steps": 0.003356456756591797, "step": 8084} {"info/global_step": 8085, "train_info/time_within_train_step": 2.6573445796966553, "step": 8085} {"train_info/time_between_train_steps": 0.0033059120178222656, "step": 8085} {"info/global_step": 8086, "train_info/time_within_train_step": 2.7228212356567383, "step": 8086} {"train_info/time_between_train_steps": 0.003383636474609375, "step": 8086} {"info/global_step": 8087, "train_info/time_within_train_step": 2.64691162109375, "step": 8087} {"train_info/time_between_train_steps": 0.003275156021118164, "step": 8087} {"info/global_step": 8088, "train_info/time_within_train_step": 2.641493797302246, "step": 8088} {"train_info/time_between_train_steps": 0.0033528804779052734, "step": 8088} {"info/global_step": 8089, "train_info/time_within_train_step": 2.6638848781585693, "step": 8089} {"train_info/time_between_train_steps": 0.0033059120178222656, "step": 8089} {"info/global_step": 8090, "train_info/time_within_train_step": 2.648827075958252, "step": 8090} {"train_info/time_between_train_steps": 0.003347635269165039, "step": 8090} {"info/global_step": 8091, "train_info/time_within_train_step": 2.6453733444213867, "step": 8091} {"train_info/time_between_train_steps": 0.0034246444702148438, "step": 8091} {"info/global_step": 8092, "train_info/time_within_train_step": 2.65384840965271, "step": 8092} {"train_info/time_between_train_steps": 0.0034101009368896484, "step": 8092} {"info/global_step": 8093, "train_info/time_within_train_step": 2.645585536956787, "step": 8093} {"train_info/time_between_train_steps": 0.0034055709838867188, "step": 8093} {"info/global_step": 8094, "train_info/time_within_train_step": 2.6671018600463867, "step": 8094} {"train_info/time_between_train_steps": 0.003390789031982422, "step": 8094} {"info/global_step": 8095, "train_info/time_within_train_step": 2.671734571456909, "step": 8095} {"train_info/time_between_train_steps": 0.00347137451171875, "step": 8095} {"info/global_step": 8096, "train_info/time_within_train_step": 2.691882848739624, "step": 8096} {"train_info/time_between_train_steps": 0.003484964370727539, "step": 8096} {"info/global_step": 8097, "train_info/time_within_train_step": 2.6494638919830322, "step": 8097} {"train_info/time_between_train_steps": 0.0034589767456054688, "step": 8097} {"info/global_step": 8098, "train_info/time_within_train_step": 2.6429150104522705, "step": 8098} {"train_info/time_between_train_steps": 0.0034084320068359375, "step": 8098} {"info/global_step": 8099, "train_info/time_within_train_step": 2.6597390174865723, "step": 8099} {"train_info/time_between_train_steps": 0.0034787654876708984, "step": 8099} {"info/global_step": 8100, "train_info/time_within_train_step": 2.6546878814697266, "step": 8100} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746920117, "_runtime": 22715}, "step": 8100} {"logs": {"train/loss": 3.0951, "train/learning_rate": 0.00012666666666666666, "train/epoch": 9.03, "_timestamp": 1746920117, "_runtime": 22715}, "step": 8100} {"train_info/time_between_train_steps": 0.02449512481689453, "step": 8100} {"info/global_step": 8101, "train_info/time_within_train_step": 2.654252052307129, "step": 8101} {"train_info/time_between_train_steps": 0.0034685134887695312, "step": 8101} {"info/global_step": 8102, "train_info/time_within_train_step": 2.6455442905426025, "step": 8102} {"train_info/time_between_train_steps": 0.0034656524658203125, "step": 8102} {"info/global_step": 8103, "train_info/time_within_train_step": 2.647742509841919, "step": 8103} {"train_info/time_between_train_steps": 0.0035347938537597656, "step": 8103} {"info/global_step": 8104, "train_info/time_within_train_step": 2.670456647872925, "step": 8104} {"train_info/time_between_train_steps": 0.003458738327026367, "step": 8104} {"info/global_step": 8105, "train_info/time_within_train_step": 2.6669399738311768, "step": 8105} {"train_info/time_between_train_steps": 0.0035240650177001953, "step": 8105} {"info/global_step": 8106, "train_info/time_within_train_step": 2.669365167617798, "step": 8106} {"train_info/time_between_train_steps": 0.003529071807861328, "step": 8106} {"info/global_step": 8107, "train_info/time_within_train_step": 2.672924280166626, "step": 8107} {"train_info/time_between_train_steps": 0.0034592151641845703, "step": 8107} {"info/global_step": 8108, "train_info/time_within_train_step": 2.6479475498199463, "step": 8108} {"train_info/time_between_train_steps": 0.0034210681915283203, "step": 8108} {"info/global_step": 8109, "train_info/time_within_train_step": 2.655099630355835, "step": 8109} {"train_info/time_between_train_steps": 0.0034842491149902344, "step": 8109} {"info/global_step": 8110, "train_info/time_within_train_step": 2.651782751083374, "step": 8110} {"train_info/time_between_train_steps": 0.003520965576171875, "step": 8110} {"info/global_step": 8111, "train_info/time_within_train_step": 2.646498203277588, "step": 8111} {"train_info/time_between_train_steps": 0.0034842491149902344, "step": 8111} {"info/global_step": 8112, "train_info/time_within_train_step": 2.6494927406311035, "step": 8112} {"train_info/time_between_train_steps": 0.0034172534942626953, "step": 8112} {"info/global_step": 8113, "train_info/time_within_train_step": 2.6490228176116943, "step": 8113} {"train_info/time_between_train_steps": 0.0034770965576171875, "step": 8113} {"info/global_step": 8114, "train_info/time_within_train_step": 2.6756460666656494, "step": 8114} {"train_info/time_between_train_steps": 0.003425121307373047, "step": 8114} {"info/global_step": 8115, "train_info/time_within_train_step": 2.65922212600708, "step": 8115} {"train_info/time_between_train_steps": 0.0034322738647460938, "step": 8115} {"info/global_step": 8116, "train_info/time_within_train_step": 2.662503957748413, "step": 8116} {"train_info/time_between_train_steps": 0.0035042762756347656, "step": 8116} {"info/global_step": 8117, "train_info/time_within_train_step": 2.698058843612671, "step": 8117} {"train_info/time_between_train_steps": 0.0034029483795166016, "step": 8117} {"info/global_step": 8118, "train_info/time_within_train_step": 2.65217924118042, "step": 8118} {"train_info/time_between_train_steps": 0.0034835338592529297, "step": 8118} {"info/global_step": 8119, "train_info/time_within_train_step": 2.6442837715148926, "step": 8119} {"train_info/time_between_train_steps": 0.0034554004669189453, "step": 8119} {"info/global_step": 8120, "train_info/time_within_train_step": 3.001927614212036, "step": 8120} {"train_info/time_between_train_steps": 0.0032858848571777344, "step": 8120} {"info/global_step": 8121, "train_info/time_within_train_step": 2.6419575214385986, "step": 8121} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 8121} {"info/global_step": 8122, "train_info/time_within_train_step": 2.663367748260498, "step": 8122} {"train_info/time_between_train_steps": 0.0033228397369384766, "step": 8122} {"info/global_step": 8123, "train_info/time_within_train_step": 2.656660318374634, "step": 8123} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 8123} {"info/global_step": 8124, "train_info/time_within_train_step": 2.6453871726989746, "step": 8124} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 8124} {"info/global_step": 8125, "train_info/time_within_train_step": 2.6597630977630615, "step": 8125} {"train_info/time_between_train_steps": 0.0032777786254882812, "step": 8125} {"info/global_step": 8126, "train_info/time_within_train_step": 2.65354061126709, "step": 8126} {"train_info/time_between_train_steps": 0.0032470226287841797, "step": 8126} {"info/global_step": 8127, "train_info/time_within_train_step": 2.660311698913574, "step": 8127} {"train_info/time_between_train_steps": 0.0032732486724853516, "step": 8127} {"info/global_step": 8128, "train_info/time_within_train_step": 2.7006595134735107, "step": 8128} {"train_info/time_between_train_steps": 0.0032644271850585938, "step": 8128} {"info/global_step": 8129, "train_info/time_within_train_step": 2.712392568588257, "step": 8129} {"train_info/time_between_train_steps": 0.0033028125762939453, "step": 8129} {"info/global_step": 8130, "train_info/time_within_train_step": 2.6418039798736572, "step": 8130} {"train_info/time_between_train_steps": 0.003360748291015625, "step": 8130} {"info/global_step": 8131, "train_info/time_within_train_step": 2.643099546432495, "step": 8131} {"train_info/time_between_train_steps": 0.0032906532287597656, "step": 8131} {"info/global_step": 8132, "train_info/time_within_train_step": 2.6611502170562744, "step": 8132} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 8132} {"info/global_step": 8133, "train_info/time_within_train_step": 2.652475357055664, "step": 8133} {"train_info/time_between_train_steps": 0.003253936767578125, "step": 8133} {"info/global_step": 8134, "train_info/time_within_train_step": 2.646989107131958, "step": 8134} {"train_info/time_between_train_steps": 0.003208160400390625, "step": 8134} {"info/global_step": 8135, "train_info/time_within_train_step": 2.668687105178833, "step": 8135} {"train_info/time_between_train_steps": 0.00327301025390625, "step": 8135} {"info/global_step": 8136, "train_info/time_within_train_step": 2.6946122646331787, "step": 8136} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 8136} {"info/global_step": 8137, "train_info/time_within_train_step": 2.665969133377075, "step": 8137} {"train_info/time_between_train_steps": 0.0032176971435546875, "step": 8137} {"info/global_step": 8138, "train_info/time_within_train_step": 2.660112142562866, "step": 8138} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 8138} {"info/global_step": 8139, "train_info/time_within_train_step": 2.641230583190918, "step": 8139} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 8139} {"info/global_step": 8140, "train_info/time_within_train_step": 2.657836675643921, "step": 8140} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 8140} {"info/global_step": 8141, "train_info/time_within_train_step": 2.6551413536071777, "step": 8141} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 8141} {"info/global_step": 8142, "train_info/time_within_train_step": 2.643230438232422, "step": 8142} {"train_info/time_between_train_steps": 0.1369020938873291, "step": 8142} {"info/global_step": 8143, "train_info/time_within_train_step": 2.657050371170044, "step": 8143} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 8143} {"info/global_step": 8144, "train_info/time_within_train_step": 2.644531726837158, "step": 8144} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 8144} {"info/global_step": 8145, "train_info/time_within_train_step": 2.645054817199707, "step": 8145} {"train_info/time_between_train_steps": 0.0032291412353515625, "step": 8145} {"info/global_step": 8146, "train_info/time_within_train_step": 2.6620144844055176, "step": 8146} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 8146} {"info/global_step": 8147, "train_info/time_within_train_step": 2.668415069580078, "step": 8147} {"train_info/time_between_train_steps": 0.003222942352294922, "step": 8147} {"info/global_step": 8148, "train_info/time_within_train_step": 2.686168909072876, "step": 8148} {"train_info/time_between_train_steps": 0.003276348114013672, "step": 8148} {"info/global_step": 8149, "train_info/time_within_train_step": 2.651651382446289, "step": 8149} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 8149} {"info/global_step": 8150, "train_info/time_within_train_step": 2.6847500801086426, "step": 8150} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746920251, "_runtime": 22849}, "step": 8150} {"logs": {"train/loss": 3.0792, "train/learning_rate": 0.0001233333333333333, "train/epoch": 9.04, "_timestamp": 1746920251, "_runtime": 22849}, "step": 8150} {"train_info/time_between_train_steps": 0.02417278289794922, "step": 8150} {"info/global_step": 8151, "train_info/time_within_train_step": 2.660626173019409, "step": 8151} {"train_info/time_between_train_steps": 0.003351926803588867, "step": 8151} {"info/global_step": 8152, "train_info/time_within_train_step": 2.6483912467956543, "step": 8152} {"train_info/time_between_train_steps": 0.003322601318359375, "step": 8152} {"info/global_step": 8153, "train_info/time_within_train_step": 2.6427791118621826, "step": 8153} {"train_info/time_between_train_steps": 0.0033168792724609375, "step": 8153} {"info/global_step": 8154, "train_info/time_within_train_step": 2.6618123054504395, "step": 8154} {"train_info/time_between_train_steps": 0.003383159637451172, "step": 8154} {"info/global_step": 8155, "train_info/time_within_train_step": 2.662449598312378, "step": 8155} {"train_info/time_between_train_steps": 0.0034875869750976562, "step": 8155} {"info/global_step": 8156, "train_info/time_within_train_step": 2.645429849624634, "step": 8156} {"train_info/time_between_train_steps": 0.003566741943359375, "step": 8156} {"info/global_step": 8157, "train_info/time_within_train_step": 2.6621577739715576, "step": 8157} {"train_info/time_between_train_steps": 0.003484964370727539, "step": 8157} {"info/global_step": 8158, "train_info/time_within_train_step": 2.660754442214966, "step": 8158} {"train_info/time_between_train_steps": 0.003528594970703125, "step": 8158} {"info/global_step": 8159, "train_info/time_within_train_step": 2.683166742324829, "step": 8159} {"train_info/time_between_train_steps": 0.003420591354370117, "step": 8159} {"info/global_step": 8160, "train_info/time_within_train_step": 2.6663076877593994, "step": 8160} {"train_info/time_between_train_steps": 0.003451108932495117, "step": 8160} {"info/global_step": 8161, "train_info/time_within_train_step": 2.7021002769470215, "step": 8161} {"train_info/time_between_train_steps": 0.003533601760864258, "step": 8161} {"info/global_step": 8162, "train_info/time_within_train_step": 2.6409177780151367, "step": 8162} {"train_info/time_between_train_steps": 0.0034525394439697266, "step": 8162} {"info/global_step": 8163, "train_info/time_within_train_step": 2.64829158782959, "step": 8163} {"train_info/time_between_train_steps": 0.0034203529357910156, "step": 8163} {"info/global_step": 8164, "train_info/time_within_train_step": 2.6665444374084473, "step": 8164} {"train_info/time_between_train_steps": 0.003452777862548828, "step": 8164} {"info/global_step": 8165, "train_info/time_within_train_step": 2.6470818519592285, "step": 8165} {"train_info/time_between_train_steps": 0.0035080909729003906, "step": 8165} {"info/global_step": 8166, "train_info/time_within_train_step": 2.6460471153259277, "step": 8166} {"train_info/time_between_train_steps": 0.003451824188232422, "step": 8166} {"info/global_step": 8167, "train_info/time_within_train_step": 2.6540439128875732, "step": 8167} {"train_info/time_between_train_steps": 0.0034401416778564453, "step": 8167} {"info/global_step": 8168, "train_info/time_within_train_step": 2.653925895690918, "step": 8168} {"train_info/time_between_train_steps": 0.003454923629760742, "step": 8168} {"info/global_step": 8169, "train_info/time_within_train_step": 2.6610395908355713, "step": 8169} {"train_info/time_between_train_steps": 0.003523588180541992, "step": 8169} {"info/global_step": 8170, "train_info/time_within_train_step": 2.6818206310272217, "step": 8170} {"train_info/time_between_train_steps": 0.0034034252166748047, "step": 8170} {"info/global_step": 8171, "train_info/time_within_train_step": 2.729165554046631, "step": 8171} {"train_info/time_between_train_steps": 0.0035228729248046875, "step": 8171} {"info/global_step": 8172, "train_info/time_within_train_step": 2.6603970527648926, "step": 8172} {"train_info/time_between_train_steps": 0.0035347938537597656, "step": 8172} {"info/global_step": 8173, "train_info/time_within_train_step": 2.64243745803833, "step": 8173} {"train_info/time_between_train_steps": 0.0034427642822265625, "step": 8173} {"info/global_step": 8174, "train_info/time_within_train_step": 2.650561809539795, "step": 8174} {"train_info/time_between_train_steps": 0.0034275054931640625, "step": 8174} {"info/global_step": 8175, "train_info/time_within_train_step": 2.6557912826538086, "step": 8175} {"train_info/time_between_train_steps": 0.0035200119018554688, "step": 8175} {"info/global_step": 8176, "train_info/time_within_train_step": 2.655363082885742, "step": 8176} {"train_info/time_between_train_steps": 0.003490447998046875, "step": 8176} {"info/global_step": 8177, "train_info/time_within_train_step": 2.645940065383911, "step": 8177} {"train_info/time_between_train_steps": 0.003431081771850586, "step": 8177} {"info/global_step": 8178, "train_info/time_within_train_step": 2.65140700340271, "step": 8178} {"train_info/time_between_train_steps": 0.0034885406494140625, "step": 8178} {"info/global_step": 8179, "train_info/time_within_train_step": 2.654981851577759, "step": 8179} {"train_info/time_between_train_steps": 0.0035724639892578125, "step": 8179} {"info/global_step": 8180, "train_info/time_within_train_step": 3.023510694503784, "step": 8180} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 8180} {"info/global_step": 8181, "train_info/time_within_train_step": 2.6546788215637207, "step": 8181} {"train_info/time_between_train_steps": 0.003414154052734375, "step": 8181} {"info/global_step": 8182, "train_info/time_within_train_step": 2.6453258991241455, "step": 8182} {"train_info/time_between_train_steps": 0.0033979415893554688, "step": 8182} {"info/global_step": 8183, "train_info/time_within_train_step": 2.6489827632904053, "step": 8183} {"train_info/time_between_train_steps": 0.003407716751098633, "step": 8183} {"info/global_step": 8184, "train_info/time_within_train_step": 2.662433624267578, "step": 8184} {"train_info/time_between_train_steps": 0.0034837722778320312, "step": 8184} {"info/global_step": 8185, "train_info/time_within_train_step": 2.668614149093628, "step": 8185} {"train_info/time_between_train_steps": 0.0033872127532958984, "step": 8185} {"info/global_step": 8186, "train_info/time_within_train_step": 2.711977243423462, "step": 8186} {"train_info/time_between_train_steps": 0.003408193588256836, "step": 8186} {"info/global_step": 8187, "train_info/time_within_train_step": 2.645585536956787, "step": 8187} {"train_info/time_between_train_steps": 0.003437519073486328, "step": 8187} {"info/global_step": 8188, "train_info/time_within_train_step": 2.6653809547424316, "step": 8188} {"train_info/time_between_train_steps": 0.003468036651611328, "step": 8188} {"info/global_step": 8189, "train_info/time_within_train_step": 2.642246961593628, "step": 8189} {"train_info/time_between_train_steps": 0.0034987926483154297, "step": 8189} {"info/global_step": 8190, "train_info/time_within_train_step": 2.652132749557495, "step": 8190} {"train_info/time_between_train_steps": 0.003414630889892578, "step": 8190} {"info/global_step": 8191, "train_info/time_within_train_step": 2.6665453910827637, "step": 8191} {"train_info/time_between_train_steps": 0.003462553024291992, "step": 8191} {"info/global_step": 8192, "train_info/time_within_train_step": 2.6458189487457275, "step": 8192} {"train_info/time_between_train_steps": 0.0033981800079345703, "step": 8192} {"info/global_step": 8193, "train_info/time_within_train_step": 2.6460063457489014, "step": 8193} {"train_info/time_between_train_steps": 0.003359556198120117, "step": 8193} {"info/global_step": 8194, "train_info/time_within_train_step": 2.6579601764678955, "step": 8194} {"train_info/time_between_train_steps": 0.003384828567504883, "step": 8194} {"info/global_step": 8195, "train_info/time_within_train_step": 2.6686017513275146, "step": 8195} {"train_info/time_between_train_steps": 0.0033414363861083984, "step": 8195} {"info/global_step": 8196, "train_info/time_within_train_step": 2.677440643310547, "step": 8196} {"train_info/time_between_train_steps": 0.0033974647521972656, "step": 8196} {"info/global_step": 8197, "train_info/time_within_train_step": 2.6430137157440186, "step": 8197} {"train_info/time_between_train_steps": 0.003566265106201172, "step": 8197} {"info/global_step": 8198, "train_info/time_within_train_step": 2.651761293411255, "step": 8198} {"train_info/time_between_train_steps": 0.00341033935546875, "step": 8198} {"info/global_step": 8199, "train_info/time_within_train_step": 2.6633331775665283, "step": 8199} {"train_info/time_between_train_steps": 0.003289937973022461, "step": 8199} {"info/global_step": 8200, "train_info/time_within_train_step": 2.6444435119628906, "step": 8200} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746920386, "_runtime": 22984}, "step": 8200} {"logs": {"train/loss": 3.0863, "train/learning_rate": 0.00011999999999999999, "train/epoch": 9.04, "_timestamp": 1746920386, "_runtime": 22984}, "step": 8200} {"train_info/time_between_train_steps": 13.018187522888184, "step": 8200} {"info/global_step": 8201, "train_info/time_within_train_step": 2.441059112548828, "step": 8201} {"train_info/time_between_train_steps": 0.003376007080078125, "step": 8201} {"info/global_step": 8202, "train_info/time_within_train_step": 2.4361963272094727, "step": 8202} {"train_info/time_between_train_steps": 0.0033097267150878906, "step": 8202} {"info/global_step": 8203, "train_info/time_within_train_step": 2.637533664703369, "step": 8203} {"train_info/time_between_train_steps": 0.0034220218658447266, "step": 8203} {"info/global_step": 8204, "train_info/time_within_train_step": 2.6496803760528564, "step": 8204} {"train_info/time_between_train_steps": 0.0033833980560302734, "step": 8204} {"info/global_step": 8205, "train_info/time_within_train_step": 2.867600440979004, "step": 8205} {"train_info/time_between_train_steps": 0.0032567977905273438, "step": 8205} {"info/global_step": 8206, "train_info/time_within_train_step": 2.6845364570617676, "step": 8206} {"train_info/time_between_train_steps": 0.003278493881225586, "step": 8206} {"info/global_step": 8207, "train_info/time_within_train_step": 2.6537771224975586, "step": 8207} {"train_info/time_between_train_steps": 0.0033130645751953125, "step": 8207} {"info/global_step": 8208, "train_info/time_within_train_step": 2.6608269214630127, "step": 8208} {"train_info/time_between_train_steps": 0.0032486915588378906, "step": 8208} {"info/global_step": 8209, "train_info/time_within_train_step": 2.6484498977661133, "step": 8209} {"train_info/time_between_train_steps": 0.0032405853271484375, "step": 8209} {"info/global_step": 8210, "train_info/time_within_train_step": 2.6598546504974365, "step": 8210} {"train_info/time_between_train_steps": 0.0032694339752197266, "step": 8210} {"info/global_step": 8211, "train_info/time_within_train_step": 2.676417589187622, "step": 8211} {"train_info/time_between_train_steps": 0.003321409225463867, "step": 8211} {"info/global_step": 8212, "train_info/time_within_train_step": 2.6657044887542725, "step": 8212} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 8212} {"info/global_step": 8213, "train_info/time_within_train_step": 2.7033441066741943, "step": 8213} {"train_info/time_between_train_steps": 0.0032939910888671875, "step": 8213} {"info/global_step": 8214, "train_info/time_within_train_step": 2.6430768966674805, "step": 8214} {"train_info/time_between_train_steps": 0.0032825469970703125, "step": 8214} {"info/global_step": 8215, "train_info/time_within_train_step": 2.6507883071899414, "step": 8215} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 8215} {"info/global_step": 8216, "train_info/time_within_train_step": 2.664727210998535, "step": 8216} {"train_info/time_between_train_steps": 0.0032668113708496094, "step": 8216} {"info/global_step": 8217, "train_info/time_within_train_step": 2.6452252864837646, "step": 8217} {"train_info/time_between_train_steps": 0.0032978057861328125, "step": 8217} {"info/global_step": 8218, "train_info/time_within_train_step": 2.6469712257385254, "step": 8218} {"train_info/time_between_train_steps": 0.0032434463500976562, "step": 8218} {"info/global_step": 8219, "train_info/time_within_train_step": 2.6504428386688232, "step": 8219} {"train_info/time_between_train_steps": 0.0033936500549316406, "step": 8219} {"info/global_step": 8220, "train_info/time_within_train_step": 2.6545817852020264, "step": 8220} {"train_info/time_between_train_steps": 0.0034074783325195312, "step": 8220} {"info/global_step": 8221, "train_info/time_within_train_step": 2.661206007003784, "step": 8221} {"train_info/time_between_train_steps": 0.003444671630859375, "step": 8221} {"info/global_step": 8222, "train_info/time_within_train_step": 2.673337936401367, "step": 8222} {"train_info/time_between_train_steps": 0.0033881664276123047, "step": 8222} {"info/global_step": 8223, "train_info/time_within_train_step": 2.732285499572754, "step": 8223} {"train_info/time_between_train_steps": 0.0035588741302490234, "step": 8223} {"info/global_step": 8224, "train_info/time_within_train_step": 2.66957950592041, "step": 8224} {"train_info/time_between_train_steps": 0.003446340560913086, "step": 8224} {"info/global_step": 8225, "train_info/time_within_train_step": 2.6445627212524414, "step": 8225} {"train_info/time_between_train_steps": 0.0034923553466796875, "step": 8225} {"info/global_step": 8226, "train_info/time_within_train_step": 2.6486923694610596, "step": 8226} {"train_info/time_between_train_steps": 0.0034444332122802734, "step": 8226} {"info/global_step": 8227, "train_info/time_within_train_step": 2.6585381031036377, "step": 8227} {"train_info/time_between_train_steps": 0.003488779067993164, "step": 8227} {"info/global_step": 8228, "train_info/time_within_train_step": 2.6578164100646973, "step": 8228} {"train_info/time_between_train_steps": 0.0035257339477539062, "step": 8228} {"info/global_step": 8229, "train_info/time_within_train_step": 2.65539813041687, "step": 8229} {"train_info/time_between_train_steps": 0.0034525394439697266, "step": 8229} {"info/global_step": 8230, "train_info/time_within_train_step": 2.646209716796875, "step": 8230} {"train_info/time_between_train_steps": 0.0035228729248046875, "step": 8230} {"info/global_step": 8231, "train_info/time_within_train_step": 2.6694464683532715, "step": 8231} {"train_info/time_between_train_steps": 0.003562450408935547, "step": 8231} {"info/global_step": 8232, "train_info/time_within_train_step": 3.043407917022705, "step": 8232} {"train_info/time_between_train_steps": 0.003403902053833008, "step": 8232} {"info/global_step": 8233, "train_info/time_within_train_step": 2.6520209312438965, "step": 8233} {"train_info/time_between_train_steps": 0.003862619400024414, "step": 8233} {"info/global_step": 8234, "train_info/time_within_train_step": 2.646519422531128, "step": 8234} {"train_info/time_between_train_steps": 0.0033674240112304688, "step": 8234} {"info/global_step": 8235, "train_info/time_within_train_step": 2.651653289794922, "step": 8235} {"train_info/time_between_train_steps": 0.003416776657104492, "step": 8235} {"info/global_step": 8236, "train_info/time_within_train_step": 2.647641897201538, "step": 8236} {"train_info/time_between_train_steps": 0.003448963165283203, "step": 8236} {"info/global_step": 8237, "train_info/time_within_train_step": 2.6699957847595215, "step": 8237} {"train_info/time_between_train_steps": 0.0036249160766601562, "step": 8237} {"info/global_step": 8238, "train_info/time_within_train_step": 2.673196792602539, "step": 8238} {"train_info/time_between_train_steps": 0.0035772323608398438, "step": 8238} {"info/global_step": 8239, "train_info/time_within_train_step": 2.704437255859375, "step": 8239} {"train_info/time_between_train_steps": 0.0035500526428222656, "step": 8239} {"info/global_step": 8240, "train_info/time_within_train_step": 2.645564317703247, "step": 8240} {"train_info/time_between_train_steps": 0.0034613609313964844, "step": 8240} {"info/global_step": 8241, "train_info/time_within_train_step": 2.6546969413757324, "step": 8241} {"train_info/time_between_train_steps": 0.0034914016723632812, "step": 8241} {"info/global_step": 8242, "train_info/time_within_train_step": 2.650937557220459, "step": 8242} {"train_info/time_between_train_steps": 0.0035293102264404297, "step": 8242} {"info/global_step": 8243, "train_info/time_within_train_step": 2.6493287086486816, "step": 8243} {"train_info/time_between_train_steps": 0.0034782886505126953, "step": 8243} {"info/global_step": 8244, "train_info/time_within_train_step": 2.6615731716156006, "step": 8244} {"train_info/time_between_train_steps": 0.003847360610961914, "step": 8244} {"info/global_step": 8245, "train_info/time_within_train_step": 2.6477527618408203, "step": 8245} {"train_info/time_between_train_steps": 0.0034923553466796875, "step": 8245} {"info/global_step": 8246, "train_info/time_within_train_step": 2.646374464035034, "step": 8246} {"train_info/time_between_train_steps": 0.0034804344177246094, "step": 8246} {"info/global_step": 8247, "train_info/time_within_train_step": 2.6715481281280518, "step": 8247} {"train_info/time_between_train_steps": 0.0036454200744628906, "step": 8247} {"info/global_step": 8248, "train_info/time_within_train_step": 3.302438259124756, "step": 8248} {"train_info/time_between_train_steps": 0.0035049915313720703, "step": 8248} {"info/global_step": 8249, "train_info/time_within_train_step": 2.6517109870910645, "step": 8249} {"train_info/time_between_train_steps": 0.003432750701904297, "step": 8249} {"info/global_step": 8250, "train_info/time_within_train_step": 2.665332794189453, "step": 8250} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746920534, "_runtime": 23132}, "step": 8250} {"logs": {"train/loss": 3.0699, "train/learning_rate": 0.00011666666666666665, "train/epoch": 9.05, "_timestamp": 1746920534, "_runtime": 23132}, "step": 8250} {"train_info/time_between_train_steps": 0.03967881202697754, "step": 8250} {"info/global_step": 8251, "train_info/time_within_train_step": 2.66363525390625, "step": 8251} {"train_info/time_between_train_steps": 0.003458738327026367, "step": 8251} {"info/global_step": 8252, "train_info/time_within_train_step": 2.6481025218963623, "step": 8252} {"train_info/time_between_train_steps": 0.003491640090942383, "step": 8252} {"info/global_step": 8253, "train_info/time_within_train_step": 2.6508543491363525, "step": 8253} {"train_info/time_between_train_steps": 0.0034139156341552734, "step": 8253} {"info/global_step": 8254, "train_info/time_within_train_step": 2.6632730960845947, "step": 8254} {"train_info/time_between_train_steps": 0.0035347938537597656, "step": 8254} {"info/global_step": 8255, "train_info/time_within_train_step": 2.6459100246429443, "step": 8255} {"train_info/time_between_train_steps": 0.0035665035247802734, "step": 8255} {"info/global_step": 8256, "train_info/time_within_train_step": 2.6725411415100098, "step": 8256} {"train_info/time_between_train_steps": 0.0034694671630859375, "step": 8256} {"info/global_step": 8257, "train_info/time_within_train_step": 2.689955711364746, "step": 8257} {"train_info/time_between_train_steps": 0.0034797191619873047, "step": 8257} {"info/global_step": 8258, "train_info/time_within_train_step": 2.6535677909851074, "step": 8258} {"train_info/time_between_train_steps": 0.0034639835357666016, "step": 8258} {"info/global_step": 8259, "train_info/time_within_train_step": 2.6886050701141357, "step": 8259} {"train_info/time_between_train_steps": 0.003505229949951172, "step": 8259} {"info/global_step": 8260, "train_info/time_within_train_step": 2.6420669555664062, "step": 8260} {"train_info/time_between_train_steps": 0.0034813880920410156, "step": 8260} {"info/global_step": 8261, "train_info/time_within_train_step": 2.651163339614868, "step": 8261} {"train_info/time_between_train_steps": 0.0035016536712646484, "step": 8261} {"info/global_step": 8262, "train_info/time_within_train_step": 2.664928436279297, "step": 8262} {"train_info/time_between_train_steps": 0.003429889678955078, "step": 8262} {"info/global_step": 8263, "train_info/time_within_train_step": 2.644636869430542, "step": 8263} {"train_info/time_between_train_steps": 0.003439188003540039, "step": 8263} {"info/global_step": 8264, "train_info/time_within_train_step": 2.6457417011260986, "step": 8264} {"train_info/time_between_train_steps": 0.0034940242767333984, "step": 8264} {"info/global_step": 8265, "train_info/time_within_train_step": 2.655150890350342, "step": 8265} {"train_info/time_between_train_steps": 0.0035228729248046875, "step": 8265} {"info/global_step": 8266, "train_info/time_within_train_step": 2.662364959716797, "step": 8266} {"train_info/time_between_train_steps": 0.0034427642822265625, "step": 8266} {"info/global_step": 8267, "train_info/time_within_train_step": 2.6723053455352783, "step": 8267} {"train_info/time_between_train_steps": 0.14556574821472168, "step": 8267} {"info/global_step": 8268, "train_info/time_within_train_step": 2.6660218238830566, "step": 8268} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 8268} {"info/global_step": 8269, "train_info/time_within_train_step": 2.6632611751556396, "step": 8269} {"train_info/time_between_train_steps": 0.0033342838287353516, "step": 8269} {"info/global_step": 8270, "train_info/time_within_train_step": 2.6629018783569336, "step": 8270} {"train_info/time_between_train_steps": 0.0032663345336914062, "step": 8270} {"info/global_step": 8271, "train_info/time_within_train_step": 2.647322177886963, "step": 8271} {"train_info/time_between_train_steps": 0.0033245086669921875, "step": 8271} {"info/global_step": 8272, "train_info/time_within_train_step": 2.6456785202026367, "step": 8272} {"train_info/time_between_train_steps": 0.003275632858276367, "step": 8272} {"info/global_step": 8273, "train_info/time_within_train_step": 2.651355266571045, "step": 8273} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 8273} {"info/global_step": 8274, "train_info/time_within_train_step": 2.652575969696045, "step": 8274} {"train_info/time_between_train_steps": 0.0033249855041503906, "step": 8274} {"info/global_step": 8275, "train_info/time_within_train_step": 3.0013022422790527, "step": 8275} {"train_info/time_between_train_steps": 0.0032601356506347656, "step": 8275} {"info/global_step": 8276, "train_info/time_within_train_step": 2.644174337387085, "step": 8276} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 8276} {"info/global_step": 8277, "train_info/time_within_train_step": 2.648404359817505, "step": 8277} {"train_info/time_between_train_steps": 0.003251791000366211, "step": 8277} {"info/global_step": 8278, "train_info/time_within_train_step": 2.6482021808624268, "step": 8278} {"train_info/time_between_train_steps": 0.003228425979614258, "step": 8278} {"info/global_step": 8279, "train_info/time_within_train_step": 2.651618242263794, "step": 8279} {"train_info/time_between_train_steps": 0.0032596588134765625, "step": 8279} {"info/global_step": 8280, "train_info/time_within_train_step": 2.6609320640563965, "step": 8280} {"train_info/time_between_train_steps": 0.003363370895385742, "step": 8280} {"info/global_step": 8281, "train_info/time_within_train_step": 2.6792380809783936, "step": 8281} {"train_info/time_between_train_steps": 0.003454446792602539, "step": 8281} {"info/global_step": 8282, "train_info/time_within_train_step": 2.644890785217285, "step": 8282} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 8282} {"info/global_step": 8283, "train_info/time_within_train_step": 2.6585750579833984, "step": 8283} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 8283} {"info/global_step": 8284, "train_info/time_within_train_step": 2.659856081008911, "step": 8284} {"train_info/time_between_train_steps": 0.003324270248413086, "step": 8284} {"info/global_step": 8285, "train_info/time_within_train_step": 2.6475863456726074, "step": 8285} {"train_info/time_between_train_steps": 0.0035185813903808594, "step": 8285} {"info/global_step": 8286, "train_info/time_within_train_step": 2.646702289581299, "step": 8286} {"train_info/time_between_train_steps": 0.0034711360931396484, "step": 8286} {"info/global_step": 8287, "train_info/time_within_train_step": 2.645909070968628, "step": 8287} {"train_info/time_between_train_steps": 0.0033423900604248047, "step": 8287} {"info/global_step": 8288, "train_info/time_within_train_step": 2.6453373432159424, "step": 8288} {"train_info/time_between_train_steps": 0.0033178329467773438, "step": 8288} {"info/global_step": 8289, "train_info/time_within_train_step": 2.6754019260406494, "step": 8289} {"train_info/time_between_train_steps": 0.003293752670288086, "step": 8289} {"info/global_step": 8290, "train_info/time_within_train_step": 2.6656620502471924, "step": 8290} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 8290} {"info/global_step": 8291, "train_info/time_within_train_step": 2.647789239883423, "step": 8291} {"train_info/time_between_train_steps": 0.0032587051391601562, "step": 8291} {"info/global_step": 8292, "train_info/time_within_train_step": 2.649993896484375, "step": 8292} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 8292} {"info/global_step": 8293, "train_info/time_within_train_step": 2.641784191131592, "step": 8293} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 8293} {"info/global_step": 8294, "train_info/time_within_train_step": 2.6559934616088867, "step": 8294} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 8294} {"info/global_step": 8295, "train_info/time_within_train_step": 2.6564924716949463, "step": 8295} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 8295} {"info/global_step": 8296, "train_info/time_within_train_step": 2.6441824436187744, "step": 8296} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 8296} {"info/global_step": 8297, "train_info/time_within_train_step": 2.645549774169922, "step": 8297} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 8297} {"info/global_step": 8298, "train_info/time_within_train_step": 2.6642987728118896, "step": 8298} {"train_info/time_between_train_steps": 0.0035462379455566406, "step": 8298} {"info/global_step": 8299, "train_info/time_within_train_step": 2.6658594608306885, "step": 8299} {"train_info/time_between_train_steps": 0.0032339096069335938, "step": 8299} {"info/global_step": 8300, "train_info/time_within_train_step": 2.694737434387207, "step": 8300} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746920669, "_runtime": 23267}, "step": 8300} {"logs": {"train/loss": 3.0619, "train/learning_rate": 0.00011333333333333331, "train/epoch": 9.05, "_timestamp": 1746920669, "_runtime": 23267}, "step": 8300} {"train_info/time_between_train_steps": 0.023940086364746094, "step": 8300} {"info/global_step": 8301, "train_info/time_within_train_step": 2.663592576980591, "step": 8301} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 8301} {"info/global_step": 8302, "train_info/time_within_train_step": 2.6642961502075195, "step": 8302} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 8302} {"info/global_step": 8303, "train_info/time_within_train_step": 2.6407666206359863, "step": 8303} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 8303} {"info/global_step": 8304, "train_info/time_within_train_step": 2.6521472930908203, "step": 8304} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 8304} {"info/global_step": 8305, "train_info/time_within_train_step": 2.6630642414093018, "step": 8305} {"train_info/time_between_train_steps": 0.0032618045806884766, "step": 8305} {"info/global_step": 8306, "train_info/time_within_train_step": 2.6435253620147705, "step": 8306} {"train_info/time_between_train_steps": 0.00323486328125, "step": 8306} {"info/global_step": 8307, "train_info/time_within_train_step": 2.644490957260132, "step": 8307} {"train_info/time_between_train_steps": 0.003245830535888672, "step": 8307} {"info/global_step": 8308, "train_info/time_within_train_step": 2.6644623279571533, "step": 8308} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 8308} {"info/global_step": 8309, "train_info/time_within_train_step": 2.6662838459014893, "step": 8309} {"train_info/time_between_train_steps": 0.003318309783935547, "step": 8309} {"info/global_step": 8310, "train_info/time_within_train_step": 2.685141086578369, "step": 8310} {"train_info/time_between_train_steps": 0.0032320022583007812, "step": 8310} {"info/global_step": 8311, "train_info/time_within_train_step": 2.656463384628296, "step": 8311} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 8311} {"info/global_step": 8312, "train_info/time_within_train_step": 2.6421031951904297, "step": 8312} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 8312} {"info/global_step": 8313, "train_info/time_within_train_step": 2.6537604331970215, "step": 8313} {"train_info/time_between_train_steps": 0.003297090530395508, "step": 8313} {"info/global_step": 8314, "train_info/time_within_train_step": 2.6630213260650635, "step": 8314} {"train_info/time_between_train_steps": 0.0032994747161865234, "step": 8314} {"info/global_step": 8315, "train_info/time_within_train_step": 2.6433165073394775, "step": 8315} {"train_info/time_between_train_steps": 0.0035953521728515625, "step": 8315} {"info/global_step": 8316, "train_info/time_within_train_step": 2.645289421081543, "step": 8316} {"train_info/time_between_train_steps": 0.0034515857696533203, "step": 8316} {"info/global_step": 8317, "train_info/time_within_train_step": 2.658085584640503, "step": 8317} {"train_info/time_between_train_steps": 0.0034399032592773438, "step": 8317} {"info/global_step": 8318, "train_info/time_within_train_step": 2.7005810737609863, "step": 8318} {"train_info/time_between_train_steps": 0.003092527389526367, "step": 8318} {"info/global_step": 8319, "train_info/time_within_train_step": 2.6576762199401855, "step": 8319} {"train_info/time_between_train_steps": 0.0030786991119384766, "step": 8319} {"info/global_step": 8320, "train_info/time_within_train_step": 2.667701244354248, "step": 8320} {"train_info/time_between_train_steps": 0.0030379295349121094, "step": 8320} {"info/global_step": 8321, "train_info/time_within_train_step": 2.64306378364563, "step": 8321} {"train_info/time_between_train_steps": 0.003031015396118164, "step": 8321} {"info/global_step": 8322, "train_info/time_within_train_step": 2.647993326187134, "step": 8322} {"train_info/time_between_train_steps": 0.003064870834350586, "step": 8322} {"info/global_step": 8323, "train_info/time_within_train_step": 2.6491761207580566, "step": 8323} {"train_info/time_between_train_steps": 0.002991199493408203, "step": 8323} {"info/global_step": 8324, "train_info/time_within_train_step": 2.6523654460906982, "step": 8324} {"train_info/time_between_train_steps": 0.003031015396118164, "step": 8324} {"info/global_step": 8325, "train_info/time_within_train_step": 2.661228656768799, "step": 8325} {"train_info/time_between_train_steps": 0.003398418426513672, "step": 8325} {"info/global_step": 8326, "train_info/time_within_train_step": 2.6811509132385254, "step": 8326} {"train_info/time_between_train_steps": 0.0033206939697265625, "step": 8326} {"info/global_step": 8327, "train_info/time_within_train_step": 2.688189744949341, "step": 8327} {"train_info/time_between_train_steps": 0.0030679702758789062, "step": 8327} {"info/global_step": 8328, "train_info/time_within_train_step": 2.660872220993042, "step": 8328} {"train_info/time_between_train_steps": 0.003025531768798828, "step": 8328} {"info/global_step": 8329, "train_info/time_within_train_step": 2.6460201740264893, "step": 8329} {"train_info/time_between_train_steps": 0.0030002593994140625, "step": 8329} {"info/global_step": 8330, "train_info/time_within_train_step": 2.6437015533447266, "step": 8330} {"train_info/time_between_train_steps": 0.0029892921447753906, "step": 8330} {"info/global_step": 8331, "train_info/time_within_train_step": 2.6523449420928955, "step": 8331} {"train_info/time_between_train_steps": 0.0029854774475097656, "step": 8331} {"info/global_step": 8332, "train_info/time_within_train_step": 2.6456947326660156, "step": 8332} {"train_info/time_between_train_steps": 0.00304412841796875, "step": 8332} {"info/global_step": 8333, "train_info/time_within_train_step": 2.6703836917877197, "step": 8333} {"train_info/time_between_train_steps": 0.003076791763305664, "step": 8333} {"info/global_step": 8334, "train_info/time_within_train_step": 2.6892893314361572, "step": 8334} {"train_info/time_between_train_steps": 0.0029959678649902344, "step": 8334} {"info/global_step": 8335, "train_info/time_within_train_step": 2.670337438583374, "step": 8335} {"train_info/time_between_train_steps": 0.003078460693359375, "step": 8335} {"info/global_step": 8336, "train_info/time_within_train_step": 2.659362316131592, "step": 8336} {"train_info/time_between_train_steps": 0.002997875213623047, "step": 8336} {"info/global_step": 8337, "train_info/time_within_train_step": 2.641204357147217, "step": 8337} {"train_info/time_between_train_steps": 0.0029993057250976562, "step": 8337} {"info/global_step": 8338, "train_info/time_within_train_step": 2.6538193225860596, "step": 8338} {"train_info/time_between_train_steps": 0.0029821395874023438, "step": 8338} {"info/global_step": 8339, "train_info/time_within_train_step": 2.6584367752075195, "step": 8339} {"train_info/time_between_train_steps": 0.0030846595764160156, "step": 8339} {"info/global_step": 8340, "train_info/time_within_train_step": 2.644047737121582, "step": 8340} {"train_info/time_between_train_steps": 0.0029871463775634766, "step": 8340} {"info/global_step": 8341, "train_info/time_within_train_step": 2.642500638961792, "step": 8341} {"train_info/time_between_train_steps": 0.0030100345611572266, "step": 8341} {"info/global_step": 8342, "train_info/time_within_train_step": 2.6646835803985596, "step": 8342} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 8342} {"info/global_step": 8343, "train_info/time_within_train_step": 2.6694278717041016, "step": 8343} {"train_info/time_between_train_steps": 0.003067493438720703, "step": 8343} {"info/global_step": 8344, "train_info/time_within_train_step": 2.688504695892334, "step": 8344} {"train_info/time_between_train_steps": 0.002996206283569336, "step": 8344} {"info/global_step": 8345, "train_info/time_within_train_step": 2.650996446609497, "step": 8345} {"train_info/time_between_train_steps": 0.003015279769897461, "step": 8345} {"info/global_step": 8346, "train_info/time_within_train_step": 2.6745765209198, "step": 8346} {"train_info/time_between_train_steps": 0.0030155181884765625, "step": 8346} {"info/global_step": 8347, "train_info/time_within_train_step": 2.6413185596466064, "step": 8347} {"train_info/time_between_train_steps": 0.0029900074005126953, "step": 8347} {"info/global_step": 8348, "train_info/time_within_train_step": 2.641153335571289, "step": 8348} {"train_info/time_between_train_steps": 0.002996206283569336, "step": 8348} {"info/global_step": 8349, "train_info/time_within_train_step": 2.6636109352111816, "step": 8349} {"train_info/time_between_train_steps": 0.0030984878540039062, "step": 8349} {"info/global_step": 8350, "train_info/time_within_train_step": 2.6496822834014893, "step": 8350} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746920803, "_runtime": 23401}, "step": 8350} {"logs": {"train/loss": 3.0533, "train/learning_rate": 0.00010999999999999998, "train/epoch": 9.06, "_timestamp": 1746920803, "_runtime": 23401}, "step": 8350} {"train_info/time_between_train_steps": 0.02396702766418457, "step": 8350} {"info/global_step": 8351, "train_info/time_within_train_step": 2.6598060131073, "step": 8351} {"train_info/time_between_train_steps": 0.0030241012573242188, "step": 8351} {"info/global_step": 8352, "train_info/time_within_train_step": 2.6470561027526855, "step": 8352} {"train_info/time_between_train_steps": 0.003032684326171875, "step": 8352} {"info/global_step": 8353, "train_info/time_within_train_step": 2.6633293628692627, "step": 8353} {"train_info/time_between_train_steps": 0.0029876232147216797, "step": 8353} {"info/global_step": 8354, "train_info/time_within_train_step": 2.662856101989746, "step": 8354} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 8354} {"info/global_step": 8355, "train_info/time_within_train_step": 2.657902479171753, "step": 8355} {"train_info/time_between_train_steps": 0.003009319305419922, "step": 8355} {"info/global_step": 8356, "train_info/time_within_train_step": 2.709862470626831, "step": 8356} {"train_info/time_between_train_steps": 0.0030393600463867188, "step": 8356} {"info/global_step": 8357, "train_info/time_within_train_step": 2.650873899459839, "step": 8357} {"train_info/time_between_train_steps": 0.0030639171600341797, "step": 8357} {"info/global_step": 8358, "train_info/time_within_train_step": 2.6482951641082764, "step": 8358} {"train_info/time_between_train_steps": 0.003033161163330078, "step": 8358} {"info/global_step": 8359, "train_info/time_within_train_step": 2.6591897010803223, "step": 8359} {"train_info/time_between_train_steps": 0.0030710697174072266, "step": 8359} {"info/global_step": 8360, "train_info/time_within_train_step": 2.6456823348999023, "step": 8360} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 8360} {"info/global_step": 8361, "train_info/time_within_train_step": 2.649179458618164, "step": 8361} {"train_info/time_between_train_steps": 0.0030350685119628906, "step": 8361} {"info/global_step": 8362, "train_info/time_within_train_step": 2.6492249965667725, "step": 8362} {"train_info/time_between_train_steps": 0.0030040740966796875, "step": 8362} {"info/global_step": 8363, "train_info/time_within_train_step": 2.65090274810791, "step": 8363} {"train_info/time_between_train_steps": 0.0030477046966552734, "step": 8363} {"info/global_step": 8364, "train_info/time_within_train_step": 2.6601898670196533, "step": 8364} {"train_info/time_between_train_steps": 0.0030460357666015625, "step": 8364} {"info/global_step": 8365, "train_info/time_within_train_step": 2.726802349090576, "step": 8365} {"train_info/time_between_train_steps": 0.0030221939086914062, "step": 8365} {"info/global_step": 8366, "train_info/time_within_train_step": 2.6544694900512695, "step": 8366} {"train_info/time_between_train_steps": 0.0030171871185302734, "step": 8366} {"info/global_step": 8367, "train_info/time_within_train_step": 2.6413333415985107, "step": 8367} {"train_info/time_between_train_steps": 0.0030329227447509766, "step": 8367} {"info/global_step": 8368, "train_info/time_within_train_step": 2.654724359512329, "step": 8368} {"train_info/time_between_train_steps": 0.0030460357666015625, "step": 8368} {"info/global_step": 8369, "train_info/time_within_train_step": 2.6485002040863037, "step": 8369} {"train_info/time_between_train_steps": 0.003057241439819336, "step": 8369} {"info/global_step": 8370, "train_info/time_within_train_step": 2.651212215423584, "step": 8370} {"train_info/time_between_train_steps": 0.003055095672607422, "step": 8370} {"info/global_step": 8371, "train_info/time_within_train_step": 2.645009994506836, "step": 8371} {"train_info/time_between_train_steps": 0.0029878616333007812, "step": 8371} {"info/global_step": 8372, "train_info/time_within_train_step": 2.645296335220337, "step": 8372} {"train_info/time_between_train_steps": 0.003064393997192383, "step": 8372} {"info/global_step": 8373, "train_info/time_within_train_step": 2.6643059253692627, "step": 8373} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 8373} {"info/global_step": 8374, "train_info/time_within_train_step": 2.670654058456421, "step": 8374} {"train_info/time_between_train_steps": 0.0030574798583984375, "step": 8374} {"info/global_step": 8375, "train_info/time_within_train_step": 2.7096307277679443, "step": 8375} {"train_info/time_between_train_steps": 0.00301361083984375, "step": 8375} {"info/global_step": 8376, "train_info/time_within_train_step": 2.6433796882629395, "step": 8376} {"train_info/time_between_train_steps": 0.0030059814453125, "step": 8376} {"info/global_step": 8377, "train_info/time_within_train_step": 2.65421462059021, "step": 8377} {"train_info/time_between_train_steps": 0.003023386001586914, "step": 8377} {"info/global_step": 8378, "train_info/time_within_train_step": 2.648921251296997, "step": 8378} {"train_info/time_between_train_steps": 0.0030133724212646484, "step": 8378} {"info/global_step": 8379, "train_info/time_within_train_step": 2.648419141769409, "step": 8379} {"train_info/time_between_train_steps": 0.003084897994995117, "step": 8379} {"info/global_step": 8380, "train_info/time_within_train_step": 2.659459114074707, "step": 8380} {"train_info/time_between_train_steps": 0.002988576889038086, "step": 8380} {"info/global_step": 8381, "train_info/time_within_train_step": 2.6450693607330322, "step": 8381} {"train_info/time_between_train_steps": 0.0030019283294677734, "step": 8381} {"info/global_step": 8382, "train_info/time_within_train_step": 2.643350839614868, "step": 8382} {"train_info/time_between_train_steps": 0.0029973983764648438, "step": 8382} {"info/global_step": 8383, "train_info/time_within_train_step": 2.670473098754883, "step": 8383} {"train_info/time_between_train_steps": 0.0030088424682617188, "step": 8383} {"info/global_step": 8384, "train_info/time_within_train_step": 2.665271520614624, "step": 8384} {"train_info/time_between_train_steps": 0.003063678741455078, "step": 8384} {"info/global_step": 8385, "train_info/time_within_train_step": 2.6871795654296875, "step": 8385} {"train_info/time_between_train_steps": 0.0030350685119628906, "step": 8385} {"info/global_step": 8386, "train_info/time_within_train_step": 2.655667304992676, "step": 8386} {"train_info/time_between_train_steps": 0.0029883384704589844, "step": 8386} {"info/global_step": 8387, "train_info/time_within_train_step": 2.9321835041046143, "step": 8387} {"train_info/time_between_train_steps": 0.002985715866088867, "step": 8387} {"info/global_step": 8388, "train_info/time_within_train_step": 2.6684045791625977, "step": 8388} {"train_info/time_between_train_steps": 0.0029675960540771484, "step": 8388} {"info/global_step": 8389, "train_info/time_within_train_step": 2.6884982585906982, "step": 8389} {"train_info/time_between_train_steps": 0.0029137134552001953, "step": 8389} {"info/global_step": 8390, "train_info/time_within_train_step": 2.6529862880706787, "step": 8390} {"train_info/time_between_train_steps": 0.002925872802734375, "step": 8390} {"info/global_step": 8391, "train_info/time_within_train_step": 2.6763319969177246, "step": 8391} {"train_info/time_between_train_steps": 0.002913236618041992, "step": 8391} {"info/global_step": 8392, "train_info/time_within_train_step": 2.6610803604125977, "step": 8392} {"train_info/time_between_train_steps": 0.0029299259185791016, "step": 8392} {"info/global_step": 8393, "train_info/time_within_train_step": 2.642481803894043, "step": 8393} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 8393} {"info/global_step": 8394, "train_info/time_within_train_step": 2.6435182094573975, "step": 8394} {"train_info/time_between_train_steps": 0.002964496612548828, "step": 8394} {"info/global_step": 8395, "train_info/time_within_train_step": 2.660417318344116, "step": 8395} {"train_info/time_between_train_steps": 0.0029430389404296875, "step": 8395} {"info/global_step": 8396, "train_info/time_within_train_step": 2.6607866287231445, "step": 8396} {"train_info/time_between_train_steps": 0.0029976367950439453, "step": 8396} {"info/global_step": 8397, "train_info/time_within_train_step": 2.676798105239868, "step": 8397} {"train_info/time_between_train_steps": 0.002954721450805664, "step": 8397} {"info/global_step": 8398, "train_info/time_within_train_step": 2.669793128967285, "step": 8398} {"train_info/time_between_train_steps": 0.002981901168823242, "step": 8398} {"info/global_step": 8399, "train_info/time_within_train_step": 2.6904404163360596, "step": 8399} {"train_info/time_between_train_steps": 0.0029036998748779297, "step": 8399} {"info/global_step": 8400, "train_info/time_within_train_step": 2.6396660804748535, "step": 8400} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746920938, "_runtime": 23536}, "step": 8400} {"logs": {"train/loss": 3.0474, "train/learning_rate": 0.00010666666666666667, "train/epoch": 9.06, "_timestamp": 1746920938, "_runtime": 23536}, "step": 8400} {"train_info/time_between_train_steps": 15.319575309753418, "step": 8400} {"info/global_step": 8401, "train_info/time_within_train_step": 2.4481921195983887, "step": 8401} {"train_info/time_between_train_steps": 0.002882242202758789, "step": 8401} {"info/global_step": 8402, "train_info/time_within_train_step": 2.42151141166687, "step": 8402} {"train_info/time_between_train_steps": 0.002937793731689453, "step": 8402} {"info/global_step": 8403, "train_info/time_within_train_step": 2.5973401069641113, "step": 8403} {"train_info/time_between_train_steps": 0.0028939247131347656, "step": 8403} {"info/global_step": 8404, "train_info/time_within_train_step": 2.6501529216766357, "step": 8404} {"train_info/time_between_train_steps": 0.003126859664916992, "step": 8404} {"info/global_step": 8405, "train_info/time_within_train_step": 2.6705148220062256, "step": 8405} {"train_info/time_between_train_steps": 0.002918243408203125, "step": 8405} {"info/global_step": 8406, "train_info/time_within_train_step": 2.7254385948181152, "step": 8406} {"train_info/time_between_train_steps": 0.002918720245361328, "step": 8406} {"info/global_step": 8407, "train_info/time_within_train_step": 2.65480637550354, "step": 8407} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 8407} {"info/global_step": 8408, "train_info/time_within_train_step": 2.6398203372955322, "step": 8408} {"train_info/time_between_train_steps": 0.006324052810668945, "step": 8408} {"info/global_step": 8409, "train_info/time_within_train_step": 2.653740167617798, "step": 8409} {"train_info/time_between_train_steps": 0.006309032440185547, "step": 8409} {"info/global_step": 8410, "train_info/time_within_train_step": 2.649170160293579, "step": 8410} {"train_info/time_between_train_steps": 0.0064144134521484375, "step": 8410} {"info/global_step": 8411, "train_info/time_within_train_step": 2.655313014984131, "step": 8411} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 8411} {"info/global_step": 8412, "train_info/time_within_train_step": 2.6447150707244873, "step": 8412} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 8412} {"info/global_step": 8413, "train_info/time_within_train_step": 2.644270658493042, "step": 8413} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 8413} {"info/global_step": 8414, "train_info/time_within_train_step": 2.644040584564209, "step": 8414} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 8414} {"info/global_step": 8415, "train_info/time_within_train_step": 2.6590330600738525, "step": 8415} {"train_info/time_between_train_steps": 0.0031366348266601562, "step": 8415} {"info/global_step": 8416, "train_info/time_within_train_step": 2.6562564373016357, "step": 8416} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 8416} {"info/global_step": 8417, "train_info/time_within_train_step": 2.645653247833252, "step": 8417} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 8417} {"info/global_step": 8418, "train_info/time_within_train_step": 2.645923614501953, "step": 8418} {"train_info/time_between_train_steps": 0.0031080245971679688, "step": 8418} {"info/global_step": 8419, "train_info/time_within_train_step": 2.6597630977630615, "step": 8419} {"train_info/time_between_train_steps": 0.003105640411376953, "step": 8419} {"info/global_step": 8420, "train_info/time_within_train_step": 2.6707723140716553, "step": 8420} {"train_info/time_between_train_steps": 0.0030753612518310547, "step": 8420} {"info/global_step": 8421, "train_info/time_within_train_step": 2.687404155731201, "step": 8421} {"train_info/time_between_train_steps": 0.003118276596069336, "step": 8421} {"info/global_step": 8422, "train_info/time_within_train_step": 2.6506896018981934, "step": 8422} {"train_info/time_between_train_steps": 0.003107309341430664, "step": 8422} {"info/global_step": 8423, "train_info/time_within_train_step": 2.685833215713501, "step": 8423} {"train_info/time_between_train_steps": 0.0030777454376220703, "step": 8423} {"info/global_step": 8424, "train_info/time_within_train_step": 2.643136739730835, "step": 8424} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 8424} {"info/global_step": 8425, "train_info/time_within_train_step": 2.649257183074951, "step": 8425} {"train_info/time_between_train_steps": 0.003117799758911133, "step": 8425} {"info/global_step": 8426, "train_info/time_within_train_step": 2.656222105026245, "step": 8426} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 8426} {"info/global_step": 8427, "train_info/time_within_train_step": 2.649407148361206, "step": 8427} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 8427} {"info/global_step": 8428, "train_info/time_within_train_step": 2.646949291229248, "step": 8428} {"train_info/time_between_train_steps": 0.003096342086791992, "step": 8428} {"info/global_step": 8429, "train_info/time_within_train_step": 2.6647400856018066, "step": 8429} {"train_info/time_between_train_steps": 0.003065824508666992, "step": 8429} {"info/global_step": 8430, "train_info/time_within_train_step": 2.6650707721710205, "step": 8430} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 8430} {"info/global_step": 8431, "train_info/time_within_train_step": 2.6590490341186523, "step": 8431} {"train_info/time_between_train_steps": 0.00307464599609375, "step": 8431} {"info/global_step": 8432, "train_info/time_within_train_step": 2.710989475250244, "step": 8432} {"train_info/time_between_train_steps": 0.0030596256256103516, "step": 8432} {"info/global_step": 8433, "train_info/time_within_train_step": 2.644577741622925, "step": 8433} {"train_info/time_between_train_steps": 0.0030717849731445312, "step": 8433} {"info/global_step": 8434, "train_info/time_within_train_step": 2.6483073234558105, "step": 8434} {"train_info/time_between_train_steps": 0.003114938735961914, "step": 8434} {"info/global_step": 8435, "train_info/time_within_train_step": 2.679762125015259, "step": 8435} {"train_info/time_between_train_steps": 0.0030562877655029297, "step": 8435} {"info/global_step": 8436, "train_info/time_within_train_step": 2.6478641033172607, "step": 8436} {"train_info/time_between_train_steps": 0.003107309341430664, "step": 8436} {"info/global_step": 8437, "train_info/time_within_train_step": 2.645453929901123, "step": 8437} {"train_info/time_between_train_steps": 0.003072500228881836, "step": 8437} {"info/global_step": 8438, "train_info/time_within_train_step": 2.65871262550354, "step": 8438} {"train_info/time_between_train_steps": 0.003047943115234375, "step": 8438} {"info/global_step": 8439, "train_info/time_within_train_step": 2.6522374153137207, "step": 8439} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 8439} {"info/global_step": 8440, "train_info/time_within_train_step": 2.6677498817443848, "step": 8440} {"train_info/time_between_train_steps": 0.003131866455078125, "step": 8440} {"info/global_step": 8441, "train_info/time_within_train_step": 2.7322301864624023, "step": 8441} {"train_info/time_between_train_steps": 0.0030493736267089844, "step": 8441} {"info/global_step": 8442, "train_info/time_within_train_step": 2.6862025260925293, "step": 8442} {"train_info/time_between_train_steps": 0.0030832290649414062, "step": 8442} {"info/global_step": 8443, "train_info/time_within_train_step": 2.642106294631958, "step": 8443} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 8443} {"info/global_step": 8444, "train_info/time_within_train_step": 2.641258478164673, "step": 8444} {"train_info/time_between_train_steps": 0.003087282180786133, "step": 8444} {"info/global_step": 8445, "train_info/time_within_train_step": 2.6610288619995117, "step": 8445} {"train_info/time_between_train_steps": 0.0030815601348876953, "step": 8445} {"info/global_step": 8446, "train_info/time_within_train_step": 2.656859874725342, "step": 8446} {"train_info/time_between_train_steps": 0.0031023025512695312, "step": 8446} {"info/global_step": 8447, "train_info/time_within_train_step": 2.6438498497009277, "step": 8447} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 8447} {"info/global_step": 8448, "train_info/time_within_train_step": 2.6525728702545166, "step": 8448} {"train_info/time_between_train_steps": 0.003059864044189453, "step": 8448} {"info/global_step": 8449, "train_info/time_within_train_step": 2.652836561203003, "step": 8449} {"train_info/time_between_train_steps": 0.003132343292236328, "step": 8449} {"info/global_step": 8450, "train_info/time_within_train_step": 2.6708261966705322, "step": 8450} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746921087, "_runtime": 23685}, "step": 8450} {"logs": {"train/loss": 3.0369, "train/learning_rate": 0.00010333333333333333, "train/epoch": 9.07, "_timestamp": 1746921087, "_runtime": 23685}, "step": 8450} {"train_info/time_between_train_steps": 0.02423882484436035, "step": 8450} {"info/global_step": 8451, "train_info/time_within_train_step": 2.6920371055603027, "step": 8451} {"train_info/time_between_train_steps": 0.003114938735961914, "step": 8451} {"info/global_step": 8452, "train_info/time_within_train_step": 2.667691707611084, "step": 8452} {"train_info/time_between_train_steps": 0.003015756607055664, "step": 8452} {"info/global_step": 8453, "train_info/time_within_train_step": 2.662548542022705, "step": 8453} {"train_info/time_between_train_steps": 0.003044605255126953, "step": 8453} {"info/global_step": 8454, "train_info/time_within_train_step": 2.642136335372925, "step": 8454} {"train_info/time_between_train_steps": 0.003084897994995117, "step": 8454} {"info/global_step": 8455, "train_info/time_within_train_step": 2.654909133911133, "step": 8455} {"train_info/time_between_train_steps": 0.0030782222747802734, "step": 8455} {"info/global_step": 8456, "train_info/time_within_train_step": 2.6563265323638916, "step": 8456} {"train_info/time_between_train_steps": 0.0030748844146728516, "step": 8456} {"info/global_step": 8457, "train_info/time_within_train_step": 2.6457784175872803, "step": 8457} {"train_info/time_between_train_steps": 0.0031287670135498047, "step": 8457} {"info/global_step": 8458, "train_info/time_within_train_step": 2.644702911376953, "step": 8458} {"train_info/time_between_train_steps": 0.003055572509765625, "step": 8458} {"info/global_step": 8459, "train_info/time_within_train_step": 2.6596431732177734, "step": 8459} {"train_info/time_between_train_steps": 0.003049612045288086, "step": 8459} {"info/global_step": 8460, "train_info/time_within_train_step": 2.6712613105773926, "step": 8460} {"train_info/time_between_train_steps": 0.0030968189239501953, "step": 8460} {"info/global_step": 8461, "train_info/time_within_train_step": 2.6839075088500977, "step": 8461} {"train_info/time_between_train_steps": 0.0030515193939208984, "step": 8461} {"info/global_step": 8462, "train_info/time_within_train_step": 2.670562982559204, "step": 8462} {"train_info/time_between_train_steps": 0.0030808448791503906, "step": 8462} {"info/global_step": 8463, "train_info/time_within_train_step": 2.677856683731079, "step": 8463} {"train_info/time_between_train_steps": 0.003045320510864258, "step": 8463} {"info/global_step": 8464, "train_info/time_within_train_step": 2.642089366912842, "step": 8464} {"train_info/time_between_train_steps": 0.0030896663665771484, "step": 8464} {"info/global_step": 8465, "train_info/time_within_train_step": 2.6554152965545654, "step": 8465} {"train_info/time_between_train_steps": 0.0030066967010498047, "step": 8465} {"info/global_step": 8466, "train_info/time_within_train_step": 2.653128147125244, "step": 8466} {"train_info/time_between_train_steps": 0.003101348876953125, "step": 8466} {"info/global_step": 8467, "train_info/time_within_train_step": 2.6438708305358887, "step": 8467} {"train_info/time_between_train_steps": 0.0030579566955566406, "step": 8467} {"info/global_step": 8468, "train_info/time_within_train_step": 2.6481165885925293, "step": 8468} {"train_info/time_between_train_steps": 0.003101348876953125, "step": 8468} {"info/global_step": 8469, "train_info/time_within_train_step": 2.6490797996520996, "step": 8469} {"train_info/time_between_train_steps": 0.003078937530517578, "step": 8469} {"info/global_step": 8470, "train_info/time_within_train_step": 2.665724039077759, "step": 8470} {"train_info/time_between_train_steps": 0.0031125545501708984, "step": 8470} {"info/global_step": 8471, "train_info/time_within_train_step": 2.662367582321167, "step": 8471} {"train_info/time_between_train_steps": 0.0030646324157714844, "step": 8471} {"info/global_step": 8472, "train_info/time_within_train_step": 2.656378984451294, "step": 8472} {"train_info/time_between_train_steps": 0.0030107498168945312, "step": 8472} {"info/global_step": 8473, "train_info/time_within_train_step": 2.7103512287139893, "step": 8473} {"train_info/time_between_train_steps": 0.003042936325073242, "step": 8473} {"info/global_step": 8474, "train_info/time_within_train_step": 2.646954298019409, "step": 8474} {"train_info/time_between_train_steps": 0.003141641616821289, "step": 8474} {"info/global_step": 8475, "train_info/time_within_train_step": 2.6489973068237305, "step": 8475} {"train_info/time_between_train_steps": 0.003021240234375, "step": 8475} {"info/global_step": 8476, "train_info/time_within_train_step": 2.6575844287872314, "step": 8476} {"train_info/time_between_train_steps": 0.003092050552368164, "step": 8476} {"info/global_step": 8477, "train_info/time_within_train_step": 2.6448769569396973, "step": 8477} {"train_info/time_between_train_steps": 0.003086566925048828, "step": 8477} {"info/global_step": 8478, "train_info/time_within_train_step": 2.660330295562744, "step": 8478} {"train_info/time_between_train_steps": 0.0031142234802246094, "step": 8478} {"info/global_step": 8479, "train_info/time_within_train_step": 2.700746774673462, "step": 8479} {"train_info/time_between_train_steps": 0.003036975860595703, "step": 8479} {"info/global_step": 8480, "train_info/time_within_train_step": 2.7142815589904785, "step": 8480} {"train_info/time_between_train_steps": 0.003126382827758789, "step": 8480} {"info/global_step": 8481, "train_info/time_within_train_step": 2.6419527530670166, "step": 8481} {"train_info/time_between_train_steps": 0.0031042098999023438, "step": 8481} {"info/global_step": 8482, "train_info/time_within_train_step": 2.6420109272003174, "step": 8482} {"train_info/time_between_train_steps": 0.003056049346923828, "step": 8482} {"info/global_step": 8483, "train_info/time_within_train_step": 2.663729667663574, "step": 8483} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 8483} {"info/global_step": 8484, "train_info/time_within_train_step": 2.6510350704193115, "step": 8484} {"train_info/time_between_train_steps": 0.0031065940856933594, "step": 8484} {"info/global_step": 8485, "train_info/time_within_train_step": 2.6443448066711426, "step": 8485} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 8485} {"info/global_step": 8486, "train_info/time_within_train_step": 2.6504740715026855, "step": 8486} {"train_info/time_between_train_steps": 0.0031228065490722656, "step": 8486} {"info/global_step": 8487, "train_info/time_within_train_step": 2.6462180614471436, "step": 8487} {"train_info/time_between_train_steps": 0.0031135082244873047, "step": 8487} {"info/global_step": 8488, "train_info/time_within_train_step": 2.6713414192199707, "step": 8488} {"train_info/time_between_train_steps": 0.003120899200439453, "step": 8488} {"info/global_step": 8489, "train_info/time_within_train_step": 2.6431667804718018, "step": 8489} {"train_info/time_between_train_steps": 0.0032563209533691406, "step": 8489} {"info/global_step": 8490, "train_info/time_within_train_step": 2.6434695720672607, "step": 8490} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 8490} {"info/global_step": 8491, "train_info/time_within_train_step": 2.6428885459899902, "step": 8491} {"train_info/time_between_train_steps": 0.0033278465270996094, "step": 8491} {"info/global_step": 8492, "train_info/time_within_train_step": 3.6155128479003906, "step": 8492} {"train_info/time_between_train_steps": 0.003496885299682617, "step": 8492} {"info/global_step": 8493, "train_info/time_within_train_step": 2.602438449859619, "step": 8493} {"train_info/time_between_train_steps": 0.0032923221588134766, "step": 8493} {"info/global_step": 8494, "train_info/time_within_train_step": 2.826235294342041, "step": 8494} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 8494} {"info/global_step": 8495, "train_info/time_within_train_step": 2.6378278732299805, "step": 8495} {"train_info/time_between_train_steps": 0.003052234649658203, "step": 8495} {"info/global_step": 8496, "train_info/time_within_train_step": 2.6372082233428955, "step": 8496} {"train_info/time_between_train_steps": 0.0032389163970947266, "step": 8496} {"info/global_step": 8497, "train_info/time_within_train_step": 2.6303484439849854, "step": 8497} {"train_info/time_between_train_steps": 0.003071308135986328, "step": 8497} {"info/global_step": 8498, "train_info/time_within_train_step": 3.0509731769561768, "step": 8498} {"train_info/time_between_train_steps": 0.003039836883544922, "step": 8498} {"info/global_step": 8499, "train_info/time_within_train_step": 2.57116961479187, "step": 8499} {"train_info/time_between_train_steps": 0.0033071041107177734, "step": 8499} {"info/global_step": 8500, "train_info/time_within_train_step": 2.6156656742095947, "step": 8500} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746921230, "_runtime": 23828}, "step": 8500} {"logs": {"train/loss": 3.0332, "train/learning_rate": 9.999999999999999e-05, "train/epoch": 9.07, "_timestamp": 1746921230, "_runtime": 23828}, "step": 8500} {"train_info/time_between_train_steps": 0.023288965225219727, "step": 8500} {"info/global_step": 8501, "train_info/time_within_train_step": 2.6550192832946777, "step": 8501} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 8501} {"info/global_step": 8502, "train_info/time_within_train_step": 2.6467783451080322, "step": 8502} {"train_info/time_between_train_steps": 0.002902984619140625, "step": 8502} {"info/global_step": 8503, "train_info/time_within_train_step": 2.655029773712158, "step": 8503} {"train_info/time_between_train_steps": 0.0029981136322021484, "step": 8503} {"info/global_step": 8504, "train_info/time_within_train_step": 2.641820192337036, "step": 8504} {"train_info/time_between_train_steps": 0.002946615219116211, "step": 8504} {"info/global_step": 8505, "train_info/time_within_train_step": 2.6720998287200928, "step": 8505} {"train_info/time_between_train_steps": 0.0029747486114501953, "step": 8505} {"info/global_step": 8506, "train_info/time_within_train_step": 2.6583497524261475, "step": 8506} {"train_info/time_between_train_steps": 0.002958536148071289, "step": 8506} {"info/global_step": 8507, "train_info/time_within_train_step": 2.6620123386383057, "step": 8507} {"train_info/time_between_train_steps": 0.0029594898223876953, "step": 8507} {"info/global_step": 8508, "train_info/time_within_train_step": 2.639955520629883, "step": 8508} {"train_info/time_between_train_steps": 0.0029196739196777344, "step": 8508} {"info/global_step": 8509, "train_info/time_within_train_step": 2.6512351036071777, "step": 8509} {"train_info/time_between_train_steps": 0.0029935836791992188, "step": 8509} {"info/global_step": 8510, "train_info/time_within_train_step": 2.6618380546569824, "step": 8510} {"train_info/time_between_train_steps": 0.002923727035522461, "step": 8510} {"info/global_step": 8511, "train_info/time_within_train_step": 2.6428322792053223, "step": 8511} {"train_info/time_between_train_steps": 0.0029611587524414062, "step": 8511} {"info/global_step": 8512, "train_info/time_within_train_step": 2.6462957859039307, "step": 8512} {"train_info/time_between_train_steps": 0.0029196739196777344, "step": 8512} {"info/global_step": 8513, "train_info/time_within_train_step": 2.6694393157958984, "step": 8513} {"train_info/time_between_train_steps": 0.0029633045196533203, "step": 8513} {"info/global_step": 8514, "train_info/time_within_train_step": 2.665862560272217, "step": 8514} {"train_info/time_between_train_steps": 0.0029714107513427734, "step": 8514} {"info/global_step": 8515, "train_info/time_within_train_step": 2.6727874279022217, "step": 8515} {"train_info/time_between_train_steps": 0.0029664039611816406, "step": 8515} {"info/global_step": 8516, "train_info/time_within_train_step": 2.6665709018707275, "step": 8516} {"train_info/time_between_train_steps": 0.002961397171020508, "step": 8516} {"info/global_step": 8517, "train_info/time_within_train_step": 2.6488728523254395, "step": 8517} {"train_info/time_between_train_steps": 0.0030870437622070312, "step": 8517} {"info/global_step": 8518, "train_info/time_within_train_step": 2.6533093452453613, "step": 8518} {"train_info/time_between_train_steps": 0.003094196319580078, "step": 8518} {"info/global_step": 8519, "train_info/time_within_train_step": 2.6512975692749023, "step": 8519} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 8519} {"info/global_step": 8520, "train_info/time_within_train_step": 2.6430001258850098, "step": 8520} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 8520} {"info/global_step": 8521, "train_info/time_within_train_step": 2.6489205360412598, "step": 8521} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 8521} {"info/global_step": 8522, "train_info/time_within_train_step": 2.64945387840271, "step": 8522} {"train_info/time_between_train_steps": 0.0031287670135498047, "step": 8522} {"info/global_step": 8523, "train_info/time_within_train_step": 2.663120985031128, "step": 8523} {"train_info/time_between_train_steps": 0.003103017807006836, "step": 8523} {"info/global_step": 8524, "train_info/time_within_train_step": 2.662871837615967, "step": 8524} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 8524} {"info/global_step": 8525, "train_info/time_within_train_step": 2.658459424972534, "step": 8525} {"train_info/time_between_train_steps": 0.003103017807006836, "step": 8525} {"info/global_step": 8526, "train_info/time_within_train_step": 2.7288174629211426, "step": 8526} {"train_info/time_between_train_steps": 0.0031213760375976562, "step": 8526} {"info/global_step": 8527, "train_info/time_within_train_step": 2.6929619312286377, "step": 8527} {"train_info/time_between_train_steps": 0.003072977066040039, "step": 8527} {"info/global_step": 8528, "train_info/time_within_train_step": 2.640951633453369, "step": 8528} {"train_info/time_between_train_steps": 0.003098011016845703, "step": 8528} {"info/global_step": 8529, "train_info/time_within_train_step": 2.6416282653808594, "step": 8529} {"train_info/time_between_train_steps": 0.0030612945556640625, "step": 8529} {"info/global_step": 8530, "train_info/time_within_train_step": 2.6670615673065186, "step": 8530} {"train_info/time_between_train_steps": 0.003101348876953125, "step": 8530} {"info/global_step": 8531, "train_info/time_within_train_step": 2.6515159606933594, "step": 8531} {"train_info/time_between_train_steps": 0.0030934810638427734, "step": 8531} {"info/global_step": 8532, "train_info/time_within_train_step": 2.6444339752197266, "step": 8532} {"train_info/time_between_train_steps": 0.003121614456176758, "step": 8532} {"info/global_step": 8533, "train_info/time_within_train_step": 2.658068895339966, "step": 8533} {"train_info/time_between_train_steps": 0.0030944347381591797, "step": 8533} {"info/global_step": 8534, "train_info/time_within_train_step": 2.6528570652008057, "step": 8534} {"train_info/time_between_train_steps": 0.003103494644165039, "step": 8534} {"info/global_step": 8535, "train_info/time_within_train_step": 2.662095308303833, "step": 8535} {"train_info/time_between_train_steps": 0.003570079803466797, "step": 8535} {"info/global_step": 8536, "train_info/time_within_train_step": 2.6954991817474365, "step": 8536} {"train_info/time_between_train_steps": 0.0031387805938720703, "step": 8536} {"info/global_step": 8537, "train_info/time_within_train_step": 2.7207419872283936, "step": 8537} {"train_info/time_between_train_steps": 0.003069639205932617, "step": 8537} {"info/global_step": 8538, "train_info/time_within_train_step": 2.647932529449463, "step": 8538} {"train_info/time_between_train_steps": 0.003095865249633789, "step": 8538} {"info/global_step": 8539, "train_info/time_within_train_step": 2.6430587768554688, "step": 8539} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 8539} {"info/global_step": 8540, "train_info/time_within_train_step": 2.6566388607025146, "step": 8540} {"train_info/time_between_train_steps": 0.003113985061645508, "step": 8540} {"info/global_step": 8541, "train_info/time_within_train_step": 2.650191068649292, "step": 8541} {"train_info/time_between_train_steps": 0.0030694007873535156, "step": 8541} {"info/global_step": 8542, "train_info/time_within_train_step": 2.6514475345611572, "step": 8542} {"train_info/time_between_train_steps": 0.003085613250732422, "step": 8542} {"info/global_step": 8543, "train_info/time_within_train_step": 2.6480655670166016, "step": 8543} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 8543} {"info/global_step": 8544, "train_info/time_within_train_step": 2.6459438800811768, "step": 8544} {"train_info/time_between_train_steps": 0.0030896663665771484, "step": 8544} {"info/global_step": 8545, "train_info/time_within_train_step": 2.6688551902770996, "step": 8545} {"train_info/time_between_train_steps": 0.003322124481201172, "step": 8545} {"info/global_step": 8546, "train_info/time_within_train_step": 2.6704695224761963, "step": 8546} {"train_info/time_between_train_steps": 0.003068208694458008, "step": 8546} {"info/global_step": 8547, "train_info/time_within_train_step": 2.7124557495117188, "step": 8547} {"train_info/time_between_train_steps": 0.0030863285064697266, "step": 8547} {"info/global_step": 8548, "train_info/time_within_train_step": 2.650242567062378, "step": 8548} {"train_info/time_between_train_steps": 0.0030298233032226562, "step": 8548} {"info/global_step": 8549, "train_info/time_within_train_step": 2.6636743545532227, "step": 8549} {"train_info/time_between_train_steps": 0.0030875205993652344, "step": 8549} {"info/global_step": 8550, "train_info/time_within_train_step": 2.6423099040985107, "step": 8550} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746921364, "_runtime": 23962}, "step": 8550} {"logs": {"train/loss": 3.0246, "train/learning_rate": 9.666666666666667e-05, "train/epoch": 9.08, "_timestamp": 1746921364, "_runtime": 23962}, "step": 8550} {"train_info/time_between_train_steps": 0.023613691329956055, "step": 8550} {"info/global_step": 8551, "train_info/time_within_train_step": 2.6502082347869873, "step": 8551} {"train_info/time_between_train_steps": 0.003059864044189453, "step": 8551} {"info/global_step": 8552, "train_info/time_within_train_step": 2.6482925415039062, "step": 8552} {"train_info/time_between_train_steps": 0.0030655860900878906, "step": 8552} {"info/global_step": 8553, "train_info/time_within_train_step": 2.6448709964752197, "step": 8553} {"train_info/time_between_train_steps": 0.003053426742553711, "step": 8553} {"info/global_step": 8554, "train_info/time_within_train_step": 2.665719985961914, "step": 8554} {"train_info/time_between_train_steps": 0.0030646324157714844, "step": 8554} {"info/global_step": 8555, "train_info/time_within_train_step": 2.662719488143921, "step": 8555} {"train_info/time_between_train_steps": 0.0031387805938720703, "step": 8555} {"info/global_step": 8556, "train_info/time_within_train_step": 2.7869319915771484, "step": 8556} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 8556} {"info/global_step": 8557, "train_info/time_within_train_step": 2.692704916000366, "step": 8557} {"train_info/time_between_train_steps": 0.0029354095458984375, "step": 8557} {"info/global_step": 8558, "train_info/time_within_train_step": 2.6671602725982666, "step": 8558} {"train_info/time_between_train_steps": 0.003007650375366211, "step": 8558} {"info/global_step": 8559, "train_info/time_within_train_step": 2.6612651348114014, "step": 8559} {"train_info/time_between_train_steps": 0.0030057430267333984, "step": 8559} {"info/global_step": 8560, "train_info/time_within_train_step": 2.7101891040802, "step": 8560} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 8560} {"info/global_step": 8561, "train_info/time_within_train_step": 2.6449849605560303, "step": 8561} {"train_info/time_between_train_steps": 0.002916574478149414, "step": 8561} {"info/global_step": 8562, "train_info/time_within_train_step": 2.646770477294922, "step": 8562} {"train_info/time_between_train_steps": 0.0029726028442382812, "step": 8562} {"info/global_step": 8563, "train_info/time_within_train_step": 2.6585943698883057, "step": 8563} {"train_info/time_between_train_steps": 0.0029594898223876953, "step": 8563} {"info/global_step": 8564, "train_info/time_within_train_step": 2.6447813510894775, "step": 8564} {"train_info/time_between_train_steps": 0.0029647350311279297, "step": 8564} {"info/global_step": 8565, "train_info/time_within_train_step": 2.6500372886657715, "step": 8565} {"train_info/time_between_train_steps": 0.002958059310913086, "step": 8565} {"info/global_step": 8566, "train_info/time_within_train_step": 2.6458871364593506, "step": 8566} {"train_info/time_between_train_steps": 0.0029861927032470703, "step": 8566} {"info/global_step": 8567, "train_info/time_within_train_step": 2.6551008224487305, "step": 8567} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 8567} {"info/global_step": 8568, "train_info/time_within_train_step": 2.6575186252593994, "step": 8568} {"train_info/time_between_train_steps": 0.0029904842376708984, "step": 8568} {"info/global_step": 8569, "train_info/time_within_train_step": 2.669729471206665, "step": 8569} {"train_info/time_between_train_steps": 0.002936840057373047, "step": 8569} {"info/global_step": 8570, "train_info/time_within_train_step": 2.7265639305114746, "step": 8570} {"train_info/time_between_train_steps": 0.002963542938232422, "step": 8570} {"info/global_step": 8571, "train_info/time_within_train_step": 2.6734602451324463, "step": 8571} {"train_info/time_between_train_steps": 0.0029659271240234375, "step": 8571} {"info/global_step": 8572, "train_info/time_within_train_step": 2.6433727741241455, "step": 8572} {"train_info/time_between_train_steps": 0.0029327869415283203, "step": 8572} {"info/global_step": 8573, "train_info/time_within_train_step": 2.6415977478027344, "step": 8573} {"train_info/time_between_train_steps": 0.0029735565185546875, "step": 8573} {"info/global_step": 8574, "train_info/time_within_train_step": 2.6568222045898438, "step": 8574} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 8574} {"info/global_step": 8575, "train_info/time_within_train_step": 2.6583423614501953, "step": 8575} {"train_info/time_between_train_steps": 0.0029630661010742188, "step": 8575} {"info/global_step": 8576, "train_info/time_within_train_step": 2.64345383644104, "step": 8576} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 8576} {"info/global_step": 8577, "train_info/time_within_train_step": 2.65160870552063, "step": 8577} {"train_info/time_between_train_steps": 0.002938985824584961, "step": 8577} {"info/global_step": 8578, "train_info/time_within_train_step": 2.650622844696045, "step": 8578} {"train_info/time_between_train_steps": 0.002995729446411133, "step": 8578} {"info/global_step": 8579, "train_info/time_within_train_step": 2.672050952911377, "step": 8579} {"train_info/time_between_train_steps": 0.0029439926147460938, "step": 8579} {"info/global_step": 8580, "train_info/time_within_train_step": 2.708651304244995, "step": 8580} {"train_info/time_between_train_steps": 0.0029036998748779297, "step": 8580} {"info/global_step": 8581, "train_info/time_within_train_step": 2.6517369747161865, "step": 8581} {"train_info/time_between_train_steps": 0.0028886795043945312, "step": 8581} {"info/global_step": 8582, "train_info/time_within_train_step": 2.664074659347534, "step": 8582} {"train_info/time_between_train_steps": 0.0029556751251220703, "step": 8582} {"info/global_step": 8583, "train_info/time_within_train_step": 2.6418204307556152, "step": 8583} {"train_info/time_between_train_steps": 0.0029926300048828125, "step": 8583} {"info/global_step": 8584, "train_info/time_within_train_step": 2.661957263946533, "step": 8584} {"train_info/time_between_train_steps": 0.002913951873779297, "step": 8584} {"info/global_step": 8585, "train_info/time_within_train_step": 2.652838706970215, "step": 8585} {"train_info/time_between_train_steps": 0.0029599666595458984, "step": 8585} {"info/global_step": 8586, "train_info/time_within_train_step": 2.645616292953491, "step": 8586} {"train_info/time_between_train_steps": 0.002942800521850586, "step": 8586} {"info/global_step": 8587, "train_info/time_within_train_step": 2.644930839538574, "step": 8587} {"train_info/time_between_train_steps": 0.002913236618041992, "step": 8587} {"info/global_step": 8588, "train_info/time_within_train_step": 2.6494176387786865, "step": 8588} {"train_info/time_between_train_steps": 0.0029816627502441406, "step": 8588} {"info/global_step": 8589, "train_info/time_within_train_step": 2.6726272106170654, "step": 8589} {"train_info/time_between_train_steps": 0.0029442310333251953, "step": 8589} {"info/global_step": 8590, "train_info/time_within_train_step": 2.67203950881958, "step": 8590} {"train_info/time_between_train_steps": 0.0029726028442382812, "step": 8590} {"info/global_step": 8591, "train_info/time_within_train_step": 2.6569695472717285, "step": 8591} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 8591} {"info/global_step": 8592, "train_info/time_within_train_step": 2.6869492530822754, "step": 8592} {"train_info/time_between_train_steps": 0.0029320716857910156, "step": 8592} {"info/global_step": 8593, "train_info/time_within_train_step": 2.6415185928344727, "step": 8593} {"train_info/time_between_train_steps": 0.0029611587524414062, "step": 8593} {"info/global_step": 8594, "train_info/time_within_train_step": 2.6513588428497314, "step": 8594} {"train_info/time_between_train_steps": 0.002940654754638672, "step": 8594} {"info/global_step": 8595, "train_info/time_within_train_step": 2.659360885620117, "step": 8595} {"train_info/time_between_train_steps": 0.002948284149169922, "step": 8595} {"info/global_step": 8596, "train_info/time_within_train_step": 2.6505939960479736, "step": 8596} {"train_info/time_between_train_steps": 0.0029871463775634766, "step": 8596} {"info/global_step": 8597, "train_info/time_within_train_step": 2.6563711166381836, "step": 8597} {"train_info/time_between_train_steps": 0.0030164718627929688, "step": 8597} {"info/global_step": 8598, "train_info/time_within_train_step": 2.721897840499878, "step": 8598} {"train_info/time_between_train_steps": 0.0030918121337890625, "step": 8598} {"info/global_step": 8599, "train_info/time_within_train_step": 2.6576743125915527, "step": 8599} {"train_info/time_between_train_steps": 0.0030546188354492188, "step": 8599} {"info/global_step": 8600, "train_info/time_within_train_step": 2.702777624130249, "step": 8600} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746921499, "_runtime": 24097}, "step": 8600} {"logs": {"train/loss": 3.0191, "train/learning_rate": 9.333333333333333e-05, "train/epoch": 9.08, "_timestamp": 1746921499, "_runtime": 24097}, "step": 8600} {"train_info/time_between_train_steps": 49.4975368976593, "step": 8600} {"info/global_step": 8601, "train_info/time_within_train_step": 2.4394736289978027, "step": 8601} {"train_info/time_between_train_steps": 0.002965688705444336, "step": 8601} {"info/global_step": 8602, "train_info/time_within_train_step": 2.4472100734710693, "step": 8602} {"train_info/time_between_train_steps": 0.0030028820037841797, "step": 8602} {"info/global_step": 8603, "train_info/time_within_train_step": 2.5514583587646484, "step": 8603} {"train_info/time_between_train_steps": 0.0029397010803222656, "step": 8603} {"info/global_step": 8604, "train_info/time_within_train_step": 2.6305108070373535, "step": 8604} {"train_info/time_between_train_steps": 0.0030062198638916016, "step": 8604} {"info/global_step": 8605, "train_info/time_within_train_step": 2.6348817348480225, "step": 8605} {"train_info/time_between_train_steps": 0.0029692649841308594, "step": 8605} {"info/global_step": 8606, "train_info/time_within_train_step": 2.64751935005188, "step": 8606} {"train_info/time_between_train_steps": 0.003301382064819336, "step": 8606} {"info/global_step": 8607, "train_info/time_within_train_step": 2.645725727081299, "step": 8607} {"train_info/time_between_train_steps": 0.0029706954956054688, "step": 8607} {"info/global_step": 8608, "train_info/time_within_train_step": 2.6670429706573486, "step": 8608} {"train_info/time_between_train_steps": 0.0031366348266601562, "step": 8608} {"info/global_step": 8609, "train_info/time_within_train_step": 2.6988210678100586, "step": 8609} {"train_info/time_between_train_steps": 0.0030035972595214844, "step": 8609} {"info/global_step": 8610, "train_info/time_within_train_step": 2.6625587940216064, "step": 8610} {"train_info/time_between_train_steps": 0.0030634403228759766, "step": 8610} {"info/global_step": 8611, "train_info/time_within_train_step": 2.6645779609680176, "step": 8611} {"train_info/time_between_train_steps": 0.0029282569885253906, "step": 8611} {"info/global_step": 8612, "train_info/time_within_train_step": 2.6418447494506836, "step": 8612} {"train_info/time_between_train_steps": 0.0030426979064941406, "step": 8612} {"info/global_step": 8613, "train_info/time_within_train_step": 2.6551220417022705, "step": 8613} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 8613} {"info/global_step": 8614, "train_info/time_within_train_step": 2.6574103832244873, "step": 8614} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 8614} {"info/global_step": 8615, "train_info/time_within_train_step": 2.645979404449463, "step": 8615} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 8615} {"info/global_step": 8616, "train_info/time_within_train_step": 2.6446077823638916, "step": 8616} {"train_info/time_between_train_steps": 0.0032308101654052734, "step": 8616} {"info/global_step": 8617, "train_info/time_within_train_step": 2.6541316509246826, "step": 8617} {"train_info/time_between_train_steps": 0.003250598907470703, "step": 8617} {"info/global_step": 8618, "train_info/time_within_train_step": 2.674459457397461, "step": 8618} {"train_info/time_between_train_steps": 0.0031309127807617188, "step": 8618} {"info/global_step": 8619, "train_info/time_within_train_step": 2.670341730117798, "step": 8619} {"train_info/time_between_train_steps": 0.0033304691314697266, "step": 8619} {"info/global_step": 8620, "train_info/time_within_train_step": 2.6726019382476807, "step": 8620} {"train_info/time_between_train_steps": 0.0030851364135742188, "step": 8620} {"info/global_step": 8621, "train_info/time_within_train_step": 2.6716198921203613, "step": 8621} {"train_info/time_between_train_steps": 0.003332376480102539, "step": 8621} {"info/global_step": 8622, "train_info/time_within_train_step": 2.6515285968780518, "step": 8622} {"train_info/time_between_train_steps": 0.003232240676879883, "step": 8622} {"info/global_step": 8623, "train_info/time_within_train_step": 2.6527011394500732, "step": 8623} {"train_info/time_between_train_steps": 0.0033180713653564453, "step": 8623} {"info/global_step": 8624, "train_info/time_within_train_step": 2.650160312652588, "step": 8624} {"train_info/time_between_train_steps": 0.0034761428833007812, "step": 8624} {"info/global_step": 8625, "train_info/time_within_train_step": 2.654472589492798, "step": 8625} {"train_info/time_between_train_steps": 0.003355741500854492, "step": 8625} {"info/global_step": 8626, "train_info/time_within_train_step": 2.650599956512451, "step": 8626} {"train_info/time_between_train_steps": 0.003532886505126953, "step": 8626} {"info/global_step": 8627, "train_info/time_within_train_step": 2.645867109298706, "step": 8627} {"train_info/time_between_train_steps": 0.003562450408935547, "step": 8627} {"info/global_step": 8628, "train_info/time_within_train_step": 2.6722536087036133, "step": 8628} {"train_info/time_between_train_steps": 0.003725767135620117, "step": 8628} {"info/global_step": 8629, "train_info/time_within_train_step": 2.6694746017456055, "step": 8629} {"train_info/time_between_train_steps": 0.0040361881256103516, "step": 8629} {"info/global_step": 8630, "train_info/time_within_train_step": 2.685729742050171, "step": 8630} {"train_info/time_between_train_steps": 0.0031147003173828125, "step": 8630} {"train_info/time_between_train_steps": 2.559445381164551, "step": 8630} {"info/global_step": 8631, "train_info/time_within_train_step": 2.639941453933716, "step": 8631} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 8631} {"info/global_step": 8632, "train_info/time_within_train_step": 2.6555614471435547, "step": 8632} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 8632} {"info/global_step": 8633, "train_info/time_within_train_step": 2.639200210571289, "step": 8633} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 8633} {"info/global_step": 8634, "train_info/time_within_train_step": 2.6364893913269043, "step": 8634} {"train_info/time_between_train_steps": 0.003284454345703125, "step": 8634} {"info/global_step": 8635, "train_info/time_within_train_step": 2.6408493518829346, "step": 8635} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 8635} {"info/global_step": 8636, "train_info/time_within_train_step": 2.660536766052246, "step": 8636} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 8636} {"info/global_step": 8637, "train_info/time_within_train_step": 2.6473922729492188, "step": 8637} {"train_info/time_between_train_steps": 0.00323486328125, "step": 8637} {"info/global_step": 8638, "train_info/time_within_train_step": 2.648804187774658, "step": 8638} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 8638} {"info/global_step": 8639, "train_info/time_within_train_step": 2.652927875518799, "step": 8639} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 8639} {"info/global_step": 8640, "train_info/time_within_train_step": 2.6495840549468994, "step": 8640} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 8640} {"info/global_step": 8641, "train_info/time_within_train_step": 2.668830633163452, "step": 8641} {"train_info/time_between_train_steps": 0.003119230270385742, "step": 8641} {"info/global_step": 8642, "train_info/time_within_train_step": 2.706169366836548, "step": 8642} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 8642} {"info/global_step": 8643, "train_info/time_within_train_step": 2.66776967048645, "step": 8643} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 8643} {"info/global_step": 8644, "train_info/time_within_train_step": 2.660872459411621, "step": 8644} {"train_info/time_between_train_steps": 0.0031273365020751953, "step": 8644} {"info/global_step": 8645, "train_info/time_within_train_step": 2.6421451568603516, "step": 8645} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 8645} {"info/global_step": 8646, "train_info/time_within_train_step": 2.6552960872650146, "step": 8646} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 8646} {"info/global_step": 8647, "train_info/time_within_train_step": 2.6591169834136963, "step": 8647} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 8647} {"info/global_step": 8648, "train_info/time_within_train_step": 2.6462111473083496, "step": 8648} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 8648} {"info/global_step": 8649, "train_info/time_within_train_step": 2.6469438076019287, "step": 8649} {"train_info/time_between_train_steps": 0.0032835006713867188, "step": 8649} {"info/global_step": 8650, "train_info/time_within_train_step": 2.652580976486206, "step": 8650} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746921686, "_runtime": 24284}, "step": 8650} {"logs": {"train/loss": 3.039, "train/learning_rate": 8.999999999999999e-05, "train/epoch": 10.0, "_timestamp": 1746921686, "_runtime": 24284}, "step": 8650} {"train_info/time_between_train_steps": 0.02551102638244629, "step": 8650} {"info/global_step": 8651, "train_info/time_within_train_step": 2.6601414680480957, "step": 8651} {"train_info/time_between_train_steps": 0.003376007080078125, "step": 8651} {"info/global_step": 8652, "train_info/time_within_train_step": 2.671416997909546, "step": 8652} {"train_info/time_between_train_steps": 0.003423929214477539, "step": 8652} {"info/global_step": 8653, "train_info/time_within_train_step": 2.6785526275634766, "step": 8653} {"train_info/time_between_train_steps": 0.003496885299682617, "step": 8653} {"info/global_step": 8654, "train_info/time_within_train_step": 2.6538867950439453, "step": 8654} {"train_info/time_between_train_steps": 0.003345966339111328, "step": 8654} {"info/global_step": 8655, "train_info/time_within_train_step": 2.6886305809020996, "step": 8655} {"train_info/time_between_train_steps": 0.0034461021423339844, "step": 8655} {"info/global_step": 8656, "train_info/time_within_train_step": 2.6443493366241455, "step": 8656} {"train_info/time_between_train_steps": 0.0034198760986328125, "step": 8656} {"info/global_step": 8657, "train_info/time_within_train_step": 2.657438278198242, "step": 8657} {"train_info/time_between_train_steps": 0.0034270286560058594, "step": 8657} {"info/global_step": 8658, "train_info/time_within_train_step": 2.654109477996826, "step": 8658} {"train_info/time_between_train_steps": 0.0033953189849853516, "step": 8658} {"info/global_step": 8659, "train_info/time_within_train_step": 2.6479287147521973, "step": 8659} {"train_info/time_between_train_steps": 0.0034379959106445312, "step": 8659} {"info/global_step": 8660, "train_info/time_within_train_step": 2.650405168533325, "step": 8660} {"train_info/time_between_train_steps": 0.0033898353576660156, "step": 8660} {"info/global_step": 8661, "train_info/time_within_train_step": 2.647852659225464, "step": 8661} {"train_info/time_between_train_steps": 0.0034890174865722656, "step": 8661} {"info/global_step": 8662, "train_info/time_within_train_step": 2.668041706085205, "step": 8662} {"train_info/time_between_train_steps": 0.003337860107421875, "step": 8662} {"info/global_step": 8663, "train_info/time_within_train_step": 2.670280933380127, "step": 8663} {"train_info/time_between_train_steps": 0.0033605098724365234, "step": 8663} {"info/global_step": 8664, "train_info/time_within_train_step": 2.6546497344970703, "step": 8664} {"train_info/time_between_train_steps": 0.003412008285522461, "step": 8664} {"info/global_step": 8665, "train_info/time_within_train_step": 2.7092127799987793, "step": 8665} {"train_info/time_between_train_steps": 0.003420114517211914, "step": 8665} {"info/global_step": 8666, "train_info/time_within_train_step": 2.6511924266815186, "step": 8666} {"train_info/time_between_train_steps": 0.0033774375915527344, "step": 8666} {"info/global_step": 8667, "train_info/time_within_train_step": 2.6498963832855225, "step": 8667} {"train_info/time_between_train_steps": 0.003345012664794922, "step": 8667} {"info/global_step": 8668, "train_info/time_within_train_step": 2.650092124938965, "step": 8668} {"train_info/time_between_train_steps": 0.003446817398071289, "step": 8668} {"info/global_step": 8669, "train_info/time_within_train_step": 2.6518778800964355, "step": 8669} {"train_info/time_between_train_steps": 0.0034151077270507812, "step": 8669} {"info/global_step": 8670, "train_info/time_within_train_step": 2.6533353328704834, "step": 8670} {"train_info/time_between_train_steps": 0.003389596939086914, "step": 8670} {"info/global_step": 8671, "train_info/time_within_train_step": 2.6567912101745605, "step": 8671} {"train_info/time_between_train_steps": 0.003366231918334961, "step": 8671} {"info/global_step": 8672, "train_info/time_within_train_step": 2.6948862075805664, "step": 8672} {"train_info/time_between_train_steps": 0.0033931732177734375, "step": 8672} {"info/global_step": 8673, "train_info/time_within_train_step": 2.6553385257720947, "step": 8673} {"train_info/time_between_train_steps": 0.0034689903259277344, "step": 8673} {"info/global_step": 8674, "train_info/time_within_train_step": 2.6618247032165527, "step": 8674} {"train_info/time_between_train_steps": 0.0034928321838378906, "step": 8674} {"info/global_step": 8675, "train_info/time_within_train_step": 2.67714524269104, "step": 8675} {"train_info/time_between_train_steps": 0.0034897327423095703, "step": 8675} {"info/global_step": 8676, "train_info/time_within_train_step": 2.7312190532684326, "step": 8676} {"train_info/time_between_train_steps": 0.0034437179565429688, "step": 8676} {"info/global_step": 8677, "train_info/time_within_train_step": 2.67024564743042, "step": 8677} {"train_info/time_between_train_steps": 0.0034706592559814453, "step": 8677} {"info/global_step": 8678, "train_info/time_within_train_step": 2.643427848815918, "step": 8678} {"train_info/time_between_train_steps": 0.0034706592559814453, "step": 8678} {"info/global_step": 8679, "train_info/time_within_train_step": 2.64296555519104, "step": 8679} {"train_info/time_between_train_steps": 0.0033795833587646484, "step": 8679} {"info/global_step": 8680, "train_info/time_within_train_step": 2.661220073699951, "step": 8680} {"train_info/time_between_train_steps": 0.0034041404724121094, "step": 8680} {"info/global_step": 8681, "train_info/time_within_train_step": 2.6717793941497803, "step": 8681} {"train_info/time_between_train_steps": 0.003595113754272461, "step": 8681} {"info/global_step": 8682, "train_info/time_within_train_step": 2.6457622051239014, "step": 8682} {"train_info/time_between_train_steps": 0.003420591354370117, "step": 8682} {"info/global_step": 8683, "train_info/time_within_train_step": 2.653867721557617, "step": 8683} {"train_info/time_between_train_steps": 0.0034024715423583984, "step": 8683} {"info/global_step": 8684, "train_info/time_within_train_step": 2.648149013519287, "step": 8684} {"train_info/time_between_train_steps": 0.0034096240997314453, "step": 8684} {"info/global_step": 8685, "train_info/time_within_train_step": 2.6713573932647705, "step": 8685} {"train_info/time_between_train_steps": 0.003536701202392578, "step": 8685} {"info/global_step": 8686, "train_info/time_within_train_step": 2.6718533039093018, "step": 8686} {"train_info/time_between_train_steps": 0.0034189224243164062, "step": 8686} {"info/global_step": 8687, "train_info/time_within_train_step": 2.6625256538391113, "step": 8687} {"train_info/time_between_train_steps": 0.003403902053833008, "step": 8687} {"info/global_step": 8688, "train_info/time_within_train_step": 2.6647403240203857, "step": 8688} {"train_info/time_between_train_steps": 0.003370523452758789, "step": 8688} {"info/global_step": 8689, "train_info/time_within_train_step": 2.6433119773864746, "step": 8689} {"train_info/time_between_train_steps": 0.0033915042877197266, "step": 8689} {"info/global_step": 8690, "train_info/time_within_train_step": 2.6446409225463867, "step": 8690} {"train_info/time_between_train_steps": 0.003522634506225586, "step": 8690} {"info/global_step": 8691, "train_info/time_within_train_step": 2.644268035888672, "step": 8691} {"train_info/time_between_train_steps": 0.003699779510498047, "step": 8691} {"info/global_step": 8692, "train_info/time_within_train_step": 2.630415439605713, "step": 8692} {"train_info/time_between_train_steps": 0.003610849380493164, "step": 8692} {"info/global_step": 8693, "train_info/time_within_train_step": 3.7368505001068115, "step": 8693} {"train_info/time_between_train_steps": 0.003641366958618164, "step": 8693} {"info/global_step": 8694, "train_info/time_within_train_step": 2.561554431915283, "step": 8694} {"train_info/time_between_train_steps": 0.0036001205444335938, "step": 8694} {"info/global_step": 8695, "train_info/time_within_train_step": 2.624744176864624, "step": 8695} {"train_info/time_between_train_steps": 0.003389120101928711, "step": 8695} {"info/global_step": 8696, "train_info/time_within_train_step": 2.610429048538208, "step": 8696} {"train_info/time_between_train_steps": 0.0034101009368896484, "step": 8696} {"info/global_step": 8697, "train_info/time_within_train_step": 2.954284191131592, "step": 8697} {"train_info/time_between_train_steps": 0.0034072399139404297, "step": 8697} {"info/global_step": 8698, "train_info/time_within_train_step": 2.5733277797698975, "step": 8698} {"train_info/time_between_train_steps": 0.0033876895904541016, "step": 8698} {"info/global_step": 8699, "train_info/time_within_train_step": 2.572225332260132, "step": 8699} {"train_info/time_between_train_steps": 0.0034439563751220703, "step": 8699} {"info/global_step": 8700, "train_info/time_within_train_step": 2.814438819885254, "step": 8700} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746921833, "_runtime": 24431}, "step": 8700} {"logs": {"train/loss": 3.0014, "train/learning_rate": 8.666666666666665e-05, "train/epoch": 10.01, "_timestamp": 1746921833, "_runtime": 24431}, "step": 8700} {"train_info/time_between_train_steps": 1.250016689300537, "step": 8700} {"info/global_step": 8701, "train_info/time_within_train_step": 2.443787097930908, "step": 8701} {"train_info/time_between_train_steps": 0.003445863723754883, "step": 8701} {"info/global_step": 8702, "train_info/time_within_train_step": 3.3906092643737793, "step": 8702} {"train_info/time_between_train_steps": 0.003684520721435547, "step": 8702} {"info/global_step": 8703, "train_info/time_within_train_step": 2.598992109298706, "step": 8703} {"train_info/time_between_train_steps": 0.003407716751098633, "step": 8703} {"info/global_step": 8704, "train_info/time_within_train_step": 2.4853296279907227, "step": 8704} {"train_info/time_between_train_steps": 0.0033910274505615234, "step": 8704} {"info/global_step": 8705, "train_info/time_within_train_step": 2.5368332862854004, "step": 8705} {"train_info/time_between_train_steps": 0.0036001205444335938, "step": 8705} {"info/global_step": 8706, "train_info/time_within_train_step": 2.565194606781006, "step": 8706} {"train_info/time_between_train_steps": 0.0032835006713867188, "step": 8706} {"info/global_step": 8707, "train_info/time_within_train_step": 2.6500842571258545, "step": 8707} {"train_info/time_between_train_steps": 0.003322601318359375, "step": 8707} {"info/global_step": 8708, "train_info/time_within_train_step": 2.6375811100006104, "step": 8708} {"train_info/time_between_train_steps": 0.003370046615600586, "step": 8708} {"info/global_step": 8709, "train_info/time_within_train_step": 2.708831548690796, "step": 8709} {"train_info/time_between_train_steps": 0.0033249855041503906, "step": 8709} {"info/global_step": 8710, "train_info/time_within_train_step": 2.6509573459625244, "step": 8710} {"train_info/time_between_train_steps": 0.003250598907470703, "step": 8710} {"info/global_step": 8711, "train_info/time_within_train_step": 2.647376537322998, "step": 8711} {"train_info/time_between_train_steps": 0.0032701492309570312, "step": 8711} {"info/global_step": 8712, "train_info/time_within_train_step": 2.9799983501434326, "step": 8712} {"train_info/time_between_train_steps": 0.003149747848510742, "step": 8712} {"info/global_step": 8713, "train_info/time_within_train_step": 2.6741957664489746, "step": 8713} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 8713} {"info/global_step": 8714, "train_info/time_within_train_step": 2.6555535793304443, "step": 8714} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 8714} {"info/global_step": 8715, "train_info/time_within_train_step": 2.6396098136901855, "step": 8715} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 8715} {"info/global_step": 8716, "train_info/time_within_train_step": 2.653625011444092, "step": 8716} {"train_info/time_between_train_steps": 0.0032711029052734375, "step": 8716} {"info/global_step": 8717, "train_info/time_within_train_step": 2.6552958488464355, "step": 8717} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 8717} {"info/global_step": 8718, "train_info/time_within_train_step": 2.6562492847442627, "step": 8718} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 8718} {"info/global_step": 8719, "train_info/time_within_train_step": 2.643517017364502, "step": 8719} {"train_info/time_between_train_steps": 0.0032165050506591797, "step": 8719} {"info/global_step": 8720, "train_info/time_within_train_step": 2.656463623046875, "step": 8720} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 8720} {"info/global_step": 8721, "train_info/time_within_train_step": 2.6687674522399902, "step": 8721} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 8721} {"info/global_step": 8722, "train_info/time_within_train_step": 2.6861801147460938, "step": 8722} {"train_info/time_between_train_steps": 0.003139019012451172, "step": 8722} {"info/global_step": 8723, "train_info/time_within_train_step": 2.6497485637664795, "step": 8723} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 8723} {"info/global_step": 8724, "train_info/time_within_train_step": 2.6632773876190186, "step": 8724} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 8724} {"info/global_step": 8725, "train_info/time_within_train_step": 2.6489524841308594, "step": 8725} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 8725} {"info/global_step": 8726, "train_info/time_within_train_step": 2.648899793624878, "step": 8726} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 8726} {"info/global_step": 8727, "train_info/time_within_train_step": 2.6454215049743652, "step": 8727} {"train_info/time_between_train_steps": 0.003242969512939453, "step": 8727} {"info/global_step": 8728, "train_info/time_within_train_step": 2.6472175121307373, "step": 8728} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 8728} {"info/global_step": 8729, "train_info/time_within_train_step": 2.6496808528900146, "step": 8729} {"train_info/time_between_train_steps": 0.0031371116638183594, "step": 8729} {"info/global_step": 8730, "train_info/time_within_train_step": 2.6618034839630127, "step": 8730} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 8730} {"info/global_step": 8731, "train_info/time_within_train_step": 2.6779253482818604, "step": 8731} {"train_info/time_between_train_steps": 0.0036020278930664062, "step": 8731} {"info/global_step": 8732, "train_info/time_within_train_step": 2.6545825004577637, "step": 8732} {"train_info/time_between_train_steps": 0.0031316280364990234, "step": 8732} {"info/global_step": 8733, "train_info/time_within_train_step": 2.711791753768921, "step": 8733} {"train_info/time_between_train_steps": 0.0031561851501464844, "step": 8733} {"info/global_step": 8734, "train_info/time_within_train_step": 2.645259380340576, "step": 8734} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 8734} {"info/global_step": 8735, "train_info/time_within_train_step": 2.650118350982666, "step": 8735} {"train_info/time_between_train_steps": 0.0031299591064453125, "step": 8735} {"info/global_step": 8736, "train_info/time_within_train_step": 2.6604340076446533, "step": 8736} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 8736} {"info/global_step": 8737, "train_info/time_within_train_step": 2.6485300064086914, "step": 8737} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 8737} {"info/global_step": 8738, "train_info/time_within_train_step": 2.647226333618164, "step": 8738} {"train_info/time_between_train_steps": 0.0031244754791259766, "step": 8738} {"info/global_step": 8739, "train_info/time_within_train_step": 2.6494646072387695, "step": 8739} {"train_info/time_between_train_steps": 0.003301382064819336, "step": 8739} {"info/global_step": 8740, "train_info/time_within_train_step": 2.6525967121124268, "step": 8740} {"train_info/time_between_train_steps": 0.0032956600189208984, "step": 8740} {"info/global_step": 8741, "train_info/time_within_train_step": 2.6619701385498047, "step": 8741} {"train_info/time_between_train_steps": 0.003353118896484375, "step": 8741} {"info/global_step": 8742, "train_info/time_within_train_step": 2.6824772357940674, "step": 8742} {"train_info/time_between_train_steps": 0.0033648014068603516, "step": 8742} {"info/global_step": 8743, "train_info/time_within_train_step": 2.730996608734131, "step": 8743} {"train_info/time_between_train_steps": 0.003345966339111328, "step": 8743} {"info/global_step": 8744, "train_info/time_within_train_step": 2.661255121231079, "step": 8744} {"train_info/time_between_train_steps": 0.0033376216888427734, "step": 8744} {"info/global_step": 8745, "train_info/time_within_train_step": 2.646968364715576, "step": 8745} {"train_info/time_between_train_steps": 0.003388643264770508, "step": 8745} {"info/global_step": 8746, "train_info/time_within_train_step": 2.648030996322632, "step": 8746} {"train_info/time_between_train_steps": 0.0033915042877197266, "step": 8746} {"info/global_step": 8747, "train_info/time_within_train_step": 2.6549665927886963, "step": 8747} {"train_info/time_between_train_steps": 0.0033898353576660156, "step": 8747} {"info/global_step": 8748, "train_info/time_within_train_step": 3.2701327800750732, "step": 8748} {"train_info/time_between_train_steps": 0.0033600330352783203, "step": 8748} {"info/global_step": 8749, "train_info/time_within_train_step": 2.6620845794677734, "step": 8749} {"train_info/time_between_train_steps": 0.0033555030822753906, "step": 8749} {"info/global_step": 8750, "train_info/time_within_train_step": 2.6550636291503906, "step": 8750} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746921976, "_runtime": 24574}, "step": 8750} {"logs": {"train/loss": 2.9998, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 10.01, "_timestamp": 1746921976, "_runtime": 24574}, "step": 8750} {"train_info/time_between_train_steps": 0.02579021453857422, "step": 8750} {"info/global_step": 8751, "train_info/time_within_train_step": 2.6562578678131104, "step": 8751} {"train_info/time_between_train_steps": 0.0033388137817382812, "step": 8751} {"info/global_step": 8752, "train_info/time_within_train_step": 2.670973539352417, "step": 8752} {"train_info/time_between_train_steps": 0.003484487533569336, "step": 8752} {"info/global_step": 8753, "train_info/time_within_train_step": 2.7276010513305664, "step": 8753} {"train_info/time_between_train_steps": 0.003400564193725586, "step": 8753} {"info/global_step": 8754, "train_info/time_within_train_step": 2.6878159046173096, "step": 8754} {"train_info/time_between_train_steps": 0.003292560577392578, "step": 8754} {"info/global_step": 8755, "train_info/time_within_train_step": 2.6424357891082764, "step": 8755} {"train_info/time_between_train_steps": 0.16026949882507324, "step": 8755} {"info/global_step": 8756, "train_info/time_within_train_step": 2.7356159687042236, "step": 8756} {"train_info/time_between_train_steps": 0.003279447555541992, "step": 8756} {"info/global_step": 8757, "train_info/time_within_train_step": 2.6455047130584717, "step": 8757} {"train_info/time_between_train_steps": 0.003267526626586914, "step": 8757} {"info/global_step": 8758, "train_info/time_within_train_step": 2.6425552368164062, "step": 8758} {"train_info/time_between_train_steps": 0.0032961368560791016, "step": 8758} {"info/global_step": 8759, "train_info/time_within_train_step": 2.662062883377075, "step": 8759} {"train_info/time_between_train_steps": 0.003319978713989258, "step": 8759} {"info/global_step": 8760, "train_info/time_within_train_step": 2.6508443355560303, "step": 8760} {"train_info/time_between_train_steps": 0.0032477378845214844, "step": 8760} {"info/global_step": 8761, "train_info/time_within_train_step": 2.651658535003662, "step": 8761} {"train_info/time_between_train_steps": 0.003288745880126953, "step": 8761} {"info/global_step": 8762, "train_info/time_within_train_step": 2.6492550373077393, "step": 8762} {"train_info/time_between_train_steps": 0.003317117691040039, "step": 8762} {"info/global_step": 8763, "train_info/time_within_train_step": 2.645406484603882, "step": 8763} {"train_info/time_between_train_steps": 0.003297567367553711, "step": 8763} {"info/global_step": 8764, "train_info/time_within_train_step": 2.668649911880493, "step": 8764} {"train_info/time_between_train_steps": 0.0033135414123535156, "step": 8764} {"info/global_step": 8765, "train_info/time_within_train_step": 2.6694858074188232, "step": 8765} {"train_info/time_between_train_steps": 0.003298044204711914, "step": 8765} {"info/global_step": 8766, "train_info/time_within_train_step": 2.718844175338745, "step": 8766} {"train_info/time_between_train_steps": 0.0033478736877441406, "step": 8766} {"info/global_step": 8767, "train_info/time_within_train_step": 2.653273820877075, "step": 8767} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 8767} {"info/global_step": 8768, "train_info/time_within_train_step": 2.6462016105651855, "step": 8768} {"train_info/time_between_train_steps": 0.00335693359375, "step": 8768} {"info/global_step": 8769, "train_info/time_within_train_step": 2.6613008975982666, "step": 8769} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 8769} {"info/global_step": 8770, "train_info/time_within_train_step": 2.654371500015259, "step": 8770} {"train_info/time_between_train_steps": 0.0033180713653564453, "step": 8770} {"info/global_step": 8771, "train_info/time_within_train_step": 2.6623222827911377, "step": 8771} {"train_info/time_between_train_steps": 0.0032880306243896484, "step": 8771} {"info/global_step": 8772, "train_info/time_within_train_step": 2.700075149536133, "step": 8772} {"train_info/time_between_train_steps": 0.0033223628997802734, "step": 8772} {"info/global_step": 8773, "train_info/time_within_train_step": 2.9520010948181152, "step": 8773} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 8773} {"info/global_step": 8774, "train_info/time_within_train_step": 2.6578104496002197, "step": 8774} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 8774} {"info/global_step": 8775, "train_info/time_within_train_step": 2.6606669425964355, "step": 8775} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 8775} {"info/global_step": 8776, "train_info/time_within_train_step": 2.671823501586914, "step": 8776} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 8776} {"info/global_step": 8777, "train_info/time_within_train_step": 2.6888041496276855, "step": 8777} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 8777} {"info/global_step": 8778, "train_info/time_within_train_step": 2.6418488025665283, "step": 8778} {"train_info/time_between_train_steps": 0.0032444000244140625, "step": 8778} {"info/global_step": 8779, "train_info/time_within_train_step": 2.643862009048462, "step": 8779} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 8779} {"info/global_step": 8780, "train_info/time_within_train_step": 2.6610500812530518, "step": 8780} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 8780} {"info/global_step": 8781, "train_info/time_within_train_step": 2.6562955379486084, "step": 8781} {"train_info/time_between_train_steps": 0.0034322738647460938, "step": 8781} {"info/global_step": 8782, "train_info/time_within_train_step": 2.6451594829559326, "step": 8782} {"train_info/time_between_train_steps": 0.003273487091064453, "step": 8782} {"info/global_step": 8783, "train_info/time_within_train_step": 2.653855562210083, "step": 8783} {"train_info/time_between_train_steps": 0.0035469532012939453, "step": 8783} {"info/global_step": 8784, "train_info/time_within_train_step": 2.651287078857422, "step": 8784} {"train_info/time_between_train_steps": 0.0038771629333496094, "step": 8784} {"info/global_step": 8785, "train_info/time_within_train_step": 2.6701881885528564, "step": 8785} {"train_info/time_between_train_steps": 0.003423929214477539, "step": 8785} {"info/global_step": 8786, "train_info/time_within_train_step": 2.6995737552642822, "step": 8786} {"train_info/time_between_train_steps": 0.0034689903259277344, "step": 8786} {"info/global_step": 8787, "train_info/time_within_train_step": 2.671778917312622, "step": 8787} {"train_info/time_between_train_steps": 0.003525257110595703, "step": 8787} {"info/global_step": 8788, "train_info/time_within_train_step": 2.659374952316284, "step": 8788} {"train_info/time_between_train_steps": 0.0034482479095458984, "step": 8788} {"info/global_step": 8789, "train_info/time_within_train_step": 2.642296075820923, "step": 8789} {"train_info/time_between_train_steps": 0.003487110137939453, "step": 8789} {"info/global_step": 8790, "train_info/time_within_train_step": 2.6550323963165283, "step": 8790} {"train_info/time_between_train_steps": 0.0033903121948242188, "step": 8790} {"info/global_step": 8791, "train_info/time_within_train_step": 2.659428834915161, "step": 8791} {"train_info/time_between_train_steps": 0.003545999526977539, "step": 8791} {"info/global_step": 8792, "train_info/time_within_train_step": 2.6462454795837402, "step": 8792} {"train_info/time_between_train_steps": 0.003423929214477539, "step": 8792} {"info/global_step": 8793, "train_info/time_within_train_step": 2.6471314430236816, "step": 8793} {"train_info/time_between_train_steps": 0.003488302230834961, "step": 8793} {"info/global_step": 8794, "train_info/time_within_train_step": 2.6669654846191406, "step": 8794} {"train_info/time_between_train_steps": 0.003451824188232422, "step": 8794} {"info/global_step": 8795, "train_info/time_within_train_step": 2.6683976650238037, "step": 8795} {"train_info/time_between_train_steps": 0.0034651756286621094, "step": 8795} {"info/global_step": 8796, "train_info/time_within_train_step": 2.687448263168335, "step": 8796} {"train_info/time_between_train_steps": 0.003417491912841797, "step": 8796} {"info/global_step": 8797, "train_info/time_within_train_step": 2.649874448776245, "step": 8797} {"train_info/time_between_train_steps": 0.0034058094024658203, "step": 8797} {"info/global_step": 8798, "train_info/time_within_train_step": 2.6878602504730225, "step": 8798} {"train_info/time_between_train_steps": 0.003445863723754883, "step": 8798} {"info/global_step": 8799, "train_info/time_within_train_step": 2.6442015171051025, "step": 8799} {"train_info/time_between_train_steps": 0.0034394264221191406, "step": 8799} {"info/global_step": 8800, "train_info/time_within_train_step": 2.6426260471343994, "step": 8800} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746922112, "_runtime": 24710}, "step": 8800} {"logs": {"train/loss": 2.9954, "train/learning_rate": 7.999999999999999e-05, "train/epoch": 10.02, "_timestamp": 1746922112, "_runtime": 24710}, "step": 8800} {"train_info/time_between_train_steps": 17.204218864440918, "step": 8800} {"info/global_step": 8801, "train_info/time_within_train_step": 2.4548377990722656, "step": 8801} {"train_info/time_between_train_steps": 0.003389120101928711, "step": 8801} {"info/global_step": 8802, "train_info/time_within_train_step": 2.446929693222046, "step": 8802} {"train_info/time_between_train_steps": 0.0034079551696777344, "step": 8802} {"info/global_step": 8803, "train_info/time_within_train_step": 2.5160083770751953, "step": 8803} {"train_info/time_between_train_steps": 0.003330230712890625, "step": 8803} {"info/global_step": 8804, "train_info/time_within_train_step": 2.640183925628662, "step": 8804} {"train_info/time_between_train_steps": 0.0034084320068359375, "step": 8804} {"info/global_step": 8805, "train_info/time_within_train_step": 2.6589250564575195, "step": 8805} {"train_info/time_between_train_steps": 0.0033676624298095703, "step": 8805} {"info/global_step": 8806, "train_info/time_within_train_step": 2.668431043624878, "step": 8806} {"train_info/time_between_train_steps": 0.0033452510833740234, "step": 8806} {"info/global_step": 8807, "train_info/time_within_train_step": 2.688051223754883, "step": 8807} {"train_info/time_between_train_steps": 0.003392457962036133, "step": 8807} {"info/global_step": 8808, "train_info/time_within_train_step": 2.651130437850952, "step": 8808} {"train_info/time_between_train_steps": 0.0033652782440185547, "step": 8808} {"info/global_step": 8809, "train_info/time_within_train_step": 2.684854030609131, "step": 8809} {"train_info/time_between_train_steps": 0.003476381301879883, "step": 8809} {"info/global_step": 8810, "train_info/time_within_train_step": 2.6431238651275635, "step": 8810} {"train_info/time_between_train_steps": 0.0034716129302978516, "step": 8810} {"info/global_step": 8811, "train_info/time_within_train_step": 2.6438918113708496, "step": 8811} {"train_info/time_between_train_steps": 0.0033571720123291016, "step": 8811} {"info/global_step": 8812, "train_info/time_within_train_step": 2.665829658508301, "step": 8812} {"train_info/time_between_train_steps": 0.0033822059631347656, "step": 8812} {"info/global_step": 8813, "train_info/time_within_train_step": 2.64473819732666, "step": 8813} {"train_info/time_between_train_steps": 0.003393411636352539, "step": 8813} {"info/global_step": 8814, "train_info/time_within_train_step": 2.646742343902588, "step": 8814} {"train_info/time_between_train_steps": 0.003403186798095703, "step": 8814} {"info/global_step": 8815, "train_info/time_within_train_step": 2.663443088531494, "step": 8815} {"train_info/time_between_train_steps": 0.0036039352416992188, "step": 8815} {"info/global_step": 8816, "train_info/time_within_train_step": 2.6622002124786377, "step": 8816} {"train_info/time_between_train_steps": 0.003381967544555664, "step": 8816} {"info/global_step": 8817, "train_info/time_within_train_step": 2.6762616634368896, "step": 8817} {"train_info/time_between_train_steps": 0.0034322738647460938, "step": 8817} {"info/global_step": 8818, "train_info/time_within_train_step": 2.8224778175354004, "step": 8818} {"train_info/time_between_train_steps": 0.0032911300659179688, "step": 8818} {"info/global_step": 8819, "train_info/time_within_train_step": 2.664889335632324, "step": 8819} {"train_info/time_between_train_steps": 0.003314495086669922, "step": 8819} {"info/global_step": 8820, "train_info/time_within_train_step": 2.656139850616455, "step": 8820} {"train_info/time_between_train_steps": 0.0033359527587890625, "step": 8820} {"info/global_step": 8821, "train_info/time_within_train_step": 2.709977388381958, "step": 8821} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 8821} {"info/global_step": 8822, "train_info/time_within_train_step": 2.985342264175415, "step": 8822} {"train_info/time_between_train_steps": 0.0032358169555664062, "step": 8822} {"info/global_step": 8823, "train_info/time_within_train_step": 2.668058156967163, "step": 8823} {"train_info/time_between_train_steps": 0.0032188892364501953, "step": 8823} {"info/global_step": 8824, "train_info/time_within_train_step": 2.659236192703247, "step": 8824} {"train_info/time_between_train_steps": 0.0032432079315185547, "step": 8824} {"info/global_step": 8825, "train_info/time_within_train_step": 2.666997194290161, "step": 8825} {"train_info/time_between_train_steps": 0.005396127700805664, "step": 8825} {"info/global_step": 8826, "train_info/time_within_train_step": 2.654141664505005, "step": 8826} {"train_info/time_between_train_steps": 0.003348827362060547, "step": 8826} {"info/global_step": 8827, "train_info/time_within_train_step": 2.643648386001587, "step": 8827} {"train_info/time_between_train_steps": 0.0033130645751953125, "step": 8827} {"info/global_step": 8828, "train_info/time_within_train_step": 2.6588199138641357, "step": 8828} {"train_info/time_between_train_steps": 0.003320932388305664, "step": 8828} {"info/global_step": 8829, "train_info/time_within_train_step": 2.660198211669922, "step": 8829} {"train_info/time_between_train_steps": 0.003475189208984375, "step": 8829} {"info/global_step": 8830, "train_info/time_within_train_step": 2.644716262817383, "step": 8830} {"train_info/time_between_train_steps": 0.003390073776245117, "step": 8830} {"info/global_step": 8831, "train_info/time_within_train_step": 2.6623055934906006, "step": 8831} {"train_info/time_between_train_steps": 0.0033147335052490234, "step": 8831} {"info/global_step": 8832, "train_info/time_within_train_step": 2.6503102779388428, "step": 8832} {"train_info/time_between_train_steps": 0.0033292770385742188, "step": 8832} {"info/global_step": 8833, "train_info/time_within_train_step": 2.662935495376587, "step": 8833} {"train_info/time_between_train_steps": 0.0034363269805908203, "step": 8833} {"info/global_step": 8834, "train_info/time_within_train_step": 2.714630603790283, "step": 8834} {"train_info/time_between_train_steps": 0.0033006668090820312, "step": 8834} {"info/global_step": 8835, "train_info/time_within_train_step": 2.70035457611084, "step": 8835} {"train_info/time_between_train_steps": 0.003405332565307617, "step": 8835} {"info/global_step": 8836, "train_info/time_within_train_step": 2.6426470279693604, "step": 8836} {"train_info/time_between_train_steps": 0.0035572052001953125, "step": 8836} {"info/global_step": 8837, "train_info/time_within_train_step": 2.642643928527832, "step": 8837} {"train_info/time_between_train_steps": 0.0034241676330566406, "step": 8837} {"info/global_step": 8838, "train_info/time_within_train_step": 2.6596262454986572, "step": 8838} {"train_info/time_between_train_steps": 0.003337860107421875, "step": 8838} {"info/global_step": 8839, "train_info/time_within_train_step": 2.653926134109497, "step": 8839} {"train_info/time_between_train_steps": 0.0034835338592529297, "step": 8839} {"info/global_step": 8840, "train_info/time_within_train_step": 2.644031286239624, "step": 8840} {"train_info/time_between_train_steps": 0.003293275833129883, "step": 8840} {"info/global_step": 8841, "train_info/time_within_train_step": 2.652723550796509, "step": 8841} {"train_info/time_between_train_steps": 0.003286123275756836, "step": 8841} {"info/global_step": 8842, "train_info/time_within_train_step": 2.650456428527832, "step": 8842} {"train_info/time_between_train_steps": 0.003568887710571289, "step": 8842} {"info/global_step": 8843, "train_info/time_within_train_step": 2.669076919555664, "step": 8843} {"train_info/time_between_train_steps": 0.003346681594848633, "step": 8843} {"info/global_step": 8844, "train_info/time_within_train_step": 2.705141305923462, "step": 8844} {"train_info/time_between_train_steps": 0.0033431053161621094, "step": 8844} {"info/global_step": 8845, "train_info/time_within_train_step": 2.662266731262207, "step": 8845} {"train_info/time_between_train_steps": 0.003370523452758789, "step": 8845} {"info/global_step": 8846, "train_info/time_within_train_step": 2.6625876426696777, "step": 8846} {"train_info/time_between_train_steps": 0.0033669471740722656, "step": 8846} {"info/global_step": 8847, "train_info/time_within_train_step": 2.6423447132110596, "step": 8847} {"train_info/time_between_train_steps": 0.003312349319458008, "step": 8847} {"info/global_step": 8848, "train_info/time_within_train_step": 2.6554856300354004, "step": 8848} {"train_info/time_between_train_steps": 0.0033669471740722656, "step": 8848} {"info/global_step": 8849, "train_info/time_within_train_step": 2.65596079826355, "step": 8849} {"train_info/time_between_train_steps": 0.0033936500549316406, "step": 8849} {"info/global_step": 8850, "train_info/time_within_train_step": 2.6460330486297607, "step": 8850} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746922263, "_runtime": 24861}, "step": 8850} {"logs": {"train/loss": 2.9779, "train/learning_rate": 7.666666666666666e-05, "train/epoch": 10.02, "_timestamp": 1746922263, "_runtime": 24861}, "step": 8850} {"train_info/time_between_train_steps": 0.031045913696289062, "step": 8850} {"info/global_step": 8851, "train_info/time_within_train_step": 2.6448028087615967, "step": 8851} {"train_info/time_between_train_steps": 0.0032978057861328125, "step": 8851} {"info/global_step": 8852, "train_info/time_within_train_step": 2.6446800231933594, "step": 8852} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 8852} {"info/global_step": 8853, "train_info/time_within_train_step": 2.6724390983581543, "step": 8853} {"train_info/time_between_train_steps": 0.0033690929412841797, "step": 8853} {"info/global_step": 8854, "train_info/time_within_train_step": 2.6736526489257812, "step": 8854} {"train_info/time_between_train_steps": 0.00337982177734375, "step": 8854} {"info/global_step": 8855, "train_info/time_within_train_step": 2.651315212249756, "step": 8855} {"train_info/time_between_train_steps": 0.0033524036407470703, "step": 8855} {"info/global_step": 8856, "train_info/time_within_train_step": 2.6881144046783447, "step": 8856} {"train_info/time_between_train_steps": 0.0033342838287353516, "step": 8856} {"info/global_step": 8857, "train_info/time_within_train_step": 2.641451835632324, "step": 8857} {"train_info/time_between_train_steps": 0.003260374069213867, "step": 8857} {"info/global_step": 8858, "train_info/time_within_train_step": 2.6566474437713623, "step": 8858} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 8858} {"info/global_step": 8859, "train_info/time_within_train_step": 2.661792755126953, "step": 8859} {"train_info/time_between_train_steps": 0.0033338069915771484, "step": 8859} {"info/global_step": 8860, "train_info/time_within_train_step": 2.6458404064178467, "step": 8860} {"train_info/time_between_train_steps": 0.003417491912841797, "step": 8860} {"info/global_step": 8861, "train_info/time_within_train_step": 2.644824743270874, "step": 8861} {"train_info/time_between_train_steps": 0.003257274627685547, "step": 8861} {"info/global_step": 8862, "train_info/time_within_train_step": 2.6541645526885986, "step": 8862} {"train_info/time_between_train_steps": 0.003376007080078125, "step": 8862} {"info/global_step": 8863, "train_info/time_within_train_step": 2.661412477493286, "step": 8863} {"train_info/time_between_train_steps": 0.0032770633697509766, "step": 8863} {"info/global_step": 8864, "train_info/time_within_train_step": 2.672445297241211, "step": 8864} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 8864} {"info/global_step": 8865, "train_info/time_within_train_step": 2.6617960929870605, "step": 8865} {"train_info/time_between_train_steps": 0.0032896995544433594, "step": 8865} {"info/global_step": 8866, "train_info/time_within_train_step": 2.7081544399261475, "step": 8866} {"train_info/time_between_train_steps": 0.0033042430877685547, "step": 8866} {"info/global_step": 8867, "train_info/time_within_train_step": 2.9552297592163086, "step": 8867} {"train_info/time_between_train_steps": 0.0031585693359375, "step": 8867} {"info/global_step": 8868, "train_info/time_within_train_step": 2.660768985748291, "step": 8868} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 8868} {"info/global_step": 8869, "train_info/time_within_train_step": 2.67464542388916, "step": 8869} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 8869} {"info/global_step": 8870, "train_info/time_within_train_step": 2.6660714149475098, "step": 8870} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 8870} {"info/global_step": 8871, "train_info/time_within_train_step": 2.699747085571289, "step": 8871} {"train_info/time_between_train_steps": 0.003266572952270508, "step": 8871} {"info/global_step": 8872, "train_info/time_within_train_step": 2.6433322429656982, "step": 8872} {"train_info/time_between_train_steps": 0.0031528472900390625, "step": 8872} {"info/global_step": 8873, "train_info/time_within_train_step": 2.642810344696045, "step": 8873} {"train_info/time_between_train_steps": 0.003228425979614258, "step": 8873} {"info/global_step": 8874, "train_info/time_within_train_step": 2.6627132892608643, "step": 8874} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 8874} {"info/global_step": 8875, "train_info/time_within_train_step": 2.6480391025543213, "step": 8875} {"train_info/time_between_train_steps": 0.003367185592651367, "step": 8875} {"info/global_step": 8876, "train_info/time_within_train_step": 2.643618583679199, "step": 8876} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 8876} {"info/global_step": 8877, "train_info/time_within_train_step": 2.658957004547119, "step": 8877} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 8877} {"info/global_step": 8878, "train_info/time_within_train_step": 2.6523633003234863, "step": 8878} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 8878} {"info/global_step": 8879, "train_info/time_within_train_step": 2.661135673522949, "step": 8879} {"train_info/time_between_train_steps": 0.003262758255004883, "step": 8879} {"info/global_step": 8880, "train_info/time_within_train_step": 2.6974334716796875, "step": 8880} {"train_info/time_between_train_steps": 0.1363086700439453, "step": 8880} {"info/global_step": 8881, "train_info/time_within_train_step": 2.697909355163574, "step": 8881} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 8881} {"info/global_step": 8882, "train_info/time_within_train_step": 2.661177158355713, "step": 8882} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 8882} {"info/global_step": 8883, "train_info/time_within_train_step": 2.7177226543426514, "step": 8883} {"train_info/time_between_train_steps": 0.003283262252807617, "step": 8883} {"info/global_step": 8884, "train_info/time_within_train_step": 2.674288272857666, "step": 8884} {"train_info/time_between_train_steps": 0.00323486328125, "step": 8884} {"info/global_step": 8885, "train_info/time_within_train_step": 2.641406297683716, "step": 8885} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 8885} {"info/global_step": 8886, "train_info/time_within_train_step": 2.65311598777771, "step": 8886} {"train_info/time_between_train_steps": 0.003225564956665039, "step": 8886} {"info/global_step": 8887, "train_info/time_within_train_step": 2.651928663253784, "step": 8887} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 8887} {"info/global_step": 8888, "train_info/time_within_train_step": 2.6503992080688477, "step": 8888} {"train_info/time_between_train_steps": 0.0032775402069091797, "step": 8888} {"info/global_step": 8889, "train_info/time_within_train_step": 2.643564462661743, "step": 8889} {"train_info/time_between_train_steps": 0.0033178329467773438, "step": 8889} {"info/global_step": 8890, "train_info/time_within_train_step": 2.6731913089752197, "step": 8890} {"train_info/time_between_train_steps": 0.0032176971435546875, "step": 8890} {"info/global_step": 8891, "train_info/time_within_train_step": 2.662904739379883, "step": 8891} {"train_info/time_between_train_steps": 0.003208637237548828, "step": 8891} {"info/global_step": 8892, "train_info/time_within_train_step": 2.659046173095703, "step": 8892} {"train_info/time_between_train_steps": 0.0032422542572021484, "step": 8892} {"info/global_step": 8893, "train_info/time_within_train_step": 2.641571044921875, "step": 8893} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 8893} {"info/global_step": 8894, "train_info/time_within_train_step": 2.6525230407714844, "step": 8894} {"train_info/time_between_train_steps": 0.0032453536987304688, "step": 8894} {"info/global_step": 8895, "train_info/time_within_train_step": 2.659198045730591, "step": 8895} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 8895} {"info/global_step": 8896, "train_info/time_within_train_step": 2.6476948261260986, "step": 8896} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 8896} {"info/global_step": 8897, "train_info/time_within_train_step": 2.64188814163208, "step": 8897} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 8897} {"info/global_step": 8898, "train_info/time_within_train_step": 2.6509082317352295, "step": 8898} {"train_info/time_between_train_steps": 0.0032427310943603516, "step": 8898} {"info/global_step": 8899, "train_info/time_within_train_step": 2.654222249984741, "step": 8899} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 8899} {"info/global_step": 8900, "train_info/time_within_train_step": 2.6549315452575684, "step": 8900} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746922398, "_runtime": 24996}, "step": 8900} {"logs": {"train/loss": 2.9791, "train/learning_rate": 7.333333333333332e-05, "train/epoch": 10.03, "_timestamp": 1746922398, "_runtime": 24996}, "step": 8900} {"train_info/time_between_train_steps": 0.04965543746948242, "step": 8900} {"info/global_step": 8901, "train_info/time_within_train_step": 2.661996603012085, "step": 8901} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 8901} {"info/global_step": 8902, "train_info/time_within_train_step": 2.648622751235962, "step": 8902} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 8902} {"info/global_step": 8903, "train_info/time_within_train_step": 2.6585395336151123, "step": 8903} {"train_info/time_between_train_steps": 0.0032427310943603516, "step": 8903} {"info/global_step": 8904, "train_info/time_within_train_step": 2.6643905639648438, "step": 8904} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 8904} {"info/global_step": 8905, "train_info/time_within_train_step": 2.643394708633423, "step": 8905} {"train_info/time_between_train_steps": 0.003406524658203125, "step": 8905} {"info/global_step": 8906, "train_info/time_within_train_step": 2.645444869995117, "step": 8906} {"train_info/time_between_train_steps": 0.0033245086669921875, "step": 8906} {"info/global_step": 8907, "train_info/time_within_train_step": 2.645456075668335, "step": 8907} {"train_info/time_between_train_steps": 0.0033957958221435547, "step": 8907} {"info/global_step": 8908, "train_info/time_within_train_step": 2.6458826065063477, "step": 8908} {"train_info/time_between_train_steps": 0.003307342529296875, "step": 8908} {"info/global_step": 8909, "train_info/time_within_train_step": 2.6468703746795654, "step": 8909} {"train_info/time_between_train_steps": 0.003543853759765625, "step": 8909} {"info/global_step": 8910, "train_info/time_within_train_step": 2.6490232944488525, "step": 8910} {"train_info/time_between_train_steps": 0.003267526626586914, "step": 8910} {"info/global_step": 8911, "train_info/time_within_train_step": 2.6414895057678223, "step": 8911} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 8911} {"info/global_step": 8912, "train_info/time_within_train_step": 2.697352170944214, "step": 8912} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 8912} {"info/global_step": 8913, "train_info/time_within_train_step": 2.654297351837158, "step": 8913} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 8913} {"info/global_step": 8914, "train_info/time_within_train_step": 2.643160581588745, "step": 8914} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 8914} {"info/global_step": 8915, "train_info/time_within_train_step": 2.6492347717285156, "step": 8915} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 8915} {"info/global_step": 8916, "train_info/time_within_train_step": 2.6527655124664307, "step": 8916} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 8916} {"info/global_step": 8917, "train_info/time_within_train_step": 2.661316394805908, "step": 8917} {"train_info/time_between_train_steps": 0.0032062530517578125, "step": 8917} {"info/global_step": 8918, "train_info/time_within_train_step": 2.6753976345062256, "step": 8918} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 8918} {"info/global_step": 8919, "train_info/time_within_train_step": 2.666774034500122, "step": 8919} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 8919} {"info/global_step": 8920, "train_info/time_within_train_step": 2.6887118816375732, "step": 8920} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 8920} {"info/global_step": 8921, "train_info/time_within_train_step": 2.6480352878570557, "step": 8921} {"train_info/time_between_train_steps": 0.003201007843017578, "step": 8921} {"info/global_step": 8922, "train_info/time_within_train_step": 2.646561622619629, "step": 8922} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 8922} {"info/global_step": 8923, "train_info/time_within_train_step": 2.649263620376587, "step": 8923} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 8923} {"info/global_step": 8924, "train_info/time_within_train_step": 2.6492252349853516, "step": 8924} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 8924} {"info/global_step": 8925, "train_info/time_within_train_step": 2.6615867614746094, "step": 8925} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 8925} {"info/global_step": 8926, "train_info/time_within_train_step": 2.6542911529541016, "step": 8926} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 8926} {"info/global_step": 8927, "train_info/time_within_train_step": 2.6595213413238525, "step": 8927} {"train_info/time_between_train_steps": 0.003183126449584961, "step": 8927} {"info/global_step": 8928, "train_info/time_within_train_step": 2.687901258468628, "step": 8928} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 8928} {"info/global_step": 8929, "train_info/time_within_train_step": 2.7246274948120117, "step": 8929} {"train_info/time_between_train_steps": 0.003252267837524414, "step": 8929} {"info/global_step": 8930, "train_info/time_within_train_step": 2.647754669189453, "step": 8930} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 8930} {"info/global_step": 8931, "train_info/time_within_train_step": 2.642072916030884, "step": 8931} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 8931} {"info/global_step": 8932, "train_info/time_within_train_step": 2.657250165939331, "step": 8932} {"train_info/time_between_train_steps": 0.0032372474670410156, "step": 8932} {"info/global_step": 8933, "train_info/time_within_train_step": 2.6527621746063232, "step": 8933} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 8933} {"info/global_step": 8934, "train_info/time_within_train_step": 2.6429712772369385, "step": 8934} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 8934} {"info/global_step": 8935, "train_info/time_within_train_step": 2.6463570594787598, "step": 8935} {"train_info/time_between_train_steps": 0.0034050941467285156, "step": 8935} {"info/global_step": 8936, "train_info/time_within_train_step": 2.6581294536590576, "step": 8936} {"train_info/time_between_train_steps": 0.0035028457641601562, "step": 8936} {"info/global_step": 8937, "train_info/time_within_train_step": 2.669017791748047, "step": 8937} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 8937} {"info/global_step": 8938, "train_info/time_within_train_step": 2.710045099258423, "step": 8938} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 8938} {"info/global_step": 8939, "train_info/time_within_train_step": 2.6403229236602783, "step": 8939} {"train_info/time_between_train_steps": 0.006643056869506836, "step": 8939} {"info/global_step": 8940, "train_info/time_within_train_step": 2.6592202186584473, "step": 8940} {"train_info/time_between_train_steps": 0.0032579898834228516, "step": 8940} {"info/global_step": 8941, "train_info/time_within_train_step": 2.6481661796569824, "step": 8941} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 8941} {"info/global_step": 8942, "train_info/time_within_train_step": 2.6474788188934326, "step": 8942} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 8942} {"info/global_step": 8943, "train_info/time_within_train_step": 2.7983484268188477, "step": 8943} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 8943} {"info/global_step": 8944, "train_info/time_within_train_step": 2.652925491333008, "step": 8944} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 8944} {"info/global_step": 8945, "train_info/time_within_train_step": 2.652719736099243, "step": 8945} {"train_info/time_between_train_steps": 0.0032019615173339844, "step": 8945} {"info/global_step": 8946, "train_info/time_within_train_step": 2.644085168838501, "step": 8946} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 8946} {"info/global_step": 8947, "train_info/time_within_train_step": 2.6497161388397217, "step": 8947} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 8947} {"info/global_step": 8948, "train_info/time_within_train_step": 2.6712965965270996, "step": 8948} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 8948} {"info/global_step": 8949, "train_info/time_within_train_step": 2.669448137283325, "step": 8949} {"train_info/time_between_train_steps": 0.003337383270263672, "step": 8949} {"info/global_step": 8950, "train_info/time_within_train_step": 2.6560189723968506, "step": 8950} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746922534, "_runtime": 25132}, "step": 8950} {"logs": {"train/loss": 2.9763, "train/learning_rate": 7e-05, "train/epoch": 10.03, "_timestamp": 1746922534, "_runtime": 25132}, "step": 8950} {"train_info/time_between_train_steps": 0.030391216278076172, "step": 8950} {"info/global_step": 8951, "train_info/time_within_train_step": 2.6580636501312256, "step": 8951} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 8951} {"info/global_step": 8952, "train_info/time_within_train_step": 2.665879726409912, "step": 8952} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 8952} {"info/global_step": 8953, "train_info/time_within_train_step": 2.648707151412964, "step": 8953} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 8953} {"info/global_step": 8954, "train_info/time_within_train_step": 2.650830030441284, "step": 8954} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 8954} {"info/global_step": 8955, "train_info/time_within_train_step": 2.6507749557495117, "step": 8955} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 8955} {"info/global_step": 8956, "train_info/time_within_train_step": 2.6484081745147705, "step": 8956} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 8956} {"info/global_step": 8957, "train_info/time_within_train_step": 2.650831460952759, "step": 8957} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 8957} {"info/global_step": 8958, "train_info/time_within_train_step": 2.6607234477996826, "step": 8958} {"train_info/time_between_train_steps": 0.0032775402069091797, "step": 8958} {"info/global_step": 8959, "train_info/time_within_train_step": 2.6419808864593506, "step": 8959} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 8959} {"info/global_step": 8960, "train_info/time_within_train_step": 2.647191286087036, "step": 8960} {"train_info/time_between_train_steps": 0.0031599998474121094, "step": 8960} {"info/global_step": 8961, "train_info/time_within_train_step": 2.663574695587158, "step": 8961} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 8961} {"info/global_step": 8962, "train_info/time_within_train_step": 2.664937973022461, "step": 8962} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 8962} {"info/global_step": 8963, "train_info/time_within_train_step": 2.6458792686462402, "step": 8963} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 8963} {"info/global_step": 8964, "train_info/time_within_train_step": 2.659487247467041, "step": 8964} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 8964} {"info/global_step": 8965, "train_info/time_within_train_step": 2.6446354389190674, "step": 8965} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 8965} {"info/global_step": 8966, "train_info/time_within_train_step": 2.652810573577881, "step": 8966} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 8966} {"info/global_step": 8967, "train_info/time_within_train_step": 2.649030923843384, "step": 8967} {"train_info/time_between_train_steps": 0.0032944679260253906, "step": 8967} {"info/global_step": 8968, "train_info/time_within_train_step": 2.909052610397339, "step": 8968} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 8968} {"info/global_step": 8969, "train_info/time_within_train_step": 2.6420559883117676, "step": 8969} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 8969} {"info/global_step": 8970, "train_info/time_within_train_step": 2.658400297164917, "step": 8970} {"train_info/time_between_train_steps": 0.0032503604888916016, "step": 8970} {"info/global_step": 8971, "train_info/time_within_train_step": 2.6516501903533936, "step": 8971} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 8971} {"info/global_step": 8972, "train_info/time_within_train_step": 2.6478805541992188, "step": 8972} {"train_info/time_between_train_steps": 0.003214597702026367, "step": 8972} {"info/global_step": 8973, "train_info/time_within_train_step": 2.6421358585357666, "step": 8973} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 8973} {"info/global_step": 8974, "train_info/time_within_train_step": 2.66805362701416, "step": 8974} {"train_info/time_between_train_steps": 0.0032622814178466797, "step": 8974} {"info/global_step": 8975, "train_info/time_within_train_step": 2.668394088745117, "step": 8975} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 8975} {"info/global_step": 8976, "train_info/time_within_train_step": 2.658489227294922, "step": 8976} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 8976} {"info/global_step": 8977, "train_info/time_within_train_step": 2.6619532108306885, "step": 8977} {"train_info/time_between_train_steps": 0.003224611282348633, "step": 8977} {"info/global_step": 8978, "train_info/time_within_train_step": 2.642547369003296, "step": 8978} {"train_info/time_between_train_steps": 0.006504058837890625, "step": 8978} {"info/global_step": 8979, "train_info/time_within_train_step": 2.654942274093628, "step": 8979} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 8979} {"info/global_step": 8980, "train_info/time_within_train_step": 2.656681537628174, "step": 8980} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 8980} {"info/global_step": 8981, "train_info/time_within_train_step": 2.643604040145874, "step": 8981} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 8981} {"info/global_step": 8982, "train_info/time_within_train_step": 2.646629571914673, "step": 8982} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 8982} {"info/global_step": 8983, "train_info/time_within_train_step": 2.6673243045806885, "step": 8983} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 8983} {"info/global_step": 8984, "train_info/time_within_train_step": 2.6652143001556396, "step": 8984} {"train_info/time_between_train_steps": 0.0033910274505615234, "step": 8984} {"info/global_step": 8985, "train_info/time_within_train_step": 2.6580097675323486, "step": 8985} {"train_info/time_between_train_steps": 0.0031702518463134766, "step": 8985} {"info/global_step": 8986, "train_info/time_within_train_step": 2.6854379177093506, "step": 8986} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 8986} {"info/global_step": 8987, "train_info/time_within_train_step": 2.641683578491211, "step": 8987} {"train_info/time_between_train_steps": 0.003224611282348633, "step": 8987} {"info/global_step": 8988, "train_info/time_within_train_step": 2.648090362548828, "step": 8988} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 8988} {"info/global_step": 8989, "train_info/time_within_train_step": 2.659184455871582, "step": 8989} {"train_info/time_between_train_steps": 0.0032372474670410156, "step": 8989} {"info/global_step": 8990, "train_info/time_within_train_step": 2.6431097984313965, "step": 8990} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 8990} {"info/global_step": 8991, "train_info/time_within_train_step": 2.643995761871338, "step": 8991} {"train_info/time_between_train_steps": 0.0032203197479248047, "step": 8991} {"info/global_step": 8992, "train_info/time_within_train_step": 2.6845109462738037, "step": 8992} {"train_info/time_between_train_steps": 0.0032727718353271484, "step": 8992} {"info/global_step": 8993, "train_info/time_within_train_step": 2.6603806018829346, "step": 8993} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 8993} {"info/global_step": 8994, "train_info/time_within_train_step": 2.6769309043884277, "step": 8994} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 8994} {"info/global_step": 8995, "train_info/time_within_train_step": 2.6625638008117676, "step": 8995} {"train_info/time_between_train_steps": 0.0032186508178710938, "step": 8995} {"info/global_step": 8996, "train_info/time_within_train_step": 2.700519323348999, "step": 8996} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 8996} {"info/global_step": 8997, "train_info/time_within_train_step": 2.6425061225891113, "step": 8997} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 8997} {"info/global_step": 8998, "train_info/time_within_train_step": 3.2287161350250244, "step": 8998} {"train_info/time_between_train_steps": 0.0033750534057617188, "step": 8998} {"info/global_step": 8999, "train_info/time_within_train_step": 2.646024465560913, "step": 8999} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 8999} {"info/global_step": 9000, "train_info/time_within_train_step": 2.643956422805786, "step": 9000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746922669, "_runtime": 25267}, "step": 9000} {"logs": {"train/loss": 2.9657, "train/learning_rate": 6.666666666666666e-05, "train/epoch": 10.04, "_timestamp": 1746922669, "_runtime": 25267}, "step": 9000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746922674, "_runtime": 25272}, "step": 9000} {"logs": {"eval/loss": 4.799495697021484, "eval/runtime": 5.2028, "eval/samples_per_second": 36.903, "eval/steps_per_second": 1.153, "train/epoch": 10.04, "_timestamp": 1746922674, "_runtime": 25272}, "step": 9000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746922674, "_runtime": 25272}, "step": 9000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.799495697021484, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 121.44915490201791, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.2028, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.903, "train/epoch": 10.04, "_timestamp": 1746922674, "_runtime": 25272}, "step": 9000} {"train_info/time_between_train_steps": 19.44720196723938, "step": 9000} {"info/global_step": 9001, "train_info/time_within_train_step": 2.4501535892486572, "step": 9001} {"train_info/time_between_train_steps": 0.003391265869140625, "step": 9001} {"info/global_step": 9002, "train_info/time_within_train_step": 2.426285982131958, "step": 9002} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 9002} {"info/global_step": 9003, "train_info/time_within_train_step": 2.5399913787841797, "step": 9003} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 9003} {"info/global_step": 9004, "train_info/time_within_train_step": 2.6497044563293457, "step": 9004} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 9004} {"info/global_step": 9005, "train_info/time_within_train_step": 2.6508970260620117, "step": 9005} {"train_info/time_between_train_steps": 0.13057637214660645, "step": 9005} {"info/global_step": 9006, "train_info/time_within_train_step": 2.649946451187134, "step": 9006} {"train_info/time_between_train_steps": 0.0032434463500976562, "step": 9006} {"info/global_step": 9007, "train_info/time_within_train_step": 2.6555545330047607, "step": 9007} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 9007} {"info/global_step": 9008, "train_info/time_within_train_step": 2.6431522369384766, "step": 9008} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 9008} {"info/global_step": 9009, "train_info/time_within_train_step": 2.645437002182007, "step": 9009} {"train_info/time_between_train_steps": 0.0032291412353515625, "step": 9009} {"info/global_step": 9010, "train_info/time_within_train_step": 2.673671007156372, "step": 9010} {"train_info/time_between_train_steps": 0.0032701492309570312, "step": 9010} {"info/global_step": 9011, "train_info/time_within_train_step": 2.6704890727996826, "step": 9011} {"train_info/time_between_train_steps": 0.003324747085571289, "step": 9011} {"info/global_step": 9012, "train_info/time_within_train_step": 2.660222291946411, "step": 9012} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 9012} {"info/global_step": 9013, "train_info/time_within_train_step": 2.6758649349212646, "step": 9013} {"train_info/time_between_train_steps": 0.003253459930419922, "step": 9013} {"info/global_step": 9014, "train_info/time_within_train_step": 2.644407033920288, "step": 9014} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 9014} {"info/global_step": 9015, "train_info/time_within_train_step": 2.6569159030914307, "step": 9015} {"train_info/time_between_train_steps": 0.0032317638397216797, "step": 9015} {"info/global_step": 9016, "train_info/time_within_train_step": 2.6465699672698975, "step": 9016} {"train_info/time_between_train_steps": 0.003252744674682617, "step": 9016} {"info/global_step": 9017, "train_info/time_within_train_step": 2.64810848236084, "step": 9017} {"train_info/time_between_train_steps": 0.003239154815673828, "step": 9017} {"info/global_step": 9018, "train_info/time_within_train_step": 2.667773962020874, "step": 9018} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 9018} {"info/global_step": 9019, "train_info/time_within_train_step": 2.660602569580078, "step": 9019} {"train_info/time_between_train_steps": 0.0032711029052734375, "step": 9019} {"info/global_step": 9020, "train_info/time_within_train_step": 2.6569294929504395, "step": 9020} {"train_info/time_between_train_steps": 0.003313302993774414, "step": 9020} {"info/global_step": 9021, "train_info/time_within_train_step": 2.7036447525024414, "step": 9021} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 9021} {"info/global_step": 9022, "train_info/time_within_train_step": 2.6578433513641357, "step": 9022} {"train_info/time_between_train_steps": 0.0033118724822998047, "step": 9022} {"info/global_step": 9023, "train_info/time_within_train_step": 2.6498966217041016, "step": 9023} {"train_info/time_between_train_steps": 0.0032498836517333984, "step": 9023} {"info/global_step": 9024, "train_info/time_within_train_step": 2.654040575027466, "step": 9024} {"train_info/time_between_train_steps": 0.0032651424407958984, "step": 9024} {"info/global_step": 9025, "train_info/time_within_train_step": 2.650864839553833, "step": 9025} {"train_info/time_between_train_steps": 0.0032083988189697266, "step": 9025} {"info/global_step": 9026, "train_info/time_within_train_step": 2.650202989578247, "step": 9026} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 9026} {"info/global_step": 9027, "train_info/time_within_train_step": 2.653824806213379, "step": 9027} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 9027} {"info/global_step": 9028, "train_info/time_within_train_step": 2.6549148559570312, "step": 9028} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 9028} {"info/global_step": 9029, "train_info/time_within_train_step": 2.6660141944885254, "step": 9029} {"train_info/time_between_train_steps": 0.003275632858276367, "step": 9029} {"info/global_step": 9030, "train_info/time_within_train_step": 2.6799819469451904, "step": 9030} {"train_info/time_between_train_steps": 0.003320455551147461, "step": 9030} {"info/global_step": 9031, "train_info/time_within_train_step": 2.650763988494873, "step": 9031} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 9031} {"info/global_step": 9032, "train_info/time_within_train_step": 2.6424219608306885, "step": 9032} {"train_info/time_between_train_steps": 0.0032889842987060547, "step": 9032} {"info/global_step": 9033, "train_info/time_within_train_step": 2.657435178756714, "step": 9033} {"train_info/time_between_train_steps": 0.0032579898834228516, "step": 9033} {"info/global_step": 9034, "train_info/time_within_train_step": 2.6514596939086914, "step": 9034} {"train_info/time_between_train_steps": 0.0032167434692382812, "step": 9034} {"info/global_step": 9035, "train_info/time_within_train_step": 2.6506574153900146, "step": 9035} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 9035} {"info/global_step": 9036, "train_info/time_within_train_step": 2.649360418319702, "step": 9036} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 9036} {"info/global_step": 9037, "train_info/time_within_train_step": 2.644251585006714, "step": 9037} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 9037} {"info/global_step": 9038, "train_info/time_within_train_step": 2.670163631439209, "step": 9038} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 9038} {"info/global_step": 9039, "train_info/time_within_train_step": 2.6684179306030273, "step": 9039} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 9039} {"info/global_step": 9040, "train_info/time_within_train_step": 2.7128548622131348, "step": 9040} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 9040} {"info/global_step": 9041, "train_info/time_within_train_step": 2.643852710723877, "step": 9041} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 9041} {"info/global_step": 9042, "train_info/time_within_train_step": 2.6605937480926514, "step": 9042} {"train_info/time_between_train_steps": 0.003226757049560547, "step": 9042} {"info/global_step": 9043, "train_info/time_within_train_step": 2.649705648422241, "step": 9043} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 9043} {"info/global_step": 9044, "train_info/time_within_train_step": 2.9611856937408447, "step": 9044} {"train_info/time_between_train_steps": 0.003204345703125, "step": 9044} {"info/global_step": 9045, "train_info/time_within_train_step": 2.6613214015960693, "step": 9045} {"train_info/time_between_train_steps": 0.0032808780670166016, "step": 9045} {"info/global_step": 9046, "train_info/time_within_train_step": 2.664463520050049, "step": 9046} {"train_info/time_between_train_steps": 0.0033659934997558594, "step": 9046} {"info/global_step": 9047, "train_info/time_within_train_step": 2.644045114517212, "step": 9047} {"train_info/time_between_train_steps": 0.0033981800079345703, "step": 9047} {"info/global_step": 9048, "train_info/time_within_train_step": 2.6597959995269775, "step": 9048} {"train_info/time_between_train_steps": 0.0033392906188964844, "step": 9048} {"info/global_step": 9049, "train_info/time_within_train_step": 2.669174909591675, "step": 9049} {"train_info/time_between_train_steps": 0.003473997116088867, "step": 9049} {"info/global_step": 9050, "train_info/time_within_train_step": 2.6859588623046875, "step": 9050} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746922823, "_runtime": 25421}, "step": 9050} {"logs": {"train/loss": 2.962, "train/learning_rate": 6.333333333333333e-05, "train/epoch": 10.04, "_timestamp": 1746922823, "_runtime": 25421}, "step": 9050} {"train_info/time_between_train_steps": 0.031105518341064453, "step": 9050} {"info/global_step": 9051, "train_info/time_within_train_step": 2.6884264945983887, "step": 9051} {"train_info/time_between_train_steps": 0.0034558773040771484, "step": 9051} {"info/global_step": 9052, "train_info/time_within_train_step": 2.689572811126709, "step": 9052} {"train_info/time_between_train_steps": 0.0034825801849365234, "step": 9052} {"info/global_step": 9053, "train_info/time_within_train_step": 2.6809890270233154, "step": 9053} {"train_info/time_between_train_steps": 0.0034139156341552734, "step": 9053} {"info/global_step": 9054, "train_info/time_within_train_step": 2.6437339782714844, "step": 9054} {"train_info/time_between_train_steps": 0.003403186798095703, "step": 9054} {"info/global_step": 9055, "train_info/time_within_train_step": 2.6536664962768555, "step": 9055} {"train_info/time_between_train_steps": 0.003430604934692383, "step": 9055} {"info/global_step": 9056, "train_info/time_within_train_step": 2.656425952911377, "step": 9056} {"train_info/time_between_train_steps": 0.0034475326538085938, "step": 9056} {"info/global_step": 9057, "train_info/time_within_train_step": 2.6452600955963135, "step": 9057} {"train_info/time_between_train_steps": 0.003341197967529297, "step": 9057} {"info/global_step": 9058, "train_info/time_within_train_step": 2.6545960903167725, "step": 9058} {"train_info/time_between_train_steps": 0.0035300254821777344, "step": 9058} {"info/global_step": 9059, "train_info/time_within_train_step": 2.6441216468811035, "step": 9059} {"train_info/time_between_train_steps": 0.003461122512817383, "step": 9059} {"info/global_step": 9060, "train_info/time_within_train_step": 2.654892921447754, "step": 9060} {"train_info/time_between_train_steps": 0.003412485122680664, "step": 9060} {"info/global_step": 9061, "train_info/time_within_train_step": 2.6560702323913574, "step": 9061} {"train_info/time_between_train_steps": 0.0035834312438964844, "step": 9061} {"info/global_step": 9062, "train_info/time_within_train_step": 2.672131299972534, "step": 9062} {"train_info/time_between_train_steps": 0.003686666488647461, "step": 9062} {"info/global_step": 9063, "train_info/time_within_train_step": 2.724956750869751, "step": 9063} {"train_info/time_between_train_steps": 0.003423929214477539, "step": 9063} {"info/global_step": 9064, "train_info/time_within_train_step": 2.6675424575805664, "step": 9064} {"train_info/time_between_train_steps": 0.003489971160888672, "step": 9064} {"info/global_step": 9065, "train_info/time_within_train_step": 2.6420280933380127, "step": 9065} {"train_info/time_between_train_steps": 0.003428220748901367, "step": 9065} {"info/global_step": 9066, "train_info/time_within_train_step": 2.652993679046631, "step": 9066} {"train_info/time_between_train_steps": 0.0034935474395751953, "step": 9066} {"info/global_step": 9067, "train_info/time_within_train_step": 2.653791666030884, "step": 9067} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 9067} {"info/global_step": 9068, "train_info/time_within_train_step": 2.8182098865509033, "step": 9068} {"train_info/time_between_train_steps": 0.003313302993774414, "step": 9068} {"info/global_step": 9069, "train_info/time_within_train_step": 2.6593453884124756, "step": 9069} {"train_info/time_between_train_steps": 0.003290891647338867, "step": 9069} {"info/global_step": 9070, "train_info/time_within_train_step": 2.6579601764678955, "step": 9070} {"train_info/time_between_train_steps": 0.003492116928100586, "step": 9070} {"info/global_step": 9071, "train_info/time_within_train_step": 2.6435093879699707, "step": 9071} {"train_info/time_between_train_steps": 0.0033707618713378906, "step": 9071} {"info/global_step": 9072, "train_info/time_within_train_step": 2.6472432613372803, "step": 9072} {"train_info/time_between_train_steps": 0.003671884536743164, "step": 9072} {"info/global_step": 9073, "train_info/time_within_train_step": 2.6612868309020996, "step": 9073} {"train_info/time_between_train_steps": 0.0034246444702148438, "step": 9073} {"info/global_step": 9074, "train_info/time_within_train_step": 2.6692159175872803, "step": 9074} {"train_info/time_between_train_steps": 0.003306150436401367, "step": 9074} {"info/global_step": 9075, "train_info/time_within_train_step": 2.710787534713745, "step": 9075} {"train_info/time_between_train_steps": 0.0033159255981445312, "step": 9075} {"info/global_step": 9076, "train_info/time_within_train_step": 2.659029722213745, "step": 9076} {"train_info/time_between_train_steps": 0.0032737255096435547, "step": 9076} {"info/global_step": 9077, "train_info/time_within_train_step": 2.6641957759857178, "step": 9077} {"train_info/time_between_train_steps": 0.003293275833129883, "step": 9077} {"info/global_step": 9078, "train_info/time_within_train_step": 2.64284348487854, "step": 9078} {"train_info/time_between_train_steps": 0.003245830535888672, "step": 9078} {"info/global_step": 9079, "train_info/time_within_train_step": 2.651798963546753, "step": 9079} {"train_info/time_between_train_steps": 0.003374338150024414, "step": 9079} {"info/global_step": 9080, "train_info/time_within_train_step": 2.66052508354187, "step": 9080} {"train_info/time_between_train_steps": 0.003292560577392578, "step": 9080} {"info/global_step": 9081, "train_info/time_within_train_step": 2.660876750946045, "step": 9081} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 9081} {"info/global_step": 9082, "train_info/time_within_train_step": 2.6681742668151855, "step": 9082} {"train_info/time_between_train_steps": 0.003270864486694336, "step": 9082} {"info/global_step": 9083, "train_info/time_within_train_step": 2.6856377124786377, "step": 9083} {"train_info/time_between_train_steps": 0.003271818161010742, "step": 9083} {"info/global_step": 9084, "train_info/time_within_train_step": 2.647963523864746, "step": 9084} {"train_info/time_between_train_steps": 0.003504037857055664, "step": 9084} {"info/global_step": 9085, "train_info/time_within_train_step": 2.6879286766052246, "step": 9085} {"train_info/time_between_train_steps": 0.003287792205810547, "step": 9085} {"info/global_step": 9086, "train_info/time_within_train_step": 2.6423633098602295, "step": 9086} {"train_info/time_between_train_steps": 0.0032618045806884766, "step": 9086} {"info/global_step": 9087, "train_info/time_within_train_step": 2.649207830429077, "step": 9087} {"train_info/time_between_train_steps": 0.0032587051391601562, "step": 9087} {"info/global_step": 9088, "train_info/time_within_train_step": 2.6611599922180176, "step": 9088} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 9088} {"info/global_step": 9089, "train_info/time_within_train_step": 2.6440062522888184, "step": 9089} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 9089} {"info/global_step": 9090, "train_info/time_within_train_step": 2.6451969146728516, "step": 9090} {"train_info/time_between_train_steps": 0.0033464431762695312, "step": 9090} {"info/global_step": 9091, "train_info/time_within_train_step": 2.660676956176758, "step": 9091} {"train_info/time_between_train_steps": 0.0032601356506347656, "step": 9091} {"info/global_step": 9092, "train_info/time_within_train_step": 2.6616177558898926, "step": 9092} {"train_info/time_between_train_steps": 0.0032553672790527344, "step": 9092} {"info/global_step": 9093, "train_info/time_within_train_step": 2.675018072128296, "step": 9093} {"train_info/time_between_train_steps": 0.003333568572998047, "step": 9093} {"info/global_step": 9094, "train_info/time_within_train_step": 2.668584108352661, "step": 9094} {"train_info/time_between_train_steps": 0.0033745765686035156, "step": 9094} {"info/global_step": 9095, "train_info/time_within_train_step": 2.6969497203826904, "step": 9095} {"train_info/time_between_train_steps": 0.0033147335052490234, "step": 9095} {"info/global_step": 9096, "train_info/time_within_train_step": 2.6414685249328613, "step": 9096} {"train_info/time_between_train_steps": 0.003377676010131836, "step": 9096} {"info/global_step": 9097, "train_info/time_within_train_step": 2.642317295074463, "step": 9097} {"train_info/time_between_train_steps": 0.0035037994384765625, "step": 9097} {"info/global_step": 9098, "train_info/time_within_train_step": 2.6636013984680176, "step": 9098} {"train_info/time_between_train_steps": 0.00342559814453125, "step": 9098} {"info/global_step": 9099, "train_info/time_within_train_step": 2.6486566066741943, "step": 9099} {"train_info/time_between_train_steps": 0.003461599349975586, "step": 9099} {"info/global_step": 9100, "train_info/time_within_train_step": 2.645279884338379, "step": 9100} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746922958, "_runtime": 25556}, "step": 9100} {"logs": {"train/loss": 2.9568, "train/learning_rate": 5.9999999999999995e-05, "train/epoch": 10.05, "_timestamp": 1746922958, "_runtime": 25556}, "step": 9100} {"train_info/time_between_train_steps": 0.04998421669006348, "step": 9100} {"info/global_step": 9101, "train_info/time_within_train_step": 2.6454668045043945, "step": 9101} {"train_info/time_between_train_steps": 0.003454446792602539, "step": 9101} {"info/global_step": 9102, "train_info/time_within_train_step": 2.6615121364593506, "step": 9102} {"train_info/time_between_train_steps": 0.0033905506134033203, "step": 9102} {"info/global_step": 9103, "train_info/time_within_train_step": 2.652449607849121, "step": 9103} {"train_info/time_between_train_steps": 0.0035490989685058594, "step": 9103} {"info/global_step": 9104, "train_info/time_within_train_step": 2.6618173122406006, "step": 9104} {"train_info/time_between_train_steps": 0.003524303436279297, "step": 9104} {"info/global_step": 9105, "train_info/time_within_train_step": 3.025118589401245, "step": 9105} {"train_info/time_between_train_steps": 0.003319978713989258, "step": 9105} {"info/global_step": 9106, "train_info/time_within_train_step": 2.6433658599853516, "step": 9106} {"train_info/time_between_train_steps": 0.003221273422241211, "step": 9106} {"info/global_step": 9107, "train_info/time_within_train_step": 2.658979892730713, "step": 9107} {"train_info/time_between_train_steps": 0.0033011436462402344, "step": 9107} {"info/global_step": 9108, "train_info/time_within_train_step": 2.6435821056365967, "step": 9108} {"train_info/time_between_train_steps": 0.0033910274505615234, "step": 9108} {"info/global_step": 9109, "train_info/time_within_train_step": 2.646772623062134, "step": 9109} {"train_info/time_between_train_steps": 0.003385782241821289, "step": 9109} {"info/global_step": 9110, "train_info/time_within_train_step": 2.6500208377838135, "step": 9110} {"train_info/time_between_train_steps": 0.003479480743408203, "step": 9110} {"info/global_step": 9111, "train_info/time_within_train_step": 2.6442668437957764, "step": 9111} {"train_info/time_between_train_steps": 0.0033605098724365234, "step": 9111} {"info/global_step": 9112, "train_info/time_within_train_step": 2.6443283557891846, "step": 9112} {"train_info/time_between_train_steps": 0.0033211708068847656, "step": 9112} {"info/global_step": 9113, "train_info/time_within_train_step": 2.6517438888549805, "step": 9113} {"train_info/time_between_train_steps": 0.0032601356506347656, "step": 9113} {"info/global_step": 9114, "train_info/time_within_train_step": 2.641178846359253, "step": 9114} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 9114} {"info/global_step": 9115, "train_info/time_within_train_step": 2.689457893371582, "step": 9115} {"train_info/time_between_train_steps": 0.0033211708068847656, "step": 9115} {"info/global_step": 9116, "train_info/time_within_train_step": 2.659440040588379, "step": 9116} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 9116} {"info/global_step": 9117, "train_info/time_within_train_step": 2.6454074382781982, "step": 9117} {"train_info/time_between_train_steps": 0.0032308101654052734, "step": 9117} {"info/global_step": 9118, "train_info/time_within_train_step": 2.6497678756713867, "step": 9118} {"train_info/time_between_train_steps": 0.0033006668090820312, "step": 9118} {"info/global_step": 9119, "train_info/time_within_train_step": 2.6605958938598633, "step": 9119} {"train_info/time_between_train_steps": 0.003265380859375, "step": 9119} {"info/global_step": 9120, "train_info/time_within_train_step": 2.6609110832214355, "step": 9120} {"train_info/time_between_train_steps": 0.0032498836517333984, "step": 9120} {"info/global_step": 9121, "train_info/time_within_train_step": 2.673886299133301, "step": 9121} {"train_info/time_between_train_steps": 0.0032377243041992188, "step": 9121} {"info/global_step": 9122, "train_info/time_within_train_step": 2.6654632091522217, "step": 9122} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 9122} {"info/global_step": 9123, "train_info/time_within_train_step": 2.70259690284729, "step": 9123} {"train_info/time_between_train_steps": 0.0033142566680908203, "step": 9123} {"info/global_step": 9124, "train_info/time_within_train_step": 2.64239239692688, "step": 9124} {"train_info/time_between_train_steps": 0.0033473968505859375, "step": 9124} {"info/global_step": 9125, "train_info/time_within_train_step": 2.641991138458252, "step": 9125} {"train_info/time_between_train_steps": 0.0035123825073242188, "step": 9125} {"info/global_step": 9126, "train_info/time_within_train_step": 2.6663613319396973, "step": 9126} {"train_info/time_between_train_steps": 0.0034377574920654297, "step": 9126} {"info/global_step": 9127, "train_info/time_within_train_step": 2.6452395915985107, "step": 9127} {"train_info/time_between_train_steps": 0.0034685134887695312, "step": 9127} {"info/global_step": 9128, "train_info/time_within_train_step": 2.645765542984009, "step": 9128} {"train_info/time_between_train_steps": 0.0034990310668945312, "step": 9128} {"info/global_step": 9129, "train_info/time_within_train_step": 2.6549527645111084, "step": 9129} {"train_info/time_between_train_steps": 0.0034346580505371094, "step": 9129} {"info/global_step": 9130, "train_info/time_within_train_step": 2.6515238285064697, "step": 9130} {"train_info/time_between_train_steps": 0.1507425308227539, "step": 9130} {"info/global_step": 9131, "train_info/time_within_train_step": 2.652259111404419, "step": 9131} {"train_info/time_between_train_steps": 0.0034189224243164062, "step": 9131} {"info/global_step": 9132, "train_info/time_within_train_step": 2.666712522506714, "step": 9132} {"train_info/time_between_train_steps": 0.0033464431762695312, "step": 9132} {"info/global_step": 9133, "train_info/time_within_train_step": 2.6577534675598145, "step": 9133} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 9133} {"info/global_step": 9134, "train_info/time_within_train_step": 2.6725118160247803, "step": 9134} {"train_info/time_between_train_steps": 0.003319978713989258, "step": 9134} {"info/global_step": 9135, "train_info/time_within_train_step": 2.670877695083618, "step": 9135} {"train_info/time_between_train_steps": 0.003323078155517578, "step": 9135} {"info/global_step": 9136, "train_info/time_within_train_step": 2.6457669734954834, "step": 9136} {"train_info/time_between_train_steps": 0.003249645233154297, "step": 9136} {"info/global_step": 9137, "train_info/time_within_train_step": 2.6513442993164062, "step": 9137} {"train_info/time_between_train_steps": 0.0033087730407714844, "step": 9137} {"info/global_step": 9138, "train_info/time_within_train_step": 2.6446900367736816, "step": 9138} {"train_info/time_between_train_steps": 0.003271818161010742, "step": 9138} {"info/global_step": 9139, "train_info/time_within_train_step": 2.669524669647217, "step": 9139} {"train_info/time_between_train_steps": 0.0032548904418945312, "step": 9139} {"info/global_step": 9140, "train_info/time_within_train_step": 2.689765214920044, "step": 9140} {"train_info/time_between_train_steps": 0.003325223922729492, "step": 9140} {"info/global_step": 9141, "train_info/time_within_train_step": 2.660262107849121, "step": 9141} {"train_info/time_between_train_steps": 0.003289461135864258, "step": 9141} {"info/global_step": 9142, "train_info/time_within_train_step": 2.663848638534546, "step": 9142} {"train_info/time_between_train_steps": 0.0033495426177978516, "step": 9142} {"info/global_step": 9143, "train_info/time_within_train_step": 2.640758752822876, "step": 9143} {"train_info/time_between_train_steps": 0.0032405853271484375, "step": 9143} {"info/global_step": 9144, "train_info/time_within_train_step": 2.6492538452148438, "step": 9144} {"train_info/time_between_train_steps": 0.003313779830932617, "step": 9144} {"info/global_step": 9145, "train_info/time_within_train_step": 2.660257339477539, "step": 9145} {"train_info/time_between_train_steps": 0.003283977508544922, "step": 9145} {"info/global_step": 9146, "train_info/time_within_train_step": 2.6448445320129395, "step": 9146} {"train_info/time_between_train_steps": 0.0033941268920898438, "step": 9146} {"info/global_step": 9147, "train_info/time_within_train_step": 2.645981550216675, "step": 9147} {"train_info/time_between_train_steps": 0.00335693359375, "step": 9147} {"info/global_step": 9148, "train_info/time_within_train_step": 2.671928882598877, "step": 9148} {"train_info/time_between_train_steps": 0.00328826904296875, "step": 9148} {"info/global_step": 9149, "train_info/time_within_train_step": 2.9749910831451416, "step": 9149} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 9149} {"info/global_step": 9150, "train_info/time_within_train_step": 2.6450083255767822, "step": 9150} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746923094, "_runtime": 25692}, "step": 9150} {"logs": {"train/loss": 2.9487, "train/learning_rate": 5.666666666666666e-05, "train/epoch": 10.05, "_timestamp": 1746923094, "_runtime": 25692}, "step": 9150} {"train_info/time_between_train_steps": 0.05298757553100586, "step": 9150} {"info/global_step": 9151, "train_info/time_within_train_step": 2.652662515640259, "step": 9151} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 9151} {"info/global_step": 9152, "train_info/time_within_train_step": 2.6706364154815674, "step": 9152} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 9152} {"info/global_step": 9153, "train_info/time_within_train_step": 2.677619695663452, "step": 9153} {"train_info/time_between_train_steps": 0.003232717514038086, "step": 9153} {"info/global_step": 9154, "train_info/time_within_train_step": 2.649571180343628, "step": 9154} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 9154} {"info/global_step": 9155, "train_info/time_within_train_step": 2.686917304992676, "step": 9155} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 9155} {"info/global_step": 9156, "train_info/time_within_train_step": 2.648557424545288, "step": 9156} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 9156} {"info/global_step": 9157, "train_info/time_within_train_step": 2.6464364528656006, "step": 9157} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 9157} {"info/global_step": 9158, "train_info/time_within_train_step": 2.6498520374298096, "step": 9158} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 9158} {"info/global_step": 9159, "train_info/time_within_train_step": 2.6491379737854004, "step": 9159} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 9159} {"info/global_step": 9160, "train_info/time_within_train_step": 2.647866725921631, "step": 9160} {"train_info/time_between_train_steps": 0.003244161605834961, "step": 9160} {"info/global_step": 9161, "train_info/time_within_train_step": 2.663477659225464, "step": 9161} {"train_info/time_between_train_steps": 0.0033185482025146484, "step": 9161} {"info/global_step": 9162, "train_info/time_within_train_step": 2.666386842727661, "step": 9162} {"train_info/time_between_train_steps": 0.003353118896484375, "step": 9162} {"info/global_step": 9163, "train_info/time_within_train_step": 2.6574530601501465, "step": 9163} {"train_info/time_between_train_steps": 0.003392457962036133, "step": 9163} {"info/global_step": 9164, "train_info/time_within_train_step": 2.708827495574951, "step": 9164} {"train_info/time_between_train_steps": 0.003300905227661133, "step": 9164} {"info/global_step": 9165, "train_info/time_within_train_step": 2.6423285007476807, "step": 9165} {"train_info/time_between_train_steps": 0.003529071807861328, "step": 9165} {"info/global_step": 9166, "train_info/time_within_train_step": 2.642300605773926, "step": 9166} {"train_info/time_between_train_steps": 0.003454446792602539, "step": 9166} {"info/global_step": 9167, "train_info/time_within_train_step": 2.6605658531188965, "step": 9167} {"train_info/time_between_train_steps": 0.003520488739013672, "step": 9167} {"info/global_step": 9168, "train_info/time_within_train_step": 2.6546688079833984, "step": 9168} {"train_info/time_between_train_steps": 0.0036208629608154297, "step": 9168} {"info/global_step": 9169, "train_info/time_within_train_step": 2.6447272300720215, "step": 9169} {"train_info/time_between_train_steps": 0.003523588180541992, "step": 9169} {"info/global_step": 9170, "train_info/time_within_train_step": 2.6603169441223145, "step": 9170} {"train_info/time_between_train_steps": 0.003501415252685547, "step": 9170} {"info/global_step": 9171, "train_info/time_within_train_step": 2.6523303985595703, "step": 9171} {"train_info/time_between_train_steps": 0.003576993942260742, "step": 9171} {"info/global_step": 9172, "train_info/time_within_train_step": 2.6627981662750244, "step": 9172} {"train_info/time_between_train_steps": 0.003541707992553711, "step": 9172} {"info/global_step": 9173, "train_info/time_within_train_step": 2.7097582817077637, "step": 9173} {"train_info/time_between_train_steps": 0.0034644603729248047, "step": 9173} {"info/global_step": 9174, "train_info/time_within_train_step": 2.7177321910858154, "step": 9174} {"train_info/time_between_train_steps": 0.0034444332122802734, "step": 9174} {"info/global_step": 9175, "train_info/time_within_train_step": 2.6414036750793457, "step": 9175} {"train_info/time_between_train_steps": 0.0036334991455078125, "step": 9175} {"info/global_step": 9176, "train_info/time_within_train_step": 2.64318585395813, "step": 9176} {"train_info/time_between_train_steps": 0.003445148468017578, "step": 9176} {"info/global_step": 9177, "train_info/time_within_train_step": 2.6648457050323486, "step": 9177} {"train_info/time_between_train_steps": 0.00348663330078125, "step": 9177} {"info/global_step": 9178, "train_info/time_within_train_step": 2.6555447578430176, "step": 9178} {"train_info/time_between_train_steps": 0.0034716129302978516, "step": 9178} {"info/global_step": 9179, "train_info/time_within_train_step": 2.6994662284851074, "step": 9179} {"train_info/time_between_train_steps": 0.003482341766357422, "step": 9179} {"info/global_step": 9180, "train_info/time_within_train_step": 2.663191080093384, "step": 9180} {"train_info/time_between_train_steps": 0.0035147666931152344, "step": 9180} {"info/global_step": 9181, "train_info/time_within_train_step": 2.6937360763549805, "step": 9181} {"train_info/time_between_train_steps": 0.0030422210693359375, "step": 9181} {"info/global_step": 9182, "train_info/time_within_train_step": 2.6582891941070557, "step": 9182} {"train_info/time_between_train_steps": 0.003033161163330078, "step": 9182} {"info/global_step": 9183, "train_info/time_within_train_step": 2.648613214492798, "step": 9183} {"train_info/time_between_train_steps": 0.003073453903198242, "step": 9183} {"info/global_step": 9184, "train_info/time_within_train_step": 2.65286922454834, "step": 9184} {"train_info/time_between_train_steps": 0.003021240234375, "step": 9184} {"info/global_step": 9185, "train_info/time_within_train_step": 2.6501729488372803, "step": 9185} {"train_info/time_between_train_steps": 0.0030145645141601562, "step": 9185} {"info/global_step": 9186, "train_info/time_within_train_step": 2.6424622535705566, "step": 9186} {"train_info/time_between_train_steps": 0.003024578094482422, "step": 9186} {"info/global_step": 9187, "train_info/time_within_train_step": 2.6505064964294434, "step": 9187} {"train_info/time_between_train_steps": 0.0030159950256347656, "step": 9187} {"info/global_step": 9188, "train_info/time_within_train_step": 2.669968605041504, "step": 9188} {"train_info/time_between_train_steps": 0.002996683120727539, "step": 9188} {"info/global_step": 9189, "train_info/time_within_train_step": 2.6732726097106934, "step": 9189} {"train_info/time_between_train_steps": 0.0031003952026367188, "step": 9189} {"info/global_step": 9190, "train_info/time_within_train_step": 2.6518495082855225, "step": 9190} {"train_info/time_between_train_steps": 0.0031065940856933594, "step": 9190} {"info/global_step": 9191, "train_info/time_within_train_step": 2.683340549468994, "step": 9191} {"train_info/time_between_train_steps": 0.0030984878540039062, "step": 9191} {"info/global_step": 9192, "train_info/time_within_train_step": 2.6407246589660645, "step": 9192} {"train_info/time_between_train_steps": 0.003048419952392578, "step": 9192} {"info/global_step": 9193, "train_info/time_within_train_step": 2.653322696685791, "step": 9193} {"train_info/time_between_train_steps": 0.0031087398529052734, "step": 9193} {"info/global_step": 9194, "train_info/time_within_train_step": 2.992250680923462, "step": 9194} {"train_info/time_between_train_steps": 0.0030150413513183594, "step": 9194} {"info/global_step": 9195, "train_info/time_within_train_step": 2.647233009338379, "step": 9195} {"train_info/time_between_train_steps": 0.0029706954956054688, "step": 9195} {"info/global_step": 9196, "train_info/time_within_train_step": 2.683927297592163, "step": 9196} {"train_info/time_between_train_steps": 0.002948284149169922, "step": 9196} {"info/global_step": 9197, "train_info/time_within_train_step": 2.640152931213379, "step": 9197} {"train_info/time_between_train_steps": 0.0029599666595458984, "step": 9197} {"info/global_step": 9198, "train_info/time_within_train_step": 2.6447982788085938, "step": 9198} {"train_info/time_between_train_steps": 0.0029337406158447266, "step": 9198} {"info/global_step": 9199, "train_info/time_within_train_step": 2.661668062210083, "step": 9199} {"train_info/time_between_train_steps": 0.002973318099975586, "step": 9199} {"info/global_step": 9200, "train_info/time_within_train_step": 2.6481873989105225, "step": 9200} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746923228, "_runtime": 25826}, "step": 9200} {"logs": {"train/loss": 2.9445, "train/learning_rate": 5.333333333333333e-05, "train/epoch": 10.06, "_timestamp": 1746923228, "_runtime": 25826}, "step": 9200} {"train_info/time_between_train_steps": 13.139978408813477, "step": 9200} {"info/global_step": 9201, "train_info/time_within_train_step": 2.4480338096618652, "step": 9201} {"train_info/time_between_train_steps": 0.0030236244201660156, "step": 9201} {"info/global_step": 9202, "train_info/time_within_train_step": 2.436511754989624, "step": 9202} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 9202} {"info/global_step": 9203, "train_info/time_within_train_step": 2.6016221046447754, "step": 9203} {"train_info/time_between_train_steps": 0.002959012985229492, "step": 9203} {"info/global_step": 9204, "train_info/time_within_train_step": 2.637471914291382, "step": 9204} {"train_info/time_between_train_steps": 0.0029103755950927734, "step": 9204} {"info/global_step": 9205, "train_info/time_within_train_step": 2.6601662635803223, "step": 9205} {"train_info/time_between_train_steps": 0.002931356430053711, "step": 9205} {"info/global_step": 9206, "train_info/time_within_train_step": 2.6616170406341553, "step": 9206} {"train_info/time_between_train_steps": 0.002971649169921875, "step": 9206} {"info/global_step": 9207, "train_info/time_within_train_step": 2.6811559200286865, "step": 9207} {"train_info/time_between_train_steps": 0.002939939498901367, "step": 9207} {"info/global_step": 9208, "train_info/time_within_train_step": 2.659069538116455, "step": 9208} {"train_info/time_between_train_steps": 0.0029392242431640625, "step": 9208} {"info/global_step": 9209, "train_info/time_within_train_step": 2.64449143409729, "step": 9209} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 9209} {"info/global_step": 9210, "train_info/time_within_train_step": 2.6485648155212402, "step": 9210} {"train_info/time_between_train_steps": 0.002936840057373047, "step": 9210} {"info/global_step": 9211, "train_info/time_within_train_step": 2.6483511924743652, "step": 9211} {"train_info/time_between_train_steps": 0.002988576889038086, "step": 9211} {"info/global_step": 9212, "train_info/time_within_train_step": 2.6632015705108643, "step": 9212} {"train_info/time_between_train_steps": 0.0029671192169189453, "step": 9212} {"info/global_step": 9213, "train_info/time_within_train_step": 2.6577396392822266, "step": 9213} {"train_info/time_between_train_steps": 0.0030100345611572266, "step": 9213} {"info/global_step": 9214, "train_info/time_within_train_step": 2.66615629196167, "step": 9214} {"train_info/time_between_train_steps": 0.0029420852661132812, "step": 9214} {"info/global_step": 9215, "train_info/time_within_train_step": 2.6852657794952393, "step": 9215} {"train_info/time_between_train_steps": 0.0029299259185791016, "step": 9215} {"info/global_step": 9216, "train_info/time_within_train_step": 2.663844347000122, "step": 9216} {"train_info/time_between_train_steps": 0.0029594898223876953, "step": 9216} {"info/global_step": 9217, "train_info/time_within_train_step": 2.648686170578003, "step": 9217} {"train_info/time_between_train_steps": 0.003007650375366211, "step": 9217} {"info/global_step": 9218, "train_info/time_within_train_step": 2.652024745941162, "step": 9218} {"train_info/time_between_train_steps": 0.002960205078125, "step": 9218} {"info/global_step": 9219, "train_info/time_within_train_step": 2.6493442058563232, "step": 9219} {"train_info/time_between_train_steps": 0.0029239654541015625, "step": 9219} {"info/global_step": 9220, "train_info/time_within_train_step": 2.6496286392211914, "step": 9220} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 9220} {"info/global_step": 9221, "train_info/time_within_train_step": 2.6465768814086914, "step": 9221} {"train_info/time_between_train_steps": 0.0029206275939941406, "step": 9221} {"info/global_step": 9222, "train_info/time_within_train_step": 2.655104160308838, "step": 9222} {"train_info/time_between_train_steps": 0.0029671192169189453, "step": 9222} {"info/global_step": 9223, "train_info/time_within_train_step": 2.6576833724975586, "step": 9223} {"train_info/time_between_train_steps": 0.003046751022338867, "step": 9223} {"info/global_step": 9224, "train_info/time_within_train_step": 2.6729164123535156, "step": 9224} {"train_info/time_between_train_steps": 0.002996206283569336, "step": 9224} {"info/global_step": 9225, "train_info/time_within_train_step": 2.7277936935424805, "step": 9225} {"train_info/time_between_train_steps": 0.002946615219116211, "step": 9225} {"info/global_step": 9226, "train_info/time_within_train_step": 2.6602542400360107, "step": 9226} {"train_info/time_between_train_steps": 0.002938985824584961, "step": 9226} {"info/global_step": 9227, "train_info/time_within_train_step": 2.6421329975128174, "step": 9227} {"train_info/time_between_train_steps": 0.0029680728912353516, "step": 9227} {"info/global_step": 9228, "train_info/time_within_train_step": 2.660144567489624, "step": 9228} {"train_info/time_between_train_steps": 0.0029702186584472656, "step": 9228} {"info/global_step": 9229, "train_info/time_within_train_step": 2.6535117626190186, "step": 9229} {"train_info/time_between_train_steps": 0.002931356430053711, "step": 9229} {"info/global_step": 9230, "train_info/time_within_train_step": 2.6452066898345947, "step": 9230} {"train_info/time_between_train_steps": 0.0029363632202148438, "step": 9230} {"info/global_step": 9231, "train_info/time_within_train_step": 2.6535096168518066, "step": 9231} {"train_info/time_between_train_steps": 0.0029249191284179688, "step": 9231} {"info/global_step": 9232, "train_info/time_within_train_step": 2.649425506591797, "step": 9232} {"train_info/time_between_train_steps": 0.002979755401611328, "step": 9232} {"info/global_step": 9233, "train_info/time_within_train_step": 2.669706106185913, "step": 9233} {"train_info/time_between_train_steps": 0.003010272979736328, "step": 9233} {"info/global_step": 9234, "train_info/time_within_train_step": 2.701878547668457, "step": 9234} {"train_info/time_between_train_steps": 0.0030324459075927734, "step": 9234} {"info/global_step": 9235, "train_info/time_within_train_step": 2.657721519470215, "step": 9235} {"train_info/time_between_train_steps": 0.0030755996704101562, "step": 9235} {"info/global_step": 9236, "train_info/time_within_train_step": 2.664968490600586, "step": 9236} {"train_info/time_between_train_steps": 0.0031173229217529297, "step": 9236} {"info/global_step": 9237, "train_info/time_within_train_step": 2.642029047012329, "step": 9237} {"train_info/time_between_train_steps": 0.003084897994995117, "step": 9237} {"info/global_step": 9238, "train_info/time_within_train_step": 2.648851156234741, "step": 9238} {"train_info/time_between_train_steps": 0.003111124038696289, "step": 9238} {"info/global_step": 9239, "train_info/time_within_train_step": 2.6709697246551514, "step": 9239} {"train_info/time_between_train_steps": 0.0030982494354248047, "step": 9239} {"info/global_step": 9240, "train_info/time_within_train_step": 2.6437149047851562, "step": 9240} {"train_info/time_between_train_steps": 0.003091573715209961, "step": 9240} {"info/global_step": 9241, "train_info/time_within_train_step": 2.6452298164367676, "step": 9241} {"train_info/time_between_train_steps": 0.0031037330627441406, "step": 9241} {"info/global_step": 9242, "train_info/time_within_train_step": 2.666321039199829, "step": 9242} {"train_info/time_between_train_steps": 0.003061532974243164, "step": 9242} {"info/global_step": 9243, "train_info/time_within_train_step": 2.6645352840423584, "step": 9243} {"train_info/time_between_train_steps": 0.003065347671508789, "step": 9243} {"info/global_step": 9244, "train_info/time_within_train_step": 2.9285624027252197, "step": 9244} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 9244} {"info/global_step": 9245, "train_info/time_within_train_step": 2.643282413482666, "step": 9245} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 9245} {"info/global_step": 9246, "train_info/time_within_train_step": 2.668178081512451, "step": 9246} {"train_info/time_between_train_steps": 0.0029344558715820312, "step": 9246} {"info/global_step": 9247, "train_info/time_within_train_step": 2.6674492359161377, "step": 9247} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 9247} {"info/global_step": 9248, "train_info/time_within_train_step": 3.2100210189819336, "step": 9248} {"train_info/time_between_train_steps": 0.006132364273071289, "step": 9248} {"info/global_step": 9249, "train_info/time_within_train_step": 2.6462795734405518, "step": 9249} {"train_info/time_between_train_steps": 0.0030558109283447266, "step": 9249} {"info/global_step": 9250, "train_info/time_within_train_step": 2.6464200019836426, "step": 9250} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746923376, "_runtime": 25974}, "step": 9250} {"logs": {"train/loss": 2.9348, "train/learning_rate": 4.9999999999999996e-05, "train/epoch": 10.06, "_timestamp": 1746923376, "_runtime": 25974}, "step": 9250} {"train_info/time_between_train_steps": 0.02434682846069336, "step": 9250} {"info/global_step": 9251, "train_info/time_within_train_step": 2.652381658554077, "step": 9251} {"train_info/time_between_train_steps": 0.0030660629272460938, "step": 9251} {"info/global_step": 9252, "train_info/time_within_train_step": 2.643839120864868, "step": 9252} {"train_info/time_between_train_steps": 0.003045797348022461, "step": 9252} {"info/global_step": 9253, "train_info/time_within_train_step": 2.6430470943450928, "step": 9253} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 9253} {"info/global_step": 9254, "train_info/time_within_train_step": 2.661548376083374, "step": 9254} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 9254} {"info/global_step": 9255, "train_info/time_within_train_step": 2.664799213409424, "step": 9255} {"train_info/time_between_train_steps": 0.0030765533447265625, "step": 9255} {"info/global_step": 9256, "train_info/time_within_train_step": 2.682229995727539, "step": 9256} {"train_info/time_between_train_steps": 0.0031020641326904297, "step": 9256} {"info/global_step": 9257, "train_info/time_within_train_step": 2.6706666946411133, "step": 9257} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 9257} {"info/global_step": 9258, "train_info/time_within_train_step": 2.6825082302093506, "step": 9258} {"train_info/time_between_train_steps": 0.0030634403228759766, "step": 9258} {"info/global_step": 9259, "train_info/time_within_train_step": 2.642970561981201, "step": 9259} {"train_info/time_between_train_steps": 0.0030841827392578125, "step": 9259} {"info/global_step": 9260, "train_info/time_within_train_step": 2.6435658931732178, "step": 9260} {"train_info/time_between_train_steps": 0.0030875205993652344, "step": 9260} {"info/global_step": 9261, "train_info/time_within_train_step": 2.6622097492218018, "step": 9261} {"train_info/time_between_train_steps": 0.0030765533447265625, "step": 9261} {"info/global_step": 9262, "train_info/time_within_train_step": 2.6486005783081055, "step": 9262} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 9262} {"info/global_step": 9263, "train_info/time_within_train_step": 2.654284715652466, "step": 9263} {"train_info/time_between_train_steps": 0.0031061172485351562, "step": 9263} {"info/global_step": 9264, "train_info/time_within_train_step": 2.6593892574310303, "step": 9264} {"train_info/time_between_train_steps": 0.003097057342529297, "step": 9264} {"info/global_step": 9265, "train_info/time_within_train_step": 2.6724624633789062, "step": 9265} {"train_info/time_between_train_steps": 0.0030739307403564453, "step": 9265} {"info/global_step": 9266, "train_info/time_within_train_step": 2.670748233795166, "step": 9266} {"train_info/time_between_train_steps": 0.003126859664916992, "step": 9266} {"info/global_step": 9267, "train_info/time_within_train_step": 2.6832683086395264, "step": 9267} {"train_info/time_between_train_steps": 0.0030889511108398438, "step": 9267} {"info/global_step": 9268, "train_info/time_within_train_step": 2.6424076557159424, "step": 9268} {"train_info/time_between_train_steps": 0.0032248497009277344, "step": 9268} {"info/global_step": 9269, "train_info/time_within_train_step": 2.657876968383789, "step": 9269} {"train_info/time_between_train_steps": 0.003053903579711914, "step": 9269} {"info/global_step": 9270, "train_info/time_within_train_step": 2.650933265686035, "step": 9270} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 9270} {"info/global_step": 9271, "train_info/time_within_train_step": 2.660648822784424, "step": 9271} {"train_info/time_between_train_steps": 0.003122091293334961, "step": 9271} {"info/global_step": 9272, "train_info/time_within_train_step": 2.7169249057769775, "step": 9272} {"train_info/time_between_train_steps": 0.0030324459075927734, "step": 9272} {"info/global_step": 9273, "train_info/time_within_train_step": 2.640192985534668, "step": 9273} {"train_info/time_between_train_steps": 0.0031015872955322266, "step": 9273} {"info/global_step": 9274, "train_info/time_within_train_step": 2.665030002593994, "step": 9274} {"train_info/time_between_train_steps": 0.0031430721282958984, "step": 9274} {"info/global_step": 9275, "train_info/time_within_train_step": 2.6522536277770996, "step": 9275} {"train_info/time_between_train_steps": 0.003100872039794922, "step": 9275} {"info/global_step": 9276, "train_info/time_within_train_step": 2.642430067062378, "step": 9276} {"train_info/time_between_train_steps": 0.003072023391723633, "step": 9276} {"info/global_step": 9277, "train_info/time_within_train_step": 2.6520907878875732, "step": 9277} {"train_info/time_between_train_steps": 0.003136873245239258, "step": 9277} {"info/global_step": 9278, "train_info/time_within_train_step": 2.6491827964782715, "step": 9278} {"train_info/time_between_train_steps": 0.0030672550201416016, "step": 9278} {"info/global_step": 9279, "train_info/time_within_train_step": 2.6678078174591064, "step": 9279} {"train_info/time_between_train_steps": 0.003097057342529297, "step": 9279} {"info/global_step": 9280, "train_info/time_within_train_step": 2.70823073387146, "step": 9280} {"train_info/time_between_train_steps": 0.0030765533447265625, "step": 9280} {"info/global_step": 9281, "train_info/time_within_train_step": 2.6409807205200195, "step": 9281} {"train_info/time_between_train_steps": 0.0031604766845703125, "step": 9281} {"info/global_step": 9282, "train_info/time_within_train_step": 2.6518542766571045, "step": 9282} {"train_info/time_between_train_steps": 0.003032207489013672, "step": 9282} {"info/global_step": 9283, "train_info/time_within_train_step": 2.6521949768066406, "step": 9283} {"train_info/time_between_train_steps": 0.0031044483184814453, "step": 9283} {"info/global_step": 9284, "train_info/time_within_train_step": 2.6483919620513916, "step": 9284} {"train_info/time_between_train_steps": 0.0030412673950195312, "step": 9284} {"info/global_step": 9285, "train_info/time_within_train_step": 2.651406764984131, "step": 9285} {"train_info/time_between_train_steps": 0.0030281543731689453, "step": 9285} {"info/global_step": 9286, "train_info/time_within_train_step": 2.6430580615997314, "step": 9286} {"train_info/time_between_train_steps": 0.003055095672607422, "step": 9286} {"info/global_step": 9287, "train_info/time_within_train_step": 2.6503922939300537, "step": 9287} {"train_info/time_between_train_steps": 0.0031147003173828125, "step": 9287} {"info/global_step": 9288, "train_info/time_within_train_step": 2.669553279876709, "step": 9288} {"train_info/time_between_train_steps": 0.0030775070190429688, "step": 9288} {"info/global_step": 9289, "train_info/time_within_train_step": 2.672987461090088, "step": 9289} {"train_info/time_between_train_steps": 0.00308990478515625, "step": 9289} {"info/global_step": 9290, "train_info/time_within_train_step": 2.649500608444214, "step": 9290} {"train_info/time_between_train_steps": 0.003134489059448242, "step": 9290} {"info/global_step": 9291, "train_info/time_within_train_step": 2.6823341846466064, "step": 9291} {"train_info/time_between_train_steps": 0.0030791759490966797, "step": 9291} {"info/global_step": 9292, "train_info/time_within_train_step": 2.6404290199279785, "step": 9292} {"train_info/time_between_train_steps": 0.003113269805908203, "step": 9292} {"info/global_step": 9293, "train_info/time_within_train_step": 2.640983819961548, "step": 9293} {"train_info/time_between_train_steps": 0.0031180381774902344, "step": 9293} {"info/global_step": 9294, "train_info/time_within_train_step": 2.6614065170288086, "step": 9294} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 9294} {"info/global_step": 9295, "train_info/time_within_train_step": 2.648155450820923, "step": 9295} {"train_info/time_between_train_steps": 0.0030727386474609375, "step": 9295} {"info/global_step": 9296, "train_info/time_within_train_step": 2.642899751663208, "step": 9296} {"train_info/time_between_train_steps": 0.003125429153442383, "step": 9296} {"info/global_step": 9297, "train_info/time_within_train_step": 2.665480375289917, "step": 9297} {"train_info/time_between_train_steps": 0.003007173538208008, "step": 9297} {"info/global_step": 9298, "train_info/time_within_train_step": 2.65666127204895, "step": 9298} {"train_info/time_between_train_steps": 0.0031197071075439453, "step": 9298} {"info/global_step": 9299, "train_info/time_within_train_step": 2.6534390449523926, "step": 9299} {"train_info/time_between_train_steps": 0.0030968189239501953, "step": 9299} {"info/global_step": 9300, "train_info/time_within_train_step": 2.7070930004119873, "step": 9300} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746923510, "_runtime": 26108}, "step": 9300} {"logs": {"train/loss": 2.9319, "train/learning_rate": 4.6666666666666665e-05, "train/epoch": 10.07, "_timestamp": 1746923510, "_runtime": 26108}, "step": 9300} {"train_info/time_between_train_steps": 0.02435135841369629, "step": 9300} {"info/global_step": 9301, "train_info/time_within_train_step": 2.7046048641204834, "step": 9301} {"train_info/time_between_train_steps": 0.0030231475830078125, "step": 9301} {"info/global_step": 9302, "train_info/time_within_train_step": 2.641047477722168, "step": 9302} {"train_info/time_between_train_steps": 0.003055572509765625, "step": 9302} {"info/global_step": 9303, "train_info/time_within_train_step": 2.644763231277466, "step": 9303} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 9303} {"info/global_step": 9304, "train_info/time_within_train_step": 2.6641504764556885, "step": 9304} {"train_info/time_between_train_steps": 0.003065824508666992, "step": 9304} {"info/global_step": 9305, "train_info/time_within_train_step": 2.6472115516662598, "step": 9305} {"train_info/time_between_train_steps": 0.0030372142791748047, "step": 9305} {"info/global_step": 9306, "train_info/time_within_train_step": 2.642082929611206, "step": 9306} {"train_info/time_between_train_steps": 0.0030820369720458984, "step": 9306} {"info/global_step": 9307, "train_info/time_within_train_step": 2.6571078300476074, "step": 9307} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 9307} {"info/global_step": 9308, "train_info/time_within_train_step": 2.650892972946167, "step": 9308} {"train_info/time_between_train_steps": 0.003124713897705078, "step": 9308} {"info/global_step": 9309, "train_info/time_within_train_step": 2.659623622894287, "step": 9309} {"train_info/time_between_train_steps": 0.0030884742736816406, "step": 9309} {"info/global_step": 9310, "train_info/time_within_train_step": 2.710721492767334, "step": 9310} {"train_info/time_between_train_steps": 0.0030870437622070312, "step": 9310} {"info/global_step": 9311, "train_info/time_within_train_step": 2.6889474391937256, "step": 9311} {"train_info/time_between_train_steps": 0.003068685531616211, "step": 9311} {"info/global_step": 9312, "train_info/time_within_train_step": 2.639957904815674, "step": 9312} {"train_info/time_between_train_steps": 0.0030050277709960938, "step": 9312} {"info/global_step": 9313, "train_info/time_within_train_step": 2.64048433303833, "step": 9313} {"train_info/time_between_train_steps": 0.0035195350646972656, "step": 9313} {"info/global_step": 9314, "train_info/time_within_train_step": 2.640730619430542, "step": 9314} {"train_info/time_between_train_steps": 0.003061532974243164, "step": 9314} {"info/global_step": 9315, "train_info/time_within_train_step": 2.648634195327759, "step": 9315} {"train_info/time_between_train_steps": 0.003038644790649414, "step": 9315} {"info/global_step": 9316, "train_info/time_within_train_step": 2.647888422012329, "step": 9316} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 9316} {"info/global_step": 9317, "train_info/time_within_train_step": 2.644782304763794, "step": 9317} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 9317} {"info/global_step": 9318, "train_info/time_within_train_step": 2.6459801197052, "step": 9318} {"train_info/time_between_train_steps": 0.0032677650451660156, "step": 9318} {"info/global_step": 9319, "train_info/time_within_train_step": 2.6443657875061035, "step": 9319} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 9319} {"info/global_step": 9320, "train_info/time_within_train_step": 2.64326810836792, "step": 9320} {"train_info/time_between_train_steps": 0.003119945526123047, "step": 9320} {"info/global_step": 9321, "train_info/time_within_train_step": 2.643566131591797, "step": 9321} {"train_info/time_between_train_steps": 0.003226041793823242, "step": 9321} {"info/global_step": 9322, "train_info/time_within_train_step": 2.6431827545166016, "step": 9322} {"train_info/time_between_train_steps": 0.003106355667114258, "step": 9322} {"info/global_step": 9323, "train_info/time_within_train_step": 2.6473851203918457, "step": 9323} {"train_info/time_between_train_steps": 0.0030739307403564453, "step": 9323} {"info/global_step": 9324, "train_info/time_within_train_step": 2.6539194583892822, "step": 9324} {"train_info/time_between_train_steps": 0.0030050277709960938, "step": 9324} {"info/global_step": 9325, "train_info/time_within_train_step": 2.6392862796783447, "step": 9325} {"train_info/time_between_train_steps": 0.0030634403228759766, "step": 9325} {"info/global_step": 9326, "train_info/time_within_train_step": 2.6387293338775635, "step": 9326} {"train_info/time_between_train_steps": 0.0030295848846435547, "step": 9326} {"info/global_step": 9327, "train_info/time_within_train_step": 2.6446335315704346, "step": 9327} {"train_info/time_between_train_steps": 0.0030171871185302734, "step": 9327} {"info/global_step": 9328, "train_info/time_within_train_step": 2.6429240703582764, "step": 9328} {"train_info/time_between_train_steps": 0.003061056137084961, "step": 9328} {"info/global_step": 9329, "train_info/time_within_train_step": 2.6405556201934814, "step": 9329} {"train_info/time_between_train_steps": 0.003068685531616211, "step": 9329} {"info/global_step": 9330, "train_info/time_within_train_step": 2.6394474506378174, "step": 9330} {"train_info/time_between_train_steps": 0.003050565719604492, "step": 9330} {"info/global_step": 9331, "train_info/time_within_train_step": 2.639312267303467, "step": 9331} {"train_info/time_between_train_steps": 0.0030167102813720703, "step": 9331} {"info/global_step": 9332, "train_info/time_within_train_step": 2.637742042541504, "step": 9332} {"train_info/time_between_train_steps": 0.0030889511108398438, "step": 9332} {"info/global_step": 9333, "train_info/time_within_train_step": 2.6396515369415283, "step": 9333} {"train_info/time_between_train_steps": 0.00308990478515625, "step": 9333} {"info/global_step": 9334, "train_info/time_within_train_step": 2.6380741596221924, "step": 9334} {"train_info/time_between_train_steps": 0.0029964447021484375, "step": 9334} {"info/global_step": 9335, "train_info/time_within_train_step": 2.6379830837249756, "step": 9335} {"train_info/time_between_train_steps": 0.0031011104583740234, "step": 9335} {"info/global_step": 9336, "train_info/time_within_train_step": 2.6399409770965576, "step": 9336} {"train_info/time_between_train_steps": 0.0030503273010253906, "step": 9336} {"info/global_step": 9337, "train_info/time_within_train_step": 2.638561248779297, "step": 9337} {"train_info/time_between_train_steps": 0.0030591487884521484, "step": 9337} {"info/global_step": 9338, "train_info/time_within_train_step": 2.639019727706909, "step": 9338} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 9338} {"info/global_step": 9339, "train_info/time_within_train_step": 2.6387879848480225, "step": 9339} {"train_info/time_between_train_steps": 0.003068685531616211, "step": 9339} {"info/global_step": 9340, "train_info/time_within_train_step": 2.6387805938720703, "step": 9340} {"train_info/time_between_train_steps": 0.003056764602661133, "step": 9340} {"info/global_step": 9341, "train_info/time_within_train_step": 2.63796067237854, "step": 9341} {"train_info/time_between_train_steps": 0.0030248165130615234, "step": 9341} {"info/global_step": 9342, "train_info/time_within_train_step": 2.6386024951934814, "step": 9342} {"train_info/time_between_train_steps": 0.003045797348022461, "step": 9342} {"info/global_step": 9343, "train_info/time_within_train_step": 2.6396548748016357, "step": 9343} {"train_info/time_between_train_steps": 0.0030722618103027344, "step": 9343} {"info/global_step": 9344, "train_info/time_within_train_step": 2.6402268409729004, "step": 9344} {"train_info/time_between_train_steps": 0.003091096878051758, "step": 9344} {"info/global_step": 9345, "train_info/time_within_train_step": 2.6419010162353516, "step": 9345} {"train_info/time_between_train_steps": 0.003126382827758789, "step": 9345} {"info/global_step": 9346, "train_info/time_within_train_step": 2.6418721675872803, "step": 9346} {"train_info/time_between_train_steps": 0.0030646324157714844, "step": 9346} {"info/global_step": 9347, "train_info/time_within_train_step": 2.641279458999634, "step": 9347} {"train_info/time_between_train_steps": 0.0030815601348876953, "step": 9347} {"info/global_step": 9348, "train_info/time_within_train_step": 2.647625207901001, "step": 9348} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 9348} {"info/global_step": 9349, "train_info/time_within_train_step": 2.659818410873413, "step": 9349} {"train_info/time_between_train_steps": 0.003183126449584961, "step": 9349} {"info/global_step": 9350, "train_info/time_within_train_step": 2.665013551712036, "step": 9350} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746923645, "_runtime": 26243}, "step": 9350} {"logs": {"train/loss": 2.926, "train/learning_rate": 4.333333333333333e-05, "train/epoch": 10.07, "_timestamp": 1746923645, "_runtime": 26243}, "step": 9350} {"train_info/time_between_train_steps": 0.023957490921020508, "step": 9350} {"info/global_step": 9351, "train_info/time_within_train_step": 2.649129629135132, "step": 9351} {"train_info/time_between_train_steps": 0.0032901763916015625, "step": 9351} {"info/global_step": 9352, "train_info/time_within_train_step": 2.647233724594116, "step": 9352} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 9352} {"info/global_step": 9353, "train_info/time_within_train_step": 2.6403660774230957, "step": 9353} {"train_info/time_between_train_steps": 0.0031206607818603516, "step": 9353} {"info/global_step": 9354, "train_info/time_within_train_step": 2.6395487785339355, "step": 9354} {"train_info/time_between_train_steps": 0.003081083297729492, "step": 9354} {"info/global_step": 9355, "train_info/time_within_train_step": 2.6437442302703857, "step": 9355} {"train_info/time_between_train_steps": 0.0030901432037353516, "step": 9355} {"info/global_step": 9356, "train_info/time_within_train_step": 2.637406826019287, "step": 9356} {"train_info/time_between_train_steps": 0.0030798912048339844, "step": 9356} {"info/global_step": 9357, "train_info/time_within_train_step": 2.6403236389160156, "step": 9357} {"train_info/time_between_train_steps": 0.003050565719604492, "step": 9357} {"info/global_step": 9358, "train_info/time_within_train_step": 2.642324209213257, "step": 9358} {"train_info/time_between_train_steps": 0.003034830093383789, "step": 9358} {"info/global_step": 9359, "train_info/time_within_train_step": 2.638801336288452, "step": 9359} {"train_info/time_between_train_steps": 0.003081798553466797, "step": 9359} {"info/global_step": 9360, "train_info/time_within_train_step": 2.651007652282715, "step": 9360} {"train_info/time_between_train_steps": 0.0030274391174316406, "step": 9360} {"info/global_step": 9361, "train_info/time_within_train_step": 2.6387763023376465, "step": 9361} {"train_info/time_between_train_steps": 0.0030922889709472656, "step": 9361} {"info/global_step": 9362, "train_info/time_within_train_step": 2.6366524696350098, "step": 9362} {"train_info/time_between_train_steps": 0.0030350685119628906, "step": 9362} {"info/global_step": 9363, "train_info/time_within_train_step": 2.802730083465576, "step": 9363} {"train_info/time_between_train_steps": 0.002966165542602539, "step": 9363} {"info/global_step": 9364, "train_info/time_within_train_step": 2.6373209953308105, "step": 9364} {"train_info/time_between_train_steps": 0.0029611587524414062, "step": 9364} {"info/global_step": 9365, "train_info/time_within_train_step": 2.637906551361084, "step": 9365} {"train_info/time_between_train_steps": 0.002914905548095703, "step": 9365} {"info/global_step": 9366, "train_info/time_within_train_step": 2.637129068374634, "step": 9366} {"train_info/time_between_train_steps": 0.0029480457305908203, "step": 9366} {"info/global_step": 9367, "train_info/time_within_train_step": 2.637042999267578, "step": 9367} {"train_info/time_between_train_steps": 0.002934694290161133, "step": 9367} {"info/global_step": 9368, "train_info/time_within_train_step": 2.6498122215270996, "step": 9368} {"train_info/time_between_train_steps": 0.003086090087890625, "step": 9368} {"info/global_step": 9369, "train_info/time_within_train_step": 2.6501381397247314, "step": 9369} {"train_info/time_between_train_steps": 0.003037691116333008, "step": 9369} {"info/global_step": 9370, "train_info/time_within_train_step": 2.6402268409729004, "step": 9370} {"train_info/time_between_train_steps": 0.0029420852661132812, "step": 9370} {"info/global_step": 9371, "train_info/time_within_train_step": 2.637075901031494, "step": 9371} {"train_info/time_between_train_steps": 0.0029518604278564453, "step": 9371} {"info/global_step": 9372, "train_info/time_within_train_step": 2.637632131576538, "step": 9372} {"train_info/time_between_train_steps": 0.0029876232147216797, "step": 9372} {"info/global_step": 9373, "train_info/time_within_train_step": 2.6380906105041504, "step": 9373} {"train_info/time_between_train_steps": 0.0030243396759033203, "step": 9373} {"info/global_step": 9374, "train_info/time_within_train_step": 2.6374971866607666, "step": 9374} {"train_info/time_between_train_steps": 0.0029141902923583984, "step": 9374} {"info/global_step": 9375, "train_info/time_within_train_step": 2.638591766357422, "step": 9375} {"train_info/time_between_train_steps": 0.0029282569885253906, "step": 9375} {"info/global_step": 9376, "train_info/time_within_train_step": 2.637674570083618, "step": 9376} {"train_info/time_between_train_steps": 0.002959012985229492, "step": 9376} {"info/global_step": 9377, "train_info/time_within_train_step": 2.6370391845703125, "step": 9377} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 9377} {"info/global_step": 9378, "train_info/time_within_train_step": 2.639859437942505, "step": 9378} {"train_info/time_between_train_steps": 0.002990245819091797, "step": 9378} {"info/global_step": 9379, "train_info/time_within_train_step": 2.642707347869873, "step": 9379} {"train_info/time_between_train_steps": 0.003028392791748047, "step": 9379} {"info/global_step": 9380, "train_info/time_within_train_step": 2.6396448612213135, "step": 9380} {"train_info/time_between_train_steps": 0.0029859542846679688, "step": 9380} {"info/global_step": 9381, "train_info/time_within_train_step": 2.6446211338043213, "step": 9381} {"train_info/time_between_train_steps": 0.002991914749145508, "step": 9381} {"info/global_step": 9382, "train_info/time_within_train_step": 2.662501335144043, "step": 9382} {"train_info/time_between_train_steps": 0.0030241012573242188, "step": 9382} {"info/global_step": 9383, "train_info/time_within_train_step": 2.6746418476104736, "step": 9383} {"train_info/time_between_train_steps": 0.0029463768005371094, "step": 9383} {"info/global_step": 9384, "train_info/time_within_train_step": 2.6561670303344727, "step": 9384} {"train_info/time_between_train_steps": 0.002997159957885742, "step": 9384} {"info/global_step": 9385, "train_info/time_within_train_step": 2.664034366607666, "step": 9385} {"train_info/time_between_train_steps": 0.0029501914978027344, "step": 9385} {"info/global_step": 9386, "train_info/time_within_train_step": 2.6631686687469482, "step": 9386} {"train_info/time_between_train_steps": 0.002969503402709961, "step": 9386} {"info/global_step": 9387, "train_info/time_within_train_step": 2.653275728225708, "step": 9387} {"train_info/time_between_train_steps": 0.0029561519622802734, "step": 9387} {"info/global_step": 9388, "train_info/time_within_train_step": 2.6624014377593994, "step": 9388} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 9388} {"info/global_step": 9389, "train_info/time_within_train_step": 2.6435320377349854, "step": 9389} {"train_info/time_between_train_steps": 0.0029625892639160156, "step": 9389} {"info/global_step": 9390, "train_info/time_within_train_step": 2.667983293533325, "step": 9390} {"train_info/time_between_train_steps": 0.0029249191284179688, "step": 9390} {"info/global_step": 9391, "train_info/time_within_train_step": 2.6399316787719727, "step": 9391} {"train_info/time_between_train_steps": 0.0029206275939941406, "step": 9391} {"info/global_step": 9392, "train_info/time_within_train_step": 2.663358211517334, "step": 9392} {"train_info/time_between_train_steps": 0.002923727035522461, "step": 9392} {"info/global_step": 9393, "train_info/time_within_train_step": 2.641861915588379, "step": 9393} {"train_info/time_between_train_steps": 0.0029807090759277344, "step": 9393} {"info/global_step": 9394, "train_info/time_within_train_step": 2.679750919342041, "step": 9394} {"train_info/time_between_train_steps": 0.0029010772705078125, "step": 9394} {"info/global_step": 9395, "train_info/time_within_train_step": 2.6407628059387207, "step": 9395} {"train_info/time_between_train_steps": 0.003271818161010742, "step": 9395} {"info/global_step": 9396, "train_info/time_within_train_step": 2.6720378398895264, "step": 9396} {"train_info/time_between_train_steps": 0.0029685497283935547, "step": 9396} {"info/global_step": 9397, "train_info/time_within_train_step": 2.641035556793213, "step": 9397} {"train_info/time_between_train_steps": 0.0029151439666748047, "step": 9397} {"info/global_step": 9398, "train_info/time_within_train_step": 2.6662213802337646, "step": 9398} {"train_info/time_between_train_steps": 0.002895355224609375, "step": 9398} {"info/global_step": 9399, "train_info/time_within_train_step": 2.6438989639282227, "step": 9399} {"train_info/time_between_train_steps": 0.0029458999633789062, "step": 9399} {"info/global_step": 9400, "train_info/time_within_train_step": 2.68442964553833, "step": 9400} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746923779, "_runtime": 26377}, "step": 9400} {"logs": {"train/loss": 2.9171, "train/learning_rate": 3.9999999999999996e-05, "train/epoch": 10.08, "_timestamp": 1746923779, "_runtime": 26377}, "step": 9400} {"train_info/time_between_train_steps": 12.893197298049927, "step": 9400} {"info/global_step": 9401, "train_info/time_within_train_step": 2.4346578121185303, "step": 9401} {"train_info/time_between_train_steps": 0.002917766571044922, "step": 9401} {"info/global_step": 9402, "train_info/time_within_train_step": 2.4249427318573, "step": 9402} {"train_info/time_between_train_steps": 0.0029327869415283203, "step": 9402} {"info/global_step": 9403, "train_info/time_within_train_step": 2.559068202972412, "step": 9403} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 9403} {"info/global_step": 9404, "train_info/time_within_train_step": 2.6620404720306396, "step": 9404} {"train_info/time_between_train_steps": 0.002888202667236328, "step": 9404} {"info/global_step": 9405, "train_info/time_within_train_step": 2.63714599609375, "step": 9405} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 9405} {"info/global_step": 9406, "train_info/time_within_train_step": 2.682065486907959, "step": 9406} {"train_info/time_between_train_steps": 0.0029554367065429688, "step": 9406} {"info/global_step": 9407, "train_info/time_within_train_step": 2.639981985092163, "step": 9407} {"train_info/time_between_train_steps": 0.002969503402709961, "step": 9407} {"info/global_step": 9408, "train_info/time_within_train_step": 2.6744511127471924, "step": 9408} {"train_info/time_between_train_steps": 0.002897024154663086, "step": 9408} {"info/global_step": 9409, "train_info/time_within_train_step": 2.6402180194854736, "step": 9409} {"train_info/time_between_train_steps": 0.0029609203338623047, "step": 9409} {"info/global_step": 9410, "train_info/time_within_train_step": 2.6669981479644775, "step": 9410} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 9410} {"info/global_step": 9411, "train_info/time_within_train_step": 2.641639471054077, "step": 9411} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 9411} {"info/global_step": 9412, "train_info/time_within_train_step": 2.6756393909454346, "step": 9412} {"train_info/time_between_train_steps": 0.0029761791229248047, "step": 9412} {"info/global_step": 9413, "train_info/time_within_train_step": 2.643246650695801, "step": 9413} {"train_info/time_between_train_steps": 0.002930879592895508, "step": 9413} {"info/global_step": 9414, "train_info/time_within_train_step": 2.671099901199341, "step": 9414} {"train_info/time_between_train_steps": 0.00293731689453125, "step": 9414} {"info/global_step": 9415, "train_info/time_within_train_step": 2.6440484523773193, "step": 9415} {"train_info/time_between_train_steps": 0.002904653549194336, "step": 9415} {"info/global_step": 9416, "train_info/time_within_train_step": 2.6640360355377197, "step": 9416} {"train_info/time_between_train_steps": 0.0029363632202148438, "step": 9416} {"info/global_step": 9417, "train_info/time_within_train_step": 2.6460323333740234, "step": 9417} {"train_info/time_between_train_steps": 0.0029020309448242188, "step": 9417} {"info/global_step": 9418, "train_info/time_within_train_step": 2.6455063819885254, "step": 9418} {"train_info/time_between_train_steps": 0.002912759780883789, "step": 9418} {"info/global_step": 9419, "train_info/time_within_train_step": 2.64237117767334, "step": 9419} {"train_info/time_between_train_steps": 0.002970457077026367, "step": 9419} {"info/global_step": 9420, "train_info/time_within_train_step": 2.6503641605377197, "step": 9420} {"train_info/time_between_train_steps": 0.0029592514038085938, "step": 9420} {"info/global_step": 9421, "train_info/time_within_train_step": 2.64734148979187, "step": 9421} {"train_info/time_between_train_steps": 0.002911090850830078, "step": 9421} {"info/global_step": 9422, "train_info/time_within_train_step": 2.657250165939331, "step": 9422} {"train_info/time_between_train_steps": 0.0029060840606689453, "step": 9422} {"info/global_step": 9423, "train_info/time_within_train_step": 2.6535117626190186, "step": 9423} {"train_info/time_between_train_steps": 0.002942323684692383, "step": 9423} {"info/global_step": 9424, "train_info/time_within_train_step": 2.652320384979248, "step": 9424} {"train_info/time_between_train_steps": 0.002887725830078125, "step": 9424} {"info/global_step": 9425, "train_info/time_within_train_step": 2.75174880027771, "step": 9425} {"train_info/time_between_train_steps": 0.002996206283569336, "step": 9425} {"info/global_step": 9426, "train_info/time_within_train_step": 2.6450119018554688, "step": 9426} {"train_info/time_between_train_steps": 0.0029489994049072266, "step": 9426} {"info/global_step": 9427, "train_info/time_within_train_step": 2.6410787105560303, "step": 9427} {"train_info/time_between_train_steps": 0.0029366016387939453, "step": 9427} {"info/global_step": 9428, "train_info/time_within_train_step": 2.6454389095306396, "step": 9428} {"train_info/time_between_train_steps": 0.0029244422912597656, "step": 9428} {"info/global_step": 9429, "train_info/time_within_train_step": 2.642679214477539, "step": 9429} {"train_info/time_between_train_steps": 0.002969503402709961, "step": 9429} {"info/global_step": 9430, "train_info/time_within_train_step": 2.661480188369751, "step": 9430} {"train_info/time_between_train_steps": 0.0029342174530029297, "step": 9430} {"info/global_step": 9431, "train_info/time_within_train_step": 2.6498565673828125, "step": 9431} {"train_info/time_between_train_steps": 0.0029304027557373047, "step": 9431} {"info/global_step": 9432, "train_info/time_within_train_step": 2.67195200920105, "step": 9432} {"train_info/time_between_train_steps": 0.0028908252716064453, "step": 9432} {"info/global_step": 9433, "train_info/time_within_train_step": 2.650247097015381, "step": 9433} {"train_info/time_between_train_steps": 0.002955913543701172, "step": 9433} {"info/global_step": 9434, "train_info/time_within_train_step": 2.6725313663482666, "step": 9434} {"train_info/time_between_train_steps": 0.0029158592224121094, "step": 9434} {"info/global_step": 9435, "train_info/time_within_train_step": 2.6461217403411865, "step": 9435} {"train_info/time_between_train_steps": 0.0028862953186035156, "step": 9435} {"info/global_step": 9436, "train_info/time_within_train_step": 2.680028200149536, "step": 9436} {"train_info/time_between_train_steps": 0.0029478073120117188, "step": 9436} {"info/global_step": 9437, "train_info/time_within_train_step": 2.6443445682525635, "step": 9437} {"train_info/time_between_train_steps": 0.0029401779174804688, "step": 9437} {"info/global_step": 9438, "train_info/time_within_train_step": 2.661461114883423, "step": 9438} {"train_info/time_between_train_steps": 0.002878904342651367, "step": 9438} {"info/global_step": 9439, "train_info/time_within_train_step": 2.6443543434143066, "step": 9439} {"train_info/time_between_train_steps": 0.002912759780883789, "step": 9439} {"info/global_step": 9440, "train_info/time_within_train_step": 2.652066469192505, "step": 9440} {"train_info/time_between_train_steps": 0.002940654754638672, "step": 9440} {"info/global_step": 9441, "train_info/time_within_train_step": 2.6468701362609863, "step": 9441} {"train_info/time_between_train_steps": 0.0029141902923583984, "step": 9441} {"info/global_step": 9442, "train_info/time_within_train_step": 2.6525943279266357, "step": 9442} {"train_info/time_between_train_steps": 0.002932310104370117, "step": 9442} {"info/global_step": 9443, "train_info/time_within_train_step": 2.6447830200195312, "step": 9443} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 9443} {"info/global_step": 9444, "train_info/time_within_train_step": 2.6417176723480225, "step": 9444} {"train_info/time_between_train_steps": 0.0029821395874023438, "step": 9444} {"info/global_step": 9445, "train_info/time_within_train_step": 2.658766508102417, "step": 9445} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 9445} {"info/global_step": 9446, "train_info/time_within_train_step": 2.641602039337158, "step": 9446} {"train_info/time_between_train_steps": 0.0029947757720947266, "step": 9446} {"info/global_step": 9447, "train_info/time_within_train_step": 2.6551032066345215, "step": 9447} {"train_info/time_between_train_steps": 0.0029087066650390625, "step": 9447} {"info/global_step": 9448, "train_info/time_within_train_step": 2.6417946815490723, "step": 9448} {"train_info/time_between_train_steps": 0.0030226707458496094, "step": 9448} {"info/global_step": 9449, "train_info/time_within_train_step": 2.653611898422241, "step": 9449} {"train_info/time_between_train_steps": 0.0029413700103759766, "step": 9449} {"info/global_step": 9450, "train_info/time_within_train_step": 2.641606092453003, "step": 9450} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746923925, "_runtime": 26523}, "step": 9450} {"logs": {"train/loss": 2.9164, "train/learning_rate": 3.666666666666666e-05, "train/epoch": 10.08, "_timestamp": 1746923925, "_runtime": 26523}, "step": 9450} {"train_info/time_between_train_steps": 0.024065256118774414, "step": 9450} {"info/global_step": 9451, "train_info/time_within_train_step": 2.6533002853393555, "step": 9451} {"train_info/time_between_train_steps": 0.0029058456420898438, "step": 9451} {"info/global_step": 9452, "train_info/time_within_train_step": 2.6459150314331055, "step": 9452} {"train_info/time_between_train_steps": 0.0029349327087402344, "step": 9452} {"info/global_step": 9453, "train_info/time_within_train_step": 2.658412218093872, "step": 9453} {"train_info/time_between_train_steps": 0.0030143260955810547, "step": 9453} {"info/global_step": 9454, "train_info/time_within_train_step": 2.656029224395752, "step": 9454} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 9454} {"info/global_step": 9455, "train_info/time_within_train_step": 2.653444528579712, "step": 9455} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 9455} {"info/global_step": 9456, "train_info/time_within_train_step": 2.6724486351013184, "step": 9456} {"train_info/time_between_train_steps": 0.0029900074005126953, "step": 9456} {"info/global_step": 9457, "train_info/time_within_train_step": 2.6456286907196045, "step": 9457} {"train_info/time_between_train_steps": 0.002901315689086914, "step": 9457} {"info/global_step": 9458, "train_info/time_within_train_step": 2.685547351837158, "step": 9458} {"train_info/time_between_train_steps": 0.0029342174530029297, "step": 9458} {"info/global_step": 9459, "train_info/time_within_train_step": 2.6571481227874756, "step": 9459} {"train_info/time_between_train_steps": 0.002917051315307617, "step": 9459} {"info/global_step": 9460, "train_info/time_within_train_step": 2.668574333190918, "step": 9460} {"train_info/time_between_train_steps": 0.0030286312103271484, "step": 9460} {"info/global_step": 9461, "train_info/time_within_train_step": 2.6466331481933594, "step": 9461} {"train_info/time_between_train_steps": 0.0029358863830566406, "step": 9461} {"info/global_step": 9462, "train_info/time_within_train_step": 2.664807081222534, "step": 9462} {"train_info/time_between_train_steps": 0.002971172332763672, "step": 9462} {"info/global_step": 9463, "train_info/time_within_train_step": 2.6483964920043945, "step": 9463} {"train_info/time_between_train_steps": 0.0029523372650146484, "step": 9463} {"info/global_step": 9464, "train_info/time_within_train_step": 2.6735451221466064, "step": 9464} {"train_info/time_between_train_steps": 0.0030121803283691406, "step": 9464} {"info/global_step": 9465, "train_info/time_within_train_step": 2.6433684825897217, "step": 9465} {"train_info/time_between_train_steps": 0.0029990673065185547, "step": 9465} {"info/global_step": 9466, "train_info/time_within_train_step": 2.668017625808716, "step": 9466} {"train_info/time_between_train_steps": 0.003050565719604492, "step": 9466} {"info/global_step": 9467, "train_info/time_within_train_step": 2.7023019790649414, "step": 9467} {"train_info/time_between_train_steps": 0.00293731689453125, "step": 9467} {"info/global_step": 9468, "train_info/time_within_train_step": 2.6735470294952393, "step": 9468} {"train_info/time_between_train_steps": 0.002969026565551758, "step": 9468} {"info/global_step": 9469, "train_info/time_within_train_step": 2.6415812969207764, "step": 9469} {"train_info/time_between_train_steps": 0.0029442310333251953, "step": 9469} {"info/global_step": 9470, "train_info/time_within_train_step": 2.6650683879852295, "step": 9470} {"train_info/time_between_train_steps": 0.0030219554901123047, "step": 9470} {"info/global_step": 9471, "train_info/time_within_train_step": 2.651390790939331, "step": 9471} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 9471} {"info/global_step": 9472, "train_info/time_within_train_step": 2.671006917953491, "step": 9472} {"train_info/time_between_train_steps": 0.003101348876953125, "step": 9472} {"info/global_step": 9473, "train_info/time_within_train_step": 2.646714448928833, "step": 9473} {"train_info/time_between_train_steps": 0.0029802322387695312, "step": 9473} {"info/global_step": 9474, "train_info/time_within_train_step": 2.6820530891418457, "step": 9474} {"train_info/time_between_train_steps": 0.0030667781829833984, "step": 9474} {"info/global_step": 9475, "train_info/time_within_train_step": 2.6479978561401367, "step": 9475} {"train_info/time_between_train_steps": 0.003033161163330078, "step": 9475} {"info/global_step": 9476, "train_info/time_within_train_step": 2.6786606311798096, "step": 9476} {"train_info/time_between_train_steps": 0.003042459487915039, "step": 9476} {"info/global_step": 9477, "train_info/time_within_train_step": 2.642900228500366, "step": 9477} {"train_info/time_between_train_steps": 0.003047466278076172, "step": 9477} {"info/global_step": 9478, "train_info/time_within_train_step": 2.6704883575439453, "step": 9478} {"train_info/time_between_train_steps": 0.003034830093383789, "step": 9478} {"info/global_step": 9479, "train_info/time_within_train_step": 2.6449553966522217, "step": 9479} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 9479} {"info/global_step": 9480, "train_info/time_within_train_step": 2.6692898273468018, "step": 9480} {"train_info/time_between_train_steps": 0.002966165542602539, "step": 9480} {"info/global_step": 9481, "train_info/time_within_train_step": 2.64349102973938, "step": 9481} {"train_info/time_between_train_steps": 0.0031173229217529297, "step": 9481} {"info/global_step": 9482, "train_info/time_within_train_step": 2.6708152294158936, "step": 9482} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 9482} {"info/global_step": 9483, "train_info/time_within_train_step": 2.645362377166748, "step": 9483} {"train_info/time_between_train_steps": 0.003115415573120117, "step": 9483} {"info/global_step": 9484, "train_info/time_within_train_step": 2.668059825897217, "step": 9484} {"train_info/time_between_train_steps": 0.0031054019927978516, "step": 9484} {"info/global_step": 9485, "train_info/time_within_train_step": 2.651005744934082, "step": 9485} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 9485} {"info/global_step": 9486, "train_info/time_within_train_step": 2.64984130859375, "step": 9486} {"train_info/time_between_train_steps": 0.003395557403564453, "step": 9486} {"info/global_step": 9487, "train_info/time_within_train_step": 2.647592782974243, "step": 9487} {"train_info/time_between_train_steps": 0.0035085678100585938, "step": 9487} {"info/global_step": 9488, "train_info/time_within_train_step": 2.647670030593872, "step": 9488} {"train_info/time_between_train_steps": 0.003408193588256836, "step": 9488} {"info/global_step": 9489, "train_info/time_within_train_step": 2.650743246078491, "step": 9489} {"train_info/time_between_train_steps": 0.0035848617553710938, "step": 9489} {"info/global_step": 9490, "train_info/time_within_train_step": 2.653358221054077, "step": 9490} {"train_info/time_between_train_steps": 0.003380298614501953, "step": 9490} {"info/global_step": 9491, "train_info/time_within_train_step": 2.652348279953003, "step": 9491} {"train_info/time_between_train_steps": 0.003832101821899414, "step": 9491} {"info/global_step": 9492, "train_info/time_within_train_step": 2.6477136611938477, "step": 9492} {"train_info/time_between_train_steps": 0.003940105438232422, "step": 9492} {"info/global_step": 9493, "train_info/time_within_train_step": 2.6719470024108887, "step": 9493} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 9493} {"train_info/time_between_train_steps": 2.3258402347564697, "step": 9493} {"info/global_step": 9494, "train_info/time_within_train_step": 2.614548444747925, "step": 9494} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 9494} {"info/global_step": 9495, "train_info/time_within_train_step": 2.668696403503418, "step": 9495} {"train_info/time_between_train_steps": 0.0031194686889648438, "step": 9495} {"info/global_step": 9496, "train_info/time_within_train_step": 2.6485707759857178, "step": 9496} {"train_info/time_between_train_steps": 0.0031578540802001953, "step": 9496} {"info/global_step": 9497, "train_info/time_within_train_step": 2.687861680984497, "step": 9497} {"train_info/time_between_train_steps": 0.0031239986419677734, "step": 9497} {"info/global_step": 9498, "train_info/time_within_train_step": 3.228756904602051, "step": 9498} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 9498} {"info/global_step": 9499, "train_info/time_within_train_step": 2.8878228664398193, "step": 9499} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 9499} {"info/global_step": 9500, "train_info/time_within_train_step": 2.6429505348205566, "step": 9500} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746924062, "_runtime": 26660}, "step": 9500} {"logs": {"train/loss": 2.9298, "train/learning_rate": 3.333333333333333e-05, "train/epoch": 11.0, "_timestamp": 1746924062, "_runtime": 26660}, "step": 9500} {"train_info/time_between_train_steps": 0.024507522583007812, "step": 9500} {"info/global_step": 9501, "train_info/time_within_train_step": 2.641303777694702, "step": 9501} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 9501} {"info/global_step": 9502, "train_info/time_within_train_step": 2.662928819656372, "step": 9502} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 9502} {"info/global_step": 9503, "train_info/time_within_train_step": 2.64180850982666, "step": 9503} {"train_info/time_between_train_steps": 0.003122091293334961, "step": 9503} {"info/global_step": 9504, "train_info/time_within_train_step": 2.6618008613586426, "step": 9504} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 9504} {"info/global_step": 9505, "train_info/time_within_train_step": 2.6486289501190186, "step": 9505} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 9505} {"info/global_step": 9506, "train_info/time_within_train_step": 2.6642282009124756, "step": 9506} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 9506} {"info/global_step": 9507, "train_info/time_within_train_step": 2.646482467651367, "step": 9507} {"train_info/time_between_train_steps": 0.003111124038696289, "step": 9507} {"info/global_step": 9508, "train_info/time_within_train_step": 2.6460418701171875, "step": 9508} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 9508} {"info/global_step": 9509, "train_info/time_within_train_step": 2.656619071960449, "step": 9509} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 9509} {"info/global_step": 9510, "train_info/time_within_train_step": 2.646531820297241, "step": 9510} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 9510} {"info/global_step": 9511, "train_info/time_within_train_step": 2.6572906970977783, "step": 9511} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 9511} {"info/global_step": 9512, "train_info/time_within_train_step": 2.65226411819458, "step": 9512} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 9512} {"info/global_step": 9513, "train_info/time_within_train_step": 2.657060384750366, "step": 9513} {"train_info/time_between_train_steps": 0.0031180381774902344, "step": 9513} {"info/global_step": 9514, "train_info/time_within_train_step": 2.6490345001220703, "step": 9514} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 9514} {"info/global_step": 9515, "train_info/time_within_train_step": 2.670074462890625, "step": 9515} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 9515} {"info/global_step": 9516, "train_info/time_within_train_step": 2.6479341983795166, "step": 9516} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 9516} {"info/global_step": 9517, "train_info/time_within_train_step": 2.672171115875244, "step": 9517} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 9517} {"info/global_step": 9518, "train_info/time_within_train_step": 2.652848720550537, "step": 9518} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 9518} {"info/global_step": 9519, "train_info/time_within_train_step": 2.6716818809509277, "step": 9519} {"train_info/time_between_train_steps": 0.0031402111053466797, "step": 9519} {"info/global_step": 9520, "train_info/time_within_train_step": 2.648648262023926, "step": 9520} {"train_info/time_between_train_steps": 0.003116130828857422, "step": 9520} {"info/global_step": 9521, "train_info/time_within_train_step": 2.6869232654571533, "step": 9521} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 9521} {"info/global_step": 9522, "train_info/time_within_train_step": 2.6422154903411865, "step": 9522} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 9522} {"info/global_step": 9523, "train_info/time_within_train_step": 2.676584005355835, "step": 9523} {"train_info/time_between_train_steps": 0.003119230270385742, "step": 9523} {"info/global_step": 9524, "train_info/time_within_train_step": 2.642056941986084, "step": 9524} {"train_info/time_between_train_steps": 0.003118753433227539, "step": 9524} {"info/global_step": 9525, "train_info/time_within_train_step": 2.6776556968688965, "step": 9525} {"train_info/time_between_train_steps": 0.0031147003173828125, "step": 9525} {"info/global_step": 9526, "train_info/time_within_train_step": 2.6526846885681152, "step": 9526} {"train_info/time_between_train_steps": 0.0031173229217529297, "step": 9526} {"info/global_step": 9527, "train_info/time_within_train_step": 2.6710500717163086, "step": 9527} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 9527} {"info/global_step": 9528, "train_info/time_within_train_step": 2.6462392807006836, "step": 9528} {"train_info/time_between_train_steps": 0.003149747848510742, "step": 9528} {"info/global_step": 9529, "train_info/time_within_train_step": 2.6772396564483643, "step": 9529} {"train_info/time_between_train_steps": 0.0031044483184814453, "step": 9529} {"info/global_step": 9530, "train_info/time_within_train_step": 2.6473116874694824, "step": 9530} {"train_info/time_between_train_steps": 0.0031125545501708984, "step": 9530} {"info/global_step": 9531, "train_info/time_within_train_step": 2.667616844177246, "step": 9531} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 9531} {"info/global_step": 9532, "train_info/time_within_train_step": 2.669926643371582, "step": 9532} {"train_info/time_between_train_steps": 0.0031163692474365234, "step": 9532} {"info/global_step": 9533, "train_info/time_within_train_step": 2.643498420715332, "step": 9533} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 9533} {"info/global_step": 9534, "train_info/time_within_train_step": 2.6676275730133057, "step": 9534} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 9534} {"info/global_step": 9535, "train_info/time_within_train_step": 2.644927501678467, "step": 9535} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 9535} {"info/global_step": 9536, "train_info/time_within_train_step": 2.66497802734375, "step": 9536} {"train_info/time_between_train_steps": 0.0031299591064453125, "step": 9536} {"info/global_step": 9537, "train_info/time_within_train_step": 2.644073247909546, "step": 9537} {"train_info/time_between_train_steps": 0.003087759017944336, "step": 9537} {"info/global_step": 9538, "train_info/time_within_train_step": 2.673276662826538, "step": 9538} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 9538} {"info/global_step": 9539, "train_info/time_within_train_step": 2.6448445320129395, "step": 9539} {"train_info/time_between_train_steps": 0.003121614456176758, "step": 9539} {"info/global_step": 9540, "train_info/time_within_train_step": 2.6634764671325684, "step": 9540} {"train_info/time_between_train_steps": 0.0030951499938964844, "step": 9540} {"info/global_step": 9541, "train_info/time_within_train_step": 2.646746873855591, "step": 9541} {"train_info/time_between_train_steps": 0.0031807422637939453, "step": 9541} {"info/global_step": 9542, "train_info/time_within_train_step": 2.648383378982544, "step": 9542} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 9542} {"info/global_step": 9543, "train_info/time_within_train_step": 2.655123233795166, "step": 9543} {"train_info/time_between_train_steps": 0.0030891895294189453, "step": 9543} {"info/global_step": 9544, "train_info/time_within_train_step": 2.647282838821411, "step": 9544} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 9544} {"info/global_step": 9545, "train_info/time_within_train_step": 2.652390956878662, "step": 9545} {"train_info/time_between_train_steps": 0.0031218528747558594, "step": 9545} {"info/global_step": 9546, "train_info/time_within_train_step": 2.6466236114501953, "step": 9546} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 9546} {"info/global_step": 9547, "train_info/time_within_train_step": 2.6506128311157227, "step": 9547} {"train_info/time_between_train_steps": 0.0032668113708496094, "step": 9547} {"info/global_step": 9548, "train_info/time_within_train_step": 2.64676833152771, "step": 9548} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 9548} {"info/global_step": 9549, "train_info/time_within_train_step": 2.669149398803711, "step": 9549} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 9549} {"info/global_step": 9550, "train_info/time_within_train_step": 2.645932674407959, "step": 9550} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746924196, "_runtime": 26794}, "step": 9550} {"logs": {"train/loss": 2.9081, "train/learning_rate": 2.9999999999999997e-05, "train/epoch": 11.01, "_timestamp": 1746924196, "_runtime": 26794}, "step": 9550} {"train_info/time_between_train_steps": 0.025197267532348633, "step": 9550} {"info/global_step": 9551, "train_info/time_within_train_step": 2.677607297897339, "step": 9551} {"train_info/time_between_train_steps": 0.0033648014068603516, "step": 9551} {"info/global_step": 9552, "train_info/time_within_train_step": 2.642512798309326, "step": 9552} {"train_info/time_between_train_steps": 0.003466367721557617, "step": 9552} {"info/global_step": 9553, "train_info/time_within_train_step": 2.645733118057251, "step": 9553} {"train_info/time_between_train_steps": 0.003277301788330078, "step": 9553} {"info/global_step": 9554, "train_info/time_within_train_step": 2.6462242603302, "step": 9554} {"train_info/time_between_train_steps": 0.0032684803009033203, "step": 9554} {"info/global_step": 9555, "train_info/time_within_train_step": 2.6452693939208984, "step": 9555} {"train_info/time_between_train_steps": 0.003379344940185547, "step": 9555} {"info/global_step": 9556, "train_info/time_within_train_step": 2.7667298316955566, "step": 9556} {"train_info/time_between_train_steps": 0.003251314163208008, "step": 9556} {"info/global_step": 9557, "train_info/time_within_train_step": 2.6547131538391113, "step": 9557} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 9557} {"info/global_step": 9558, "train_info/time_within_train_step": 2.649059772491455, "step": 9558} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 9558} {"info/global_step": 9559, "train_info/time_within_train_step": 2.9115149974823, "step": 9559} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 9559} {"info/global_step": 9560, "train_info/time_within_train_step": 2.657914400100708, "step": 9560} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 9560} {"info/global_step": 9561, "train_info/time_within_train_step": 2.6496145725250244, "step": 9561} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 9561} {"info/global_step": 9562, "train_info/time_within_train_step": 2.674271821975708, "step": 9562} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 9562} {"info/global_step": 9563, "train_info/time_within_train_step": 2.6414635181427, "step": 9563} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 9563} {"info/global_step": 9564, "train_info/time_within_train_step": 2.678290605545044, "step": 9564} {"train_info/time_between_train_steps": 0.0032317638397216797, "step": 9564} {"info/global_step": 9565, "train_info/time_within_train_step": 2.6516335010528564, "step": 9565} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 9565} {"info/global_step": 9566, "train_info/time_within_train_step": 2.6696670055389404, "step": 9566} {"train_info/time_between_train_steps": 0.0031478404998779297, "step": 9566} {"info/global_step": 9567, "train_info/time_within_train_step": 2.650663137435913, "step": 9567} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 9567} {"info/global_step": 9568, "train_info/time_within_train_step": 2.670095443725586, "step": 9568} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 9568} {"info/global_step": 9569, "train_info/time_within_train_step": 2.6523942947387695, "step": 9569} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 9569} {"info/global_step": 9570, "train_info/time_within_train_step": 2.6796112060546875, "step": 9570} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 9570} {"info/global_step": 9571, "train_info/time_within_train_step": 2.649146556854248, "step": 9571} {"train_info/time_between_train_steps": 0.003149747848510742, "step": 9571} {"info/global_step": 9572, "train_info/time_within_train_step": 2.6882636547088623, "step": 9572} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 9572} {"info/global_step": 9573, "train_info/time_within_train_step": 2.6424152851104736, "step": 9573} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 9573} {"info/global_step": 9574, "train_info/time_within_train_step": 2.6768393516540527, "step": 9574} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 9574} {"info/global_step": 9575, "train_info/time_within_train_step": 2.6423099040985107, "step": 9575} {"train_info/time_between_train_steps": 0.0031197071075439453, "step": 9575} {"info/global_step": 9576, "train_info/time_within_train_step": 2.6487977504730225, "step": 9576} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 9576} {"info/global_step": 9577, "train_info/time_within_train_step": 2.6744256019592285, "step": 9577} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 9577} {"info/global_step": 9578, "train_info/time_within_train_step": 2.6523287296295166, "step": 9578} {"train_info/time_between_train_steps": 0.0031168460845947266, "step": 9578} {"info/global_step": 9579, "train_info/time_within_train_step": 2.670231342315674, "step": 9579} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 9579} {"info/global_step": 9580, "train_info/time_within_train_step": 2.6476449966430664, "step": 9580} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 9580} {"info/global_step": 9581, "train_info/time_within_train_step": 2.687281608581543, "step": 9581} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 9581} {"info/global_step": 9582, "train_info/time_within_train_step": 2.6426329612731934, "step": 9582} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 9582} {"info/global_step": 9583, "train_info/time_within_train_step": 2.675593852996826, "step": 9583} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 9583} {"info/global_step": 9584, "train_info/time_within_train_step": 2.643625497817993, "step": 9584} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 9584} {"info/global_step": 9585, "train_info/time_within_train_step": 2.6669602394104004, "step": 9585} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 9585} {"info/global_step": 9586, "train_info/time_within_train_step": 2.646059036254883, "step": 9586} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 9586} {"info/global_step": 9587, "train_info/time_within_train_step": 2.664515495300293, "step": 9587} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 9587} {"info/global_step": 9588, "train_info/time_within_train_step": 2.645698308944702, "step": 9588} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 9588} {"info/global_step": 9589, "train_info/time_within_train_step": 2.673581123352051, "step": 9589} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 9589} {"info/global_step": 9590, "train_info/time_within_train_step": 2.648543357849121, "step": 9590} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 9590} {"info/global_step": 9591, "train_info/time_within_train_step": 2.669801712036133, "step": 9591} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 9591} {"info/global_step": 9592, "train_info/time_within_train_step": 2.6678738594055176, "step": 9592} {"train_info/time_between_train_steps": 0.003173828125, "step": 9592} {"info/global_step": 9593, "train_info/time_within_train_step": 2.671438455581665, "step": 9593} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 9593} {"info/global_step": 9594, "train_info/time_within_train_step": 2.646019697189331, "step": 9594} {"train_info/time_between_train_steps": 0.0035161972045898438, "step": 9594} {"info/global_step": 9595, "train_info/time_within_train_step": 2.685511827468872, "step": 9595} {"train_info/time_between_train_steps": 0.0031435489654541016, "step": 9595} {"info/global_step": 9596, "train_info/time_within_train_step": 2.6424052715301514, "step": 9596} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 9596} {"info/global_step": 9597, "train_info/time_within_train_step": 2.672342300415039, "step": 9597} {"train_info/time_between_train_steps": 0.0031213760375976562, "step": 9597} {"info/global_step": 9598, "train_info/time_within_train_step": 2.644789695739746, "step": 9598} {"train_info/time_between_train_steps": 0.00312042236328125, "step": 9598} {"info/global_step": 9599, "train_info/time_within_train_step": 2.6647017002105713, "step": 9599} {"train_info/time_between_train_steps": 0.003204345703125, "step": 9599} {"info/global_step": 9600, "train_info/time_within_train_step": 2.6446011066436768, "step": 9600} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746924332, "_runtime": 26930}, "step": 9600} {"logs": {"train/loss": 2.9006, "train/learning_rate": 2.6666666666666667e-05, "train/epoch": 11.01, "_timestamp": 1746924332, "_runtime": 26930}, "step": 9600} {"train_info/time_between_train_steps": 12.677817106246948, "step": 9600} {"info/global_step": 9601, "train_info/time_within_train_step": 2.432509660720825, "step": 9601} {"train_info/time_between_train_steps": 0.0031430721282958984, "step": 9601} {"info/global_step": 9602, "train_info/time_within_train_step": 2.438736915588379, "step": 9602} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 9602} {"info/global_step": 9603, "train_info/time_within_train_step": 2.6287224292755127, "step": 9603} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 9603} {"info/global_step": 9604, "train_info/time_within_train_step": 2.6420629024505615, "step": 9604} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 9604} {"info/global_step": 9605, "train_info/time_within_train_step": 2.9071033000946045, "step": 9605} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 9605} {"info/global_step": 9606, "train_info/time_within_train_step": 2.6855599880218506, "step": 9606} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 9606} {"info/global_step": 9607, "train_info/time_within_train_step": 2.6445043087005615, "step": 9607} {"train_info/time_between_train_steps": 0.003141641616821289, "step": 9607} {"info/global_step": 9608, "train_info/time_within_train_step": 2.677142381668091, "step": 9608} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 9608} {"info/global_step": 9609, "train_info/time_within_train_step": 2.6522035598754883, "step": 9609} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 9609} {"info/global_step": 9610, "train_info/time_within_train_step": 2.6657378673553467, "step": 9610} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 9610} {"info/global_step": 9611, "train_info/time_within_train_step": 2.645817518234253, "step": 9611} {"train_info/time_between_train_steps": 0.0031261444091796875, "step": 9611} {"info/global_step": 9612, "train_info/time_within_train_step": 2.668567419052124, "step": 9612} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 9612} {"info/global_step": 9613, "train_info/time_within_train_step": 2.6452953815460205, "step": 9613} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 9613} {"info/global_step": 9614, "train_info/time_within_train_step": 2.667325019836426, "step": 9614} {"train_info/time_between_train_steps": 0.0031189918518066406, "step": 9614} {"info/global_step": 9615, "train_info/time_within_train_step": 2.6490254402160645, "step": 9615} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 9615} {"info/global_step": 9616, "train_info/time_within_train_step": 2.6625287532806396, "step": 9616} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 9616} {"info/global_step": 9617, "train_info/time_within_train_step": 2.649515151977539, "step": 9617} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 9617} {"info/global_step": 9618, "train_info/time_within_train_step": 2.6618478298187256, "step": 9618} {"train_info/time_between_train_steps": 0.12848567962646484, "step": 9618} {"info/global_step": 9619, "train_info/time_within_train_step": 2.6473283767700195, "step": 9619} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 9619} {"info/global_step": 9620, "train_info/time_within_train_step": 2.6676690578460693, "step": 9620} {"train_info/time_between_train_steps": 0.0034089088439941406, "step": 9620} {"info/global_step": 9621, "train_info/time_within_train_step": 2.6546387672424316, "step": 9621} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 9621} {"info/global_step": 9622, "train_info/time_within_train_step": 2.6711602210998535, "step": 9622} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 9622} {"info/global_step": 9623, "train_info/time_within_train_step": 2.6495845317840576, "step": 9623} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 9623} {"info/global_step": 9624, "train_info/time_within_train_step": 2.6835129261016846, "step": 9624} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 9624} {"info/global_step": 9625, "train_info/time_within_train_step": 2.6506545543670654, "step": 9625} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 9625} {"info/global_step": 9626, "train_info/time_within_train_step": 2.6785669326782227, "step": 9626} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 9626} {"info/global_step": 9627, "train_info/time_within_train_step": 2.6438896656036377, "step": 9627} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 9627} {"info/global_step": 9628, "train_info/time_within_train_step": 2.668975591659546, "step": 9628} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 9628} {"info/global_step": 9629, "train_info/time_within_train_step": 2.6452579498291016, "step": 9629} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 9629} {"info/global_step": 9630, "train_info/time_within_train_step": 2.676558256149292, "step": 9630} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 9630} {"info/global_step": 9631, "train_info/time_within_train_step": 2.6456298828125, "step": 9631} {"train_info/time_between_train_steps": 0.0031402111053466797, "step": 9631} {"info/global_step": 9632, "train_info/time_within_train_step": 2.669431686401367, "step": 9632} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 9632} {"info/global_step": 9633, "train_info/time_within_train_step": 2.647183895111084, "step": 9633} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 9633} {"info/global_step": 9634, "train_info/time_within_train_step": 2.6690075397491455, "step": 9634} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 9634} {"info/global_step": 9635, "train_info/time_within_train_step": 2.6551082134246826, "step": 9635} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 9635} {"info/global_step": 9636, "train_info/time_within_train_step": 2.6702892780303955, "step": 9636} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 9636} {"info/global_step": 9637, "train_info/time_within_train_step": 2.6487984657287598, "step": 9637} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 9637} {"info/global_step": 9638, "train_info/time_within_train_step": 2.6792380809783936, "step": 9638} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 9638} {"info/global_step": 9639, "train_info/time_within_train_step": 2.648159980773926, "step": 9639} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 9639} {"info/global_step": 9640, "train_info/time_within_train_step": 2.6675493717193604, "step": 9640} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 9640} {"info/global_step": 9641, "train_info/time_within_train_step": 2.6466519832611084, "step": 9641} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 9641} {"info/global_step": 9642, "train_info/time_within_train_step": 2.6524577140808105, "step": 9642} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 9642} {"info/global_step": 9643, "train_info/time_within_train_step": 2.6462576389312744, "step": 9643} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 9643} {"info/global_step": 9644, "train_info/time_within_train_step": 2.646649122238159, "step": 9644} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 9644} {"info/global_step": 9645, "train_info/time_within_train_step": 2.6462275981903076, "step": 9645} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 9645} {"info/global_step": 9646, "train_info/time_within_train_step": 2.6449708938598633, "step": 9646} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 9646} {"info/global_step": 9647, "train_info/time_within_train_step": 2.653707504272461, "step": 9647} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 9647} {"info/global_step": 9648, "train_info/time_within_train_step": 2.6465888023376465, "step": 9648} {"train_info/time_between_train_steps": 0.0032291412353515625, "step": 9648} {"info/global_step": 9649, "train_info/time_within_train_step": 2.655689001083374, "step": 9649} {"train_info/time_between_train_steps": 0.0031943321228027344, "step": 9649} {"info/global_step": 9650, "train_info/time_within_train_step": 2.6464550495147705, "step": 9650} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746924478, "_runtime": 27076}, "step": 9650} {"logs": {"train/loss": 2.904, "train/learning_rate": 2.3333333333333332e-05, "train/epoch": 11.02, "_timestamp": 1746924478, "_runtime": 27076}, "step": 9650} {"train_info/time_between_train_steps": 0.02458786964416504, "step": 9650} {"info/global_step": 9651, "train_info/time_within_train_step": 2.643704891204834, "step": 9651} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 9651} {"info/global_step": 9652, "train_info/time_within_train_step": 2.6691205501556396, "step": 9652} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 9652} {"info/global_step": 9653, "train_info/time_within_train_step": 2.646554470062256, "step": 9653} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 9653} {"info/global_step": 9654, "train_info/time_within_train_step": 2.6637744903564453, "step": 9654} {"train_info/time_between_train_steps": 0.0031325817108154297, "step": 9654} {"info/global_step": 9655, "train_info/time_within_train_step": 2.647425889968872, "step": 9655} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 9655} {"info/global_step": 9656, "train_info/time_within_train_step": 2.668942928314209, "step": 9656} {"train_info/time_between_train_steps": 0.0031604766845703125, "step": 9656} {"info/global_step": 9657, "train_info/time_within_train_step": 2.648904800415039, "step": 9657} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 9657} {"info/global_step": 9658, "train_info/time_within_train_step": 2.6584360599517822, "step": 9658} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 9658} {"info/global_step": 9659, "train_info/time_within_train_step": 2.6468703746795654, "step": 9659} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 9659} {"info/global_step": 9660, "train_info/time_within_train_step": 2.650869131088257, "step": 9660} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 9660} {"info/global_step": 9661, "train_info/time_within_train_step": 2.6443724632263184, "step": 9661} {"train_info/time_between_train_steps": 0.0031588077545166016, "step": 9661} {"info/global_step": 9662, "train_info/time_within_train_step": 2.6433703899383545, "step": 9662} {"train_info/time_between_train_steps": 0.0032672882080078125, "step": 9662} {"info/global_step": 9663, "train_info/time_within_train_step": 2.644714593887329, "step": 9663} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 9663} {"info/global_step": 9664, "train_info/time_within_train_step": 2.6418285369873047, "step": 9664} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 9664} {"info/global_step": 9665, "train_info/time_within_train_step": 2.6536340713500977, "step": 9665} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 9665} {"info/global_step": 9666, "train_info/time_within_train_step": 2.89814829826355, "step": 9666} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 9666} {"info/global_step": 9667, "train_info/time_within_train_step": 2.6458535194396973, "step": 9667} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 9667} {"info/global_step": 9668, "train_info/time_within_train_step": 2.67105770111084, "step": 9668} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 9668} {"info/global_step": 9669, "train_info/time_within_train_step": 2.6472089290618896, "step": 9669} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 9669} {"info/global_step": 9670, "train_info/time_within_train_step": 2.675153970718384, "step": 9670} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 9670} {"info/global_step": 9671, "train_info/time_within_train_step": 2.6524276733398438, "step": 9671} {"train_info/time_between_train_steps": 0.0031385421752929688, "step": 9671} {"info/global_step": 9672, "train_info/time_within_train_step": 2.6717095375061035, "step": 9672} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 9672} {"info/global_step": 9673, "train_info/time_within_train_step": 2.6435608863830566, "step": 9673} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 9673} {"info/global_step": 9674, "train_info/time_within_train_step": 2.6868398189544678, "step": 9674} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 9674} {"info/global_step": 9675, "train_info/time_within_train_step": 2.6428866386413574, "step": 9675} {"train_info/time_between_train_steps": 0.0032308101654052734, "step": 9675} {"info/global_step": 9676, "train_info/time_within_train_step": 2.6714401245117188, "step": 9676} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 9676} {"info/global_step": 9677, "train_info/time_within_train_step": 2.642247200012207, "step": 9677} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 9677} {"info/global_step": 9678, "train_info/time_within_train_step": 2.6644444465637207, "step": 9678} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 9678} {"info/global_step": 9679, "train_info/time_within_train_step": 2.645565986633301, "step": 9679} {"train_info/time_between_train_steps": 0.003201007843017578, "step": 9679} {"info/global_step": 9680, "train_info/time_within_train_step": 2.6649529933929443, "step": 9680} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 9680} {"info/global_step": 9681, "train_info/time_within_train_step": 2.823669195175171, "step": 9681} {"train_info/time_between_train_steps": 0.0032722949981689453, "step": 9681} {"info/global_step": 9682, "train_info/time_within_train_step": 2.6493916511535645, "step": 9682} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 9682} {"info/global_step": 9683, "train_info/time_within_train_step": 2.660994529724121, "step": 9683} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 9683} {"info/global_step": 9684, "train_info/time_within_train_step": 2.646930456161499, "step": 9684} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 9684} {"info/global_step": 9685, "train_info/time_within_train_step": 2.6407461166381836, "step": 9685} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 9685} {"info/global_step": 9686, "train_info/time_within_train_step": 2.6510162353515625, "step": 9686} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 9686} {"info/global_step": 9687, "train_info/time_within_train_step": 2.645935535430908, "step": 9687} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 9687} {"info/global_step": 9688, "train_info/time_within_train_step": 2.6538407802581787, "step": 9688} {"train_info/time_between_train_steps": 0.0032083988189697266, "step": 9688} {"info/global_step": 9689, "train_info/time_within_train_step": 2.6543595790863037, "step": 9689} {"train_info/time_between_train_steps": 0.003190755844116211, "step": 9689} {"info/global_step": 9690, "train_info/time_within_train_step": 2.654237747192383, "step": 9690} {"train_info/time_between_train_steps": 0.0032167434692382812, "step": 9690} {"info/global_step": 9691, "train_info/time_within_train_step": 2.6463279724121094, "step": 9691} {"train_info/time_between_train_steps": 0.0032186508178710938, "step": 9691} {"info/global_step": 9692, "train_info/time_within_train_step": 2.6689956188201904, "step": 9692} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 9692} {"info/global_step": 9693, "train_info/time_within_train_step": 2.645012855529785, "step": 9693} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 9693} {"info/global_step": 9694, "train_info/time_within_train_step": 2.67313814163208, "step": 9694} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 9694} {"info/global_step": 9695, "train_info/time_within_train_step": 2.652998685836792, "step": 9695} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 9695} {"info/global_step": 9696, "train_info/time_within_train_step": 2.6682560443878174, "step": 9696} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 9696} {"info/global_step": 9697, "train_info/time_within_train_step": 2.647063732147217, "step": 9697} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 9697} {"info/global_step": 9698, "train_info/time_within_train_step": 2.6797192096710205, "step": 9698} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 9698} {"info/global_step": 9699, "train_info/time_within_train_step": 2.666161060333252, "step": 9699} {"train_info/time_between_train_steps": 0.003278017044067383, "step": 9699} {"info/global_step": 9700, "train_info/time_within_train_step": 2.6455564498901367, "step": 9700} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746924613, "_runtime": 27211}, "step": 9700} {"logs": {"train/loss": 2.8844, "train/learning_rate": 1.9999999999999998e-05, "train/epoch": 11.02, "_timestamp": 1746924613, "_runtime": 27211}, "step": 9700} {"train_info/time_between_train_steps": 0.02452993392944336, "step": 9700} {"info/global_step": 9701, "train_info/time_within_train_step": 2.6515915393829346, "step": 9701} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 9701} {"info/global_step": 9702, "train_info/time_within_train_step": 2.642009973526001, "step": 9702} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 9702} {"info/global_step": 9703, "train_info/time_within_train_step": 2.6589109897613525, "step": 9703} {"train_info/time_between_train_steps": 0.0031604766845703125, "step": 9703} {"info/global_step": 9704, "train_info/time_within_train_step": 2.6415226459503174, "step": 9704} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 9704} {"info/global_step": 9705, "train_info/time_within_train_step": 2.6554079055786133, "step": 9705} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 9705} {"info/global_step": 9706, "train_info/time_within_train_step": 2.6477692127227783, "step": 9706} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 9706} {"info/global_step": 9707, "train_info/time_within_train_step": 2.6587812900543213, "step": 9707} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 9707} {"info/global_step": 9708, "train_info/time_within_train_step": 2.6712353229522705, "step": 9708} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 9708} {"info/global_step": 9709, "train_info/time_within_train_step": 2.648979425430298, "step": 9709} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 9709} {"info/global_step": 9710, "train_info/time_within_train_step": 2.945734739303589, "step": 9710} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 9710} {"info/global_step": 9711, "train_info/time_within_train_step": 2.670051097869873, "step": 9711} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 9711} {"info/global_step": 9712, "train_info/time_within_train_step": 2.647854804992676, "step": 9712} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 9712} {"info/global_step": 9713, "train_info/time_within_train_step": 2.6863110065460205, "step": 9713} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 9713} {"info/global_step": 9714, "train_info/time_within_train_step": 2.6450886726379395, "step": 9714} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 9714} {"info/global_step": 9715, "train_info/time_within_train_step": 2.6762144565582275, "step": 9715} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 9715} {"info/global_step": 9716, "train_info/time_within_train_step": 2.642456531524658, "step": 9716} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 9716} {"info/global_step": 9717, "train_info/time_within_train_step": 2.6768524646759033, "step": 9717} {"train_info/time_between_train_steps": 0.0032639503479003906, "step": 9717} {"info/global_step": 9718, "train_info/time_within_train_step": 2.649825096130371, "step": 9718} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 9718} {"info/global_step": 9719, "train_info/time_within_train_step": 2.6690616607666016, "step": 9719} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 9719} {"info/global_step": 9720, "train_info/time_within_train_step": 2.648106575012207, "step": 9720} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 9720} {"info/global_step": 9721, "train_info/time_within_train_step": 2.6902694702148438, "step": 9721} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 9721} {"info/global_step": 9722, "train_info/time_within_train_step": 2.64798641204834, "step": 9722} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 9722} {"info/global_step": 9723, "train_info/time_within_train_step": 2.6722960472106934, "step": 9723} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 9723} {"info/global_step": 9724, "train_info/time_within_train_step": 2.6492273807525635, "step": 9724} {"train_info/time_between_train_steps": 0.003237485885620117, "step": 9724} {"info/global_step": 9725, "train_info/time_within_train_step": 2.6704587936401367, "step": 9725} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 9725} {"info/global_step": 9726, "train_info/time_within_train_step": 2.6452207565307617, "step": 9726} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 9726} {"info/global_step": 9727, "train_info/time_within_train_step": 2.6761579513549805, "step": 9727} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 9727} {"info/global_step": 9728, "train_info/time_within_train_step": 2.642634153366089, "step": 9728} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 9728} {"info/global_step": 9729, "train_info/time_within_train_step": 2.660931348800659, "step": 9729} {"train_info/time_between_train_steps": 0.0031807422637939453, "step": 9729} {"info/global_step": 9730, "train_info/time_within_train_step": 2.64521861076355, "step": 9730} {"train_info/time_between_train_steps": 0.0034041404724121094, "step": 9730} {"info/global_step": 9731, "train_info/time_within_train_step": 2.6513376235961914, "step": 9731} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 9731} {"info/global_step": 9732, "train_info/time_within_train_step": 2.6454367637634277, "step": 9732} {"train_info/time_between_train_steps": 0.0033326148986816406, "step": 9732} {"info/global_step": 9733, "train_info/time_within_train_step": 2.643277883529663, "step": 9733} {"train_info/time_between_train_steps": 0.003408193588256836, "step": 9733} {"info/global_step": 9734, "train_info/time_within_train_step": 2.649061441421509, "step": 9734} {"train_info/time_between_train_steps": 0.0031499862670898438, "step": 9734} {"info/global_step": 9735, "train_info/time_within_train_step": 2.6437032222747803, "step": 9735} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 9735} {"info/global_step": 9736, "train_info/time_within_train_step": 2.661351442337036, "step": 9736} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 9736} {"info/global_step": 9737, "train_info/time_within_train_step": 2.6611738204956055, "step": 9737} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 9737} {"info/global_step": 9738, "train_info/time_within_train_step": 2.6444549560546875, "step": 9738} {"train_info/time_between_train_steps": 0.003204345703125, "step": 9738} {"info/global_step": 9739, "train_info/time_within_train_step": 2.6496658325195312, "step": 9739} {"train_info/time_between_train_steps": 0.003301858901977539, "step": 9739} {"info/global_step": 9740, "train_info/time_within_train_step": 2.6429781913757324, "step": 9740} {"train_info/time_between_train_steps": 0.0033063888549804688, "step": 9740} {"info/global_step": 9741, "train_info/time_within_train_step": 2.6492674350738525, "step": 9741} {"train_info/time_between_train_steps": 0.003260374069213867, "step": 9741} {"info/global_step": 9742, "train_info/time_within_train_step": 2.651106834411621, "step": 9742} {"train_info/time_between_train_steps": 0.0033273696899414062, "step": 9742} {"info/global_step": 9743, "train_info/time_within_train_step": 2.6474077701568604, "step": 9743} {"train_info/time_between_train_steps": 0.17209529876708984, "step": 9743} {"info/global_step": 9744, "train_info/time_within_train_step": 2.647730827331543, "step": 9744} {"train_info/time_between_train_steps": 0.003361225128173828, "step": 9744} {"info/global_step": 9745, "train_info/time_within_train_step": 2.6714961528778076, "step": 9745} {"train_info/time_between_train_steps": 0.0033032894134521484, "step": 9745} {"info/global_step": 9746, "train_info/time_within_train_step": 2.6460318565368652, "step": 9746} {"train_info/time_between_train_steps": 0.0034029483795166016, "step": 9746} {"info/global_step": 9747, "train_info/time_within_train_step": 2.661940574645996, "step": 9747} {"train_info/time_between_train_steps": 0.0033066272735595703, "step": 9747} {"info/global_step": 9748, "train_info/time_within_train_step": 3.235522508621216, "step": 9748} {"train_info/time_between_train_steps": 0.0033559799194335938, "step": 9748} {"info/global_step": 9749, "train_info/time_within_train_step": 2.660149097442627, "step": 9749} {"train_info/time_between_train_steps": 0.0033288002014160156, "step": 9749} {"info/global_step": 9750, "train_info/time_within_train_step": 2.6421072483062744, "step": 9750} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746924749, "_runtime": 27347}, "step": 9750} {"logs": {"train/loss": 2.8892, "train/learning_rate": 1.6666666666666664e-05, "train/epoch": 11.03, "_timestamp": 1746924748, "_runtime": 27346}, "step": 9750} {"train_info/time_between_train_steps": 0.02471184730529785, "step": 9750} {"info/global_step": 9751, "train_info/time_within_train_step": 2.6844289302825928, "step": 9751} {"train_info/time_between_train_steps": 0.0033767223358154297, "step": 9751} {"info/global_step": 9752, "train_info/time_within_train_step": 2.6434009075164795, "step": 9752} {"train_info/time_between_train_steps": 0.0033943653106689453, "step": 9752} {"info/global_step": 9753, "train_info/time_within_train_step": 2.6649603843688965, "step": 9753} {"train_info/time_between_train_steps": 0.003313779830932617, "step": 9753} {"info/global_step": 9754, "train_info/time_within_train_step": 2.6444461345672607, "step": 9754} {"train_info/time_between_train_steps": 0.0034317970275878906, "step": 9754} {"info/global_step": 9755, "train_info/time_within_train_step": 2.6517035961151123, "step": 9755} {"train_info/time_between_train_steps": 0.003351449966430664, "step": 9755} {"info/global_step": 9756, "train_info/time_within_train_step": 2.6456706523895264, "step": 9756} {"train_info/time_between_train_steps": 0.0033638477325439453, "step": 9756} {"info/global_step": 9757, "train_info/time_within_train_step": 2.652333974838257, "step": 9757} {"train_info/time_between_train_steps": 0.0033884048461914062, "step": 9757} {"info/global_step": 9758, "train_info/time_within_train_step": 2.646728754043579, "step": 9758} {"train_info/time_between_train_steps": 0.003398418426513672, "step": 9758} {"info/global_step": 9759, "train_info/time_within_train_step": 2.6412715911865234, "step": 9759} {"train_info/time_between_train_steps": 0.003389596939086914, "step": 9759} {"info/global_step": 9760, "train_info/time_within_train_step": 2.6455843448638916, "step": 9760} {"train_info/time_between_train_steps": 0.003499746322631836, "step": 9760} {"info/global_step": 9761, "train_info/time_within_train_step": 2.6401143074035645, "step": 9761} {"train_info/time_between_train_steps": 0.0033910274505615234, "step": 9761} {"info/global_step": 9762, "train_info/time_within_train_step": 2.654191732406616, "step": 9762} {"train_info/time_between_train_steps": 0.0033273696899414062, "step": 9762} {"info/global_step": 9763, "train_info/time_within_train_step": 2.6403393745422363, "step": 9763} {"train_info/time_between_train_steps": 0.0034570693969726562, "step": 9763} {"info/global_step": 9764, "train_info/time_within_train_step": 2.6524879932403564, "step": 9764} {"train_info/time_between_train_steps": 0.003278017044067383, "step": 9764} {"info/global_step": 9765, "train_info/time_within_train_step": 2.640751600265503, "step": 9765} {"train_info/time_between_train_steps": 0.0033273696899414062, "step": 9765} {"info/global_step": 9766, "train_info/time_within_train_step": 2.6824469566345215, "step": 9766} {"train_info/time_between_train_steps": 0.0032606124877929688, "step": 9766} {"info/global_step": 9767, "train_info/time_within_train_step": 2.6577582359313965, "step": 9767} {"train_info/time_between_train_steps": 0.0033249855041503906, "step": 9767} {"info/global_step": 9768, "train_info/time_within_train_step": 2.6713173389434814, "step": 9768} {"train_info/time_between_train_steps": 0.003318309783935547, "step": 9768} {"info/global_step": 9769, "train_info/time_within_train_step": 2.6497766971588135, "step": 9769} {"train_info/time_between_train_steps": 0.003386259078979492, "step": 9769} {"info/global_step": 9770, "train_info/time_within_train_step": 2.6874501705169678, "step": 9770} {"train_info/time_between_train_steps": 0.0033538341522216797, "step": 9770} {"info/global_step": 9771, "train_info/time_within_train_step": 2.6447784900665283, "step": 9771} {"train_info/time_between_train_steps": 0.0033690929412841797, "step": 9771} {"info/global_step": 9772, "train_info/time_within_train_step": 2.6749844551086426, "step": 9772} {"train_info/time_between_train_steps": 0.0033745765686035156, "step": 9772} {"info/global_step": 9773, "train_info/time_within_train_step": 2.6431827545166016, "step": 9773} {"train_info/time_between_train_steps": 0.003501415252685547, "step": 9773} {"info/global_step": 9774, "train_info/time_within_train_step": 2.6638083457946777, "step": 9774} {"train_info/time_between_train_steps": 0.0035109519958496094, "step": 9774} {"info/global_step": 9775, "train_info/time_within_train_step": 2.6469831466674805, "step": 9775} {"train_info/time_between_train_steps": 0.003594636917114258, "step": 9775} {"info/global_step": 9776, "train_info/time_within_train_step": 2.6476306915283203, "step": 9776} {"train_info/time_between_train_steps": 0.0034983158111572266, "step": 9776} {"info/global_step": 9777, "train_info/time_within_train_step": 2.6635324954986572, "step": 9777} {"train_info/time_between_train_steps": 0.0035398006439208984, "step": 9777} {"info/global_step": 9778, "train_info/time_within_train_step": 2.644662857055664, "step": 9778} {"train_info/time_between_train_steps": 0.0034835338592529297, "step": 9778} {"info/global_step": 9779, "train_info/time_within_train_step": 2.669058084487915, "step": 9779} {"train_info/time_between_train_steps": 0.0034897327423095703, "step": 9779} {"info/global_step": 9780, "train_info/time_within_train_step": 2.6447441577911377, "step": 9780} {"train_info/time_between_train_steps": 0.003481149673461914, "step": 9780} {"info/global_step": 9781, "train_info/time_within_train_step": 2.6610331535339355, "step": 9781} {"train_info/time_between_train_steps": 0.0035254955291748047, "step": 9781} {"info/global_step": 9782, "train_info/time_within_train_step": 2.6464643478393555, "step": 9782} {"train_info/time_between_train_steps": 0.003477334976196289, "step": 9782} {"info/global_step": 9783, "train_info/time_within_train_step": 2.6527655124664307, "step": 9783} {"train_info/time_between_train_steps": 0.0034797191619873047, "step": 9783} {"info/global_step": 9784, "train_info/time_within_train_step": 2.6458241939544678, "step": 9784} {"train_info/time_between_train_steps": 0.0034432411193847656, "step": 9784} {"info/global_step": 9785, "train_info/time_within_train_step": 2.6458566188812256, "step": 9785} {"train_info/time_between_train_steps": 0.0035495758056640625, "step": 9785} {"info/global_step": 9786, "train_info/time_within_train_step": 2.6453378200531006, "step": 9786} {"train_info/time_between_train_steps": 0.0034210681915283203, "step": 9786} {"info/global_step": 9787, "train_info/time_within_train_step": 2.643996477127075, "step": 9787} {"train_info/time_between_train_steps": 0.0035164356231689453, "step": 9787} {"info/global_step": 9788, "train_info/time_within_train_step": 2.6540844440460205, "step": 9788} {"train_info/time_between_train_steps": 0.0034999847412109375, "step": 9788} {"info/global_step": 9789, "train_info/time_within_train_step": 2.6495301723480225, "step": 9789} {"train_info/time_between_train_steps": 0.0034475326538085938, "step": 9789} {"info/global_step": 9790, "train_info/time_within_train_step": 2.6555614471435547, "step": 9790} {"train_info/time_between_train_steps": 0.0034570693969726562, "step": 9790} {"info/global_step": 9791, "train_info/time_within_train_step": 2.6594529151916504, "step": 9791} {"train_info/time_between_train_steps": 0.003422260284423828, "step": 9791} {"info/global_step": 9792, "train_info/time_within_train_step": 2.6533362865448, "step": 9792} {"train_info/time_between_train_steps": 0.003520965576171875, "step": 9792} {"info/global_step": 9793, "train_info/time_within_train_step": 2.647245407104492, "step": 9793} {"train_info/time_between_train_steps": 0.0034036636352539062, "step": 9793} {"info/global_step": 9794, "train_info/time_within_train_step": 2.6547226905822754, "step": 9794} {"train_info/time_between_train_steps": 0.0034945011138916016, "step": 9794} {"info/global_step": 9795, "train_info/time_within_train_step": 2.64766263961792, "step": 9795} {"train_info/time_between_train_steps": 0.003430604934692383, "step": 9795} {"info/global_step": 9796, "train_info/time_within_train_step": 2.653233766555786, "step": 9796} {"train_info/time_between_train_steps": 0.003435373306274414, "step": 9796} {"info/global_step": 9797, "train_info/time_within_train_step": 2.652676820755005, "step": 9797} {"train_info/time_between_train_steps": 0.0033812522888183594, "step": 9797} {"info/global_step": 9798, "train_info/time_within_train_step": 2.6529698371887207, "step": 9798} {"train_info/time_between_train_steps": 0.003460407257080078, "step": 9798} {"info/global_step": 9799, "train_info/time_within_train_step": 2.648149251937866, "step": 9799} {"train_info/time_between_train_steps": 0.0033941268920898438, "step": 9799} {"info/global_step": 9800, "train_info/time_within_train_step": 2.669078826904297, "step": 9800} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746924882, "_runtime": 27480}, "step": 9800} {"logs": {"train/loss": 2.8853, "train/learning_rate": 1.3333333333333333e-05, "train/epoch": 11.03, "_timestamp": 1746924882, "_runtime": 27480}, "step": 9800} {"train_info/time_between_train_steps": 13.748565435409546, "step": 9800} {"info/global_step": 9801, "train_info/time_within_train_step": 2.484501600265503, "step": 9801} {"train_info/time_between_train_steps": 0.0034058094024658203, "step": 9801} {"info/global_step": 9802, "train_info/time_within_train_step": 2.4517879486083984, "step": 9802} {"train_info/time_between_train_steps": 0.0033788681030273438, "step": 9802} {"info/global_step": 9803, "train_info/time_within_train_step": 2.587961196899414, "step": 9803} {"train_info/time_between_train_steps": 0.003374338150024414, "step": 9803} {"info/global_step": 9804, "train_info/time_within_train_step": 2.635800361633301, "step": 9804} {"train_info/time_between_train_steps": 0.0034286975860595703, "step": 9804} {"info/global_step": 9805, "train_info/time_within_train_step": 3.009786605834961, "step": 9805} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 9805} {"info/global_step": 9806, "train_info/time_within_train_step": 2.7977943420410156, "step": 9806} {"train_info/time_between_train_steps": 0.0032579898834228516, "step": 9806} {"info/global_step": 9807, "train_info/time_within_train_step": 2.668433904647827, "step": 9807} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 9807} {"info/global_step": 9808, "train_info/time_within_train_step": 2.647557258605957, "step": 9808} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 9808} {"info/global_step": 9809, "train_info/time_within_train_step": 2.6879096031188965, "step": 9809} {"train_info/time_between_train_steps": 0.0032358169555664062, "step": 9809} {"info/global_step": 9810, "train_info/time_within_train_step": 2.6444878578186035, "step": 9810} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 9810} {"info/global_step": 9811, "train_info/time_within_train_step": 2.6750738620758057, "step": 9811} {"train_info/time_between_train_steps": 0.0032203197479248047, "step": 9811} {"info/global_step": 9812, "train_info/time_within_train_step": 2.6438281536102295, "step": 9812} {"train_info/time_between_train_steps": 0.0032601356506347656, "step": 9812} {"info/global_step": 9813, "train_info/time_within_train_step": 2.664534091949463, "step": 9813} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 9813} {"info/global_step": 9814, "train_info/time_within_train_step": 2.65030837059021, "step": 9814} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 9814} {"info/global_step": 9815, "train_info/time_within_train_step": 2.665377378463745, "step": 9815} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 9815} {"info/global_step": 9816, "train_info/time_within_train_step": 2.6487159729003906, "step": 9816} {"train_info/time_between_train_steps": 0.003247976303100586, "step": 9816} {"info/global_step": 9817, "train_info/time_within_train_step": 2.677849531173706, "step": 9817} {"train_info/time_between_train_steps": 0.0031702518463134766, "step": 9817} {"info/global_step": 9818, "train_info/time_within_train_step": 2.641310214996338, "step": 9818} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 9818} {"info/global_step": 9819, "train_info/time_within_train_step": 2.669849395751953, "step": 9819} {"train_info/time_between_train_steps": 0.003264904022216797, "step": 9819} {"info/global_step": 9820, "train_info/time_within_train_step": 2.645566701889038, "step": 9820} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 9820} {"info/global_step": 9821, "train_info/time_within_train_step": 2.6641855239868164, "step": 9821} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 9821} {"info/global_step": 9822, "train_info/time_within_train_step": 2.64613938331604, "step": 9822} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 9822} {"info/global_step": 9823, "train_info/time_within_train_step": 2.6774842739105225, "step": 9823} {"train_info/time_between_train_steps": 0.0032219886779785156, "step": 9823} {"info/global_step": 9824, "train_info/time_within_train_step": 2.6477670669555664, "step": 9824} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 9824} {"info/global_step": 9825, "train_info/time_within_train_step": 2.6704180240631104, "step": 9825} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 9825} {"info/global_step": 9826, "train_info/time_within_train_step": 2.654555320739746, "step": 9826} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 9826} {"info/global_step": 9827, "train_info/time_within_train_step": 2.6693339347839355, "step": 9827} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 9827} {"info/global_step": 9828, "train_info/time_within_train_step": 2.647874593734741, "step": 9828} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 9828} {"info/global_step": 9829, "train_info/time_within_train_step": 2.6822991371154785, "step": 9829} {"train_info/time_between_train_steps": 0.0032339096069335938, "step": 9829} {"info/global_step": 9830, "train_info/time_within_train_step": 2.6497597694396973, "step": 9830} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 9830} {"info/global_step": 9831, "train_info/time_within_train_step": 2.6772191524505615, "step": 9831} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 9831} {"info/global_step": 9832, "train_info/time_within_train_step": 2.643887996673584, "step": 9832} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 9832} {"info/global_step": 9833, "train_info/time_within_train_step": 2.670053482055664, "step": 9833} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 9833} {"info/global_step": 9834, "train_info/time_within_train_step": 2.64493727684021, "step": 9834} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 9834} {"info/global_step": 9835, "train_info/time_within_train_step": 2.6662023067474365, "step": 9835} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 9835} {"info/global_step": 9836, "train_info/time_within_train_step": 2.6456363201141357, "step": 9836} {"train_info/time_between_train_steps": 0.0032706260681152344, "step": 9836} {"info/global_step": 9837, "train_info/time_within_train_step": 2.6752419471740723, "step": 9837} {"train_info/time_between_train_steps": 0.003233194351196289, "step": 9837} {"info/global_step": 9838, "train_info/time_within_train_step": 2.6479201316833496, "step": 9838} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 9838} {"info/global_step": 9839, "train_info/time_within_train_step": 2.6712348461151123, "step": 9839} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 9839} {"info/global_step": 9840, "train_info/time_within_train_step": 2.6542608737945557, "step": 9840} {"train_info/time_between_train_steps": 0.003215789794921875, "step": 9840} {"info/global_step": 9841, "train_info/time_within_train_step": 2.672292709350586, "step": 9841} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 9841} {"info/global_step": 9842, "train_info/time_within_train_step": 2.6514086723327637, "step": 9842} {"train_info/time_between_train_steps": 0.0032634735107421875, "step": 9842} {"info/global_step": 9843, "train_info/time_within_train_step": 2.687563896179199, "step": 9843} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 9843} {"info/global_step": 9844, "train_info/time_within_train_step": 2.646469831466675, "step": 9844} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 9844} {"info/global_step": 9845, "train_info/time_within_train_step": 2.6720986366271973, "step": 9845} {"train_info/time_between_train_steps": 0.003226757049560547, "step": 9845} {"info/global_step": 9846, "train_info/time_within_train_step": 2.646690845489502, "step": 9846} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 9846} {"info/global_step": 9847, "train_info/time_within_train_step": 2.669543981552124, "step": 9847} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 9847} {"info/global_step": 9848, "train_info/time_within_train_step": 2.6535797119140625, "step": 9848} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 9848} {"info/global_step": 9849, "train_info/time_within_train_step": 2.669473648071289, "step": 9849} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 9849} {"info/global_step": 9850, "train_info/time_within_train_step": 2.6659789085388184, "step": 9850} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746925030, "_runtime": 27628}, "step": 9850} {"logs": {"train/loss": 2.889, "train/learning_rate": 9.999999999999999e-06, "train/epoch": 11.04, "_timestamp": 1746925030, "_runtime": 27628}, "step": 9850} {"train_info/time_between_train_steps": 0.024756669998168945, "step": 9850} {"info/global_step": 9851, "train_info/time_within_train_step": 2.6457290649414062, "step": 9851} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 9851} {"info/global_step": 9852, "train_info/time_within_train_step": 2.684278726577759, "step": 9852} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 9852} {"info/global_step": 9853, "train_info/time_within_train_step": 2.643767833709717, "step": 9853} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 9853} {"info/global_step": 9854, "train_info/time_within_train_step": 2.6689038276672363, "step": 9854} {"train_info/time_between_train_steps": 0.0032248497009277344, "step": 9854} {"info/global_step": 9855, "train_info/time_within_train_step": 2.647902488708496, "step": 9855} {"train_info/time_between_train_steps": 0.0032575130462646484, "step": 9855} {"info/global_step": 9856, "train_info/time_within_train_step": 2.6699585914611816, "step": 9856} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 9856} {"info/global_step": 9857, "train_info/time_within_train_step": 2.6541380882263184, "step": 9857} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 9857} {"info/global_step": 9858, "train_info/time_within_train_step": 2.671356678009033, "step": 9858} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 9858} {"info/global_step": 9859, "train_info/time_within_train_step": 2.648681163787842, "step": 9859} {"train_info/time_between_train_steps": 0.003255128860473633, "step": 9859} {"info/global_step": 9860, "train_info/time_within_train_step": 2.684596300125122, "step": 9860} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 9860} {"info/global_step": 9861, "train_info/time_within_train_step": 2.647994041442871, "step": 9861} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 9861} {"info/global_step": 9862, "train_info/time_within_train_step": 2.667292833328247, "step": 9862} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 9862} {"info/global_step": 9863, "train_info/time_within_train_step": 2.6479651927948, "step": 9863} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 9863} {"info/global_step": 9864, "train_info/time_within_train_step": 2.6608963012695312, "step": 9864} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 9864} {"info/global_step": 9865, "train_info/time_within_train_step": 2.645677089691162, "step": 9865} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 9865} {"info/global_step": 9866, "train_info/time_within_train_step": 2.645901918411255, "step": 9866} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 9866} {"info/global_step": 9867, "train_info/time_within_train_step": 2.643932819366455, "step": 9867} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 9867} {"info/global_step": 9868, "train_info/time_within_train_step": 2.648890733718872, "step": 9868} {"train_info/time_between_train_steps": 0.13380813598632812, "step": 9868} {"info/global_step": 9869, "train_info/time_within_train_step": 2.663949728012085, "step": 9869} {"train_info/time_between_train_steps": 0.0032510757446289062, "step": 9869} {"info/global_step": 9870, "train_info/time_within_train_step": 2.6756768226623535, "step": 9870} {"train_info/time_between_train_steps": 0.0032958984375, "step": 9870} {"info/global_step": 9871, "train_info/time_within_train_step": 2.648428440093994, "step": 9871} {"train_info/time_between_train_steps": 0.0033636093139648438, "step": 9871} {"info/global_step": 9872, "train_info/time_within_train_step": 2.6738810539245605, "step": 9872} {"train_info/time_between_train_steps": 0.0033342838287353516, "step": 9872} {"info/global_step": 9873, "train_info/time_within_train_step": 2.653850555419922, "step": 9873} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 9873} {"info/global_step": 9874, "train_info/time_within_train_step": 2.6714279651641846, "step": 9874} {"train_info/time_between_train_steps": 0.0033223628997802734, "step": 9874} {"info/global_step": 9875, "train_info/time_within_train_step": 2.645545244216919, "step": 9875} {"train_info/time_between_train_steps": 0.003449678421020508, "step": 9875} {"info/global_step": 9876, "train_info/time_within_train_step": 2.6807565689086914, "step": 9876} {"train_info/time_between_train_steps": 0.0033788681030273438, "step": 9876} {"info/global_step": 9877, "train_info/time_within_train_step": 2.6443803310394287, "step": 9877} {"train_info/time_between_train_steps": 0.0033545494079589844, "step": 9877} {"info/global_step": 9878, "train_info/time_within_train_step": 2.6683197021484375, "step": 9878} {"train_info/time_between_train_steps": 0.003457307815551758, "step": 9878} {"info/global_step": 9879, "train_info/time_within_train_step": 2.648111343383789, "step": 9879} {"train_info/time_between_train_steps": 0.0034067630767822266, "step": 9879} {"info/global_step": 9880, "train_info/time_within_train_step": 2.6694605350494385, "step": 9880} {"train_info/time_between_train_steps": 0.0033698081970214844, "step": 9880} {"info/global_step": 9881, "train_info/time_within_train_step": 2.654151439666748, "step": 9881} {"train_info/time_between_train_steps": 0.003354310989379883, "step": 9881} {"info/global_step": 9882, "train_info/time_within_train_step": 2.6783759593963623, "step": 9882} {"train_info/time_between_train_steps": 0.0034456253051757812, "step": 9882} {"info/global_step": 9883, "train_info/time_within_train_step": 2.6489181518554688, "step": 9883} {"train_info/time_between_train_steps": 0.0033979415893554688, "step": 9883} {"info/global_step": 9884, "train_info/time_within_train_step": 2.6807167530059814, "step": 9884} {"train_info/time_between_train_steps": 0.0033500194549560547, "step": 9884} {"info/global_step": 9885, "train_info/time_within_train_step": 2.6489953994750977, "step": 9885} {"train_info/time_between_train_steps": 0.0033555030822753906, "step": 9885} {"info/global_step": 9886, "train_info/time_within_train_step": 2.6770169734954834, "step": 9886} {"train_info/time_between_train_steps": 0.003361940383911133, "step": 9886} {"info/global_step": 9887, "train_info/time_within_train_step": 2.643409013748169, "step": 9887} {"train_info/time_between_train_steps": 0.0034394264221191406, "step": 9887} {"info/global_step": 9888, "train_info/time_within_train_step": 2.667799472808838, "step": 9888} {"train_info/time_between_train_steps": 0.0034139156341552734, "step": 9888} {"info/global_step": 9889, "train_info/time_within_train_step": 2.6477205753326416, "step": 9889} {"train_info/time_between_train_steps": 0.003449678421020508, "step": 9889} {"info/global_step": 9890, "train_info/time_within_train_step": 2.662808895111084, "step": 9890} {"train_info/time_between_train_steps": 0.0034012794494628906, "step": 9890} {"info/global_step": 9891, "train_info/time_within_train_step": 2.649142265319824, "step": 9891} {"train_info/time_between_train_steps": 0.003314495086669922, "step": 9891} {"info/global_step": 9892, "train_info/time_within_train_step": 2.676295042037964, "step": 9892} {"train_info/time_between_train_steps": 0.0033876895904541016, "step": 9892} {"info/global_step": 9893, "train_info/time_within_train_step": 2.647702217102051, "step": 9893} {"train_info/time_between_train_steps": 0.003400564193725586, "step": 9893} {"info/global_step": 9894, "train_info/time_within_train_step": 2.6733171939849854, "step": 9894} {"train_info/time_between_train_steps": 0.0034084320068359375, "step": 9894} {"info/global_step": 9895, "train_info/time_within_train_step": 2.6489923000335693, "step": 9895} {"train_info/time_between_train_steps": 0.003405332565307617, "step": 9895} {"info/global_step": 9896, "train_info/time_within_train_step": 2.6685633659362793, "step": 9896} {"train_info/time_between_train_steps": 0.003374814987182617, "step": 9896} {"info/global_step": 9897, "train_info/time_within_train_step": 2.6465229988098145, "step": 9897} {"train_info/time_between_train_steps": 0.003306865692138672, "step": 9897} {"info/global_step": 9898, "train_info/time_within_train_step": 2.682941198348999, "step": 9898} {"train_info/time_between_train_steps": 0.003381490707397461, "step": 9898} {"info/global_step": 9899, "train_info/time_within_train_step": 2.644141674041748, "step": 9899} {"train_info/time_between_train_steps": 0.003323078155517578, "step": 9899} {"info/global_step": 9900, "train_info/time_within_train_step": 2.671405553817749, "step": 9900} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746925165, "_runtime": 27763}, "step": 9900} {"logs": {"train/loss": 2.8788, "train/learning_rate": 6.666666666666667e-06, "train/epoch": 11.04, "_timestamp": 1746925165, "_runtime": 27763}, "step": 9900} {"train_info/time_between_train_steps": 0.024399280548095703, "step": 9900} {"info/global_step": 9901, "train_info/time_within_train_step": 2.6443822383880615, "step": 9901} {"train_info/time_between_train_steps": 0.003348112106323242, "step": 9901} {"info/global_step": 9902, "train_info/time_within_train_step": 2.656409978866577, "step": 9902} {"train_info/time_between_train_steps": 0.0033817291259765625, "step": 9902} {"info/global_step": 9903, "train_info/time_within_train_step": 2.6975162029266357, "step": 9903} {"train_info/time_between_train_steps": 0.0032858848571777344, "step": 9903} {"info/global_step": 9904, "train_info/time_within_train_step": 2.6471147537231445, "step": 9904} {"train_info/time_between_train_steps": 0.003324270248413086, "step": 9904} {"info/global_step": 9905, "train_info/time_within_train_step": 3.0024495124816895, "step": 9905} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 9905} {"info/global_step": 9906, "train_info/time_within_train_step": 2.6679635047912598, "step": 9906} {"train_info/time_between_train_steps": 0.0035982131958007812, "step": 9906} {"info/global_step": 9907, "train_info/time_within_train_step": 2.6472878456115723, "step": 9907} {"train_info/time_between_train_steps": 0.0034346580505371094, "step": 9907} {"info/global_step": 9908, "train_info/time_within_train_step": 2.643702507019043, "step": 9908} {"train_info/time_between_train_steps": 0.0034499168395996094, "step": 9908} {"info/global_step": 9909, "train_info/time_within_train_step": 2.644015312194824, "step": 9909} {"train_info/time_between_train_steps": 0.0033347606658935547, "step": 9909} {"info/global_step": 9910, "train_info/time_within_train_step": 2.644270181655884, "step": 9910} {"train_info/time_between_train_steps": 0.003485441207885742, "step": 9910} {"info/global_step": 9911, "train_info/time_within_train_step": 2.6414785385131836, "step": 9911} {"train_info/time_between_train_steps": 0.0032339096069335938, "step": 9911} {"info/global_step": 9912, "train_info/time_within_train_step": 2.6417415142059326, "step": 9912} {"train_info/time_between_train_steps": 0.0032749176025390625, "step": 9912} {"info/global_step": 9913, "train_info/time_within_train_step": 2.6542487144470215, "step": 9913} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 9913} {"info/global_step": 9914, "train_info/time_within_train_step": 2.6645009517669678, "step": 9914} {"train_info/time_between_train_steps": 0.003236532211303711, "step": 9914} {"info/global_step": 9915, "train_info/time_within_train_step": 2.6653647422790527, "step": 9915} {"train_info/time_between_train_steps": 0.0032241344451904297, "step": 9915} {"info/global_step": 9916, "train_info/time_within_train_step": 2.641126871109009, "step": 9916} {"train_info/time_between_train_steps": 0.0032341480255126953, "step": 9916} {"info/global_step": 9917, "train_info/time_within_train_step": 2.666264772415161, "step": 9917} {"train_info/time_between_train_steps": 0.003258228302001953, "step": 9917} {"info/global_step": 9918, "train_info/time_within_train_step": 2.644371509552002, "step": 9918} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 9918} {"info/global_step": 9919, "train_info/time_within_train_step": 2.662551164627075, "step": 9919} {"train_info/time_between_train_steps": 0.0032825469970703125, "step": 9919} {"info/global_step": 9920, "train_info/time_within_train_step": 2.644392490386963, "step": 9920} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 9920} {"info/global_step": 9921, "train_info/time_within_train_step": 2.6724958419799805, "step": 9921} {"train_info/time_between_train_steps": 0.0032494068145751953, "step": 9921} {"info/global_step": 9922, "train_info/time_within_train_step": 2.64603853225708, "step": 9922} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 9922} {"info/global_step": 9923, "train_info/time_within_train_step": 2.6695749759674072, "step": 9923} {"train_info/time_between_train_steps": 0.0032377243041992188, "step": 9923} {"info/global_step": 9924, "train_info/time_within_train_step": 2.6512327194213867, "step": 9924} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 9924} {"info/global_step": 9925, "train_info/time_within_train_step": 2.6829586029052734, "step": 9925} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 9925} {"info/global_step": 9926, "train_info/time_within_train_step": 2.648123025894165, "step": 9926} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 9926} {"info/global_step": 9927, "train_info/time_within_train_step": 2.6848866939544678, "step": 9927} {"train_info/time_between_train_steps": 0.003229856491088867, "step": 9927} {"info/global_step": 9928, "train_info/time_within_train_step": 2.6415584087371826, "step": 9928} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 9928} {"info/global_step": 9929, "train_info/time_within_train_step": 2.674741744995117, "step": 9929} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 9929} {"info/global_step": 9930, "train_info/time_within_train_step": 2.6439974308013916, "step": 9930} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 9930} {"info/global_step": 9931, "train_info/time_within_train_step": 2.8148767948150635, "step": 9931} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 9931} {"info/global_step": 9932, "train_info/time_within_train_step": 2.6447465419769287, "step": 9932} {"train_info/time_between_train_steps": 0.0032889842987060547, "step": 9932} {"info/global_step": 9933, "train_info/time_within_train_step": 2.658586263656616, "step": 9933} {"train_info/time_between_train_steps": 0.0032334327697753906, "step": 9933} {"info/global_step": 9934, "train_info/time_within_train_step": 2.6450209617614746, "step": 9934} {"train_info/time_between_train_steps": 0.0032186508178710938, "step": 9934} {"info/global_step": 9935, "train_info/time_within_train_step": 2.6643712520599365, "step": 9935} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 9935} {"info/global_step": 9936, "train_info/time_within_train_step": 2.6524722576141357, "step": 9936} {"train_info/time_between_train_steps": 0.003298521041870117, "step": 9936} {"info/global_step": 9937, "train_info/time_within_train_step": 2.658447504043579, "step": 9937} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 9937} {"info/global_step": 9938, "train_info/time_within_train_step": 2.644662618637085, "step": 9938} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 9938} {"info/global_step": 9939, "train_info/time_within_train_step": 2.678948163986206, "step": 9939} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 9939} {"info/global_step": 9940, "train_info/time_within_train_step": 2.64570951461792, "step": 9940} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 9940} {"info/global_step": 9941, "train_info/time_within_train_step": 2.676988124847412, "step": 9941} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 9941} {"info/global_step": 9942, "train_info/time_within_train_step": 2.6537437438964844, "step": 9942} {"train_info/time_between_train_steps": 0.003293752670288086, "step": 9942} {"info/global_step": 9943, "train_info/time_within_train_step": 2.674600601196289, "step": 9943} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 9943} {"info/global_step": 9944, "train_info/time_within_train_step": 2.642651081085205, "step": 9944} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 9944} {"info/global_step": 9945, "train_info/time_within_train_step": 2.6711223125457764, "step": 9945} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 9945} {"info/global_step": 9946, "train_info/time_within_train_step": 2.643909454345703, "step": 9946} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 9946} {"info/global_step": 9947, "train_info/time_within_train_step": 2.66705322265625, "step": 9947} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 9947} {"info/global_step": 9948, "train_info/time_within_train_step": 2.64660906791687, "step": 9948} {"train_info/time_between_train_steps": 0.0031478404998779297, "step": 9948} {"info/global_step": 9949, "train_info/time_within_train_step": 2.671017646789551, "step": 9949} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 9949} {"info/global_step": 9950, "train_info/time_within_train_step": 2.652531385421753, "step": 9950} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746925300, "_runtime": 27898}, "step": 9950} {"logs": {"train/loss": 2.8821, "train/learning_rate": 3.3333333333333333e-06, "train/epoch": 11.05, "_timestamp": 1746925300, "_runtime": 27898}, "step": 9950} {"train_info/time_between_train_steps": 0.02466297149658203, "step": 9950} {"info/global_step": 9951, "train_info/time_within_train_step": 2.674166679382324, "step": 9951} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 9951} {"info/global_step": 9952, "train_info/time_within_train_step": 2.6420023441314697, "step": 9952} {"train_info/time_between_train_steps": 0.0032503604888916016, "step": 9952} {"info/global_step": 9953, "train_info/time_within_train_step": 2.6731019020080566, "step": 9953} {"train_info/time_between_train_steps": 0.0032629966735839844, "step": 9953} {"info/global_step": 9954, "train_info/time_within_train_step": 2.642979383468628, "step": 9954} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 9954} {"info/global_step": 9955, "train_info/time_within_train_step": 2.667832374572754, "step": 9955} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 9955} {"info/global_step": 9956, "train_info/time_within_train_step": 2.6438212394714355, "step": 9956} {"train_info/time_between_train_steps": 0.0032546520233154297, "step": 9956} {"info/global_step": 9957, "train_info/time_within_train_step": 2.676281213760376, "step": 9957} {"train_info/time_between_train_steps": 0.0032460689544677734, "step": 9957} {"info/global_step": 9958, "train_info/time_within_train_step": 2.669774293899536, "step": 9958} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 9958} {"info/global_step": 9959, "train_info/time_within_train_step": 2.6438968181610107, "step": 9959} {"train_info/time_between_train_steps": 0.0032498836517333984, "step": 9959} {"info/global_step": 9960, "train_info/time_within_train_step": 2.6561214923858643, "step": 9960} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 9960} {"info/global_step": 9961, "train_info/time_within_train_step": 2.6511430740356445, "step": 9961} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 9961} {"info/global_step": 9962, "train_info/time_within_train_step": 2.6710681915283203, "step": 9962} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 9962} {"info/global_step": 9963, "train_info/time_within_train_step": 2.9272947311401367, "step": 9963} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 9963} {"info/global_step": 9964, "train_info/time_within_train_step": 2.645334243774414, "step": 9964} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 9964} {"info/global_step": 9965, "train_info/time_within_train_step": 2.672252655029297, "step": 9965} {"train_info/time_between_train_steps": 0.003265380859375, "step": 9965} {"info/global_step": 9966, "train_info/time_within_train_step": 2.653291702270508, "step": 9966} {"train_info/time_between_train_steps": 0.003231525421142578, "step": 9966} {"info/global_step": 9967, "train_info/time_within_train_step": 2.6703052520751953, "step": 9967} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 9967} {"info/global_step": 9968, "train_info/time_within_train_step": 2.6406896114349365, "step": 9968} {"train_info/time_between_train_steps": 0.0032753944396972656, "step": 9968} {"info/global_step": 9969, "train_info/time_within_train_step": 2.682880401611328, "step": 9969} {"train_info/time_between_train_steps": 0.003246784210205078, "step": 9969} {"info/global_step": 9970, "train_info/time_within_train_step": 2.6420462131500244, "step": 9970} {"train_info/time_between_train_steps": 0.0033063888549804688, "step": 9970} {"info/global_step": 9971, "train_info/time_within_train_step": 2.668851137161255, "step": 9971} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 9971} {"info/global_step": 9972, "train_info/time_within_train_step": 2.6479694843292236, "step": 9972} {"train_info/time_between_train_steps": 0.0032401084899902344, "step": 9972} {"info/global_step": 9973, "train_info/time_within_train_step": 2.6708524227142334, "step": 9973} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 9973} {"info/global_step": 9974, "train_info/time_within_train_step": 2.654029607772827, "step": 9974} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 9974} {"info/global_step": 9975, "train_info/time_within_train_step": 2.6717889308929443, "step": 9975} {"train_info/time_between_train_steps": 0.003229379653930664, "step": 9975} {"info/global_step": 9976, "train_info/time_within_train_step": 2.649489164352417, "step": 9976} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 9976} {"info/global_step": 9977, "train_info/time_within_train_step": 2.687617540359497, "step": 9977} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 9977} {"info/global_step": 9978, "train_info/time_within_train_step": 2.6442949771881104, "step": 9978} {"train_info/time_between_train_steps": 0.003226757049560547, "step": 9978} {"info/global_step": 9979, "train_info/time_within_train_step": 2.670933961868286, "step": 9979} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 9979} {"info/global_step": 9980, "train_info/time_within_train_step": 2.643484354019165, "step": 9980} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 9980} {"info/global_step": 9981, "train_info/time_within_train_step": 2.6657917499542236, "step": 9981} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 9981} {"info/global_step": 9982, "train_info/time_within_train_step": 2.652118682861328, "step": 9982} {"train_info/time_between_train_steps": 0.003208160400390625, "step": 9982} {"info/global_step": 9983, "train_info/time_within_train_step": 2.6675865650177, "step": 9983} {"train_info/time_between_train_steps": 0.003258943557739258, "step": 9983} {"info/global_step": 9984, "train_info/time_within_train_step": 2.6464037895202637, "step": 9984} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 9984} {"info/global_step": 9985, "train_info/time_within_train_step": 2.6873576641082764, "step": 9985} {"train_info/time_between_train_steps": 0.0033063888549804688, "step": 9985} {"info/global_step": 9986, "train_info/time_within_train_step": 2.6488215923309326, "step": 9986} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 9986} {"info/global_step": 9987, "train_info/time_within_train_step": 2.6733808517456055, "step": 9987} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 9987} {"info/global_step": 9988, "train_info/time_within_train_step": 2.645024538040161, "step": 9988} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 9988} {"info/global_step": 9989, "train_info/time_within_train_step": 2.6730926036834717, "step": 9989} {"train_info/time_between_train_steps": 0.003347635269165039, "step": 9989} {"info/global_step": 9990, "train_info/time_within_train_step": 2.6442461013793945, "step": 9990} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 9990} {"info/global_step": 9991, "train_info/time_within_train_step": 2.666436195373535, "step": 9991} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 9991} {"info/global_step": 9992, "train_info/time_within_train_step": 2.6424899101257324, "step": 9992} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 9992} {"info/global_step": 9993, "train_info/time_within_train_step": 2.689732789993286, "step": 9993} {"train_info/time_between_train_steps": 0.1201322078704834, "step": 9993} {"info/global_step": 9994, "train_info/time_within_train_step": 2.6457908153533936, "step": 9994} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 9994} {"info/global_step": 9995, "train_info/time_within_train_step": 2.6709632873535156, "step": 9995} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 9995} {"info/global_step": 9996, "train_info/time_within_train_step": 2.645714282989502, "step": 9996} {"train_info/time_between_train_steps": 0.0032219886779785156, "step": 9996} {"info/global_step": 9997, "train_info/time_within_train_step": 2.666620969772339, "step": 9997} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 9997} {"info/global_step": 9998, "train_info/time_within_train_step": 3.2512149810791016, "step": 9998} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 9998} {"info/global_step": 9999, "train_info/time_within_train_step": 2.6670968532562256, "step": 9999} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 9999} {"info/global_step": 10000, "train_info/time_within_train_step": 2.644547939300537, "step": 10000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746925435, "_runtime": 28033}, "step": 10000} {"logs": {"train/loss": 2.8754, "train/learning_rate": 0.0, "train/epoch": 11.05, "_timestamp": 1746925435, "_runtime": 28033}, "step": 10000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746925441, "_runtime": 28039}, "step": 10000} {"logs": {"eval/loss": 4.802618026733398, "eval/runtime": 5.1726, "eval/samples_per_second": 37.119, "eval/steps_per_second": 1.16, "train/epoch": 11.05, "_timestamp": 1746925441, "_runtime": 28039}, "step": 10000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746925441, "_runtime": 28039}, "step": 10000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.802618026733398, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 121.82895182391071, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1726, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 37.119, "train/epoch": 11.05, "_timestamp": 1746925441, "_runtime": 28039}, "step": 10000} {"train_info": {"train_info/memory_allocated": 1645.4873046875, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746925454, "_runtime": 28052}, "step": 10000} {"logs": {"train/train_runtime": 28052.704, "train/train_samples_per_second": 22.814, "train/train_steps_per_second": 0.356, "train/total_flos": 8.3630695514112e+16, "train/train_loss": 3.8252799322128297, "train/epoch": 11.05, "_timestamp": 1746925454, "_runtime": 28052}, "step": 10000} {"train_info": {"train_info/memory_allocated": 1645.486328125, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746925463, "_runtime": 28061}, "step": 10000} {"logs": {"eval/loss": 4.802618026733398, "eval/runtime": 4.7346, "eval/samples_per_second": 40.552, "eval/steps_per_second": 1.267, "train/epoch": 11.05, "_timestamp": 1746925463, "_runtime": 28061}, "step": 10000} {"train_info": {"train_info/memory_allocated": 1645.486328125, "train_info/memory_max_allocated": 5134.96240234375, "train_info/memory_reserved": 8294.0, "train_info/memory_max_reserved": 8294.0, "_timestamp": 1746925463, "_runtime": 28061}, "step": 10000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.802618026733398, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 121.82895182391071, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 4.7346, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 40.552, "train/epoch": 11.05, "_timestamp": 1746925463, "_runtime": 28061}, "step": 10000}