{"num_parameters": 124439808, "trainable_parameters": 124439808, "step": 0} {"train_info/time_between_train_steps": 3.821139097213745, "step": 0} {"info/global_step": 1, "train_info/time_within_train_step": 28.533889055252075, "step": 1} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 19761.71484375, "train_info/memory_reserved": 22624.0, "train_info/memory_max_reserved": 22624.0, "_timestamp": 1733861725, "_runtime": 37}, "step": 1} {"logs": {"train/loss": 10.8568, "train/learning_rate": 4.9999999999999996e-06, "train/epoch": 0.0, "_timestamp": 1733861725, "_runtime": 37}, "step": 1} {"train_info/time_between_train_steps": 0.008469104766845703, "step": 1} {"info/global_step": 2, "train_info/time_within_train_step": 28.037352323532104, "step": 2} {"train_info/time_between_train_steps": 0.005648136138916016, "step": 2} {"info/global_step": 3, "train_info/time_within_train_step": 27.87070369720459, "step": 3} {"train_info/time_between_train_steps": 0.005811452865600586, "step": 3} {"info/global_step": 4, "train_info/time_within_train_step": 28.119908809661865, "step": 4} {"train_info/time_between_train_steps": 0.010096311569213867, "step": 4} {"info/global_step": 5, "train_info/time_within_train_step": 28.18924331665039, "step": 5} {"train_info/time_between_train_steps": 0.005335807800292969, "step": 5} {"info/global_step": 6, "train_info/time_within_train_step": 27.95185136795044, "step": 6} {"train_info/time_between_train_steps": 0.0058629512786865234, "step": 6} {"info/global_step": 7, "train_info/time_within_train_step": 28.15664267539978, "step": 7} {"train_info/time_between_train_steps": 0.013402462005615234, "step": 7} {"info/global_step": 8, "train_info/time_within_train_step": 27.89963722229004, "step": 8} {"train_info/time_between_train_steps": 0.014599084854125977, "step": 8} {"info/global_step": 9, "train_info/time_within_train_step": 28.237628936767578, "step": 9} {"train_info/time_between_train_steps": 0.00685882568359375, "step": 9} {"info/global_step": 10, "train_info/time_within_train_step": 27.834078788757324, "step": 10} {"train_info/time_between_train_steps": 0.013814210891723633, "step": 10} {"info/global_step": 11, "train_info/time_within_train_step": 28.312318325042725, "step": 11} {"train_info/time_between_train_steps": 0.006107330322265625, "step": 11} {"info/global_step": 12, "train_info/time_within_train_step": 28.011987924575806, "step": 12} {"train_info/time_between_train_steps": 0.005248308181762695, "step": 12} {"info/global_step": 13, "train_info/time_within_train_step": 27.861613273620605, "step": 13} {"train_info/time_between_train_steps": 0.005290985107421875, "step": 13} {"info/global_step": 14, "train_info/time_within_train_step": 27.869736194610596, "step": 14} {"train_info/time_between_train_steps": 0.0052640438079833984, "step": 14} {"info/global_step": 15, "train_info/time_within_train_step": 27.908385515213013, "step": 15} {"train_info/time_between_train_steps": 0.005279541015625, "step": 15} {"info/global_step": 16, "train_info/time_within_train_step": 27.986371994018555, "step": 16} {"train_info/time_between_train_steps": 0.0054624080657958984, "step": 16} {"info/global_step": 17, "train_info/time_within_train_step": 27.933210849761963, "step": 17} {"train_info/time_between_train_steps": 0.005207538604736328, "step": 17} {"info/global_step": 18, "train_info/time_within_train_step": 27.833080053329468, "step": 18} {"train_info/time_between_train_steps": 0.005620718002319336, "step": 18} {"info/global_step": 19, "train_info/time_within_train_step": 27.832363605499268, "step": 19} {"train_info/time_between_train_steps": 0.010288476943969727, "step": 19} {"info/global_step": 20, "train_info/time_within_train_step": 27.97080087661743, "step": 20} {"train_info/time_between_train_steps": 0.007299661636352539, "step": 20} {"info/global_step": 21, "train_info/time_within_train_step": 27.89056944847107, "step": 21} {"train_info/time_between_train_steps": 0.005644321441650391, "step": 21} {"info/global_step": 22, "train_info/time_within_train_step": 27.957114696502686, "step": 22} {"train_info/time_between_train_steps": 0.006374359130859375, "step": 22} {"info/global_step": 23, "train_info/time_within_train_step": 27.912258625030518, "step": 23} {"train_info/time_between_train_steps": 0.005713939666748047, "step": 23} {"info/global_step": 24, "train_info/time_within_train_step": 27.911243200302124, "step": 24} {"train_info/time_between_train_steps": 0.00562286376953125, "step": 24} {"train_info/time_between_train_steps": 5.126796722412109, "step": 24} {"info/global_step": 25, "train_info/time_within_train_step": 27.819792985916138, "step": 25} {"train_info/time_between_train_steps": 0.005560874938964844, "step": 25} {"info/global_step": 26, "train_info/time_within_train_step": 28.104661464691162, "step": 26} {"train_info/time_between_train_steps": 0.0054476261138916016, "step": 26} {"info/global_step": 27, "train_info/time_within_train_step": 27.90863800048828, "step": 27} {"train_info/time_between_train_steps": 0.0054759979248046875, "step": 27} {"info/global_step": 28, "train_info/time_within_train_step": 28.002175331115723, "step": 28} {"train_info/time_between_train_steps": 0.005541801452636719, "step": 28} {"info/global_step": 29, "train_info/time_within_train_step": 27.869744777679443, "step": 29} {"train_info/time_between_train_steps": 0.005255460739135742, "step": 29} {"info/global_step": 30, "train_info/time_within_train_step": 27.88740587234497, "step": 30} {"train_info/time_between_train_steps": 0.005084037780761719, "step": 30} {"info/global_step": 31, "train_info/time_within_train_step": 27.947638750076294, "step": 31} {"train_info/time_between_train_steps": 0.005289793014526367, "step": 31} {"info/global_step": 32, "train_info/time_within_train_step": 28.10380220413208, "step": 32} {"train_info/time_between_train_steps": 0.009924650192260742, "step": 32} {"info/global_step": 33, "train_info/time_within_train_step": 27.89262628555298, "step": 33} {"train_info/time_between_train_steps": 0.0055010318756103516, "step": 33} {"info/global_step": 34, "train_info/time_within_train_step": 27.8582661151886, "step": 34} {"train_info/time_between_train_steps": 0.0054607391357421875, "step": 34} {"info/global_step": 35, "train_info/time_within_train_step": 27.92349410057068, "step": 35} {"train_info/time_between_train_steps": 0.009967803955078125, "step": 35} {"info/global_step": 36, "train_info/time_within_train_step": 27.88943123817444, "step": 36} {"train_info/time_between_train_steps": 0.005645275115966797, "step": 36} {"info/global_step": 37, "train_info/time_within_train_step": 27.88342046737671, "step": 37} {"train_info/time_between_train_steps": 0.010091781616210938, "step": 37} {"info/global_step": 38, "train_info/time_within_train_step": 27.82862401008606, "step": 38} {"train_info/time_between_train_steps": 0.005346059799194336, "step": 38} {"info/global_step": 39, "train_info/time_within_train_step": 27.98231291770935, "step": 39} {"train_info/time_between_train_steps": 0.009741067886352539, "step": 39} {"info/global_step": 40, "train_info/time_within_train_step": 27.859386205673218, "step": 40} {"train_info/time_between_train_steps": 0.0057337284088134766, "step": 40} {"info/global_step": 41, "train_info/time_within_train_step": 27.910923957824707, "step": 41} {"train_info/time_between_train_steps": 0.005632877349853516, "step": 41} {"info/global_step": 42, "train_info/time_within_train_step": 27.88668203353882, "step": 42} {"train_info/time_between_train_steps": 0.014742851257324219, "step": 42} {"info/global_step": 43, "train_info/time_within_train_step": 27.924360990524292, "step": 43} {"train_info/time_between_train_steps": 0.005479097366333008, "step": 43} {"info/global_step": 44, "train_info/time_within_train_step": 27.88132882118225, "step": 44} {"train_info/time_between_train_steps": 0.014685869216918945, "step": 44} {"info/global_step": 45, "train_info/time_within_train_step": 27.976166009902954, "step": 45} {"train_info/time_between_train_steps": 0.01074528694152832, "step": 45} {"info/global_step": 46, "train_info/time_within_train_step": 27.91370916366577, "step": 46} {"train_info/time_between_train_steps": 0.0055637359619140625, "step": 46} {"info/global_step": 47, "train_info/time_within_train_step": 28.028409957885742, "step": 47} {"train_info/time_between_train_steps": 0.005727529525756836, "step": 47} {"info/global_step": 48, "train_info/time_within_train_step": 27.91259527206421, "step": 48} {"train_info/time_between_train_steps": 0.005834102630615234, "step": 48} {"train_info/time_between_train_steps": 5.275522232055664, "step": 48} {"info/global_step": 49, "train_info/time_within_train_step": 27.926105737686157, "step": 49} {"train_info/time_between_train_steps": 0.005899667739868164, "step": 49} {"info/global_step": 50, "train_info/time_within_train_step": 28.046265602111816, "step": 50} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733863106, "_runtime": 1418}, "step": 50} {"logs": {"train/loss": 8.4903, "train/learning_rate": 0.00025, "train/epoch": 2.0, "_timestamp": 1733863106, "_runtime": 1418}, "step": 50} {"train_info/time_between_train_steps": 0.018194198608398438, "step": 50} {"info/global_step": 51, "train_info/time_within_train_step": 27.860803365707397, "step": 51} {"train_info/time_between_train_steps": 0.005678415298461914, "step": 51} {"info/global_step": 52, "train_info/time_within_train_step": 27.95051383972168, "step": 52} {"train_info/time_between_train_steps": 0.005599498748779297, "step": 52} {"info/global_step": 53, "train_info/time_within_train_step": 27.84534239768982, "step": 53} {"train_info/time_between_train_steps": 0.005167722702026367, "step": 53} {"info/global_step": 54, "train_info/time_within_train_step": 27.898667812347412, "step": 54} {"train_info/time_between_train_steps": 0.005662202835083008, "step": 54} {"info/global_step": 55, "train_info/time_within_train_step": 27.82908058166504, "step": 55} {"train_info/time_between_train_steps": 0.005223751068115234, "step": 55} {"info/global_step": 56, "train_info/time_within_train_step": 27.924776315689087, "step": 56} {"train_info/time_between_train_steps": 0.005299091339111328, "step": 56} {"info/global_step": 57, "train_info/time_within_train_step": 27.85494303703308, "step": 57} {"train_info/time_between_train_steps": 0.012265205383300781, "step": 57} {"info/global_step": 58, "train_info/time_within_train_step": 27.89437484741211, "step": 58} {"train_info/time_between_train_steps": 0.01020669937133789, "step": 58} {"info/global_step": 59, "train_info/time_within_train_step": 27.883049726486206, "step": 59} {"train_info/time_between_train_steps": 0.005450010299682617, "step": 59} {"info/global_step": 60, "train_info/time_within_train_step": 27.914623975753784, "step": 60} {"train_info/time_between_train_steps": 0.005243062973022461, "step": 60} {"info/global_step": 61, "train_info/time_within_train_step": 27.864964485168457, "step": 61} {"train_info/time_between_train_steps": 0.005204677581787109, "step": 61} {"info/global_step": 62, "train_info/time_within_train_step": 27.89541006088257, "step": 62} {"train_info/time_between_train_steps": 0.005498170852661133, "step": 62} {"info/global_step": 63, "train_info/time_within_train_step": 28.01825761795044, "step": 63} {"train_info/time_between_train_steps": 0.005452394485473633, "step": 63} {"info/global_step": 64, "train_info/time_within_train_step": 27.840373992919922, "step": 64} {"train_info/time_between_train_steps": 0.0054509639739990234, "step": 64} {"info/global_step": 65, "train_info/time_within_train_step": 27.91447901725769, "step": 65} {"train_info/time_between_train_steps": 0.005467653274536133, "step": 65} {"info/global_step": 66, "train_info/time_within_train_step": 27.868010759353638, "step": 66} {"train_info/time_between_train_steps": 0.009564638137817383, "step": 66} {"info/global_step": 67, "train_info/time_within_train_step": 27.89435911178589, "step": 67} {"train_info/time_between_train_steps": 0.006176471710205078, "step": 67} {"info/global_step": 68, "train_info/time_within_train_step": 27.859719276428223, "step": 68} {"train_info/time_between_train_steps": 0.005562782287597656, "step": 68} {"info/global_step": 69, "train_info/time_within_train_step": 27.964381456375122, "step": 69} {"train_info/time_between_train_steps": 0.005448818206787109, "step": 69} {"info/global_step": 70, "train_info/time_within_train_step": 27.82854700088501, "step": 70} {"train_info/time_between_train_steps": 0.011949777603149414, "step": 70} {"info/global_step": 71, "train_info/time_within_train_step": 27.937572717666626, "step": 71} {"train_info/time_between_train_steps": 0.005756378173828125, "step": 71} {"info/global_step": 72, "train_info/time_within_train_step": 27.877082109451294, "step": 72} {"train_info/time_between_train_steps": 0.005797386169433594, "step": 72} {"train_info/time_between_train_steps": 5.539104461669922, "step": 72} {"info/global_step": 73, "train_info/time_within_train_step": 27.92402696609497, "step": 73} {"train_info/time_between_train_steps": 0.011109352111816406, "step": 73} {"info/global_step": 74, "train_info/time_within_train_step": 28.00415802001953, "step": 74} {"train_info/time_between_train_steps": 0.006369590759277344, "step": 74} {"info/global_step": 75, "train_info/time_within_train_step": 27.94434690475464, "step": 75} {"train_info/time_between_train_steps": 0.0053560733795166016, "step": 75} {"info/global_step": 76, "train_info/time_within_train_step": 27.982746124267578, "step": 76} {"train_info/time_between_train_steps": 0.005368471145629883, "step": 76} {"info/global_step": 77, "train_info/time_within_train_step": 27.895103693008423, "step": 77} {"train_info/time_between_train_steps": 0.006207466125488281, "step": 77} {"info/global_step": 78, "train_info/time_within_train_step": 27.97312641143799, "step": 78} {"train_info/time_between_train_steps": 0.005048990249633789, "step": 78} {"info/global_step": 79, "train_info/time_within_train_step": 27.880038022994995, "step": 79} {"train_info/time_between_train_steps": 0.005433797836303711, "step": 79} {"info/global_step": 80, "train_info/time_within_train_step": 27.864113569259644, "step": 80} {"train_info/time_between_train_steps": 0.005471229553222656, "step": 80} {"info/global_step": 81, "train_info/time_within_train_step": 27.88240623474121, "step": 81} {"train_info/time_between_train_steps": 0.005268573760986328, "step": 81} {"info/global_step": 82, "train_info/time_within_train_step": 27.937636137008667, "step": 82} {"train_info/time_between_train_steps": 0.0065059661865234375, "step": 82} {"info/global_step": 83, "train_info/time_within_train_step": 27.875128030776978, "step": 83} {"train_info/time_between_train_steps": 0.005377531051635742, "step": 83} {"info/global_step": 84, "train_info/time_within_train_step": 27.833176612854004, "step": 84} {"train_info/time_between_train_steps": 0.013754844665527344, "step": 84} {"info/global_step": 85, "train_info/time_within_train_step": 27.91662859916687, "step": 85} {"train_info/time_between_train_steps": 0.005378007888793945, "step": 85} {"info/global_step": 86, "train_info/time_within_train_step": 27.929656982421875, "step": 86} {"train_info/time_between_train_steps": 0.010367870330810547, "step": 86} {"info/global_step": 87, "train_info/time_within_train_step": 27.86956238746643, "step": 87} {"train_info/time_between_train_steps": 0.0109100341796875, "step": 87} {"info/global_step": 88, "train_info/time_within_train_step": 27.96914505958557, "step": 88} {"train_info/time_between_train_steps": 0.005514860153198242, "step": 88} {"info/global_step": 89, "train_info/time_within_train_step": 27.8777859210968, "step": 89} {"train_info/time_between_train_steps": 0.005585432052612305, "step": 89} {"info/global_step": 90, "train_info/time_within_train_step": 27.92362093925476, "step": 90} {"train_info/time_between_train_steps": 0.005262613296508789, "step": 90} {"info/global_step": 91, "train_info/time_within_train_step": 27.891221046447754, "step": 91} {"train_info/time_between_train_steps": 0.009668827056884766, "step": 91} {"info/global_step": 92, "train_info/time_within_train_step": 27.906431436538696, "step": 92} {"train_info/time_between_train_steps": 0.005475759506225586, "step": 92} {"info/global_step": 93, "train_info/time_within_train_step": 27.924067735671997, "step": 93} {"train_info/time_between_train_steps": 0.010826349258422852, "step": 93} {"info/global_step": 94, "train_info/time_within_train_step": 27.95855140686035, "step": 94} {"train_info/time_between_train_steps": 0.0054624080657958984, "step": 94} {"info/global_step": 95, "train_info/time_within_train_step": 27.871114015579224, "step": 95} {"train_info/time_between_train_steps": 0.005692958831787109, "step": 95} {"info/global_step": 96, "train_info/time_within_train_step": 27.877554178237915, "step": 96} {"train_info/time_between_train_steps": 0.0058100223541259766, "step": 96} {"train_info/time_between_train_steps": 5.1437668800354, "step": 96} {"info/global_step": 97, "train_info/time_within_train_step": 27.86967706680298, "step": 97} {"train_info/time_between_train_steps": 0.005918979644775391, "step": 97} {"info/global_step": 98, "train_info/time_within_train_step": 28.016448974609375, "step": 98} {"train_info/time_between_train_steps": 0.011922121047973633, "step": 98} {"info/global_step": 99, "train_info/time_within_train_step": 27.938883781433105, "step": 99} {"train_info/time_between_train_steps": 0.005344867706298828, "step": 99} {"info/global_step": 100, "train_info/time_within_train_step": 27.948858499526978, "step": 100} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733864512, "_runtime": 2824}, "step": 100} {"logs": {"train/loss": 7.2157, "train/learning_rate": 0.0005, "train/epoch": 4.0, "_timestamp": 1733864512, "_runtime": 2824}, "step": 100} {"train_info/time_between_train_steps": 2.5753893852233887, "step": 100} {"info/global_step": 101, "train_info/time_within_train_step": 28.01094675064087, "step": 101} {"train_info/time_between_train_steps": 0.0052280426025390625, "step": 101} {"info/global_step": 102, "train_info/time_within_train_step": 27.856173753738403, "step": 102} {"train_info/time_between_train_steps": 0.005151033401489258, "step": 102} {"info/global_step": 103, "train_info/time_within_train_step": 27.863196849822998, "step": 103} {"train_info/time_between_train_steps": 0.005470752716064453, "step": 103} {"info/global_step": 104, "train_info/time_within_train_step": 27.845460653305054, "step": 104} {"train_info/time_between_train_steps": 0.00522303581237793, "step": 104} {"info/global_step": 105, "train_info/time_within_train_step": 27.890036582946777, "step": 105} {"train_info/time_between_train_steps": 0.0053937435150146484, "step": 105} {"info/global_step": 106, "train_info/time_within_train_step": 27.85034418106079, "step": 106} {"train_info/time_between_train_steps": 0.00945901870727539, "step": 106} {"info/global_step": 107, "train_info/time_within_train_step": 27.940770864486694, "step": 107} {"train_info/time_between_train_steps": 0.0052950382232666016, "step": 107} {"info/global_step": 108, "train_info/time_within_train_step": 27.857229948043823, "step": 108} {"train_info/time_between_train_steps": 0.005430936813354492, "step": 108} {"info/global_step": 109, "train_info/time_within_train_step": 27.867021083831787, "step": 109} {"train_info/time_between_train_steps": 0.010390043258666992, "step": 109} {"info/global_step": 110, "train_info/time_within_train_step": 27.927757501602173, "step": 110} {"train_info/time_between_train_steps": 0.005270719528198242, "step": 110} {"info/global_step": 111, "train_info/time_within_train_step": 27.872534036636353, "step": 111} {"train_info/time_between_train_steps": 0.011554956436157227, "step": 111} {"info/global_step": 112, "train_info/time_within_train_step": 27.89185643196106, "step": 112} {"train_info/time_between_train_steps": 0.005768299102783203, "step": 112} {"info/global_step": 113, "train_info/time_within_train_step": 27.87519097328186, "step": 113} {"train_info/time_between_train_steps": 0.005689859390258789, "step": 113} {"info/global_step": 114, "train_info/time_within_train_step": 27.877984046936035, "step": 114} {"train_info/time_between_train_steps": 0.005509376525878906, "step": 114} {"info/global_step": 115, "train_info/time_within_train_step": 27.90910792350769, "step": 115} {"train_info/time_between_train_steps": 0.005732297897338867, "step": 115} {"info/global_step": 116, "train_info/time_within_train_step": 27.897411346435547, "step": 116} {"train_info/time_between_train_steps": 0.0055124759674072266, "step": 116} {"info/global_step": 117, "train_info/time_within_train_step": 27.810490608215332, "step": 117} {"train_info/time_between_train_steps": 0.005469083786010742, "step": 117} {"info/global_step": 118, "train_info/time_within_train_step": 27.966025590896606, "step": 118} {"train_info/time_between_train_steps": 0.005712032318115234, "step": 118} {"info/global_step": 119, "train_info/time_within_train_step": 27.87128472328186, "step": 119} {"train_info/time_between_train_steps": 0.006020545959472656, "step": 119} {"info/global_step": 120, "train_info/time_within_train_step": 27.965394735336304, "step": 120} {"train_info/time_between_train_steps": 0.015111923217773438, "step": 120} {"train_info/time_between_train_steps": 5.249781131744385, "step": 120} {"info/global_step": 121, "train_info/time_within_train_step": 27.81099033355713, "step": 121} {"train_info/time_between_train_steps": 0.005724668502807617, "step": 121} {"info/global_step": 122, "train_info/time_within_train_step": 28.07422637939453, "step": 122} {"train_info/time_between_train_steps": 0.005447864532470703, "step": 122} {"info/global_step": 123, "train_info/time_within_train_step": 27.86060333251953, "step": 123} {"train_info/time_between_train_steps": 0.009648561477661133, "step": 123} {"info/global_step": 124, "train_info/time_within_train_step": 27.96206283569336, "step": 124} {"train_info/time_between_train_steps": 0.005552053451538086, "step": 124} {"info/global_step": 125, "train_info/time_within_train_step": 28.005625009536743, "step": 125} {"train_info/time_between_train_steps": 0.005424976348876953, "step": 125} {"info/global_step": 126, "train_info/time_within_train_step": 27.919677257537842, "step": 126} {"train_info/time_between_train_steps": 0.005380153656005859, "step": 126} {"info/global_step": 127, "train_info/time_within_train_step": 27.847646951675415, "step": 127} {"train_info/time_between_train_steps": 0.009386539459228516, "step": 127} {"info/global_step": 128, "train_info/time_within_train_step": 27.91883373260498, "step": 128} {"train_info/time_between_train_steps": 0.005613803863525391, "step": 128} {"info/global_step": 129, "train_info/time_within_train_step": 27.84879422187805, "step": 129} {"train_info/time_between_train_steps": 0.005271196365356445, "step": 129} {"info/global_step": 130, "train_info/time_within_train_step": 27.823144674301147, "step": 130} {"train_info/time_between_train_steps": 0.013925552368164062, "step": 130} {"info/global_step": 131, "train_info/time_within_train_step": 27.924867391586304, "step": 131} {"train_info/time_between_train_steps": 0.005182027816772461, "step": 131} {"info/global_step": 132, "train_info/time_within_train_step": 27.839778184890747, "step": 132} {"train_info/time_between_train_steps": 0.005640983581542969, "step": 132} {"info/global_step": 133, "train_info/time_within_train_step": 27.886006832122803, "step": 133} {"train_info/time_between_train_steps": 0.0054013729095458984, "step": 133} {"info/global_step": 134, "train_info/time_within_train_step": 27.874873638153076, "step": 134} {"train_info/time_between_train_steps": 0.009658098220825195, "step": 134} {"info/global_step": 135, "train_info/time_within_train_step": 27.84233021736145, "step": 135} {"train_info/time_between_train_steps": 0.005398988723754883, "step": 135} {"info/global_step": 136, "train_info/time_within_train_step": 27.884586811065674, "step": 136} {"train_info/time_between_train_steps": 0.009964466094970703, "step": 136} {"info/global_step": 137, "train_info/time_within_train_step": 27.895139694213867, "step": 137} {"train_info/time_between_train_steps": 0.005768537521362305, "step": 137} {"info/global_step": 138, "train_info/time_within_train_step": 27.9070463180542, "step": 138} {"train_info/time_between_train_steps": 0.010411977767944336, "step": 138} {"info/global_step": 139, "train_info/time_within_train_step": 27.9529767036438, "step": 139} {"train_info/time_between_train_steps": 0.005345344543457031, "step": 139} {"info/global_step": 140, "train_info/time_within_train_step": 27.88967490196228, "step": 140} {"train_info/time_between_train_steps": 0.008183002471923828, "step": 140} {"info/global_step": 141, "train_info/time_within_train_step": 27.960476398468018, "step": 141} {"train_info/time_between_train_steps": 0.00974893569946289, "step": 141} {"info/global_step": 142, "train_info/time_within_train_step": 27.884103059768677, "step": 142} {"train_info/time_between_train_steps": 0.005866527557373047, "step": 142} {"info/global_step": 143, "train_info/time_within_train_step": 27.896954774856567, "step": 143} {"train_info/time_between_train_steps": 0.00549769401550293, "step": 143} {"info/global_step": 144, "train_info/time_within_train_step": 27.89739680290222, "step": 144} {"train_info/time_between_train_steps": 0.006129264831542969, "step": 144} {"train_info/time_between_train_steps": 5.425424098968506, "step": 144} {"info/global_step": 145, "train_info/time_within_train_step": 27.834883213043213, "step": 145} {"train_info/time_between_train_steps": 0.0051310062408447266, "step": 145} {"info/global_step": 146, "train_info/time_within_train_step": 28.02673649787903, "step": 146} {"train_info/time_between_train_steps": 0.005354881286621094, "step": 146} {"info/global_step": 147, "train_info/time_within_train_step": 27.918845176696777, "step": 147} {"train_info/time_between_train_steps": 0.00532984733581543, "step": 147} {"info/global_step": 148, "train_info/time_within_train_step": 27.948442459106445, "step": 148} {"train_info/time_between_train_steps": 0.005659580230712891, "step": 148} {"info/global_step": 149, "train_info/time_within_train_step": 27.846700191497803, "step": 149} {"train_info/time_between_train_steps": 0.006077289581298828, "step": 149} {"info/global_step": 150, "train_info/time_within_train_step": 27.854774236679077, "step": 150} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733865921, "_runtime": 4233}, "step": 150} {"logs": {"train/loss": 6.6121, "train/learning_rate": 0.0005833333333333333, "train/epoch": 6.0, "_timestamp": 1733865921, "_runtime": 4233}, "step": 150} {"train_info/time_between_train_steps": 0.00804591178894043, "step": 150} {"info/global_step": 151, "train_info/time_within_train_step": 27.857871532440186, "step": 151} {"train_info/time_between_train_steps": 0.008490324020385742, "step": 151} {"info/global_step": 152, "train_info/time_within_train_step": 27.974483489990234, "step": 152} {"train_info/time_between_train_steps": 0.005115509033203125, "step": 152} {"info/global_step": 153, "train_info/time_within_train_step": 27.92187786102295, "step": 153} {"train_info/time_between_train_steps": 0.009986162185668945, "step": 153} {"info/global_step": 154, "train_info/time_within_train_step": 27.911165714263916, "step": 154} {"train_info/time_between_train_steps": 0.005217075347900391, "step": 154} {"info/global_step": 155, "train_info/time_within_train_step": 27.820499658584595, "step": 155} {"train_info/time_between_train_steps": 0.005408048629760742, "step": 155} {"info/global_step": 156, "train_info/time_within_train_step": 27.980628490447998, "step": 156} {"train_info/time_between_train_steps": 0.006457090377807617, "step": 156} {"info/global_step": 157, "train_info/time_within_train_step": 27.837635278701782, "step": 157} {"train_info/time_between_train_steps": 0.005362749099731445, "step": 157} {"info/global_step": 158, "train_info/time_within_train_step": 27.898962259292603, "step": 158} {"train_info/time_between_train_steps": 0.005330801010131836, "step": 158} {"info/global_step": 159, "train_info/time_within_train_step": 27.890092372894287, "step": 159} {"train_info/time_between_train_steps": 0.005282163619995117, "step": 159} {"info/global_step": 160, "train_info/time_within_train_step": 27.824662685394287, "step": 160} {"train_info/time_between_train_steps": 0.005444049835205078, "step": 160} {"info/global_step": 161, "train_info/time_within_train_step": 27.962764263153076, "step": 161} {"train_info/time_between_train_steps": 0.005165576934814453, "step": 161} {"info/global_step": 162, "train_info/time_within_train_step": 27.83262276649475, "step": 162} {"train_info/time_between_train_steps": 0.0052471160888671875, "step": 162} {"info/global_step": 163, "train_info/time_within_train_step": 27.883310079574585, "step": 163} {"train_info/time_between_train_steps": 0.005480527877807617, "step": 163} {"info/global_step": 164, "train_info/time_within_train_step": 27.879080057144165, "step": 164} {"train_info/time_between_train_steps": 0.0071392059326171875, "step": 164} {"info/global_step": 165, "train_info/time_within_train_step": 27.953266143798828, "step": 165} {"train_info/time_between_train_steps": 0.005618095397949219, "step": 165} {"info/global_step": 166, "train_info/time_within_train_step": 27.933587312698364, "step": 166} {"train_info/time_between_train_steps": 0.0060193538665771484, "step": 166} {"info/global_step": 167, "train_info/time_within_train_step": 27.992498874664307, "step": 167} {"train_info/time_between_train_steps": 0.005940914154052734, "step": 167} {"info/global_step": 168, "train_info/time_within_train_step": 27.864049434661865, "step": 168} {"train_info/time_between_train_steps": 0.011033773422241211, "step": 168} {"train_info/time_between_train_steps": 5.190542936325073, "step": 168} {"info/global_step": 169, "train_info/time_within_train_step": 27.862074613571167, "step": 169} {"train_info/time_between_train_steps": 0.00539398193359375, "step": 169} {"info/global_step": 170, "train_info/time_within_train_step": 27.974599361419678, "step": 170} {"train_info/time_between_train_steps": 0.005474567413330078, "step": 170} {"info/global_step": 171, "train_info/time_within_train_step": 27.99712634086609, "step": 171} {"train_info/time_between_train_steps": 0.005408525466918945, "step": 171} {"info/global_step": 172, "train_info/time_within_train_step": 28.066603183746338, "step": 172} {"train_info/time_between_train_steps": 0.0054361820220947266, "step": 172} {"info/global_step": 173, "train_info/time_within_train_step": 27.93461775779724, "step": 173} {"train_info/time_between_train_steps": 0.0051136016845703125, "step": 173} {"info/global_step": 174, "train_info/time_within_train_step": 27.89629817008972, "step": 174} {"train_info/time_between_train_steps": 0.005347490310668945, "step": 174} {"info/global_step": 175, "train_info/time_within_train_step": 27.856720447540283, "step": 175} {"train_info/time_between_train_steps": 0.010079145431518555, "step": 175} {"info/global_step": 176, "train_info/time_within_train_step": 27.869271516799927, "step": 176} {"train_info/time_between_train_steps": 0.00527501106262207, "step": 176} {"info/global_step": 177, "train_info/time_within_train_step": 27.85781955718994, "step": 177} {"train_info/time_between_train_steps": 0.010607481002807617, "step": 177} {"info/global_step": 178, "train_info/time_within_train_step": 27.906853675842285, "step": 178} {"train_info/time_between_train_steps": 0.00543975830078125, "step": 178} {"info/global_step": 179, "train_info/time_within_train_step": 27.887194395065308, "step": 179} {"train_info/time_between_train_steps": 0.005355119705200195, "step": 179} {"info/global_step": 180, "train_info/time_within_train_step": 27.888171195983887, "step": 180} {"train_info/time_between_train_steps": 0.0054438114166259766, "step": 180} {"info/global_step": 181, "train_info/time_within_train_step": 27.87649631500244, "step": 181} {"train_info/time_between_train_steps": 0.005704641342163086, "step": 181} {"info/global_step": 182, "train_info/time_within_train_step": 27.92414164543152, "step": 182} {"train_info/time_between_train_steps": 0.006415843963623047, "step": 182} {"info/global_step": 183, "train_info/time_within_train_step": 27.848407983779907, "step": 183} {"train_info/time_between_train_steps": 0.005649566650390625, "step": 183} {"info/global_step": 184, "train_info/time_within_train_step": 27.884580373764038, "step": 184} {"train_info/time_between_train_steps": 0.01051950454711914, "step": 184} {"info/global_step": 185, "train_info/time_within_train_step": 27.90295720100403, "step": 185} {"train_info/time_between_train_steps": 0.005264759063720703, "step": 185} {"info/global_step": 186, "train_info/time_within_train_step": 27.85777759552002, "step": 186} {"train_info/time_between_train_steps": 0.005407094955444336, "step": 186} {"info/global_step": 187, "train_info/time_within_train_step": 27.923032522201538, "step": 187} {"train_info/time_between_train_steps": 0.006235599517822266, "step": 187} {"info/global_step": 188, "train_info/time_within_train_step": 27.938955068588257, "step": 188} {"train_info/time_between_train_steps": 0.01044011116027832, "step": 188} {"info/global_step": 189, "train_info/time_within_train_step": 27.91809344291687, "step": 189} {"train_info/time_between_train_steps": 0.011632204055786133, "step": 189} {"info/global_step": 190, "train_info/time_within_train_step": 27.87188482284546, "step": 190} {"train_info/time_between_train_steps": 0.006090402603149414, "step": 190} {"info/global_step": 191, "train_info/time_within_train_step": 28.00863265991211, "step": 191} {"train_info/time_between_train_steps": 0.005842447280883789, "step": 191} {"info/global_step": 192, "train_info/time_within_train_step": 27.863271713256836, "step": 192} {"train_info/time_between_train_steps": 0.0059506893157958984, "step": 192} {"train_info/time_between_train_steps": 5.24846625328064, "step": 192} {"info/global_step": 193, "train_info/time_within_train_step": 27.896165370941162, "step": 193} {"train_info/time_between_train_steps": 0.005080223083496094, "step": 193} {"info/global_step": 194, "train_info/time_within_train_step": 27.951216459274292, "step": 194} {"train_info/time_between_train_steps": 0.009551525115966797, "step": 194} {"info/global_step": 195, "train_info/time_within_train_step": 27.889395236968994, "step": 195} {"train_info/time_between_train_steps": 0.009166479110717773, "step": 195} {"info/global_step": 196, "train_info/time_within_train_step": 27.9456467628479, "step": 196} {"train_info/time_between_train_steps": 0.005602598190307617, "step": 196} {"info/global_step": 197, "train_info/time_within_train_step": 27.889535427093506, "step": 197} {"train_info/time_between_train_steps": 0.005179882049560547, "step": 197} {"info/global_step": 198, "train_info/time_within_train_step": 27.810219764709473, "step": 198} {"train_info/time_between_train_steps": 0.0057489871978759766, "step": 198} {"info/global_step": 199, "train_info/time_within_train_step": 27.873029947280884, "step": 199} {"train_info/time_between_train_steps": 0.006817817687988281, "step": 199} {"info/global_step": 200, "train_info/time_within_train_step": 27.90688467025757, "step": 200} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733867327, "_runtime": 5639}, "step": 200} {"logs": {"train/loss": 6.0811, "train/learning_rate": 0.0005555555555555556, "train/epoch": 8.01, "_timestamp": 1733867327, "_runtime": 5639}, "step": 200} {"train_info/time_between_train_steps": 2.4157602787017822, "step": 200} {"info/global_step": 201, "train_info/time_within_train_step": 27.913870573043823, "step": 201} {"train_info/time_between_train_steps": 0.008521795272827148, "step": 201} {"info/global_step": 202, "train_info/time_within_train_step": 27.8715603351593, "step": 202} {"train_info/time_between_train_steps": 0.005393028259277344, "step": 202} {"info/global_step": 203, "train_info/time_within_train_step": 28.006418228149414, "step": 203} {"train_info/time_between_train_steps": 0.006293535232543945, "step": 203} {"info/global_step": 204, "train_info/time_within_train_step": 27.85329794883728, "step": 204} {"train_info/time_between_train_steps": 0.005535125732421875, "step": 204} {"info/global_step": 205, "train_info/time_within_train_step": 27.944677352905273, "step": 205} {"train_info/time_between_train_steps": 0.005331754684448242, "step": 205} {"info/global_step": 206, "train_info/time_within_train_step": 27.834398984909058, "step": 206} {"train_info/time_between_train_steps": 0.005268096923828125, "step": 206} {"info/global_step": 207, "train_info/time_within_train_step": 27.901167154312134, "step": 207} {"train_info/time_between_train_steps": 0.0054318904876708984, "step": 207} {"info/global_step": 208, "train_info/time_within_train_step": 27.914040088653564, "step": 208} {"train_info/time_between_train_steps": 0.005574941635131836, "step": 208} {"info/global_step": 209, "train_info/time_within_train_step": 27.889857292175293, "step": 209} {"train_info/time_between_train_steps": 0.005930423736572266, "step": 209} {"info/global_step": 210, "train_info/time_within_train_step": 27.902791023254395, "step": 210} {"train_info/time_between_train_steps": 0.005293369293212891, "step": 210} {"info/global_step": 211, "train_info/time_within_train_step": 27.893150568008423, "step": 211} {"train_info/time_between_train_steps": 0.00590062141418457, "step": 211} {"info/global_step": 212, "train_info/time_within_train_step": 27.991011142730713, "step": 212} {"train_info/time_between_train_steps": 0.005436420440673828, "step": 212} {"info/global_step": 213, "train_info/time_within_train_step": 27.91648769378662, "step": 213} {"train_info/time_between_train_steps": 0.0063343048095703125, "step": 213} {"info/global_step": 214, "train_info/time_within_train_step": 27.953208208084106, "step": 214} {"train_info/time_between_train_steps": 0.005563259124755859, "step": 214} {"info/global_step": 215, "train_info/time_within_train_step": 27.94828987121582, "step": 215} {"train_info/time_between_train_steps": 0.005845069885253906, "step": 215} {"info/global_step": 216, "train_info/time_within_train_step": 27.971690893173218, "step": 216} {"train_info/time_between_train_steps": 0.011038780212402344, "step": 216} {"train_info/time_between_train_steps": 5.599370718002319, "step": 216} {"info/global_step": 217, "train_info/time_within_train_step": 27.882237911224365, "step": 217} {"train_info/time_between_train_steps": 0.0056307315826416016, "step": 217} {"info/global_step": 218, "train_info/time_within_train_step": 28.080852031707764, "step": 218} {"train_info/time_between_train_steps": 0.005543231964111328, "step": 218} {"info/global_step": 219, "train_info/time_within_train_step": 28.04484510421753, "step": 219} {"train_info/time_between_train_steps": 0.0054781436920166016, "step": 219} {"info/global_step": 220, "train_info/time_within_train_step": 27.982690811157227, "step": 220} {"train_info/time_between_train_steps": 0.0056610107421875, "step": 220} {"info/global_step": 221, "train_info/time_within_train_step": 28.064523458480835, "step": 221} {"train_info/time_between_train_steps": 0.010109663009643555, "step": 221} {"info/global_step": 222, "train_info/time_within_train_step": 27.929218769073486, "step": 222} {"train_info/time_between_train_steps": 0.005980253219604492, "step": 222} {"info/global_step": 223, "train_info/time_within_train_step": 27.86570954322815, "step": 223} {"train_info/time_between_train_steps": 0.0056438446044921875, "step": 223} {"info/global_step": 224, "train_info/time_within_train_step": 27.89176082611084, "step": 224} {"train_info/time_between_train_steps": 0.005543708801269531, "step": 224} {"info/global_step": 225, "train_info/time_within_train_step": 27.87575364112854, "step": 225} {"train_info/time_between_train_steps": 0.006125926971435547, "step": 225} {"info/global_step": 226, "train_info/time_within_train_step": 27.8488667011261, "step": 226} {"train_info/time_between_train_steps": 0.010565042495727539, "step": 226} {"info/global_step": 227, "train_info/time_within_train_step": 27.90395975112915, "step": 227} {"train_info/time_between_train_steps": 0.0054781436920166016, "step": 227} {"info/global_step": 228, "train_info/time_within_train_step": 27.926060676574707, "step": 228} {"train_info/time_between_train_steps": 0.010333061218261719, "step": 228} {"info/global_step": 229, "train_info/time_within_train_step": 27.90238070487976, "step": 229} {"train_info/time_between_train_steps": 0.00576019287109375, "step": 229} {"info/global_step": 230, "train_info/time_within_train_step": 27.89388680458069, "step": 230} {"train_info/time_between_train_steps": 0.010326862335205078, "step": 230} {"info/global_step": 231, "train_info/time_within_train_step": 27.941290855407715, "step": 231} {"train_info/time_between_train_steps": 0.00861978530883789, "step": 231} {"info/global_step": 232, "train_info/time_within_train_step": 27.88461947441101, "step": 232} {"train_info/time_between_train_steps": 0.005505561828613281, "step": 232} {"info/global_step": 233, "train_info/time_within_train_step": 27.934995651245117, "step": 233} {"train_info/time_between_train_steps": 0.005434751510620117, "step": 233} {"info/global_step": 234, "train_info/time_within_train_step": 27.97720956802368, "step": 234} {"train_info/time_between_train_steps": 0.010189294815063477, "step": 234} {"info/global_step": 235, "train_info/time_within_train_step": 27.927281141281128, "step": 235} {"train_info/time_between_train_steps": 0.005486249923706055, "step": 235} {"info/global_step": 236, "train_info/time_within_train_step": 27.921709537506104, "step": 236} {"train_info/time_between_train_steps": 0.010803699493408203, "step": 236} {"info/global_step": 237, "train_info/time_within_train_step": 27.98872399330139, "step": 237} {"train_info/time_between_train_steps": 0.00561976432800293, "step": 237} {"info/global_step": 238, "train_info/time_within_train_step": 27.91378140449524, "step": 238} {"train_info/time_between_train_steps": 0.005858182907104492, "step": 238} {"info/global_step": 239, "train_info/time_within_train_step": 27.92412781715393, "step": 239} {"train_info/time_between_train_steps": 0.0060274600982666016, "step": 239} {"info/global_step": 240, "train_info/time_within_train_step": 27.998769283294678, "step": 240} {"train_info/time_between_train_steps": 0.0061016082763671875, "step": 240} {"train_info/time_between_train_steps": 5.345746040344238, "step": 240} {"info/global_step": 241, "train_info/time_within_train_step": 27.91753911972046, "step": 241} {"train_info/time_between_train_steps": 0.010732173919677734, "step": 241} {"info/global_step": 242, "train_info/time_within_train_step": 28.116531372070312, "step": 242} {"train_info/time_between_train_steps": 0.00556635856628418, "step": 242} {"info/global_step": 243, "train_info/time_within_train_step": 27.874912977218628, "step": 243} {"train_info/time_between_train_steps": 0.005785226821899414, "step": 243} {"info/global_step": 244, "train_info/time_within_train_step": 28.001402139663696, "step": 244} {"train_info/time_between_train_steps": 0.005778074264526367, "step": 244} {"info/global_step": 245, "train_info/time_within_train_step": 27.85223364830017, "step": 245} {"train_info/time_between_train_steps": 0.0052225589752197266, "step": 245} {"info/global_step": 246, "train_info/time_within_train_step": 27.893455028533936, "step": 246} {"train_info/time_between_train_steps": 0.005319356918334961, "step": 246} {"info/global_step": 247, "train_info/time_within_train_step": 27.843024015426636, "step": 247} {"train_info/time_between_train_steps": 0.010188102722167969, "step": 247} {"info/global_step": 248, "train_info/time_within_train_step": 27.96091866493225, "step": 248} {"train_info/time_between_train_steps": 0.005468606948852539, "step": 248} {"info/global_step": 249, "train_info/time_within_train_step": 27.842076539993286, "step": 249} {"train_info/time_between_train_steps": 0.005692481994628906, "step": 249} {"info/global_step": 250, "train_info/time_within_train_step": 28.08454203605652, "step": 250} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733868737, "_runtime": 7049}, "step": 250} {"logs": {"train/loss": 5.6744, "train/learning_rate": 0.0005277777777777777, "train/epoch": 10.01, "_timestamp": 1733868737, "_runtime": 7049}, "step": 250} {"train_info/time_between_train_steps": 0.01365041732788086, "step": 250} {"info/global_step": 251, "train_info/time_within_train_step": 27.859680891036987, "step": 251} {"train_info/time_between_train_steps": 0.010239839553833008, "step": 251} {"info/global_step": 252, "train_info/time_within_train_step": 27.83976650238037, "step": 252} {"train_info/time_between_train_steps": 0.009843587875366211, "step": 252} {"info/global_step": 253, "train_info/time_within_train_step": 27.933988332748413, "step": 253} {"train_info/time_between_train_steps": 0.005249977111816406, "step": 253} {"info/global_step": 254, "train_info/time_within_train_step": 27.869959592819214, "step": 254} {"train_info/time_between_train_steps": 0.005375385284423828, "step": 254} {"info/global_step": 255, "train_info/time_within_train_step": 27.89018225669861, "step": 255} {"train_info/time_between_train_steps": 0.005431413650512695, "step": 255} {"info/global_step": 256, "train_info/time_within_train_step": 27.85981273651123, "step": 256} {"train_info/time_between_train_steps": 0.005416393280029297, "step": 256} {"info/global_step": 257, "train_info/time_within_train_step": 27.983348846435547, "step": 257} {"train_info/time_between_train_steps": 0.005534172058105469, "step": 257} {"info/global_step": 258, "train_info/time_within_train_step": 27.955776691436768, "step": 258} {"train_info/time_between_train_steps": 0.009979248046875, "step": 258} {"info/global_step": 259, "train_info/time_within_train_step": 27.934094190597534, "step": 259} {"train_info/time_between_train_steps": 0.005521535873413086, "step": 259} {"info/global_step": 260, "train_info/time_within_train_step": 27.861037731170654, "step": 260} {"train_info/time_between_train_steps": 0.005658864974975586, "step": 260} {"info/global_step": 261, "train_info/time_within_train_step": 27.95903754234314, "step": 261} {"train_info/time_between_train_steps": 0.00575709342956543, "step": 261} {"info/global_step": 262, "train_info/time_within_train_step": 27.888697147369385, "step": 262} {"train_info/time_between_train_steps": 0.010955572128295898, "step": 262} {"info/global_step": 263, "train_info/time_within_train_step": 27.937700033187866, "step": 263} {"train_info/time_between_train_steps": 0.00578761100769043, "step": 263} {"info/global_step": 264, "train_info/time_within_train_step": 27.888998985290527, "step": 264} {"train_info/time_between_train_steps": 0.006703853607177734, "step": 264} {"train_info/time_between_train_steps": 5.412487506866455, "step": 264} {"info/global_step": 265, "train_info/time_within_train_step": 33.5150728225708, "step": 265} {"train_info/time_between_train_steps": 0.005140781402587891, "step": 265} {"info/global_step": 266, "train_info/time_within_train_step": 54.9160692691803, "step": 266} {"train_info/time_between_train_steps": 0.005522012710571289, "step": 266} {"info/global_step": 267, "train_info/time_within_train_step": 54.870261669158936, "step": 267} {"train_info/time_between_train_steps": 0.00984954833984375, "step": 267} {"info/global_step": 268, "train_info/time_within_train_step": 54.62228012084961, "step": 268} {"train_info/time_between_train_steps": 0.005709648132324219, "step": 268} {"info/global_step": 269, "train_info/time_within_train_step": 54.72721862792969, "step": 269} {"train_info/time_between_train_steps": 0.012401103973388672, "step": 269} {"info/global_step": 270, "train_info/time_within_train_step": 54.54993009567261, "step": 270} {"train_info/time_between_train_steps": 0.0053937435150146484, "step": 270} {"info/global_step": 271, "train_info/time_within_train_step": 54.4993531703949, "step": 271} {"train_info/time_between_train_steps": 0.010281085968017578, "step": 271} {"info/global_step": 272, "train_info/time_within_train_step": 54.74463629722595, "step": 272} {"train_info/time_between_train_steps": 0.00545048713684082, "step": 272} {"info/global_step": 273, "train_info/time_within_train_step": 54.677117109298706, "step": 273} {"train_info/time_between_train_steps": 0.007695198059082031, "step": 273} {"info/global_step": 274, "train_info/time_within_train_step": 54.71284222602844, "step": 274} {"train_info/time_between_train_steps": 0.015003204345703125, "step": 274} {"info/global_step": 275, "train_info/time_within_train_step": 54.5838348865509, "step": 275} {"train_info/time_between_train_steps": 0.006484031677246094, "step": 275} {"info/global_step": 276, "train_info/time_within_train_step": 54.64979910850525, "step": 276} {"train_info/time_between_train_steps": 0.006408214569091797, "step": 276} {"info/global_step": 277, "train_info/time_within_train_step": 47.28894925117493, "step": 277} {"train_info/time_between_train_steps": 0.005303621292114258, "step": 277} {"info/global_step": 278, "train_info/time_within_train_step": 27.888726472854614, "step": 278} {"train_info/time_between_train_steps": 0.005271196365356445, "step": 278} {"info/global_step": 279, "train_info/time_within_train_step": 27.842493772506714, "step": 279} {"train_info/time_between_train_steps": 0.007112026214599609, "step": 279} {"info/global_step": 280, "train_info/time_within_train_step": 27.91629123687744, "step": 280} {"train_info/time_between_train_steps": 0.005514621734619141, "step": 280} {"info/global_step": 281, "train_info/time_within_train_step": 27.94734501838684, "step": 281} {"train_info/time_between_train_steps": 0.005294322967529297, "step": 281} {"info/global_step": 282, "train_info/time_within_train_step": 27.8762469291687, "step": 282} {"train_info/time_between_train_steps": 0.0058727264404296875, "step": 282} {"info/global_step": 283, "train_info/time_within_train_step": 27.92640209197998, "step": 283} {"train_info/time_between_train_steps": 0.005160808563232422, "step": 283} {"info/global_step": 284, "train_info/time_within_train_step": 27.910324096679688, "step": 284} {"train_info/time_between_train_steps": 0.006075859069824219, "step": 284} {"info/global_step": 285, "train_info/time_within_train_step": 27.867588996887207, "step": 285} {"train_info/time_between_train_steps": 0.01023721694946289, "step": 285} {"info/global_step": 286, "train_info/time_within_train_step": 27.858565092086792, "step": 286} {"train_info/time_between_train_steps": 0.010214090347290039, "step": 286} {"info/global_step": 287, "train_info/time_within_train_step": 32.92755913734436, "step": 287} {"train_info/time_between_train_steps": 0.005651950836181641, "step": 287} {"info/global_step": 288, "train_info/time_within_train_step": 54.19832730293274, "step": 288} {"train_info/time_between_train_steps": 0.010259389877319336, "step": 288} {"train_info/time_between_train_steps": 7.2443788051605225, "step": 288} {"info/global_step": 289, "train_info/time_within_train_step": 54.14817786216736, "step": 289} {"train_info/time_between_train_steps": 0.005767107009887695, "step": 289} {"info/global_step": 290, "train_info/time_within_train_step": 54.397077560424805, "step": 290} {"train_info/time_between_train_steps": 0.0055849552154541016, "step": 290} {"info/global_step": 291, "train_info/time_within_train_step": 54.23816776275635, "step": 291} {"train_info/time_between_train_steps": 0.005911350250244141, "step": 291} {"info/global_step": 292, "train_info/time_within_train_step": 54.19840908050537, "step": 292} {"train_info/time_between_train_steps": 0.010102272033691406, "step": 292} {"info/global_step": 293, "train_info/time_within_train_step": 54.2811074256897, "step": 293} {"train_info/time_between_train_steps": 0.005193233489990234, "step": 293} {"info/global_step": 294, "train_info/time_within_train_step": 54.43468976020813, "step": 294} {"train_info/time_between_train_steps": 0.010524272918701172, "step": 294} {"info/global_step": 295, "train_info/time_within_train_step": 54.253355503082275, "step": 295} {"train_info/time_between_train_steps": 0.01051020622253418, "step": 295} {"info/global_step": 296, "train_info/time_within_train_step": 55.04879403114319, "step": 296} {"train_info/time_between_train_steps": 0.00558018684387207, "step": 296} {"info/global_step": 297, "train_info/time_within_train_step": 54.34609532356262, "step": 297} {"train_info/time_between_train_steps": 0.005360603332519531, "step": 297} {"info/global_step": 298, "train_info/time_within_train_step": 54.577178716659546, "step": 298} {"train_info/time_between_train_steps": 0.010412216186523438, "step": 298} {"info/global_step": 299, "train_info/time_within_train_step": 45.98192262649536, "step": 299} {"train_info/time_between_train_steps": 0.005329608917236328, "step": 299} {"info/global_step": 300, "train_info/time_within_train_step": 27.815983295440674, "step": 300} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733870779, "_runtime": 9091}, "step": 300} {"logs": {"train/loss": 5.4147, "train/learning_rate": 0.0005, "train/epoch": 12.01, "_timestamp": 1733870779, "_runtime": 9091}, "step": 300} {"train_info/time_between_train_steps": 2.4862406253814697, "step": 300} {"info/global_step": 301, "train_info/time_within_train_step": 27.95231795310974, "step": 301} {"train_info/time_between_train_steps": 0.010192155838012695, "step": 301} {"info/global_step": 302, "train_info/time_within_train_step": 27.912920236587524, "step": 302} {"train_info/time_between_train_steps": 0.009202241897583008, "step": 302} {"info/global_step": 303, "train_info/time_within_train_step": 27.942954063415527, "step": 303} {"train_info/time_between_train_steps": 0.00543522834777832, "step": 303} {"info/global_step": 304, "train_info/time_within_train_step": 27.916218042373657, "step": 304} {"train_info/time_between_train_steps": 0.0053865909576416016, "step": 304} {"info/global_step": 305, "train_info/time_within_train_step": 27.97864031791687, "step": 305} {"train_info/time_between_train_steps": 0.005716085433959961, "step": 305} {"info/global_step": 306, "train_info/time_within_train_step": 27.850365161895752, "step": 306} {"train_info/time_between_train_steps": 0.0052754878997802734, "step": 306} {"info/global_step": 307, "train_info/time_within_train_step": 27.87501049041748, "step": 307} {"train_info/time_between_train_steps": 0.005446195602416992, "step": 307} {"info/global_step": 308, "train_info/time_within_train_step": 27.890231132507324, "step": 308} {"train_info/time_between_train_steps": 0.009997129440307617, "step": 308} {"info/global_step": 309, "train_info/time_within_train_step": 27.950765371322632, "step": 309} {"train_info/time_between_train_steps": 0.0058116912841796875, "step": 309} {"info/global_step": 310, "train_info/time_within_train_step": 27.922719478607178, "step": 310} {"train_info/time_between_train_steps": 0.011106729507446289, "step": 310} {"info/global_step": 311, "train_info/time_within_train_step": 27.96547031402588, "step": 311} {"train_info/time_between_train_steps": 0.0059015750885009766, "step": 311} {"info/global_step": 312, "train_info/time_within_train_step": 28.105748414993286, "step": 312} {"train_info/time_between_train_steps": 0.006141185760498047, "step": 312} {"train_info/time_between_train_steps": 5.200135707855225, "step": 312} {"info/global_step": 313, "train_info/time_within_train_step": 27.94357967376709, "step": 313} {"train_info/time_between_train_steps": 0.006500959396362305, "step": 313} {"info/global_step": 314, "train_info/time_within_train_step": 28.057218074798584, "step": 314} {"train_info/time_between_train_steps": 0.010511398315429688, "step": 314} {"info/global_step": 315, "train_info/time_within_train_step": 27.940613746643066, "step": 315} {"train_info/time_between_train_steps": 0.005811929702758789, "step": 315} {"info/global_step": 316, "train_info/time_within_train_step": 28.0390043258667, "step": 316} {"train_info/time_between_train_steps": 0.009774208068847656, "step": 316} {"info/global_step": 317, "train_info/time_within_train_step": 27.88076138496399, "step": 317} {"train_info/time_between_train_steps": 0.0052258968353271484, "step": 317} {"info/global_step": 318, "train_info/time_within_train_step": 28.030539751052856, "step": 318} {"train_info/time_between_train_steps": 0.014481306076049805, "step": 318} {"info/global_step": 319, "train_info/time_within_train_step": 27.872583627700806, "step": 319} {"train_info/time_between_train_steps": 0.005280971527099609, "step": 319} {"info/global_step": 320, "train_info/time_within_train_step": 27.928632259368896, "step": 320} {"train_info/time_between_train_steps": 0.007923364639282227, "step": 320} {"info/global_step": 321, "train_info/time_within_train_step": 27.86077070236206, "step": 321} {"train_info/time_between_train_steps": 0.005402565002441406, "step": 321} {"info/global_step": 322, "train_info/time_within_train_step": 27.893105030059814, "step": 322} {"train_info/time_between_train_steps": 0.00884556770324707, "step": 322} {"info/global_step": 323, "train_info/time_within_train_step": 27.911871194839478, "step": 323} {"train_info/time_between_train_steps": 0.013902902603149414, "step": 323} {"info/global_step": 324, "train_info/time_within_train_step": 28.014004230499268, "step": 324} {"train_info/time_between_train_steps": 0.014440536499023438, "step": 324} {"info/global_step": 325, "train_info/time_within_train_step": 27.917236328125, "step": 325} {"train_info/time_between_train_steps": 0.013857603073120117, "step": 325} {"info/global_step": 326, "train_info/time_within_train_step": 27.988632917404175, "step": 326} {"train_info/time_between_train_steps": 0.005274772644042969, "step": 326} {"info/global_step": 327, "train_info/time_within_train_step": 27.926281213760376, "step": 327} {"train_info/time_between_train_steps": 0.0054438114166259766, "step": 327} {"info/global_step": 328, "train_info/time_within_train_step": 28.04514455795288, "step": 328} {"train_info/time_between_train_steps": 0.009557247161865234, "step": 328} {"info/global_step": 329, "train_info/time_within_train_step": 27.916889190673828, "step": 329} {"train_info/time_between_train_steps": 0.005468606948852539, "step": 329} {"info/global_step": 330, "train_info/time_within_train_step": 27.922077894210815, "step": 330} {"train_info/time_between_train_steps": 0.005370616912841797, "step": 330} {"info/global_step": 331, "train_info/time_within_train_step": 27.923028230667114, "step": 331} {"train_info/time_between_train_steps": 0.010865926742553711, "step": 331} {"info/global_step": 332, "train_info/time_within_train_step": 27.8688805103302, "step": 332} {"train_info/time_between_train_steps": 0.0054285526275634766, "step": 332} {"info/global_step": 333, "train_info/time_within_train_step": 27.93871521949768, "step": 333} {"train_info/time_between_train_steps": 0.005581378936767578, "step": 333} {"info/global_step": 334, "train_info/time_within_train_step": 27.96034002304077, "step": 334} {"train_info/time_between_train_steps": 0.005595684051513672, "step": 334} {"info/global_step": 335, "train_info/time_within_train_step": 27.929439783096313, "step": 335} {"train_info/time_between_train_steps": 0.010567903518676758, "step": 335} {"info/global_step": 336, "train_info/time_within_train_step": 27.92082953453064, "step": 336} {"train_info/time_between_train_steps": 0.005933046340942383, "step": 336} {"train_info/time_between_train_steps": 5.33640193939209, "step": 336} {"info/global_step": 337, "train_info/time_within_train_step": 27.91355299949646, "step": 337} {"train_info/time_between_train_steps": 0.0051305294036865234, "step": 337} {"info/global_step": 338, "train_info/time_within_train_step": 28.06067657470703, "step": 338} {"train_info/time_between_train_steps": 0.005434274673461914, "step": 338} {"info/global_step": 339, "train_info/time_within_train_step": 27.965662717819214, "step": 339} {"train_info/time_between_train_steps": 0.010189056396484375, "step": 339} {"info/global_step": 340, "train_info/time_within_train_step": 27.946305751800537, "step": 340} {"train_info/time_between_train_steps": 0.0054225921630859375, "step": 340} {"info/global_step": 341, "train_info/time_within_train_step": 27.912734270095825, "step": 341} {"train_info/time_between_train_steps": 0.005174875259399414, "step": 341} {"info/global_step": 342, "train_info/time_within_train_step": 27.81847834587097, "step": 342} {"train_info/time_between_train_steps": 0.010183334350585938, "step": 342} {"info/global_step": 343, "train_info/time_within_train_step": 27.983673810958862, "step": 343} {"train_info/time_between_train_steps": 0.0051190853118896484, "step": 343} {"info/global_step": 344, "train_info/time_within_train_step": 27.842815160751343, "step": 344} {"train_info/time_between_train_steps": 0.005388736724853516, "step": 344} {"info/global_step": 345, "train_info/time_within_train_step": 27.87504506111145, "step": 345} {"train_info/time_between_train_steps": 0.00942540168762207, "step": 345} {"info/global_step": 346, "train_info/time_within_train_step": 27.853031396865845, "step": 346} {"train_info/time_between_train_steps": 0.00800943374633789, "step": 346} {"info/global_step": 347, "train_info/time_within_train_step": 27.878655910491943, "step": 347} {"train_info/time_between_train_steps": 0.005389213562011719, "step": 347} {"info/global_step": 348, "train_info/time_within_train_step": 27.876102685928345, "step": 348} {"train_info/time_between_train_steps": 0.010813713073730469, "step": 348} {"info/global_step": 349, "train_info/time_within_train_step": 27.9240505695343, "step": 349} {"train_info/time_between_train_steps": 0.005380392074584961, "step": 349} {"info/global_step": 350, "train_info/time_within_train_step": 27.859062433242798, "step": 350} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733872189, "_runtime": 10501}, "step": 350} {"logs": {"train/loss": 5.246, "train/learning_rate": 0.00047222222222222224, "train/epoch": 14.01, "_timestamp": 1733872189, "_runtime": 10501}, "step": 350} {"train_info/time_between_train_steps": 0.0072078704833984375, "step": 350} {"info/global_step": 351, "train_info/time_within_train_step": 27.838289260864258, "step": 351} {"train_info/time_between_train_steps": 0.006203889846801758, "step": 351} {"info/global_step": 352, "train_info/time_within_train_step": 27.94213056564331, "step": 352} {"train_info/time_between_train_steps": 0.00999140739440918, "step": 352} {"info/global_step": 353, "train_info/time_within_train_step": 27.85683512687683, "step": 353} {"train_info/time_between_train_steps": 0.005193948745727539, "step": 353} {"info/global_step": 354, "train_info/time_within_train_step": 27.94767117500305, "step": 354} {"train_info/time_between_train_steps": 0.00541377067565918, "step": 354} {"info/global_step": 355, "train_info/time_within_train_step": 27.84339213371277, "step": 355} {"train_info/time_between_train_steps": 0.005814790725708008, "step": 355} {"info/global_step": 356, "train_info/time_within_train_step": 27.874053716659546, "step": 356} {"train_info/time_between_train_steps": 0.0056629180908203125, "step": 356} {"info/global_step": 357, "train_info/time_within_train_step": 27.891692399978638, "step": 357} {"train_info/time_between_train_steps": 0.005610942840576172, "step": 357} {"info/global_step": 358, "train_info/time_within_train_step": 27.927151679992676, "step": 358} {"train_info/time_between_train_steps": 0.006050586700439453, "step": 358} {"info/global_step": 359, "train_info/time_within_train_step": 28.016385078430176, "step": 359} {"train_info/time_between_train_steps": 0.005617856979370117, "step": 359} {"info/global_step": 360, "train_info/time_within_train_step": 27.848596572875977, "step": 360} {"train_info/time_between_train_steps": 0.0060024261474609375, "step": 360} {"train_info/time_between_train_steps": 5.487926959991455, "step": 360} {"info/global_step": 361, "train_info/time_within_train_step": 27.910669088363647, "step": 361} {"train_info/time_between_train_steps": 0.010767936706542969, "step": 361} {"info/global_step": 362, "train_info/time_within_train_step": 28.05900502204895, "step": 362} {"train_info/time_between_train_steps": 0.005725383758544922, "step": 362} {"info/global_step": 363, "train_info/time_within_train_step": 27.927067756652832, "step": 363} {"train_info/time_between_train_steps": 0.0055768489837646484, "step": 363} {"info/global_step": 364, "train_info/time_within_train_step": 27.906662464141846, "step": 364} {"train_info/time_between_train_steps": 0.005615234375, "step": 364} {"info/global_step": 365, "train_info/time_within_train_step": 28.010314226150513, "step": 365} {"train_info/time_between_train_steps": 0.014490604400634766, "step": 365} {"info/global_step": 366, "train_info/time_within_train_step": 27.816113233566284, "step": 366} {"train_info/time_between_train_steps": 0.005274772644042969, "step": 366} {"info/global_step": 367, "train_info/time_within_train_step": 27.923080921173096, "step": 367} {"train_info/time_between_train_steps": 0.009685516357421875, "step": 367} {"info/global_step": 368, "train_info/time_within_train_step": 27.908674001693726, "step": 368} {"train_info/time_between_train_steps": 0.010564327239990234, "step": 368} {"info/global_step": 369, "train_info/time_within_train_step": 27.894200086593628, "step": 369} {"train_info/time_between_train_steps": 0.005381107330322266, "step": 369} {"info/global_step": 370, "train_info/time_within_train_step": 27.835965156555176, "step": 370} {"train_info/time_between_train_steps": 0.005221366882324219, "step": 370} {"info/global_step": 371, "train_info/time_within_train_step": 27.866164684295654, "step": 371} {"train_info/time_between_train_steps": 0.005327701568603516, "step": 371} {"info/global_step": 372, "train_info/time_within_train_step": 27.922224044799805, "step": 372} {"train_info/time_between_train_steps": 0.005484104156494141, "step": 372} {"info/global_step": 373, "train_info/time_within_train_step": 27.93669080734253, "step": 373} {"train_info/time_between_train_steps": 0.005464792251586914, "step": 373} {"info/global_step": 374, "train_info/time_within_train_step": 27.982857704162598, "step": 374} {"train_info/time_between_train_steps": 0.010157108306884766, "step": 374} {"info/global_step": 375, "train_info/time_within_train_step": 27.819478511810303, "step": 375} {"train_info/time_between_train_steps": 0.008983850479125977, "step": 375} {"info/global_step": 376, "train_info/time_within_train_step": 27.968738079071045, "step": 376} {"train_info/time_between_train_steps": 0.005590677261352539, "step": 376} {"info/global_step": 377, "train_info/time_within_train_step": 27.891096115112305, "step": 377} {"train_info/time_between_train_steps": 0.005487203598022461, "step": 377} {"info/global_step": 378, "train_info/time_within_train_step": 27.92504358291626, "step": 378} {"train_info/time_between_train_steps": 0.0057337284088134766, "step": 378} {"info/global_step": 379, "train_info/time_within_train_step": 27.873619079589844, "step": 379} {"train_info/time_between_train_steps": 0.005158662796020508, "step": 379} {"info/global_step": 380, "train_info/time_within_train_step": 27.91353416442871, "step": 380} {"train_info/time_between_train_steps": 0.00658416748046875, "step": 380} {"info/global_step": 381, "train_info/time_within_train_step": 27.88924789428711, "step": 381} {"train_info/time_between_train_steps": 0.005296468734741211, "step": 381} {"info/global_step": 382, "train_info/time_within_train_step": 27.89810347557068, "step": 382} {"train_info/time_between_train_steps": 0.005716085433959961, "step": 382} {"info/global_step": 383, "train_info/time_within_train_step": 27.965447425842285, "step": 383} {"train_info/time_between_train_steps": 0.015073299407958984, "step": 383} {"info/global_step": 384, "train_info/time_within_train_step": 27.93622589111328, "step": 384} {"train_info/time_between_train_steps": 0.010890483856201172, "step": 384} {"train_info/time_between_train_steps": 5.232351064682007, "step": 384} {"info/global_step": 385, "train_info/time_within_train_step": 27.88042116165161, "step": 385} {"train_info/time_between_train_steps": 0.005445241928100586, "step": 385} {"info/global_step": 386, "train_info/time_within_train_step": 28.035608053207397, "step": 386} {"train_info/time_between_train_steps": 0.010398387908935547, "step": 386} {"info/global_step": 387, "train_info/time_within_train_step": 27.923914670944214, "step": 387} {"train_info/time_between_train_steps": 0.00563359260559082, "step": 387} {"info/global_step": 388, "train_info/time_within_train_step": 27.99910283088684, "step": 388} {"train_info/time_between_train_steps": 0.005629777908325195, "step": 388} {"info/global_step": 389, "train_info/time_within_train_step": 27.885318994522095, "step": 389} {"train_info/time_between_train_steps": 0.005276679992675781, "step": 389} {"info/global_step": 390, "train_info/time_within_train_step": 27.94597625732422, "step": 390} {"train_info/time_between_train_steps": 0.005300760269165039, "step": 390} {"info/global_step": 391, "train_info/time_within_train_step": 27.91901183128357, "step": 391} {"train_info/time_between_train_steps": 0.0051059722900390625, "step": 391} {"info/global_step": 392, "train_info/time_within_train_step": 27.922277688980103, "step": 392} {"train_info/time_between_train_steps": 0.010256052017211914, "step": 392} {"info/global_step": 393, "train_info/time_within_train_step": 27.946816444396973, "step": 393} {"train_info/time_between_train_steps": 0.005426645278930664, "step": 393} {"info/global_step": 394, "train_info/time_within_train_step": 27.813148260116577, "step": 394} {"train_info/time_between_train_steps": 0.005214691162109375, "step": 394} {"info/global_step": 395, "train_info/time_within_train_step": 28.031450510025024, "step": 395} {"train_info/time_between_train_steps": 0.010218620300292969, "step": 395} {"info/global_step": 396, "train_info/time_within_train_step": 27.832324743270874, "step": 396} {"train_info/time_between_train_steps": 0.005281686782836914, "step": 396} {"info/global_step": 397, "train_info/time_within_train_step": 27.890445232391357, "step": 397} {"train_info/time_between_train_steps": 0.005423545837402344, "step": 397} {"info/global_step": 398, "train_info/time_within_train_step": 27.870547771453857, "step": 398} {"train_info/time_between_train_steps": 0.00529170036315918, "step": 398} {"info/global_step": 399, "train_info/time_within_train_step": 27.923609733581543, "step": 399} {"train_info/time_between_train_steps": 0.006553173065185547, "step": 399} {"info/global_step": 400, "train_info/time_within_train_step": 27.91495633125305, "step": 400} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733873596, "_runtime": 11908}, "step": 400} {"logs": {"train/loss": 5.1141, "train/learning_rate": 0.00044444444444444436, "train/epoch": 16.01, "_timestamp": 1733873596, "_runtime": 11908}, "step": 400} {"train_info/time_between_train_steps": 2.3100426197052, "step": 400} {"info/global_step": 401, "train_info/time_within_train_step": 27.960118770599365, "step": 401} {"train_info/time_between_train_steps": 0.010901212692260742, "step": 401} {"info/global_step": 402, "train_info/time_within_train_step": 27.82571816444397, "step": 402} {"train_info/time_between_train_steps": 0.005398988723754883, "step": 402} {"info/global_step": 403, "train_info/time_within_train_step": 27.9453444480896, "step": 403} {"train_info/time_between_train_steps": 0.01426243782043457, "step": 403} {"info/global_step": 404, "train_info/time_within_train_step": 27.875283002853394, "step": 404} {"train_info/time_between_train_steps": 0.005678892135620117, "step": 404} {"info/global_step": 405, "train_info/time_within_train_step": 27.934632062911987, "step": 405} {"train_info/time_between_train_steps": 0.005330562591552734, "step": 405} {"info/global_step": 406, "train_info/time_within_train_step": 27.880878925323486, "step": 406} {"train_info/time_between_train_steps": 0.005694866180419922, "step": 406} {"info/global_step": 407, "train_info/time_within_train_step": 27.85265612602234, "step": 407} {"train_info/time_between_train_steps": 0.005730152130126953, "step": 407} {"info/global_step": 408, "train_info/time_within_train_step": 27.920149087905884, "step": 408} {"train_info/time_between_train_steps": 0.006062984466552734, "step": 408} {"train_info/time_between_train_steps": 5.215541124343872, "step": 408} {"info/global_step": 409, "train_info/time_within_train_step": 27.87403392791748, "step": 409} {"train_info/time_between_train_steps": 0.010165929794311523, "step": 409} {"info/global_step": 410, "train_info/time_within_train_step": 28.105641841888428, "step": 410} {"train_info/time_between_train_steps": 0.005406618118286133, "step": 410} {"info/global_step": 411, "train_info/time_within_train_step": 27.8521511554718, "step": 411} {"train_info/time_between_train_steps": 0.00648951530456543, "step": 411} {"info/global_step": 412, "train_info/time_within_train_step": 28.015289783477783, "step": 412} {"train_info/time_between_train_steps": 0.005639076232910156, "step": 412} {"info/global_step": 413, "train_info/time_within_train_step": 27.95787477493286, "step": 413} {"train_info/time_between_train_steps": 0.014213323593139648, "step": 413} {"info/global_step": 414, "train_info/time_within_train_step": 27.87571358680725, "step": 414} {"train_info/time_between_train_steps": 0.005636930465698242, "step": 414} {"info/global_step": 415, "train_info/time_within_train_step": 27.94058871269226, "step": 415} {"train_info/time_between_train_steps": 0.005146503448486328, "step": 415} {"info/global_step": 416, "train_info/time_within_train_step": 27.896914958953857, "step": 416} {"train_info/time_between_train_steps": 0.00959634780883789, "step": 416} {"info/global_step": 417, "train_info/time_within_train_step": 27.883610725402832, "step": 417} {"train_info/time_between_train_steps": 0.005218029022216797, "step": 417} {"info/global_step": 418, "train_info/time_within_train_step": 27.903810024261475, "step": 418} {"train_info/time_between_train_steps": 0.005398750305175781, "step": 418} {"info/global_step": 419, "train_info/time_within_train_step": 27.812946796417236, "step": 419} {"train_info/time_between_train_steps": 0.01419520378112793, "step": 419} {"info/global_step": 420, "train_info/time_within_train_step": 27.90622115135193, "step": 420} {"train_info/time_between_train_steps": 0.0100860595703125, "step": 420} {"info/global_step": 421, "train_info/time_within_train_step": 28.07691717147827, "step": 421} {"train_info/time_between_train_steps": 0.013910293579101562, "step": 421} {"info/global_step": 422, "train_info/time_within_train_step": 27.86402177810669, "step": 422} {"train_info/time_between_train_steps": 0.010456085205078125, "step": 422} {"info/global_step": 423, "train_info/time_within_train_step": 27.864712238311768, "step": 423} {"train_info/time_between_train_steps": 0.005240917205810547, "step": 423} {"info/global_step": 424, "train_info/time_within_train_step": 27.85373544692993, "step": 424} {"train_info/time_between_train_steps": 0.00566411018371582, "step": 424} {"info/global_step": 425, "train_info/time_within_train_step": 27.910603523254395, "step": 425} {"train_info/time_between_train_steps": 0.010902881622314453, "step": 425} {"info/global_step": 426, "train_info/time_within_train_step": 27.866512775421143, "step": 426} {"train_info/time_between_train_steps": 0.005379438400268555, "step": 426} {"info/global_step": 427, "train_info/time_within_train_step": 27.883288621902466, "step": 427} {"train_info/time_between_train_steps": 0.005482196807861328, "step": 427} {"info/global_step": 428, "train_info/time_within_train_step": 27.89821982383728, "step": 428} {"train_info/time_between_train_steps": 0.006619930267333984, "step": 428} {"info/global_step": 429, "train_info/time_within_train_step": 27.90566897392273, "step": 429} {"train_info/time_between_train_steps": 0.009766340255737305, "step": 429} {"info/global_step": 430, "train_info/time_within_train_step": 27.890706777572632, "step": 430} {"train_info/time_between_train_steps": 0.005345821380615234, "step": 430} {"info/global_step": 431, "train_info/time_within_train_step": 27.875792503356934, "step": 431} {"train_info/time_between_train_steps": 0.016437530517578125, "step": 431} {"info/global_step": 432, "train_info/time_within_train_step": 27.900954723358154, "step": 432} {"train_info/time_between_train_steps": 0.005933523178100586, "step": 432} {"train_info/time_between_train_steps": 5.349683523178101, "step": 432} {"info/global_step": 433, "train_info/time_within_train_step": 27.885534286499023, "step": 433} {"train_info/time_between_train_steps": 0.005750894546508789, "step": 433} {"info/global_step": 434, "train_info/time_within_train_step": 27.9525887966156, "step": 434} {"train_info/time_between_train_steps": 0.009895801544189453, "step": 434} {"info/global_step": 435, "train_info/time_within_train_step": 27.83566117286682, "step": 435} {"train_info/time_between_train_steps": 0.005357265472412109, "step": 435} {"info/global_step": 436, "train_info/time_within_train_step": 27.940978288650513, "step": 436} {"train_info/time_between_train_steps": 0.010418891906738281, "step": 436} {"info/global_step": 437, "train_info/time_within_train_step": 27.980412483215332, "step": 437} {"train_info/time_between_train_steps": 0.0063152313232421875, "step": 437} {"info/global_step": 438, "train_info/time_within_train_step": 27.86991834640503, "step": 438} {"train_info/time_between_train_steps": 0.005168437957763672, "step": 438} {"info/global_step": 439, "train_info/time_within_train_step": 27.884427547454834, "step": 439} {"train_info/time_between_train_steps": 0.008323907852172852, "step": 439} {"info/global_step": 440, "train_info/time_within_train_step": 27.893783807754517, "step": 440} {"train_info/time_between_train_steps": 0.005981922149658203, "step": 440} {"info/global_step": 441, "train_info/time_within_train_step": 27.8704776763916, "step": 441} {"train_info/time_between_train_steps": 0.009710073471069336, "step": 441} {"info/global_step": 442, "train_info/time_within_train_step": 27.863332509994507, "step": 442} {"train_info/time_between_train_steps": 0.0054018497467041016, "step": 442} {"info/global_step": 443, "train_info/time_within_train_step": 27.86281991004944, "step": 443} {"train_info/time_between_train_steps": 0.010308027267456055, "step": 443} {"info/global_step": 444, "train_info/time_within_train_step": 27.92629861831665, "step": 444} {"train_info/time_between_train_steps": 0.006601095199584961, "step": 444} {"info/global_step": 445, "train_info/time_within_train_step": 27.84630036354065, "step": 445} {"train_info/time_between_train_steps": 0.008348226547241211, "step": 445} {"info/global_step": 446, "train_info/time_within_train_step": 27.856345176696777, "step": 446} {"train_info/time_between_train_steps": 0.0060961246490478516, "step": 446} {"info/global_step": 447, "train_info/time_within_train_step": 27.856279611587524, "step": 447} {"train_info/time_between_train_steps": 0.010698556900024414, "step": 447} {"info/global_step": 448, "train_info/time_within_train_step": 27.88671612739563, "step": 448} {"train_info/time_between_train_steps": 0.0057773590087890625, "step": 448} {"info/global_step": 449, "train_info/time_within_train_step": 27.800527334213257, "step": 449} {"train_info/time_between_train_steps": 0.006496906280517578, "step": 449} {"info/global_step": 450, "train_info/time_within_train_step": 27.81158995628357, "step": 450} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733875004, "_runtime": 13316}, "step": 450} {"logs": {"train/loss": 4.9877, "train/learning_rate": 0.00041666666666666664, "train/epoch": 18.02, "_timestamp": 1733875004, "_runtime": 13316}, "step": 450} {"train_info/time_between_train_steps": 0.0074841976165771484, "step": 450} {"info/global_step": 451, "train_info/time_within_train_step": 27.803152561187744, "step": 451} {"train_info/time_between_train_steps": 0.00532841682434082, "step": 451} {"info/global_step": 452, "train_info/time_within_train_step": 27.996629238128662, "step": 452} {"train_info/time_between_train_steps": 0.005557060241699219, "step": 452} {"info/global_step": 453, "train_info/time_within_train_step": 27.90078353881836, "step": 453} {"train_info/time_between_train_steps": 0.0054361820220947266, "step": 453} {"info/global_step": 454, "train_info/time_within_train_step": 27.82730531692505, "step": 454} {"train_info/time_between_train_steps": 0.005541324615478516, "step": 454} {"info/global_step": 455, "train_info/time_within_train_step": 27.92565107345581, "step": 455} {"train_info/time_between_train_steps": 0.015038013458251953, "step": 455} {"info/global_step": 456, "train_info/time_within_train_step": 27.925771236419678, "step": 456} {"train_info/time_between_train_steps": 0.0060122013092041016, "step": 456} {"train_info/time_between_train_steps": 5.15233588218689, "step": 456} {"info/global_step": 457, "train_info/time_within_train_step": 27.909586191177368, "step": 457} {"train_info/time_between_train_steps": 0.006040334701538086, "step": 457} {"info/global_step": 458, "train_info/time_within_train_step": 28.137542963027954, "step": 458} {"train_info/time_between_train_steps": 0.011893987655639648, "step": 458} {"info/global_step": 459, "train_info/time_within_train_step": 27.95271396636963, "step": 459} {"train_info/time_between_train_steps": 0.006497621536254883, "step": 459} {"info/global_step": 460, "train_info/time_within_train_step": 28.001882314682007, "step": 460} {"train_info/time_between_train_steps": 0.005715847015380859, "step": 460} {"info/global_step": 461, "train_info/time_within_train_step": 27.925892114639282, "step": 461} {"train_info/time_between_train_steps": 0.005464792251586914, "step": 461} {"info/global_step": 462, "train_info/time_within_train_step": 27.843188285827637, "step": 462} {"train_info/time_between_train_steps": 0.01022195816040039, "step": 462} {"info/global_step": 463, "train_info/time_within_train_step": 27.835870265960693, "step": 463} {"train_info/time_between_train_steps": 0.00530552864074707, "step": 463} {"info/global_step": 464, "train_info/time_within_train_step": 27.901309967041016, "step": 464} {"train_info/time_between_train_steps": 0.01144099235534668, "step": 464} {"info/global_step": 465, "train_info/time_within_train_step": 27.88672947883606, "step": 465} {"train_info/time_between_train_steps": 0.009938240051269531, "step": 465} {"info/global_step": 466, "train_info/time_within_train_step": 27.887600421905518, "step": 466} {"train_info/time_between_train_steps": 0.00989675521850586, "step": 466} {"info/global_step": 467, "train_info/time_within_train_step": 27.849918127059937, "step": 467} {"train_info/time_between_train_steps": 0.005476474761962891, "step": 467} {"info/global_step": 468, "train_info/time_within_train_step": 27.953349828720093, "step": 468} {"train_info/time_between_train_steps": 0.011000633239746094, "step": 468} {"info/global_step": 469, "train_info/time_within_train_step": 27.874753713607788, "step": 469} {"train_info/time_between_train_steps": 0.0054209232330322266, "step": 469} {"info/global_step": 470, "train_info/time_within_train_step": 27.884888172149658, "step": 470} {"train_info/time_between_train_steps": 0.005951881408691406, "step": 470} {"info/global_step": 471, "train_info/time_within_train_step": 27.82809352874756, "step": 471} {"train_info/time_between_train_steps": 0.00557255744934082, "step": 471} {"info/global_step": 472, "train_info/time_within_train_step": 27.86241579055786, "step": 472} {"train_info/time_between_train_steps": 0.010120391845703125, "step": 472} {"info/global_step": 473, "train_info/time_within_train_step": 27.844380378723145, "step": 473} {"train_info/time_between_train_steps": 0.005620718002319336, "step": 473} {"info/global_step": 474, "train_info/time_within_train_step": 27.89250683784485, "step": 474} {"train_info/time_between_train_steps": 0.005524635314941406, "step": 474} {"info/global_step": 475, "train_info/time_within_train_step": 27.882616758346558, "step": 475} {"train_info/time_between_train_steps": 0.005684852600097656, "step": 475} {"info/global_step": 476, "train_info/time_within_train_step": 27.834041118621826, "step": 476} {"train_info/time_between_train_steps": 0.005663394927978516, "step": 476} {"info/global_step": 477, "train_info/time_within_train_step": 27.90588068962097, "step": 477} {"train_info/time_between_train_steps": 0.00581669807434082, "step": 477} {"info/global_step": 478, "train_info/time_within_train_step": 27.864700078964233, "step": 478} {"train_info/time_between_train_steps": 0.006318092346191406, "step": 478} {"info/global_step": 479, "train_info/time_within_train_step": 27.850335597991943, "step": 479} {"train_info/time_between_train_steps": 0.005738019943237305, "step": 479} {"info/global_step": 480, "train_info/time_within_train_step": 27.91063904762268, "step": 480} {"train_info/time_between_train_steps": 0.007357120513916016, "step": 480} {"train_info/time_between_train_steps": 5.296358585357666, "step": 480} {"info/global_step": 481, "train_info/time_within_train_step": 27.84310793876648, "step": 481} {"train_info/time_between_train_steps": 0.005970478057861328, "step": 481} {"info/global_step": 482, "train_info/time_within_train_step": 27.996733903884888, "step": 482} {"train_info/time_between_train_steps": 0.005694389343261719, "step": 482} {"info/global_step": 483, "train_info/time_within_train_step": 27.973267555236816, "step": 483} {"train_info/time_between_train_steps": 0.01124882698059082, "step": 483} {"info/global_step": 484, "train_info/time_within_train_step": 27.917524814605713, "step": 484} {"train_info/time_between_train_steps": 0.00571441650390625, "step": 484} {"info/global_step": 485, "train_info/time_within_train_step": 27.860389947891235, "step": 485} {"train_info/time_between_train_steps": 0.00542759895324707, "step": 485} {"info/global_step": 486, "train_info/time_within_train_step": 27.826270818710327, "step": 486} {"train_info/time_between_train_steps": 0.0060253143310546875, "step": 486} {"info/global_step": 487, "train_info/time_within_train_step": 27.85361337661743, "step": 487} {"train_info/time_between_train_steps": 0.005337715148925781, "step": 487} {"info/global_step": 488, "train_info/time_within_train_step": 27.836999893188477, "step": 488} {"train_info/time_between_train_steps": 0.0056018829345703125, "step": 488} {"info/global_step": 489, "train_info/time_within_train_step": 27.85642695426941, "step": 489} {"train_info/time_between_train_steps": 0.005617856979370117, "step": 489} {"info/global_step": 490, "train_info/time_within_train_step": 27.831857681274414, "step": 490} {"train_info/time_between_train_steps": 0.011475324630737305, "step": 490} {"info/global_step": 491, "train_info/time_within_train_step": 27.851728916168213, "step": 491} {"train_info/time_between_train_steps": 0.00559544563293457, "step": 491} {"info/global_step": 492, "train_info/time_within_train_step": 27.86044979095459, "step": 492} {"train_info/time_between_train_steps": 0.014014959335327148, "step": 492} {"info/global_step": 493, "train_info/time_within_train_step": 27.872878313064575, "step": 493} {"train_info/time_between_train_steps": 0.005593299865722656, "step": 493} {"info/global_step": 494, "train_info/time_within_train_step": 27.82900619506836, "step": 494} {"train_info/time_between_train_steps": 0.010349273681640625, "step": 494} {"info/global_step": 495, "train_info/time_within_train_step": 27.82022786140442, "step": 495} {"train_info/time_between_train_steps": 0.011099100112915039, "step": 495} {"info/global_step": 496, "train_info/time_within_train_step": 27.86856961250305, "step": 496} {"train_info/time_between_train_steps": 0.0054931640625, "step": 496} {"info/global_step": 497, "train_info/time_within_train_step": 27.846609354019165, "step": 497} {"train_info/time_between_train_steps": 0.005639314651489258, "step": 497} {"info/global_step": 498, "train_info/time_within_train_step": 27.828230619430542, "step": 498} {"train_info/time_between_train_steps": 0.005542278289794922, "step": 498} {"info/global_step": 499, "train_info/time_within_train_step": 27.958035707473755, "step": 499} {"train_info/time_between_train_steps": 0.010689735412597656, "step": 499} {"info/global_step": 500, "train_info/time_within_train_step": 27.839276552200317, "step": 500} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733876409, "_runtime": 14721}, "step": 500} {"logs": {"train/loss": 4.8652, "train/learning_rate": 0.00038888888888888887, "train/epoch": 20.02, "_timestamp": 1733876409, "_runtime": 14721}, "step": 500} {"train_info/time_between_train_steps": 2.394805908203125, "step": 500} {"info/global_step": 501, "train_info/time_within_train_step": 27.87432885169983, "step": 501} {"train_info/time_between_train_steps": 0.010862588882446289, "step": 501} {"info/global_step": 502, "train_info/time_within_train_step": 27.8777072429657, "step": 502} {"train_info/time_between_train_steps": 0.005761861801147461, "step": 502} {"info/global_step": 503, "train_info/time_within_train_step": 27.890493631362915, "step": 503} {"train_info/time_between_train_steps": 0.010388374328613281, "step": 503} {"info/global_step": 504, "train_info/time_within_train_step": 27.889983892440796, "step": 504} {"train_info/time_between_train_steps": 0.0061185359954833984, "step": 504} {"train_info/time_between_train_steps": 5.4197797775268555, "step": 504} {"info/global_step": 505, "train_info/time_within_train_step": 27.843919038772583, "step": 505} {"train_info/time_between_train_steps": 0.0056915283203125, "step": 505} {"info/global_step": 506, "train_info/time_within_train_step": 28.030489921569824, "step": 506} {"train_info/time_between_train_steps": 0.005544185638427734, "step": 506} {"info/global_step": 507, "train_info/time_within_train_step": 27.894803285598755, "step": 507} {"train_info/time_between_train_steps": 0.005391597747802734, "step": 507} {"info/global_step": 508, "train_info/time_within_train_step": 27.943537950515747, "step": 508} {"train_info/time_between_train_steps": 0.005640745162963867, "step": 508} {"info/global_step": 509, "train_info/time_within_train_step": 27.828128814697266, "step": 509} {"train_info/time_between_train_steps": 0.005241870880126953, "step": 509} {"info/global_step": 510, "train_info/time_within_train_step": 27.823890924453735, "step": 510} {"train_info/time_between_train_steps": 0.005310535430908203, "step": 510} {"info/global_step": 511, "train_info/time_within_train_step": 27.840429306030273, "step": 511} {"train_info/time_between_train_steps": 0.005288362503051758, "step": 511} {"info/global_step": 512, "train_info/time_within_train_step": 27.854710817337036, "step": 512} {"train_info/time_between_train_steps": 0.005129814147949219, "step": 512} {"info/global_step": 513, "train_info/time_within_train_step": 27.868507146835327, "step": 513} {"train_info/time_between_train_steps": 0.006006002426147461, "step": 513} {"info/global_step": 514, "train_info/time_within_train_step": 27.93352437019348, "step": 514} {"train_info/time_between_train_steps": 0.005305767059326172, "step": 514} {"info/global_step": 515, "train_info/time_within_train_step": 27.83526039123535, "step": 515} {"train_info/time_between_train_steps": 0.010460376739501953, "step": 515} {"info/global_step": 516, "train_info/time_within_train_step": 27.841933250427246, "step": 516} {"train_info/time_between_train_steps": 0.005476713180541992, "step": 516} {"info/global_step": 517, "train_info/time_within_train_step": 27.84576439857483, "step": 517} {"train_info/time_between_train_steps": 0.0052182674407958984, "step": 517} {"info/global_step": 518, "train_info/time_within_train_step": 27.84359884262085, "step": 518} {"train_info/time_between_train_steps": 0.005664825439453125, "step": 518} {"info/global_step": 519, "train_info/time_within_train_step": 27.852445125579834, "step": 519} {"train_info/time_between_train_steps": 0.006258964538574219, "step": 519} {"info/global_step": 520, "train_info/time_within_train_step": 27.842531204223633, "step": 520} {"train_info/time_between_train_steps": 0.00561070442199707, "step": 520} {"info/global_step": 521, "train_info/time_within_train_step": 27.889511108398438, "step": 521} {"train_info/time_between_train_steps": 0.009637832641601562, "step": 521} {"info/global_step": 522, "train_info/time_within_train_step": 27.802544832229614, "step": 522} {"train_info/time_between_train_steps": 0.0051920413970947266, "step": 522} {"info/global_step": 523, "train_info/time_within_train_step": 27.8525447845459, "step": 523} {"train_info/time_between_train_steps": 0.0055637359619140625, "step": 523} {"info/global_step": 524, "train_info/time_within_train_step": 27.80139923095703, "step": 524} {"train_info/time_between_train_steps": 0.010105133056640625, "step": 524} {"info/global_step": 525, "train_info/time_within_train_step": 27.865301370620728, "step": 525} {"train_info/time_between_train_steps": 0.005692720413208008, "step": 525} {"info/global_step": 526, "train_info/time_within_train_step": 27.88852858543396, "step": 526} {"train_info/time_between_train_steps": 0.005749702453613281, "step": 526} {"info/global_step": 527, "train_info/time_within_train_step": 27.896571159362793, "step": 527} {"train_info/time_between_train_steps": 0.007287263870239258, "step": 527} {"info/global_step": 528, "train_info/time_within_train_step": 27.88986873626709, "step": 528} {"train_info/time_between_train_steps": 0.011726617813110352, "step": 528} {"train_info/time_between_train_steps": 5.120944023132324, "step": 528} {"info/global_step": 529, "train_info/time_within_train_step": 27.89640474319458, "step": 529} {"train_info/time_between_train_steps": 0.005939006805419922, "step": 529} {"info/global_step": 530, "train_info/time_within_train_step": 28.218708515167236, "step": 530} {"train_info/time_between_train_steps": 0.005604267120361328, "step": 530} {"info/global_step": 531, "train_info/time_within_train_step": 27.859265327453613, "step": 531} {"train_info/time_between_train_steps": 0.0059545040130615234, "step": 531} {"info/global_step": 532, "train_info/time_within_train_step": 27.967445850372314, "step": 532} {"train_info/time_between_train_steps": 0.005720376968383789, "step": 532} {"info/global_step": 533, "train_info/time_within_train_step": 27.89865231513977, "step": 533} {"train_info/time_between_train_steps": 0.0056056976318359375, "step": 533} {"info/global_step": 534, "train_info/time_within_train_step": 27.8799991607666, "step": 534} {"train_info/time_between_train_steps": 0.005559206008911133, "step": 534} {"info/global_step": 535, "train_info/time_within_train_step": 27.83234429359436, "step": 535} {"train_info/time_between_train_steps": 0.005421161651611328, "step": 535} {"info/global_step": 536, "train_info/time_within_train_step": 27.84687352180481, "step": 536} {"train_info/time_between_train_steps": 0.005324840545654297, "step": 536} {"info/global_step": 537, "train_info/time_within_train_step": 27.812856674194336, "step": 537} {"train_info/time_between_train_steps": 0.005374908447265625, "step": 537} {"info/global_step": 538, "train_info/time_within_train_step": 27.82063102722168, "step": 538} {"train_info/time_between_train_steps": 0.005239248275756836, "step": 538} {"info/global_step": 539, "train_info/time_within_train_step": 27.82723379135132, "step": 539} {"train_info/time_between_train_steps": 0.005295991897583008, "step": 539} {"info/global_step": 540, "train_info/time_within_train_step": 27.811086177825928, "step": 540} {"train_info/time_between_train_steps": 0.005580425262451172, "step": 540} {"info/global_step": 541, "train_info/time_within_train_step": 27.837977409362793, "step": 541} {"train_info/time_between_train_steps": 0.005512237548828125, "step": 541} {"info/global_step": 542, "train_info/time_within_train_step": 27.830695629119873, "step": 542} {"train_info/time_between_train_steps": 0.005494594573974609, "step": 542} {"info/global_step": 543, "train_info/time_within_train_step": 27.867006301879883, "step": 543} {"train_info/time_between_train_steps": 0.005351066589355469, "step": 543} {"info/global_step": 544, "train_info/time_within_train_step": 27.807859659194946, "step": 544} {"train_info/time_between_train_steps": 0.005249977111816406, "step": 544} {"info/global_step": 545, "train_info/time_within_train_step": 27.82230019569397, "step": 545} {"train_info/time_between_train_steps": 0.010681867599487305, "step": 545} {"info/global_step": 546, "train_info/time_within_train_step": 27.970029592514038, "step": 546} {"train_info/time_between_train_steps": 0.006182193756103516, "step": 546} {"info/global_step": 547, "train_info/time_within_train_step": 27.87220859527588, "step": 547} {"train_info/time_between_train_steps": 0.005524396896362305, "step": 547} {"info/global_step": 548, "train_info/time_within_train_step": 27.823115825653076, "step": 548} {"train_info/time_between_train_steps": 0.005835056304931641, "step": 548} {"info/global_step": 549, "train_info/time_within_train_step": 27.857767820358276, "step": 549} {"train_info/time_between_train_steps": 0.005532026290893555, "step": 549} {"info/global_step": 550, "train_info/time_within_train_step": 27.86286187171936, "step": 550} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733877816, "_runtime": 16128}, "step": 550} {"logs": {"train/loss": 4.7263, "train/learning_rate": 0.0003611111111111111, "train/epoch": 22.02, "_timestamp": 1733877816, "_runtime": 16128}, "step": 550} {"train_info/time_between_train_steps": 0.007869482040405273, "step": 550} {"info/global_step": 551, "train_info/time_within_train_step": 27.906161546707153, "step": 551} {"train_info/time_between_train_steps": 0.005956411361694336, "step": 551} {"info/global_step": 552, "train_info/time_within_train_step": 27.835118293762207, "step": 552} {"train_info/time_between_train_steps": 0.006093740463256836, "step": 552} {"train_info/time_between_train_steps": 5.284787654876709, "step": 552} {"info/global_step": 553, "train_info/time_within_train_step": 27.828003883361816, "step": 553} {"train_info/time_between_train_steps": 0.005063533782958984, "step": 553} {"info/global_step": 554, "train_info/time_within_train_step": 27.94733953475952, "step": 554} {"train_info/time_between_train_steps": 0.005703926086425781, "step": 554} {"info/global_step": 555, "train_info/time_within_train_step": 27.92203974723816, "step": 555} {"train_info/time_between_train_steps": 0.005499839782714844, "step": 555} {"info/global_step": 556, "train_info/time_within_train_step": 27.90157985687256, "step": 556} {"train_info/time_between_train_steps": 0.00991058349609375, "step": 556} {"info/global_step": 557, "train_info/time_within_train_step": 27.941086053848267, "step": 557} {"train_info/time_between_train_steps": 0.00571751594543457, "step": 557} {"info/global_step": 558, "train_info/time_within_train_step": 27.858603954315186, "step": 558} {"train_info/time_between_train_steps": 0.005327701568603516, "step": 558} {"info/global_step": 559, "train_info/time_within_train_step": 27.915207147598267, "step": 559} {"train_info/time_between_train_steps": 0.005393505096435547, "step": 559} {"info/global_step": 560, "train_info/time_within_train_step": 27.894651412963867, "step": 560} {"train_info/time_between_train_steps": 0.005367279052734375, "step": 560} {"info/global_step": 561, "train_info/time_within_train_step": 27.99834942817688, "step": 561} {"train_info/time_between_train_steps": 0.007378816604614258, "step": 561} {"info/global_step": 562, "train_info/time_within_train_step": 27.92231774330139, "step": 562} {"train_info/time_between_train_steps": 0.005354404449462891, "step": 562} {"info/global_step": 563, "train_info/time_within_train_step": 27.89910888671875, "step": 563} {"train_info/time_between_train_steps": 0.009620428085327148, "step": 563} {"info/global_step": 564, "train_info/time_within_train_step": 27.822662115097046, "step": 564} {"train_info/time_between_train_steps": 0.005409717559814453, "step": 564} {"info/global_step": 565, "train_info/time_within_train_step": 27.88777995109558, "step": 565} {"train_info/time_between_train_steps": 0.00524139404296875, "step": 565} {"info/global_step": 566, "train_info/time_within_train_step": 27.86192226409912, "step": 566} {"train_info/time_between_train_steps": 0.005444765090942383, "step": 566} {"info/global_step": 567, "train_info/time_within_train_step": 27.852421045303345, "step": 567} {"train_info/time_between_train_steps": 0.009893178939819336, "step": 567} {"info/global_step": 568, "train_info/time_within_train_step": 27.89379858970642, "step": 568} {"train_info/time_between_train_steps": 0.005529165267944336, "step": 568} {"info/global_step": 569, "train_info/time_within_train_step": 27.851369619369507, "step": 569} {"train_info/time_between_train_steps": 0.005176544189453125, "step": 569} {"info/global_step": 570, "train_info/time_within_train_step": 27.86748242378235, "step": 570} {"train_info/time_between_train_steps": 0.006411552429199219, "step": 570} {"info/global_step": 571, "train_info/time_within_train_step": 27.906250715255737, "step": 571} {"train_info/time_between_train_steps": 0.005312204360961914, "step": 571} {"info/global_step": 572, "train_info/time_within_train_step": 27.893706560134888, "step": 572} {"train_info/time_between_train_steps": 0.010753870010375977, "step": 572} {"info/global_step": 573, "train_info/time_within_train_step": 27.914600133895874, "step": 573} {"train_info/time_between_train_steps": 0.01149606704711914, "step": 573} {"info/global_step": 574, "train_info/time_within_train_step": 27.947702646255493, "step": 574} {"train_info/time_between_train_steps": 0.005384922027587891, "step": 574} {"info/global_step": 575, "train_info/time_within_train_step": 27.92045021057129, "step": 575} {"train_info/time_between_train_steps": 0.0062482357025146484, "step": 575} {"info/global_step": 576, "train_info/time_within_train_step": 27.906256437301636, "step": 576} {"train_info/time_between_train_steps": 0.010857343673706055, "step": 576} {"train_info/time_between_train_steps": 5.474336862564087, "step": 576} {"info/global_step": 577, "train_info/time_within_train_step": 27.944814205169678, "step": 577} {"train_info/time_between_train_steps": 0.0054705142974853516, "step": 577} {"info/global_step": 578, "train_info/time_within_train_step": 28.054246187210083, "step": 578} {"train_info/time_between_train_steps": 0.008492231369018555, "step": 578} {"info/global_step": 579, "train_info/time_within_train_step": 27.874080419540405, "step": 579} {"train_info/time_between_train_steps": 0.005407810211181641, "step": 579} {"info/global_step": 580, "train_info/time_within_train_step": 27.935359001159668, "step": 580} {"train_info/time_between_train_steps": 0.005383729934692383, "step": 580} {"info/global_step": 581, "train_info/time_within_train_step": 27.85428524017334, "step": 581} {"train_info/time_between_train_steps": 0.0074841976165771484, "step": 581} {"info/global_step": 582, "train_info/time_within_train_step": 27.831166982650757, "step": 582} {"train_info/time_between_train_steps": 0.009261131286621094, "step": 582} {"info/global_step": 583, "train_info/time_within_train_step": 27.855700969696045, "step": 583} {"train_info/time_between_train_steps": 0.0052700042724609375, "step": 583} {"info/global_step": 584, "train_info/time_within_train_step": 27.880573272705078, "step": 584} {"train_info/time_between_train_steps": 0.005286693572998047, "step": 584} {"info/global_step": 585, "train_info/time_within_train_step": 27.888071537017822, "step": 585} {"train_info/time_between_train_steps": 0.013593196868896484, "step": 585} {"info/global_step": 586, "train_info/time_within_train_step": 27.849879026412964, "step": 586} {"train_info/time_between_train_steps": 0.010090351104736328, "step": 586} {"info/global_step": 587, "train_info/time_within_train_step": 27.924092054367065, "step": 587} {"train_info/time_between_train_steps": 0.005278825759887695, "step": 587} {"info/global_step": 588, "train_info/time_within_train_step": 27.82734966278076, "step": 588} {"train_info/time_between_train_steps": 0.0053501129150390625, "step": 588} {"info/global_step": 589, "train_info/time_within_train_step": 27.91457724571228, "step": 589} {"train_info/time_between_train_steps": 0.0053327083587646484, "step": 589} {"info/global_step": 590, "train_info/time_within_train_step": 27.881101846694946, "step": 590} {"train_info/time_between_train_steps": 0.005130767822265625, "step": 590} {"info/global_step": 591, "train_info/time_within_train_step": 27.862570762634277, "step": 591} {"train_info/time_between_train_steps": 0.005700588226318359, "step": 591} {"info/global_step": 592, "train_info/time_within_train_step": 27.955049514770508, "step": 592} {"train_info/time_between_train_steps": 0.005343437194824219, "step": 592} {"info/global_step": 593, "train_info/time_within_train_step": 27.93032479286194, "step": 593} {"train_info/time_between_train_steps": 0.005692481994628906, "step": 593} {"info/global_step": 594, "train_info/time_within_train_step": 27.88618516921997, "step": 594} {"train_info/time_between_train_steps": 0.0054819583892822266, "step": 594} {"info/global_step": 595, "train_info/time_within_train_step": 27.854907989501953, "step": 595} {"train_info/time_between_train_steps": 0.005196809768676758, "step": 595} {"info/global_step": 596, "train_info/time_within_train_step": 27.84715962409973, "step": 596} {"train_info/time_between_train_steps": 0.0058362483978271484, "step": 596} {"info/global_step": 597, "train_info/time_within_train_step": 27.838088750839233, "step": 597} {"train_info/time_between_train_steps": 0.010184526443481445, "step": 597} {"info/global_step": 598, "train_info/time_within_train_step": 27.921239614486694, "step": 598} {"train_info/time_between_train_steps": 0.009755611419677734, "step": 598} {"info/global_step": 599, "train_info/time_within_train_step": 27.896024227142334, "step": 599} {"train_info/time_between_train_steps": 0.011821508407592773, "step": 599} {"info/global_step": 600, "train_info/time_within_train_step": 27.94292402267456, "step": 600} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733879222, "_runtime": 17534}, "step": 600} {"logs": {"train/loss": 4.5808, "train/learning_rate": 0.0003333333333333333, "train/epoch": 24.02, "_timestamp": 1733879222, "_runtime": 17534}, "step": 600} {"train_info/time_between_train_steps": 2.839597225189209, "step": 600} {"train_info/time_between_train_steps": 7.952690839767456, "step": 600} {"info/global_step": 601, "train_info/time_within_train_step": 27.817885637283325, "step": 601} {"train_info/time_between_train_steps": 0.009822845458984375, "step": 601} {"info/global_step": 602, "train_info/time_within_train_step": 28.11079692840576, "step": 602} {"train_info/time_between_train_steps": 0.005141258239746094, "step": 602} {"info/global_step": 603, "train_info/time_within_train_step": 27.870774745941162, "step": 603} {"train_info/time_between_train_steps": 0.010284900665283203, "step": 603} {"info/global_step": 604, "train_info/time_within_train_step": 27.955245971679688, "step": 604} {"train_info/time_between_train_steps": 0.005579233169555664, "step": 604} {"info/global_step": 605, "train_info/time_within_train_step": 27.851816654205322, "step": 605} {"train_info/time_between_train_steps": 0.005100727081298828, "step": 605} {"info/global_step": 606, "train_info/time_within_train_step": 27.849857807159424, "step": 606} {"train_info/time_between_train_steps": 0.005554676055908203, "step": 606} {"info/global_step": 607, "train_info/time_within_train_step": 27.838050603866577, "step": 607} {"train_info/time_between_train_steps": 0.009172201156616211, "step": 607} {"info/global_step": 608, "train_info/time_within_train_step": 27.986337423324585, "step": 608} {"train_info/time_between_train_steps": 0.009524345397949219, "step": 608} {"info/global_step": 609, "train_info/time_within_train_step": 27.850003957748413, "step": 609} {"train_info/time_between_train_steps": 0.005481719970703125, "step": 609} {"info/global_step": 610, "train_info/time_within_train_step": 27.860655307769775, "step": 610} {"train_info/time_between_train_steps": 0.005255699157714844, "step": 610} {"info/global_step": 611, "train_info/time_within_train_step": 27.891159772872925, "step": 611} {"train_info/time_between_train_steps": 0.005232095718383789, "step": 611} {"info/global_step": 612, "train_info/time_within_train_step": 27.85856342315674, "step": 612} {"train_info/time_between_train_steps": 0.0054302215576171875, "step": 612} {"info/global_step": 613, "train_info/time_within_train_step": 27.862857818603516, "step": 613} {"train_info/time_between_train_steps": 0.005461215972900391, "step": 613} {"info/global_step": 614, "train_info/time_within_train_step": 27.912312984466553, "step": 614} {"train_info/time_between_train_steps": 0.005301952362060547, "step": 614} {"info/global_step": 615, "train_info/time_within_train_step": 27.930366277694702, "step": 615} {"train_info/time_between_train_steps": 0.005224943161010742, "step": 615} {"info/global_step": 616, "train_info/time_within_train_step": 27.820459842681885, "step": 616} {"train_info/time_between_train_steps": 0.010549068450927734, "step": 616} {"info/global_step": 617, "train_info/time_within_train_step": 27.95806336402893, "step": 617} {"train_info/time_between_train_steps": 0.010022401809692383, "step": 617} {"info/global_step": 618, "train_info/time_within_train_step": 27.853299140930176, "step": 618} {"train_info/time_between_train_steps": 0.00542449951171875, "step": 618} {"info/global_step": 619, "train_info/time_within_train_step": 27.879270315170288, "step": 619} {"train_info/time_between_train_steps": 0.010322809219360352, "step": 619} {"info/global_step": 620, "train_info/time_within_train_step": 27.898733615875244, "step": 620} {"train_info/time_between_train_steps": 0.0053937435150146484, "step": 620} {"info/global_step": 621, "train_info/time_within_train_step": 27.862004041671753, "step": 621} {"train_info/time_between_train_steps": 0.005614519119262695, "step": 621} {"info/global_step": 622, "train_info/time_within_train_step": 27.875123262405396, "step": 622} {"train_info/time_between_train_steps": 0.005391120910644531, "step": 622} {"info/global_step": 623, "train_info/time_within_train_step": 27.894152641296387, "step": 623} {"train_info/time_between_train_steps": 0.009673118591308594, "step": 623} {"info/global_step": 624, "train_info/time_within_train_step": 28.011129140853882, "step": 624} {"train_info/time_between_train_steps": 0.006047964096069336, "step": 624} {"train_info/time_between_train_steps": 5.369655609130859, "step": 624} {"info/global_step": 625, "train_info/time_within_train_step": 27.895280122756958, "step": 625} {"train_info/time_between_train_steps": 0.004972696304321289, "step": 625} {"info/global_step": 626, "train_info/time_within_train_step": 28.024032592773438, "step": 626} {"train_info/time_between_train_steps": 0.011165380477905273, "step": 626} {"info/global_step": 627, "train_info/time_within_train_step": 27.93697762489319, "step": 627} {"train_info/time_between_train_steps": 0.0054209232330322266, "step": 627} {"info/global_step": 628, "train_info/time_within_train_step": 27.882732391357422, "step": 628} {"train_info/time_between_train_steps": 0.005675792694091797, "step": 628} {"info/global_step": 629, "train_info/time_within_train_step": 27.885122537612915, "step": 629} {"train_info/time_between_train_steps": 0.005019664764404297, "step": 629} {"info/global_step": 630, "train_info/time_within_train_step": 27.8977108001709, "step": 630} {"train_info/time_between_train_steps": 0.005239725112915039, "step": 630} {"info/global_step": 631, "train_info/time_within_train_step": 27.897190809249878, "step": 631} {"train_info/time_between_train_steps": 0.005419015884399414, "step": 631} {"info/global_step": 632, "train_info/time_within_train_step": 27.897838354110718, "step": 632} {"train_info/time_between_train_steps": 0.005216121673583984, "step": 632} {"info/global_step": 633, "train_info/time_within_train_step": 27.852357625961304, "step": 633} {"train_info/time_between_train_steps": 0.005405902862548828, "step": 633} {"info/global_step": 634, "train_info/time_within_train_step": 27.894083261489868, "step": 634} {"train_info/time_between_train_steps": 0.005175352096557617, "step": 634} {"info/global_step": 635, "train_info/time_within_train_step": 27.8632071018219, "step": 635} {"train_info/time_between_train_steps": 0.00528407096862793, "step": 635} {"info/global_step": 636, "train_info/time_within_train_step": 27.94785165786743, "step": 636} {"train_info/time_between_train_steps": 0.005322694778442383, "step": 636} {"info/global_step": 637, "train_info/time_within_train_step": 27.882810354232788, "step": 637} {"train_info/time_between_train_steps": 0.0061762332916259766, "step": 637} {"info/global_step": 638, "train_info/time_within_train_step": 27.906910181045532, "step": 638} {"train_info/time_between_train_steps": 0.005358457565307617, "step": 638} {"info/global_step": 639, "train_info/time_within_train_step": 27.94679284095764, "step": 639} {"train_info/time_between_train_steps": 0.005338907241821289, "step": 639} {"info/global_step": 640, "train_info/time_within_train_step": 27.862999200820923, "step": 640} {"train_info/time_between_train_steps": 0.005895137786865234, "step": 640} {"info/global_step": 641, "train_info/time_within_train_step": 27.89948844909668, "step": 641} {"train_info/time_between_train_steps": 0.005259037017822266, "step": 641} {"info/global_step": 642, "train_info/time_within_train_step": 27.919026613235474, "step": 642} {"train_info/time_between_train_steps": 0.011430978775024414, "step": 642} {"info/global_step": 643, "train_info/time_within_train_step": 27.872007369995117, "step": 643} {"train_info/time_between_train_steps": 0.005465984344482422, "step": 643} {"info/global_step": 644, "train_info/time_within_train_step": 27.87464165687561, "step": 644} {"train_info/time_between_train_steps": 0.0067577362060546875, "step": 644} {"info/global_step": 645, "train_info/time_within_train_step": 27.858885288238525, "step": 645} {"train_info/time_between_train_steps": 0.005514383316040039, "step": 645} {"info/global_step": 646, "train_info/time_within_train_step": 27.875934839248657, "step": 646} {"train_info/time_between_train_steps": 0.0064830780029296875, "step": 646} {"info/global_step": 647, "train_info/time_within_train_step": 27.907817363739014, "step": 647} {"train_info/time_between_train_steps": 0.010320425033569336, "step": 647} {"info/global_step": 648, "train_info/time_within_train_step": 27.879340410232544, "step": 648} {"train_info/time_between_train_steps": 0.006078958511352539, "step": 648} {"train_info/time_between_train_steps": 5.4237892627716064, "step": 648} {"info/global_step": 649, "train_info/time_within_train_step": 27.847715854644775, "step": 649} {"train_info/time_between_train_steps": 0.01444387435913086, "step": 649} {"info/global_step": 650, "train_info/time_within_train_step": 28.1419575214386, "step": 650} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733880636, "_runtime": 18948}, "step": 650} {"logs": {"train/loss": 4.4631, "train/learning_rate": 0.00030555555555555555, "train/epoch": 27.0, "_timestamp": 1733880636, "_runtime": 18948}, "step": 650} {"train_info/time_between_train_steps": 0.0076024532318115234, "step": 650} {"info/global_step": 651, "train_info/time_within_train_step": 27.962664365768433, "step": 651} {"train_info/time_between_train_steps": 0.005708456039428711, "step": 651} {"info/global_step": 652, "train_info/time_within_train_step": 27.97283625602722, "step": 652} {"train_info/time_between_train_steps": 0.009986162185668945, "step": 652} {"info/global_step": 653, "train_info/time_within_train_step": 27.915614128112793, "step": 653} {"train_info/time_between_train_steps": 0.0052263736724853516, "step": 653} {"info/global_step": 654, "train_info/time_within_train_step": 27.86668062210083, "step": 654} {"train_info/time_between_train_steps": 0.0053522586822509766, "step": 654} {"info/global_step": 655, "train_info/time_within_train_step": 28.000743865966797, "step": 655} {"train_info/time_between_train_steps": 0.0051631927490234375, "step": 655} {"info/global_step": 656, "train_info/time_within_train_step": 27.86671257019043, "step": 656} {"train_info/time_between_train_steps": 0.005816221237182617, "step": 656} {"info/global_step": 657, "train_info/time_within_train_step": 27.914462566375732, "step": 657} {"train_info/time_between_train_steps": 0.0054242610931396484, "step": 657} {"info/global_step": 658, "train_info/time_within_train_step": 27.83583378791809, "step": 658} {"train_info/time_between_train_steps": 0.00928640365600586, "step": 658} {"info/global_step": 659, "train_info/time_within_train_step": 27.83978533744812, "step": 659} {"train_info/time_between_train_steps": 0.0054318904876708984, "step": 659} {"info/global_step": 660, "train_info/time_within_train_step": 27.826948881149292, "step": 660} {"train_info/time_between_train_steps": 0.005329608917236328, "step": 660} {"info/global_step": 661, "train_info/time_within_train_step": 27.876357793807983, "step": 661} {"train_info/time_between_train_steps": 0.010441780090332031, "step": 661} {"info/global_step": 662, "train_info/time_within_train_step": 27.91276979446411, "step": 662} {"train_info/time_between_train_steps": 0.005395650863647461, "step": 662} {"info/global_step": 663, "train_info/time_within_train_step": 27.84207057952881, "step": 663} {"train_info/time_between_train_steps": 0.005218505859375, "step": 663} {"info/global_step": 664, "train_info/time_within_train_step": 27.85801887512207, "step": 664} {"train_info/time_between_train_steps": 0.0065572261810302734, "step": 664} {"info/global_step": 665, "train_info/time_within_train_step": 27.826082229614258, "step": 665} {"train_info/time_between_train_steps": 0.005336284637451172, "step": 665} {"info/global_step": 666, "train_info/time_within_train_step": 27.97257161140442, "step": 666} {"train_info/time_between_train_steps": 0.0053369998931884766, "step": 666} {"info/global_step": 667, "train_info/time_within_train_step": 27.884641885757446, "step": 667} {"train_info/time_between_train_steps": 0.005444526672363281, "step": 667} {"info/global_step": 668, "train_info/time_within_train_step": 27.861114740371704, "step": 668} {"train_info/time_between_train_steps": 0.0056304931640625, "step": 668} {"info/global_step": 669, "train_info/time_within_train_step": 27.85574221611023, "step": 669} {"train_info/time_between_train_steps": 0.005450725555419922, "step": 669} {"info/global_step": 670, "train_info/time_within_train_step": 28.04161500930786, "step": 670} {"train_info/time_between_train_steps": 0.005568265914916992, "step": 670} {"info/global_step": 671, "train_info/time_within_train_step": 27.907753944396973, "step": 671} {"train_info/time_between_train_steps": 0.005795478820800781, "step": 671} {"info/global_step": 672, "train_info/time_within_train_step": 27.87393593788147, "step": 672} {"train_info/time_between_train_steps": 0.0058290958404541016, "step": 672} {"train_info/time_between_train_steps": 5.279158115386963, "step": 672} {"info/global_step": 673, "train_info/time_within_train_step": 27.869053840637207, "step": 673} {"train_info/time_between_train_steps": 0.00553131103515625, "step": 673} {"info/global_step": 674, "train_info/time_within_train_step": 28.01433825492859, "step": 674} {"train_info/time_between_train_steps": 0.005415916442871094, "step": 674} {"info/global_step": 675, "train_info/time_within_train_step": 27.84256911277771, "step": 675} {"train_info/time_between_train_steps": 0.005495786666870117, "step": 675} {"info/global_step": 676, "train_info/time_within_train_step": 28.041896104812622, "step": 676} {"train_info/time_between_train_steps": 0.009836196899414062, "step": 676} {"info/global_step": 677, "train_info/time_within_train_step": 27.912744283676147, "step": 677} {"train_info/time_between_train_steps": 0.005164146423339844, "step": 677} {"info/global_step": 678, "train_info/time_within_train_step": 27.817155361175537, "step": 678} {"train_info/time_between_train_steps": 0.0056400299072265625, "step": 678} {"info/global_step": 679, "train_info/time_within_train_step": 27.905116081237793, "step": 679} {"train_info/time_between_train_steps": 0.008977174758911133, "step": 679} {"info/global_step": 680, "train_info/time_within_train_step": 27.985504388809204, "step": 680} {"train_info/time_between_train_steps": 0.005307435989379883, "step": 680} {"info/global_step": 681, "train_info/time_within_train_step": 27.85242533683777, "step": 681} {"train_info/time_between_train_steps": 0.005267143249511719, "step": 681} {"info/global_step": 682, "train_info/time_within_train_step": 27.85489511489868, "step": 682} {"train_info/time_between_train_steps": 0.005684375762939453, "step": 682} {"info/global_step": 683, "train_info/time_within_train_step": 27.880486726760864, "step": 683} {"train_info/time_between_train_steps": 0.005312681198120117, "step": 683} {"info/global_step": 684, "train_info/time_within_train_step": 27.866594791412354, "step": 684} {"train_info/time_between_train_steps": 0.009598493576049805, "step": 684} {"info/global_step": 685, "train_info/time_within_train_step": 27.86707615852356, "step": 685} {"train_info/time_between_train_steps": 0.005392789840698242, "step": 685} {"info/global_step": 686, "train_info/time_within_train_step": 27.948904275894165, "step": 686} {"train_info/time_between_train_steps": 0.010075807571411133, "step": 686} {"info/global_step": 687, "train_info/time_within_train_step": 27.854478120803833, "step": 687} {"train_info/time_between_train_steps": 0.005673408508300781, "step": 687} {"info/global_step": 688, "train_info/time_within_train_step": 27.850605964660645, "step": 688} {"train_info/time_between_train_steps": 0.009410381317138672, "step": 688} {"info/global_step": 689, "train_info/time_within_train_step": 27.879457473754883, "step": 689} {"train_info/time_between_train_steps": 0.005396366119384766, "step": 689} {"info/global_step": 690, "train_info/time_within_train_step": 27.856611251831055, "step": 690} {"train_info/time_between_train_steps": 0.010206937789916992, "step": 690} {"info/global_step": 691, "train_info/time_within_train_step": 27.816641092300415, "step": 691} {"train_info/time_between_train_steps": 0.0052869319915771484, "step": 691} {"info/global_step": 692, "train_info/time_within_train_step": 27.89573836326599, "step": 692} {"train_info/time_between_train_steps": 0.01099085807800293, "step": 692} {"info/global_step": 693, "train_info/time_within_train_step": 27.881745100021362, "step": 693} {"train_info/time_between_train_steps": 0.005259513854980469, "step": 693} {"info/global_step": 694, "train_info/time_within_train_step": 27.905223846435547, "step": 694} {"train_info/time_between_train_steps": 0.005930423736572266, "step": 694} {"info/global_step": 695, "train_info/time_within_train_step": 27.936837434768677, "step": 695} {"train_info/time_between_train_steps": 0.005639076232910156, "step": 695} {"info/global_step": 696, "train_info/time_within_train_step": 27.969319343566895, "step": 696} {"train_info/time_between_train_steps": 0.005949974060058594, "step": 696} {"train_info/time_between_train_steps": 5.299138069152832, "step": 696} {"info/global_step": 697, "train_info/time_within_train_step": 27.832470655441284, "step": 697} {"train_info/time_between_train_steps": 0.005220651626586914, "step": 697} {"info/global_step": 698, "train_info/time_within_train_step": 28.041288375854492, "step": 698} {"train_info/time_between_train_steps": 0.0051691532135009766, "step": 698} {"info/global_step": 699, "train_info/time_within_train_step": 27.842570304870605, "step": 699} {"train_info/time_between_train_steps": 0.009353160858154297, "step": 699} {"info/global_step": 700, "train_info/time_within_train_step": 27.95538091659546, "step": 700} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733882042, "_runtime": 20354}, "step": 700} {"logs": {"train/loss": 4.3476, "train/learning_rate": 0.0002777777777777778, "train/epoch": 29.0, "_timestamp": 1733882042, "_runtime": 20354}, "step": 700} {"train_info/time_between_train_steps": 2.894319772720337, "step": 700} {"info/global_step": 701, "train_info/time_within_train_step": 27.97170376777649, "step": 701} {"train_info/time_between_train_steps": 0.005122661590576172, "step": 701} {"info/global_step": 702, "train_info/time_within_train_step": 27.963645458221436, "step": 702} {"train_info/time_between_train_steps": 0.013430356979370117, "step": 702} {"info/global_step": 703, "train_info/time_within_train_step": 27.84221625328064, "step": 703} {"train_info/time_between_train_steps": 0.005458354949951172, "step": 703} {"info/global_step": 704, "train_info/time_within_train_step": 27.867116928100586, "step": 704} {"train_info/time_between_train_steps": 0.014849662780761719, "step": 704} {"info/global_step": 705, "train_info/time_within_train_step": 27.890214681625366, "step": 705} {"train_info/time_between_train_steps": 0.005322456359863281, "step": 705} {"info/global_step": 706, "train_info/time_within_train_step": 27.86959671974182, "step": 706} {"train_info/time_between_train_steps": 0.0053558349609375, "step": 706} {"info/global_step": 707, "train_info/time_within_train_step": 27.83532190322876, "step": 707} {"train_info/time_between_train_steps": 0.005261421203613281, "step": 707} {"info/global_step": 708, "train_info/time_within_train_step": 27.85789155960083, "step": 708} {"train_info/time_between_train_steps": 0.0054051876068115234, "step": 708} {"info/global_step": 709, "train_info/time_within_train_step": 27.859711408615112, "step": 709} {"train_info/time_between_train_steps": 0.005505084991455078, "step": 709} {"info/global_step": 710, "train_info/time_within_train_step": 27.83241868019104, "step": 710} {"train_info/time_between_train_steps": 0.0053615570068359375, "step": 710} {"info/global_step": 711, "train_info/time_within_train_step": 27.8771390914917, "step": 711} {"train_info/time_between_train_steps": 0.00545191764831543, "step": 711} {"info/global_step": 712, "train_info/time_within_train_step": 27.899548292160034, "step": 712} {"train_info/time_between_train_steps": 0.0054662227630615234, "step": 712} {"info/global_step": 713, "train_info/time_within_train_step": 27.864492654800415, "step": 713} {"train_info/time_between_train_steps": 0.005400896072387695, "step": 713} {"info/global_step": 714, "train_info/time_within_train_step": 27.828548192977905, "step": 714} {"train_info/time_between_train_steps": 0.005742549896240234, "step": 714} {"info/global_step": 715, "train_info/time_within_train_step": 27.863619565963745, "step": 715} {"train_info/time_between_train_steps": 0.009663581848144531, "step": 715} {"info/global_step": 716, "train_info/time_within_train_step": 27.942336082458496, "step": 716} {"train_info/time_between_train_steps": 0.005761384963989258, "step": 716} {"info/global_step": 717, "train_info/time_within_train_step": 28.023338794708252, "step": 717} {"train_info/time_between_train_steps": 0.005545377731323242, "step": 717} {"info/global_step": 718, "train_info/time_within_train_step": 27.887366771697998, "step": 718} {"train_info/time_between_train_steps": 0.005745410919189453, "step": 718} {"info/global_step": 719, "train_info/time_within_train_step": 27.91116499900818, "step": 719} {"train_info/time_between_train_steps": 0.005788326263427734, "step": 719} {"info/global_step": 720, "train_info/time_within_train_step": 27.967403411865234, "step": 720} {"train_info/time_between_train_steps": 0.005941629409790039, "step": 720} {"train_info/time_between_train_steps": 5.477025270462036, "step": 720} {"info/global_step": 721, "train_info/time_within_train_step": 27.928735971450806, "step": 721} {"train_info/time_between_train_steps": 0.005128383636474609, "step": 721} {"info/global_step": 722, "train_info/time_within_train_step": 28.049934148788452, "step": 722} {"train_info/time_between_train_steps": 0.005548238754272461, "step": 722} {"info/global_step": 723, "train_info/time_within_train_step": 27.867759943008423, "step": 723} {"train_info/time_between_train_steps": 0.005232095718383789, "step": 723} {"info/global_step": 724, "train_info/time_within_train_step": 27.958215713500977, "step": 724} {"train_info/time_between_train_steps": 0.010283708572387695, "step": 724} {"info/global_step": 725, "train_info/time_within_train_step": 27.838098526000977, "step": 725} {"train_info/time_between_train_steps": 0.008843421936035156, "step": 725} {"info/global_step": 726, "train_info/time_within_train_step": 28.03019952774048, "step": 726} {"train_info/time_between_train_steps": 0.005263090133666992, "step": 726} {"info/global_step": 727, "train_info/time_within_train_step": 27.922576904296875, "step": 727} {"train_info/time_between_train_steps": 0.00530242919921875, "step": 727} {"info/global_step": 728, "train_info/time_within_train_step": 27.81952452659607, "step": 728} {"train_info/time_between_train_steps": 0.005249500274658203, "step": 728} {"info/global_step": 729, "train_info/time_within_train_step": 27.86084794998169, "step": 729} {"train_info/time_between_train_steps": 0.00553584098815918, "step": 729} {"info/global_step": 730, "train_info/time_within_train_step": 27.873020887374878, "step": 730} {"train_info/time_between_train_steps": 0.010323286056518555, "step": 730} {"info/global_step": 731, "train_info/time_within_train_step": 27.86635661125183, "step": 731} {"train_info/time_between_train_steps": 0.009994983673095703, "step": 731} {"info/global_step": 732, "train_info/time_within_train_step": 27.869921445846558, "step": 732} {"train_info/time_between_train_steps": 0.005424022674560547, "step": 732} {"info/global_step": 733, "train_info/time_within_train_step": 27.96374249458313, "step": 733} {"train_info/time_between_train_steps": 0.00825810432434082, "step": 733} {"info/global_step": 734, "train_info/time_within_train_step": 27.971956729888916, "step": 734} {"train_info/time_between_train_steps": 0.009534835815429688, "step": 734} {"info/global_step": 735, "train_info/time_within_train_step": 27.848340272903442, "step": 735} {"train_info/time_between_train_steps": 0.011820554733276367, "step": 735} {"info/global_step": 736, "train_info/time_within_train_step": 27.863386631011963, "step": 736} {"train_info/time_between_train_steps": 0.005312919616699219, "step": 736} {"info/global_step": 737, "train_info/time_within_train_step": 27.89184880256653, "step": 737} {"train_info/time_between_train_steps": 0.008439779281616211, "step": 737} {"info/global_step": 738, "train_info/time_within_train_step": 27.89066457748413, "step": 738} {"train_info/time_between_train_steps": 0.0051767826080322266, "step": 738} {"info/global_step": 739, "train_info/time_within_train_step": 27.878474712371826, "step": 739} {"train_info/time_between_train_steps": 0.00537419319152832, "step": 739} {"info/global_step": 740, "train_info/time_within_train_step": 27.918630123138428, "step": 740} {"train_info/time_between_train_steps": 0.014837503433227539, "step": 740} {"info/global_step": 741, "train_info/time_within_train_step": 27.868849992752075, "step": 741} {"train_info/time_between_train_steps": 0.0053942203521728516, "step": 741} {"info/global_step": 742, "train_info/time_within_train_step": 27.92979669570923, "step": 742} {"train_info/time_between_train_steps": 0.006720304489135742, "step": 742} {"info/global_step": 743, "train_info/time_within_train_step": 27.953426361083984, "step": 743} {"train_info/time_between_train_steps": 0.00989675521850586, "step": 743} {"info/global_step": 744, "train_info/time_within_train_step": 27.905426502227783, "step": 744} {"train_info/time_between_train_steps": 0.006106853485107422, "step": 744} {"train_info/time_between_train_steps": 5.212895631790161, "step": 744} {"info/global_step": 745, "train_info/time_within_train_step": 27.943410396575928, "step": 745} {"train_info/time_between_train_steps": 0.005742073059082031, "step": 745} {"info/global_step": 746, "train_info/time_within_train_step": 28.070550680160522, "step": 746} {"train_info/time_between_train_steps": 0.0053234100341796875, "step": 746} {"info/global_step": 747, "train_info/time_within_train_step": 27.933279752731323, "step": 747} {"train_info/time_between_train_steps": 0.005614280700683594, "step": 747} {"info/global_step": 748, "train_info/time_within_train_step": 28.059388399124146, "step": 748} {"train_info/time_between_train_steps": 0.0075206756591796875, "step": 748} {"info/global_step": 749, "train_info/time_within_train_step": 27.876919746398926, "step": 749} {"train_info/time_between_train_steps": 0.01029348373413086, "step": 749} {"info/global_step": 750, "train_info/time_within_train_step": 27.832568407058716, "step": 750} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733883451, "_runtime": 21763}, "step": 750} {"logs": {"train/loss": 4.2499, "train/learning_rate": 0.00025, "train/epoch": 31.0, "_timestamp": 1733883451, "_runtime": 21763}, "step": 750} {"train_info/time_between_train_steps": 0.0072934627532958984, "step": 750} {"info/global_step": 751, "train_info/time_within_train_step": 27.857545137405396, "step": 751} {"train_info/time_between_train_steps": 0.005162477493286133, "step": 751} {"info/global_step": 752, "train_info/time_within_train_step": 27.834912538528442, "step": 752} {"train_info/time_between_train_steps": 0.0052471160888671875, "step": 752} {"info/global_step": 753, "train_info/time_within_train_step": 27.934590101242065, "step": 753} {"train_info/time_between_train_steps": 0.006592273712158203, "step": 753} {"info/global_step": 754, "train_info/time_within_train_step": 27.857612371444702, "step": 754} {"train_info/time_between_train_steps": 0.005227565765380859, "step": 754} {"info/global_step": 755, "train_info/time_within_train_step": 27.91248846054077, "step": 755} {"train_info/time_between_train_steps": 0.005403041839599609, "step": 755} {"info/global_step": 756, "train_info/time_within_train_step": 27.85490083694458, "step": 756} {"train_info/time_between_train_steps": 0.010051250457763672, "step": 756} {"info/global_step": 757, "train_info/time_within_train_step": 27.881808042526245, "step": 757} {"train_info/time_between_train_steps": 0.010099172592163086, "step": 757} {"info/global_step": 758, "train_info/time_within_train_step": 27.91795063018799, "step": 758} {"train_info/time_between_train_steps": 0.005520820617675781, "step": 758} {"info/global_step": 759, "train_info/time_within_train_step": 27.9602370262146, "step": 759} {"train_info/time_between_train_steps": 0.009317636489868164, "step": 759} {"info/global_step": 760, "train_info/time_within_train_step": 27.932271718978882, "step": 760} {"train_info/time_between_train_steps": 0.010860443115234375, "step": 760} {"info/global_step": 761, "train_info/time_within_train_step": 27.96569061279297, "step": 761} {"train_info/time_between_train_steps": 0.01341104507446289, "step": 761} {"info/global_step": 762, "train_info/time_within_train_step": 27.93411898612976, "step": 762} {"train_info/time_between_train_steps": 0.010379552841186523, "step": 762} {"info/global_step": 763, "train_info/time_within_train_step": 27.84468364715576, "step": 763} {"train_info/time_between_train_steps": 0.010996103286743164, "step": 763} {"info/global_step": 764, "train_info/time_within_train_step": 27.969399213790894, "step": 764} {"train_info/time_between_train_steps": 0.0055010318756103516, "step": 764} {"info/global_step": 765, "train_info/time_within_train_step": 27.884066581726074, "step": 765} {"train_info/time_between_train_steps": 0.0054187774658203125, "step": 765} {"info/global_step": 766, "train_info/time_within_train_step": 27.933112859725952, "step": 766} {"train_info/time_between_train_steps": 0.010654449462890625, "step": 766} {"info/global_step": 767, "train_info/time_within_train_step": 27.856878995895386, "step": 767} {"train_info/time_between_train_steps": 0.006348371505737305, "step": 767} {"info/global_step": 768, "train_info/time_within_train_step": 27.92731261253357, "step": 768} {"train_info/time_between_train_steps": 0.006208896636962891, "step": 768} {"train_info/time_between_train_steps": 5.409374713897705, "step": 768} {"info/global_step": 769, "train_info/time_within_train_step": 27.88438105583191, "step": 769} {"train_info/time_between_train_steps": 0.0056574344635009766, "step": 769} {"info/global_step": 770, "train_info/time_within_train_step": 28.048359870910645, "step": 770} {"train_info/time_between_train_steps": 0.008373022079467773, "step": 770} {"info/global_step": 771, "train_info/time_within_train_step": 27.89099645614624, "step": 771} {"train_info/time_between_train_steps": 0.005343437194824219, "step": 771} {"info/global_step": 772, "train_info/time_within_train_step": 27.918737411499023, "step": 772} {"train_info/time_between_train_steps": 0.005456447601318359, "step": 772} {"info/global_step": 773, "train_info/time_within_train_step": 27.975944757461548, "step": 773} {"train_info/time_between_train_steps": 0.0052411556243896484, "step": 773} {"info/global_step": 774, "train_info/time_within_train_step": 27.828519582748413, "step": 774} {"train_info/time_between_train_steps": 0.009424448013305664, "step": 774} {"info/global_step": 775, "train_info/time_within_train_step": 27.888432264328003, "step": 775} {"train_info/time_between_train_steps": 0.005304813385009766, "step": 775} {"info/global_step": 776, "train_info/time_within_train_step": 27.863325357437134, "step": 776} {"train_info/time_between_train_steps": 0.019701242446899414, "step": 776} {"info/global_step": 777, "train_info/time_within_train_step": 27.86982536315918, "step": 777} {"train_info/time_between_train_steps": 0.005448341369628906, "step": 777} {"info/global_step": 778, "train_info/time_within_train_step": 27.82927107810974, "step": 778} {"train_info/time_between_train_steps": 0.0052759647369384766, "step": 778} {"info/global_step": 779, "train_info/time_within_train_step": 28.01047158241272, "step": 779} {"train_info/time_between_train_steps": 0.006181240081787109, "step": 779} {"info/global_step": 780, "train_info/time_within_train_step": 27.81373620033264, "step": 780} {"train_info/time_between_train_steps": 0.010245084762573242, "step": 780} {"info/global_step": 781, "train_info/time_within_train_step": 27.889512062072754, "step": 781} {"train_info/time_between_train_steps": 0.005410671234130859, "step": 781} {"info/global_step": 782, "train_info/time_within_train_step": 27.905481815338135, "step": 782} {"train_info/time_between_train_steps": 0.009799003601074219, "step": 782} {"info/global_step": 783, "train_info/time_within_train_step": 27.887949466705322, "step": 783} {"train_info/time_between_train_steps": 0.010118246078491211, "step": 783} {"info/global_step": 784, "train_info/time_within_train_step": 27.87034273147583, "step": 784} {"train_info/time_between_train_steps": 0.005460500717163086, "step": 784} {"info/global_step": 785, "train_info/time_within_train_step": 27.845494747161865, "step": 785} {"train_info/time_between_train_steps": 0.005574941635131836, "step": 785} {"info/global_step": 786, "train_info/time_within_train_step": 27.85550856590271, "step": 786} {"train_info/time_between_train_steps": 0.005370616912841797, "step": 786} {"info/global_step": 787, "train_info/time_within_train_step": 27.862098932266235, "step": 787} {"train_info/time_between_train_steps": 0.00519871711730957, "step": 787} {"info/global_step": 788, "train_info/time_within_train_step": 27.86797547340393, "step": 788} {"train_info/time_between_train_steps": 0.005776643753051758, "step": 788} {"info/global_step": 789, "train_info/time_within_train_step": 27.84992265701294, "step": 789} {"train_info/time_between_train_steps": 0.005273103713989258, "step": 789} {"info/global_step": 790, "train_info/time_within_train_step": 27.901424407958984, "step": 790} {"train_info/time_between_train_steps": 0.005642414093017578, "step": 790} {"info/global_step": 791, "train_info/time_within_train_step": 27.887646198272705, "step": 791} {"train_info/time_between_train_steps": 0.005697488784790039, "step": 791} {"info/global_step": 792, "train_info/time_within_train_step": 27.908438444137573, "step": 792} {"train_info/time_between_train_steps": 0.006121158599853516, "step": 792} {"train_info/time_between_train_steps": 5.583119630813599, "step": 792} {"info/global_step": 793, "train_info/time_within_train_step": 27.9321129322052, "step": 793} {"train_info/time_between_train_steps": 0.005574226379394531, "step": 793} {"info/global_step": 794, "train_info/time_within_train_step": 28.02779269218445, "step": 794} {"train_info/time_between_train_steps": 0.010422468185424805, "step": 794} {"info/global_step": 795, "train_info/time_within_train_step": 28.07706332206726, "step": 795} {"train_info/time_between_train_steps": 0.005431652069091797, "step": 795} {"info/global_step": 796, "train_info/time_within_train_step": 27.99479055404663, "step": 796} {"train_info/time_between_train_steps": 0.010009527206420898, "step": 796} {"info/global_step": 797, "train_info/time_within_train_step": 27.875941514968872, "step": 797} {"train_info/time_between_train_steps": 0.009826421737670898, "step": 797} {"info/global_step": 798, "train_info/time_within_train_step": 27.81486940383911, "step": 798} {"train_info/time_between_train_steps": 0.005196809768676758, "step": 798} {"info/global_step": 799, "train_info/time_within_train_step": 27.92206048965454, "step": 799} {"train_info/time_between_train_steps": 0.0056955814361572266, "step": 799} {"info/global_step": 800, "train_info/time_within_train_step": 27.945321798324585, "step": 800} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733884858, "_runtime": 23170}, "step": 800} {"logs": {"train/loss": 4.1602, "train/learning_rate": 0.00022222222222222218, "train/epoch": 33.01, "_timestamp": 1733884858, "_runtime": 23170}, "step": 800} {"train_info/time_between_train_steps": 2.856712818145752, "step": 800} {"info/global_step": 801, "train_info/time_within_train_step": 27.883622407913208, "step": 801} {"train_info/time_between_train_steps": 0.010210514068603516, "step": 801} {"info/global_step": 802, "train_info/time_within_train_step": 27.86180806159973, "step": 802} {"train_info/time_between_train_steps": 0.005268096923828125, "step": 802} {"info/global_step": 803, "train_info/time_within_train_step": 27.82466983795166, "step": 803} {"train_info/time_between_train_steps": 0.005328655242919922, "step": 803} {"info/global_step": 804, "train_info/time_within_train_step": 27.841315269470215, "step": 804} {"train_info/time_between_train_steps": 0.0055658817291259766, "step": 804} {"info/global_step": 805, "train_info/time_within_train_step": 27.815061330795288, "step": 805} {"train_info/time_between_train_steps": 0.005221128463745117, "step": 805} {"info/global_step": 806, "train_info/time_within_train_step": 27.87323260307312, "step": 806} {"train_info/time_between_train_steps": 0.005598306655883789, "step": 806} {"info/global_step": 807, "train_info/time_within_train_step": 27.858259201049805, "step": 807} {"train_info/time_between_train_steps": 0.005509376525878906, "step": 807} {"info/global_step": 808, "train_info/time_within_train_step": 27.866678714752197, "step": 808} {"train_info/time_between_train_steps": 0.011636972427368164, "step": 808} {"info/global_step": 809, "train_info/time_within_train_step": 27.925782918930054, "step": 809} {"train_info/time_between_train_steps": 0.0053369998931884766, "step": 809} {"info/global_step": 810, "train_info/time_within_train_step": 28.003788471221924, "step": 810} {"train_info/time_between_train_steps": 0.005316734313964844, "step": 810} {"info/global_step": 811, "train_info/time_within_train_step": 27.91982889175415, "step": 811} {"train_info/time_between_train_steps": 0.009908676147460938, "step": 811} {"info/global_step": 812, "train_info/time_within_train_step": 27.854879140853882, "step": 812} {"train_info/time_between_train_steps": 0.009664535522460938, "step": 812} {"info/global_step": 813, "train_info/time_within_train_step": 27.91584825515747, "step": 813} {"train_info/time_between_train_steps": 0.006469249725341797, "step": 813} {"info/global_step": 814, "train_info/time_within_train_step": 27.832855701446533, "step": 814} {"train_info/time_between_train_steps": 0.0059909820556640625, "step": 814} {"info/global_step": 815, "train_info/time_within_train_step": 27.992600202560425, "step": 815} {"train_info/time_between_train_steps": 0.0058078765869140625, "step": 815} {"info/global_step": 816, "train_info/time_within_train_step": 27.886504411697388, "step": 816} {"train_info/time_between_train_steps": 0.006314992904663086, "step": 816} {"train_info/time_between_train_steps": 5.055109739303589, "step": 816} {"info/global_step": 817, "train_info/time_within_train_step": 27.866954565048218, "step": 817} {"train_info/time_between_train_steps": 0.005156517028808594, "step": 817} {"info/global_step": 818, "train_info/time_within_train_step": 28.01647639274597, "step": 818} {"train_info/time_between_train_steps": 0.005446195602416992, "step": 818} {"info/global_step": 819, "train_info/time_within_train_step": 27.96556568145752, "step": 819} {"train_info/time_between_train_steps": 0.005622148513793945, "step": 819} {"info/global_step": 820, "train_info/time_within_train_step": 27.945469617843628, "step": 820} {"train_info/time_between_train_steps": 0.0056915283203125, "step": 820} {"info/global_step": 821, "train_info/time_within_train_step": 27.88659358024597, "step": 821} {"train_info/time_between_train_steps": 0.005565643310546875, "step": 821} {"info/global_step": 822, "train_info/time_within_train_step": 27.867566108703613, "step": 822} {"train_info/time_between_train_steps": 0.01445913314819336, "step": 822} {"info/global_step": 823, "train_info/time_within_train_step": 27.87318253517151, "step": 823} {"train_info/time_between_train_steps": 0.00535273551940918, "step": 823} {"info/global_step": 824, "train_info/time_within_train_step": 27.916833639144897, "step": 824} {"train_info/time_between_train_steps": 0.01334524154663086, "step": 824} {"info/global_step": 825, "train_info/time_within_train_step": 27.860329627990723, "step": 825} {"train_info/time_between_train_steps": 0.005523204803466797, "step": 825} {"info/global_step": 826, "train_info/time_within_train_step": 27.956284046173096, "step": 826} {"train_info/time_between_train_steps": 0.010099649429321289, "step": 826} {"info/global_step": 827, "train_info/time_within_train_step": 27.849488735198975, "step": 827} {"train_info/time_between_train_steps": 0.0053904056549072266, "step": 827} {"info/global_step": 828, "train_info/time_within_train_step": 27.854365587234497, "step": 828} {"train_info/time_between_train_steps": 0.011330604553222656, "step": 828} {"info/global_step": 829, "train_info/time_within_train_step": 27.8541579246521, "step": 829} {"train_info/time_between_train_steps": 0.0071141719818115234, "step": 829} {"info/global_step": 830, "train_info/time_within_train_step": 27.892338037490845, "step": 830} {"train_info/time_between_train_steps": 0.0055408477783203125, "step": 830} {"info/global_step": 831, "train_info/time_within_train_step": 27.898076057434082, "step": 831} {"train_info/time_between_train_steps": 0.005829811096191406, "step": 831} {"info/global_step": 832, "train_info/time_within_train_step": 27.874744415283203, "step": 832} {"train_info/time_between_train_steps": 0.005541801452636719, "step": 832} {"info/global_step": 833, "train_info/time_within_train_step": 27.888389110565186, "step": 833} {"train_info/time_between_train_steps": 0.01053619384765625, "step": 833} {"info/global_step": 834, "train_info/time_within_train_step": 27.89982581138611, "step": 834} {"train_info/time_between_train_steps": 0.010380983352661133, "step": 834} {"info/global_step": 835, "train_info/time_within_train_step": 27.894134044647217, "step": 835} {"train_info/time_between_train_steps": 0.005674839019775391, "step": 835} {"info/global_step": 836, "train_info/time_within_train_step": 27.866823434829712, "step": 836} {"train_info/time_between_train_steps": 0.0060307979583740234, "step": 836} {"info/global_step": 837, "train_info/time_within_train_step": 27.890435695648193, "step": 837} {"train_info/time_between_train_steps": 0.00531768798828125, "step": 837} {"info/global_step": 838, "train_info/time_within_train_step": 27.914138317108154, "step": 838} {"train_info/time_between_train_steps": 0.006368160247802734, "step": 838} {"info/global_step": 839, "train_info/time_within_train_step": 27.904123544692993, "step": 839} {"train_info/time_between_train_steps": 0.006043910980224609, "step": 839} {"info/global_step": 840, "train_info/time_within_train_step": 27.89624571800232, "step": 840} {"train_info/time_between_train_steps": 0.005858659744262695, "step": 840} {"train_info/time_between_train_steps": 5.2123870849609375, "step": 840} {"info/global_step": 841, "train_info/time_within_train_step": 27.913843393325806, "step": 841} {"train_info/time_between_train_steps": 0.0059795379638671875, "step": 841} {"info/global_step": 842, "train_info/time_within_train_step": 28.356560945510864, "step": 842} {"train_info/time_between_train_steps": 0.011049747467041016, "step": 842} {"info/global_step": 843, "train_info/time_within_train_step": 27.864521265029907, "step": 843} {"train_info/time_between_train_steps": 0.00561833381652832, "step": 843} {"info/global_step": 844, "train_info/time_within_train_step": 27.929980516433716, "step": 844} {"train_info/time_between_train_steps": 0.0063550472259521484, "step": 844} {"info/global_step": 845, "train_info/time_within_train_step": 27.919150590896606, "step": 845} {"train_info/time_between_train_steps": 0.00543665885925293, "step": 845} {"info/global_step": 846, "train_info/time_within_train_step": 27.896425247192383, "step": 846} {"train_info/time_between_train_steps": 0.009620428085327148, "step": 846} {"info/global_step": 847, "train_info/time_within_train_step": 27.87555956840515, "step": 847} {"train_info/time_between_train_steps": 0.005321502685546875, "step": 847} {"info/global_step": 848, "train_info/time_within_train_step": 27.80702829360962, "step": 848} {"train_info/time_between_train_steps": 0.0053670406341552734, "step": 848} {"info/global_step": 849, "train_info/time_within_train_step": 27.804544925689697, "step": 849} {"train_info/time_between_train_steps": 0.005560874938964844, "step": 849} {"info/global_step": 850, "train_info/time_within_train_step": 27.844847202301025, "step": 850} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733886266, "_runtime": 24578}, "step": 850} {"logs": {"train/loss": 4.0822, "train/learning_rate": 0.00019444444444444443, "train/epoch": 35.01, "_timestamp": 1733886266, "_runtime": 24578}, "step": 850} {"train_info/time_between_train_steps": 0.008715391159057617, "step": 850} {"info/global_step": 851, "train_info/time_within_train_step": 27.872763872146606, "step": 851} {"train_info/time_between_train_steps": 0.0057337284088134766, "step": 851} {"info/global_step": 852, "train_info/time_within_train_step": 27.913955450057983, "step": 852} {"train_info/time_between_train_steps": 0.005682468414306641, "step": 852} {"info/global_step": 853, "train_info/time_within_train_step": 27.885173797607422, "step": 853} {"train_info/time_between_train_steps": 0.005443096160888672, "step": 853} {"info/global_step": 854, "train_info/time_within_train_step": 27.87550449371338, "step": 854} {"train_info/time_between_train_steps": 0.005412578582763672, "step": 854} {"info/global_step": 855, "train_info/time_within_train_step": 27.89293122291565, "step": 855} {"train_info/time_between_train_steps": 0.0056154727935791016, "step": 855} {"info/global_step": 856, "train_info/time_within_train_step": 28.025326251983643, "step": 856} {"train_info/time_between_train_steps": 0.005723237991333008, "step": 856} {"info/global_step": 857, "train_info/time_within_train_step": 27.968424797058105, "step": 857} {"train_info/time_between_train_steps": 0.005353450775146484, "step": 857} {"info/global_step": 858, "train_info/time_within_train_step": 27.907056093215942, "step": 858} {"train_info/time_between_train_steps": 0.005520343780517578, "step": 858} {"info/global_step": 859, "train_info/time_within_train_step": 27.83943009376526, "step": 859} {"train_info/time_between_train_steps": 0.005416393280029297, "step": 859} {"info/global_step": 860, "train_info/time_within_train_step": 27.956836700439453, "step": 860} {"train_info/time_between_train_steps": 0.005898475646972656, "step": 860} {"info/global_step": 861, "train_info/time_within_train_step": 27.90471315383911, "step": 861} {"train_info/time_between_train_steps": 0.00586390495300293, "step": 861} {"info/global_step": 862, "train_info/time_within_train_step": 27.879387855529785, "step": 862} {"train_info/time_between_train_steps": 0.005524158477783203, "step": 862} {"info/global_step": 863, "train_info/time_within_train_step": 27.867449522018433, "step": 863} {"train_info/time_between_train_steps": 0.0068089962005615234, "step": 863} {"info/global_step": 864, "train_info/time_within_train_step": 27.886305570602417, "step": 864} {"train_info/time_between_train_steps": 0.01122283935546875, "step": 864} {"train_info/time_between_train_steps": 5.387828826904297, "step": 864} {"info/global_step": 865, "train_info/time_within_train_step": 27.889748096466064, "step": 865} {"train_info/time_between_train_steps": 0.0058650970458984375, "step": 865} {"info/global_step": 866, "train_info/time_within_train_step": 28.057335138320923, "step": 866} {"train_info/time_between_train_steps": 0.005793333053588867, "step": 866} {"info/global_step": 867, "train_info/time_within_train_step": 27.950927734375, "step": 867} {"train_info/time_between_train_steps": 0.006034374237060547, "step": 867} {"info/global_step": 868, "train_info/time_within_train_step": 27.952280282974243, "step": 868} {"train_info/time_between_train_steps": 0.0062236785888671875, "step": 868} {"info/global_step": 869, "train_info/time_within_train_step": 27.96891140937805, "step": 869} {"train_info/time_between_train_steps": 0.005426645278930664, "step": 869} {"info/global_step": 870, "train_info/time_within_train_step": 27.82170271873474, "step": 870} {"train_info/time_between_train_steps": 0.005269765853881836, "step": 870} {"info/global_step": 871, "train_info/time_within_train_step": 27.86750102043152, "step": 871} {"train_info/time_between_train_steps": 0.0055255889892578125, "step": 871} {"info/global_step": 872, "train_info/time_within_train_step": 27.925307512283325, "step": 872} {"train_info/time_between_train_steps": 0.0057430267333984375, "step": 872} {"info/global_step": 873, "train_info/time_within_train_step": 28.0738263130188, "step": 873} {"train_info/time_between_train_steps": 0.005604982376098633, "step": 873} {"info/global_step": 874, "train_info/time_within_train_step": 28.023247718811035, "step": 874} {"train_info/time_between_train_steps": 0.011282205581665039, "step": 874} {"info/global_step": 875, "train_info/time_within_train_step": 27.98322868347168, "step": 875} {"train_info/time_between_train_steps": 0.005761384963989258, "step": 875} {"info/global_step": 876, "train_info/time_within_train_step": 27.981420278549194, "step": 876} {"train_info/time_between_train_steps": 0.006268024444580078, "step": 876} {"info/global_step": 877, "train_info/time_within_train_step": 27.93537163734436, "step": 877} {"train_info/time_between_train_steps": 0.00609588623046875, "step": 877} {"info/global_step": 878, "train_info/time_within_train_step": 27.94768261909485, "step": 878} {"train_info/time_between_train_steps": 0.005653858184814453, "step": 878} {"info/global_step": 879, "train_info/time_within_train_step": 27.90947914123535, "step": 879} {"train_info/time_between_train_steps": 0.00923013687133789, "step": 879} {"info/global_step": 880, "train_info/time_within_train_step": 27.938187837600708, "step": 880} {"train_info/time_between_train_steps": 0.010868310928344727, "step": 880} {"info/global_step": 881, "train_info/time_within_train_step": 27.99759531021118, "step": 881} {"train_info/time_between_train_steps": 0.0061130523681640625, "step": 881} {"info/global_step": 882, "train_info/time_within_train_step": 28.007490634918213, "step": 882} {"train_info/time_between_train_steps": 0.006865978240966797, "step": 882} {"info/global_step": 883, "train_info/time_within_train_step": 28.12627387046814, "step": 883} {"train_info/time_between_train_steps": 0.012643098831176758, "step": 883} {"info/global_step": 884, "train_info/time_within_train_step": 27.981439352035522, "step": 884} {"train_info/time_between_train_steps": 0.007307767868041992, "step": 884} {"info/global_step": 885, "train_info/time_within_train_step": 27.90947699546814, "step": 885} {"train_info/time_between_train_steps": 0.006138801574707031, "step": 885} {"info/global_step": 886, "train_info/time_within_train_step": 27.922860622406006, "step": 886} {"train_info/time_between_train_steps": 0.005804538726806641, "step": 886} {"info/global_step": 887, "train_info/time_within_train_step": 27.87931752204895, "step": 887} {"train_info/time_between_train_steps": 0.00600123405456543, "step": 887} {"info/global_step": 888, "train_info/time_within_train_step": 28.044672966003418, "step": 888} {"train_info/time_between_train_steps": 0.015778064727783203, "step": 888} {"train_info/time_between_train_steps": 5.344126462936401, "step": 888} {"info/global_step": 889, "train_info/time_within_train_step": 27.876063108444214, "step": 889} {"train_info/time_between_train_steps": 0.005171298980712891, "step": 889} {"info/global_step": 890, "train_info/time_within_train_step": 28.000138521194458, "step": 890} {"train_info/time_between_train_steps": 0.005452394485473633, "step": 890} {"info/global_step": 891, "train_info/time_within_train_step": 27.84483766555786, "step": 891} {"train_info/time_between_train_steps": 0.005944728851318359, "step": 891} {"info/global_step": 892, "train_info/time_within_train_step": 27.940255880355835, "step": 892} {"train_info/time_between_train_steps": 0.005712270736694336, "step": 892} {"info/global_step": 893, "train_info/time_within_train_step": 27.899933338165283, "step": 893} {"train_info/time_between_train_steps": 0.005553007125854492, "step": 893} {"info/global_step": 894, "train_info/time_within_train_step": 27.820339679718018, "step": 894} {"train_info/time_between_train_steps": 0.005334138870239258, "step": 894} {"info/global_step": 895, "train_info/time_within_train_step": 27.865430116653442, "step": 895} {"train_info/time_between_train_steps": 0.005246400833129883, "step": 895} {"info/global_step": 896, "train_info/time_within_train_step": 27.80813217163086, "step": 896} {"train_info/time_between_train_steps": 0.005289554595947266, "step": 896} {"info/global_step": 897, "train_info/time_within_train_step": 27.915367364883423, "step": 897} {"train_info/time_between_train_steps": 0.005543947219848633, "step": 897} {"info/global_step": 898, "train_info/time_within_train_step": 27.848084211349487, "step": 898} {"train_info/time_between_train_steps": 0.00555872917175293, "step": 898} {"info/global_step": 899, "train_info/time_within_train_step": 27.826393842697144, "step": 899} {"train_info/time_between_train_steps": 0.005648374557495117, "step": 899} {"info/global_step": 900, "train_info/time_within_train_step": 27.91648840904236, "step": 900} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733887674, "_runtime": 25986}, "step": 900} {"logs": {"train/loss": 4.0101, "train/learning_rate": 0.00016666666666666666, "train/epoch": 37.01, "_timestamp": 1733887674, "_runtime": 25986}, "step": 900} {"train_info/time_between_train_steps": 2.9591546058654785, "step": 900} {"info/global_step": 901, "train_info/time_within_train_step": 27.884081840515137, "step": 901} {"train_info/time_between_train_steps": 0.010945320129394531, "step": 901} {"info/global_step": 902, "train_info/time_within_train_step": 27.86406373977661, "step": 902} {"train_info/time_between_train_steps": 0.00526118278503418, "step": 902} {"info/global_step": 903, "train_info/time_within_train_step": 27.87629222869873, "step": 903} {"train_info/time_between_train_steps": 0.011861562728881836, "step": 903} {"info/global_step": 904, "train_info/time_within_train_step": 27.986878633499146, "step": 904} {"train_info/time_between_train_steps": 0.010555267333984375, "step": 904} {"info/global_step": 905, "train_info/time_within_train_step": 27.838485717773438, "step": 905} {"train_info/time_between_train_steps": 0.005414724349975586, "step": 905} {"info/global_step": 906, "train_info/time_within_train_step": 27.875592708587646, "step": 906} {"train_info/time_between_train_steps": 0.005292415618896484, "step": 906} {"info/global_step": 907, "train_info/time_within_train_step": 27.804466724395752, "step": 907} {"train_info/time_between_train_steps": 0.005299568176269531, "step": 907} {"info/global_step": 908, "train_info/time_within_train_step": 27.801083087921143, "step": 908} {"train_info/time_between_train_steps": 0.00581812858581543, "step": 908} {"info/global_step": 909, "train_info/time_within_train_step": 27.924331188201904, "step": 909} {"train_info/time_between_train_steps": 0.0052814483642578125, "step": 909} {"info/global_step": 910, "train_info/time_within_train_step": 27.825196743011475, "step": 910} {"train_info/time_between_train_steps": 0.006045341491699219, "step": 910} {"info/global_step": 911, "train_info/time_within_train_step": 27.840593099594116, "step": 911} {"train_info/time_between_train_steps": 0.006079435348510742, "step": 911} {"info/global_step": 912, "train_info/time_within_train_step": 27.888762950897217, "step": 912} {"train_info/time_between_train_steps": 0.006135702133178711, "step": 912} {"train_info/time_between_train_steps": 5.085971117019653, "step": 912} {"info/global_step": 913, "train_info/time_within_train_step": 27.817318201065063, "step": 913} {"train_info/time_between_train_steps": 0.005024433135986328, "step": 913} {"info/global_step": 914, "train_info/time_within_train_step": 27.97433114051819, "step": 914} {"train_info/time_between_train_steps": 0.006505727767944336, "step": 914} {"info/global_step": 915, "train_info/time_within_train_step": 27.94943904876709, "step": 915} {"train_info/time_between_train_steps": 0.005566120147705078, "step": 915} {"info/global_step": 916, "train_info/time_within_train_step": 28.04191303253174, "step": 916} {"train_info/time_between_train_steps": 0.005540370941162109, "step": 916} {"info/global_step": 917, "train_info/time_within_train_step": 27.926685333251953, "step": 917} {"train_info/time_between_train_steps": 0.0052187442779541016, "step": 917} {"info/global_step": 918, "train_info/time_within_train_step": 27.85184645652771, "step": 918} {"train_info/time_between_train_steps": 0.00523686408996582, "step": 918} {"info/global_step": 919, "train_info/time_within_train_step": 27.94430136680603, "step": 919} {"train_info/time_between_train_steps": 0.005269765853881836, "step": 919} {"info/global_step": 920, "train_info/time_within_train_step": 27.838752031326294, "step": 920} {"train_info/time_between_train_steps": 0.005185365676879883, "step": 920} {"info/global_step": 921, "train_info/time_within_train_step": 27.80368733406067, "step": 921} {"train_info/time_between_train_steps": 0.0056989192962646484, "step": 921} {"info/global_step": 922, "train_info/time_within_train_step": 27.8658230304718, "step": 922} {"train_info/time_between_train_steps": 0.005913972854614258, "step": 922} {"info/global_step": 923, "train_info/time_within_train_step": 27.876071453094482, "step": 923} {"train_info/time_between_train_steps": 0.005391359329223633, "step": 923} {"info/global_step": 924, "train_info/time_within_train_step": 27.842966318130493, "step": 924} {"train_info/time_between_train_steps": 0.005644083023071289, "step": 924} {"info/global_step": 925, "train_info/time_within_train_step": 27.826216220855713, "step": 925} {"train_info/time_between_train_steps": 0.009181022644042969, "step": 925} {"info/global_step": 926, "train_info/time_within_train_step": 27.84077477455139, "step": 926} {"train_info/time_between_train_steps": 0.005381107330322266, "step": 926} {"info/global_step": 927, "train_info/time_within_train_step": 27.917213916778564, "step": 927} {"train_info/time_between_train_steps": 0.005394697189331055, "step": 927} {"info/global_step": 928, "train_info/time_within_train_step": 27.82552146911621, "step": 928} {"train_info/time_between_train_steps": 0.009613513946533203, "step": 928} {"info/global_step": 929, "train_info/time_within_train_step": 27.828991889953613, "step": 929} {"train_info/time_between_train_steps": 0.005264997482299805, "step": 929} {"info/global_step": 930, "train_info/time_within_train_step": 27.84946894645691, "step": 930} {"train_info/time_between_train_steps": 0.005398750305175781, "step": 930} {"info/global_step": 931, "train_info/time_within_train_step": 27.903262615203857, "step": 931} {"train_info/time_between_train_steps": 0.0055963993072509766, "step": 931} {"info/global_step": 932, "train_info/time_within_train_step": 28.01182794570923, "step": 932} {"train_info/time_between_train_steps": 0.005692481994628906, "step": 932} {"info/global_step": 933, "train_info/time_within_train_step": 27.81058621406555, "step": 933} {"train_info/time_between_train_steps": 0.005754232406616211, "step": 933} {"info/global_step": 934, "train_info/time_within_train_step": 27.965450048446655, "step": 934} {"train_info/time_between_train_steps": 0.0070648193359375, "step": 934} {"info/global_step": 935, "train_info/time_within_train_step": 28.131367444992065, "step": 935} {"train_info/time_between_train_steps": 0.005963563919067383, "step": 935} {"info/global_step": 936, "train_info/time_within_train_step": 27.927685976028442, "step": 936} {"train_info/time_between_train_steps": 0.006070375442504883, "step": 936} {"train_info/time_between_train_steps": 5.437132835388184, "step": 936} {"info/global_step": 937, "train_info/time_within_train_step": 27.84115982055664, "step": 937} {"train_info/time_between_train_steps": 0.0055806636810302734, "step": 937} {"info/global_step": 938, "train_info/time_within_train_step": 28.006691694259644, "step": 938} {"train_info/time_between_train_steps": 0.0065898895263671875, "step": 938} {"info/global_step": 939, "train_info/time_within_train_step": 27.80047607421875, "step": 939} {"train_info/time_between_train_steps": 0.005469560623168945, "step": 939} {"info/global_step": 940, "train_info/time_within_train_step": 27.92683696746826, "step": 940} {"train_info/time_between_train_steps": 0.005613088607788086, "step": 940} {"info/global_step": 941, "train_info/time_within_train_step": 27.842132806777954, "step": 941} {"train_info/time_between_train_steps": 0.005785226821899414, "step": 941} {"info/global_step": 942, "train_info/time_within_train_step": 27.827579021453857, "step": 942} {"train_info/time_between_train_steps": 0.010230064392089844, "step": 942} {"info/global_step": 943, "train_info/time_within_train_step": 27.84981632232666, "step": 943} {"train_info/time_between_train_steps": 0.00640559196472168, "step": 943} {"info/global_step": 944, "train_info/time_within_train_step": 27.93044900894165, "step": 944} {"train_info/time_between_train_steps": 0.005368947982788086, "step": 944} {"info/global_step": 945, "train_info/time_within_train_step": 27.81655263900757, "step": 945} {"train_info/time_between_train_steps": 0.005617380142211914, "step": 945} {"info/global_step": 946, "train_info/time_within_train_step": 27.825392484664917, "step": 946} {"train_info/time_between_train_steps": 0.0053827762603759766, "step": 946} {"info/global_step": 947, "train_info/time_within_train_step": 27.829052686691284, "step": 947} {"train_info/time_between_train_steps": 0.0055119991302490234, "step": 947} {"info/global_step": 948, "train_info/time_within_train_step": 27.929964065551758, "step": 948} {"train_info/time_between_train_steps": 0.010542869567871094, "step": 948} {"info/global_step": 949, "train_info/time_within_train_step": 27.88458013534546, "step": 949} {"train_info/time_between_train_steps": 0.005186557769775391, "step": 949} {"info/global_step": 950, "train_info/time_within_train_step": 27.85302209854126, "step": 950} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733889082, "_runtime": 27394}, "step": 950} {"logs": {"train/loss": 3.9461, "train/learning_rate": 0.0001388888888888889, "train/epoch": 39.01, "_timestamp": 1733889082, "_runtime": 27394}, "step": 950} {"train_info/time_between_train_steps": 0.007400035858154297, "step": 950} {"info/global_step": 951, "train_info/time_within_train_step": 27.93006181716919, "step": 951} {"train_info/time_between_train_steps": 0.005506992340087891, "step": 951} {"info/global_step": 952, "train_info/time_within_train_step": 27.88629961013794, "step": 952} {"train_info/time_between_train_steps": 0.009310483932495117, "step": 952} {"info/global_step": 953, "train_info/time_within_train_step": 27.82680892944336, "step": 953} {"train_info/time_between_train_steps": 0.005295991897583008, "step": 953} {"info/global_step": 954, "train_info/time_within_train_step": 27.94121766090393, "step": 954} {"train_info/time_between_train_steps": 0.018523216247558594, "step": 954} {"info/global_step": 955, "train_info/time_within_train_step": 27.943815231323242, "step": 955} {"train_info/time_between_train_steps": 0.005396842956542969, "step": 955} {"info/global_step": 956, "train_info/time_within_train_step": 27.859354496002197, "step": 956} {"train_info/time_between_train_steps": 0.005617618560791016, "step": 956} {"info/global_step": 957, "train_info/time_within_train_step": 27.888511180877686, "step": 957} {"train_info/time_between_train_steps": 0.00799703598022461, "step": 957} {"info/global_step": 958, "train_info/time_within_train_step": 27.889397382736206, "step": 958} {"train_info/time_between_train_steps": 0.009823799133300781, "step": 958} {"info/global_step": 959, "train_info/time_within_train_step": 27.882930755615234, "step": 959} {"train_info/time_between_train_steps": 0.006162405014038086, "step": 959} {"info/global_step": 960, "train_info/time_within_train_step": 27.8966166973114, "step": 960} {"train_info/time_between_train_steps": 0.005913734436035156, "step": 960} {"train_info/time_between_train_steps": 5.191656589508057, "step": 960} {"info/global_step": 961, "train_info/time_within_train_step": 27.789000511169434, "step": 961} {"train_info/time_between_train_steps": 0.005738973617553711, "step": 961} {"info/global_step": 962, "train_info/time_within_train_step": 28.052489519119263, "step": 962} {"train_info/time_between_train_steps": 0.005551815032958984, "step": 962} {"info/global_step": 963, "train_info/time_within_train_step": 27.9151771068573, "step": 963} {"train_info/time_between_train_steps": 0.005597114562988281, "step": 963} {"info/global_step": 964, "train_info/time_within_train_step": 28.411425828933716, "step": 964} {"train_info/time_between_train_steps": 0.0050678253173828125, "step": 964} {"info/global_step": 965, "train_info/time_within_train_step": 27.83763360977173, "step": 965} {"train_info/time_between_train_steps": 0.0058650970458984375, "step": 965} {"info/global_step": 966, "train_info/time_within_train_step": 27.977898597717285, "step": 966} {"train_info/time_between_train_steps": 0.005273580551147461, "step": 966} {"info/global_step": 967, "train_info/time_within_train_step": 27.887017965316772, "step": 967} {"train_info/time_between_train_steps": 0.0051593780517578125, "step": 967} {"info/global_step": 968, "train_info/time_within_train_step": 27.821566343307495, "step": 968} {"train_info/time_between_train_steps": 0.005392551422119141, "step": 968} {"info/global_step": 969, "train_info/time_within_train_step": 27.810842275619507, "step": 969} {"train_info/time_between_train_steps": 0.005220651626586914, "step": 969} {"info/global_step": 970, "train_info/time_within_train_step": 27.844110012054443, "step": 970} {"train_info/time_between_train_steps": 0.0054836273193359375, "step": 970} {"info/global_step": 971, "train_info/time_within_train_step": 27.80595374107361, "step": 971} {"train_info/time_between_train_steps": 0.005359649658203125, "step": 971} {"info/global_step": 972, "train_info/time_within_train_step": 27.851890802383423, "step": 972} {"train_info/time_between_train_steps": 0.011244535446166992, "step": 972} {"info/global_step": 973, "train_info/time_within_train_step": 27.857337474822998, "step": 973} {"train_info/time_between_train_steps": 0.0053637027740478516, "step": 973} {"info/global_step": 974, "train_info/time_within_train_step": 27.86637592315674, "step": 974} {"train_info/time_between_train_steps": 0.005276203155517578, "step": 974} {"info/global_step": 975, "train_info/time_within_train_step": 27.866991758346558, "step": 975} {"train_info/time_between_train_steps": 0.010159492492675781, "step": 975} {"info/global_step": 976, "train_info/time_within_train_step": 27.831337451934814, "step": 976} {"train_info/time_between_train_steps": 0.00559544563293457, "step": 976} {"info/global_step": 977, "train_info/time_within_train_step": 27.88849663734436, "step": 977} {"train_info/time_between_train_steps": 0.0051991939544677734, "step": 977} {"info/global_step": 978, "train_info/time_within_train_step": 27.87962317466736, "step": 978} {"train_info/time_between_train_steps": 0.005331993103027344, "step": 978} {"info/global_step": 979, "train_info/time_within_train_step": 27.851089477539062, "step": 979} {"train_info/time_between_train_steps": 0.011881589889526367, "step": 979} {"info/global_step": 980, "train_info/time_within_train_step": 27.930831909179688, "step": 980} {"train_info/time_between_train_steps": 0.01476740837097168, "step": 980} {"info/global_step": 981, "train_info/time_within_train_step": 27.913533449172974, "step": 981} {"train_info/time_between_train_steps": 0.007160663604736328, "step": 981} {"info/global_step": 982, "train_info/time_within_train_step": 28.11786651611328, "step": 982} {"train_info/time_between_train_steps": 0.013040781021118164, "step": 982} {"info/global_step": 983, "train_info/time_within_train_step": 27.899564027786255, "step": 983} {"train_info/time_between_train_steps": 0.011513471603393555, "step": 983} {"info/global_step": 984, "train_info/time_within_train_step": 27.90519404411316, "step": 984} {"train_info/time_between_train_steps": 0.006306886672973633, "step": 984} {"train_info/time_between_train_steps": 5.3222222328186035, "step": 984} {"info/global_step": 985, "train_info/time_within_train_step": 27.84534525871277, "step": 985} {"train_info/time_between_train_steps": 0.005148172378540039, "step": 985} {"info/global_step": 986, "train_info/time_within_train_step": 28.026160717010498, "step": 986} {"train_info/time_between_train_steps": 0.0057599544525146484, "step": 986} {"info/global_step": 987, "train_info/time_within_train_step": 27.87250852584839, "step": 987} {"train_info/time_between_train_steps": 0.01073312759399414, "step": 987} {"info/global_step": 988, "train_info/time_within_train_step": 27.89476466178894, "step": 988} {"train_info/time_between_train_steps": 0.010852575302124023, "step": 988} {"info/global_step": 989, "train_info/time_within_train_step": 27.911609411239624, "step": 989} {"train_info/time_between_train_steps": 0.009978532791137695, "step": 989} {"info/global_step": 990, "train_info/time_within_train_step": 27.848854780197144, "step": 990} {"train_info/time_between_train_steps": 0.005465507507324219, "step": 990} {"info/global_step": 991, "train_info/time_within_train_step": 27.806310892105103, "step": 991} {"train_info/time_between_train_steps": 0.00540924072265625, "step": 991} {"info/global_step": 992, "train_info/time_within_train_step": 27.85192632675171, "step": 992} {"train_info/time_between_train_steps": 0.005357503890991211, "step": 992} {"info/global_step": 993, "train_info/time_within_train_step": 27.83337712287903, "step": 993} {"train_info/time_between_train_steps": 0.005525350570678711, "step": 993} {"info/global_step": 994, "train_info/time_within_train_step": 27.934894323349, "step": 994} {"train_info/time_between_train_steps": 0.009718179702758789, "step": 994} {"info/global_step": 995, "train_info/time_within_train_step": 27.91450810432434, "step": 995} {"train_info/time_between_train_steps": 0.005321025848388672, "step": 995} {"info/global_step": 996, "train_info/time_within_train_step": 27.864219427108765, "step": 996} {"train_info/time_between_train_steps": 0.005610942840576172, "step": 996} {"info/global_step": 997, "train_info/time_within_train_step": 28.008266925811768, "step": 997} {"train_info/time_between_train_steps": 0.010438680648803711, "step": 997} {"info/global_step": 998, "train_info/time_within_train_step": 27.83282995223999, "step": 998} {"train_info/time_between_train_steps": 0.010363101959228516, "step": 998} {"info/global_step": 999, "train_info/time_within_train_step": 27.869904041290283, "step": 999} {"train_info/time_between_train_steps": 0.005359649658203125, "step": 999} {"info/global_step": 1000, "train_info/time_within_train_step": 27.885088682174683, "step": 1000} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22648.0, "train_info/memory_max_reserved": 22648.0, "_timestamp": 1733890487, "_runtime": 28799}, "step": 1000} {"logs": {"train/loss": 3.8885, "train/learning_rate": 0.00011111111111111109, "train/epoch": 41.01, "_timestamp": 1733890487, "_runtime": 28799}, "step": 1000} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733890489, "_runtime": 28801}, "step": 1000} {"logs": {"eval/loss": 5.021076202392578, "eval/runtime": 1.8249, "eval/samples_per_second": 50.963, "eval/steps_per_second": 3.288, "train/epoch": 41.01, "_timestamp": 1733890489, "_runtime": 28801}, "step": 1000} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733890489, "_runtime": 28801}, "step": 1000} {"logs": {"eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_loss": 5.021076202392578, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_ppl": 151.57434071608614, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_runtime": 1.8249, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_samples_per_second": 50.963, "train/epoch": 41.01, "_timestamp": 1733890489, "_runtime": 28801}, "step": 1000} {"train_info/time_between_train_steps": 4.208867788314819, "step": 1000} {"info/global_step": 1001, "train_info/time_within_train_step": 27.871687650680542, "step": 1001} {"train_info/time_between_train_steps": 0.010308265686035156, "step": 1001} {"info/global_step": 1002, "train_info/time_within_train_step": 27.84255075454712, "step": 1002} {"train_info/time_between_train_steps": 0.005226612091064453, "step": 1002} {"info/global_step": 1003, "train_info/time_within_train_step": 27.873998403549194, "step": 1003} {"train_info/time_between_train_steps": 0.005320310592651367, "step": 1003} {"info/global_step": 1004, "train_info/time_within_train_step": 27.84050679206848, "step": 1004} {"train_info/time_between_train_steps": 0.010746002197265625, "step": 1004} {"info/global_step": 1005, "train_info/time_within_train_step": 27.91942071914673, "step": 1005} {"train_info/time_between_train_steps": 0.005536317825317383, "step": 1005} {"info/global_step": 1006, "train_info/time_within_train_step": 27.880692720413208, "step": 1006} {"train_info/time_between_train_steps": 0.0062940120697021484, "step": 1006} {"info/global_step": 1007, "train_info/time_within_train_step": 27.865641355514526, "step": 1007} {"train_info/time_between_train_steps": 0.010835886001586914, "step": 1007} {"info/global_step": 1008, "train_info/time_within_train_step": 27.99689292907715, "step": 1008} {"train_info/time_between_train_steps": 0.010865449905395508, "step": 1008} {"train_info/time_between_train_steps": 5.426269054412842, "step": 1008} {"info/global_step": 1009, "train_info/time_within_train_step": 27.834061861038208, "step": 1009} {"train_info/time_between_train_steps": 0.01191091537475586, "step": 1009} {"info/global_step": 1010, "train_info/time_within_train_step": 27.97603130340576, "step": 1010} {"train_info/time_between_train_steps": 0.005285024642944336, "step": 1010} {"info/global_step": 1011, "train_info/time_within_train_step": 27.933807134628296, "step": 1011} {"train_info/time_between_train_steps": 0.00547337532043457, "step": 1011} {"info/global_step": 1012, "train_info/time_within_train_step": 27.945985794067383, "step": 1012} {"train_info/time_between_train_steps": 0.005488157272338867, "step": 1012} {"info/global_step": 1013, "train_info/time_within_train_step": 27.975032806396484, "step": 1013} {"train_info/time_between_train_steps": 0.0052869319915771484, "step": 1013} {"info/global_step": 1014, "train_info/time_within_train_step": 27.847171306610107, "step": 1014} {"train_info/time_between_train_steps": 0.014146566390991211, "step": 1014} {"info/global_step": 1015, "train_info/time_within_train_step": 27.91959023475647, "step": 1015} {"train_info/time_between_train_steps": 0.009741067886352539, "step": 1015} {"info/global_step": 1016, "train_info/time_within_train_step": 27.85541081428528, "step": 1016} {"train_info/time_between_train_steps": 0.010186433792114258, "step": 1016} {"info/global_step": 1017, "train_info/time_within_train_step": 27.88287615776062, "step": 1017} {"train_info/time_between_train_steps": 0.005461692810058594, "step": 1017} {"info/global_step": 1018, "train_info/time_within_train_step": 27.824490308761597, "step": 1018} {"train_info/time_between_train_steps": 0.005400180816650391, "step": 1018} {"info/global_step": 1019, "train_info/time_within_train_step": 27.83704400062561, "step": 1019} {"train_info/time_between_train_steps": 0.005383491516113281, "step": 1019} {"info/global_step": 1020, "train_info/time_within_train_step": 27.93085741996765, "step": 1020} {"train_info/time_between_train_steps": 0.0072023868560791016, "step": 1020} {"info/global_step": 1021, "train_info/time_within_train_step": 27.890251636505127, "step": 1021} {"train_info/time_between_train_steps": 0.005392789840698242, "step": 1021} {"info/global_step": 1022, "train_info/time_within_train_step": 27.814088106155396, "step": 1022} {"train_info/time_between_train_steps": 0.005352973937988281, "step": 1022} {"info/global_step": 1023, "train_info/time_within_train_step": 27.812724351882935, "step": 1023} {"train_info/time_between_train_steps": 0.0053558349609375, "step": 1023} {"info/global_step": 1024, "train_info/time_within_train_step": 27.879349946975708, "step": 1024} {"train_info/time_between_train_steps": 0.005811214447021484, "step": 1024} {"info/global_step": 1025, "train_info/time_within_train_step": 27.849042415618896, "step": 1025} {"train_info/time_between_train_steps": 0.005323886871337891, "step": 1025} {"info/global_step": 1026, "train_info/time_within_train_step": 27.816988945007324, "step": 1026} {"train_info/time_between_train_steps": 0.00547480583190918, "step": 1026} {"info/global_step": 1027, "train_info/time_within_train_step": 27.818432331085205, "step": 1027} {"train_info/time_between_train_steps": 0.005283355712890625, "step": 1027} {"info/global_step": 1028, "train_info/time_within_train_step": 28.04896569252014, "step": 1028} {"train_info/time_between_train_steps": 0.00604248046875, "step": 1028} {"info/global_step": 1029, "train_info/time_within_train_step": 27.856252193450928, "step": 1029} {"train_info/time_between_train_steps": 0.005608081817626953, "step": 1029} {"info/global_step": 1030, "train_info/time_within_train_step": 27.89925503730774, "step": 1030} {"train_info/time_between_train_steps": 0.00982809066772461, "step": 1030} {"info/global_step": 1031, "train_info/time_within_train_step": 27.8701491355896, "step": 1031} {"train_info/time_between_train_steps": 0.011253118515014648, "step": 1031} {"info/global_step": 1032, "train_info/time_within_train_step": 27.858869075775146, "step": 1032} {"train_info/time_between_train_steps": 0.0070421695709228516, "step": 1032} {"train_info/time_between_train_steps": 5.631202697753906, "step": 1032} {"info/global_step": 1033, "train_info/time_within_train_step": 27.875207901000977, "step": 1033} {"train_info/time_between_train_steps": 0.010218620300292969, "step": 1033} {"info/global_step": 1034, "train_info/time_within_train_step": 28.023854732513428, "step": 1034} {"train_info/time_between_train_steps": 0.005663156509399414, "step": 1034} {"info/global_step": 1035, "train_info/time_within_train_step": 27.858847856521606, "step": 1035} {"train_info/time_between_train_steps": 0.010233640670776367, "step": 1035} {"info/global_step": 1036, "train_info/time_within_train_step": 27.96044635772705, "step": 1036} {"train_info/time_between_train_steps": 0.005649089813232422, "step": 1036} {"info/global_step": 1037, "train_info/time_within_train_step": 27.82658886909485, "step": 1037} {"train_info/time_between_train_steps": 0.0054895877838134766, "step": 1037} {"info/global_step": 1038, "train_info/time_within_train_step": 27.847219467163086, "step": 1038} {"train_info/time_between_train_steps": 0.0050258636474609375, "step": 1038} {"info/global_step": 1039, "train_info/time_within_train_step": 27.800825357437134, "step": 1039} {"train_info/time_between_train_steps": 0.005166530609130859, "step": 1039} {"info/global_step": 1040, "train_info/time_within_train_step": 27.850704193115234, "step": 1040} {"train_info/time_between_train_steps": 0.005276918411254883, "step": 1040} {"info/global_step": 1041, "train_info/time_within_train_step": 27.860581874847412, "step": 1041} {"train_info/time_between_train_steps": 0.005258321762084961, "step": 1041} {"info/global_step": 1042, "train_info/time_within_train_step": 27.894838094711304, "step": 1042} {"train_info/time_between_train_steps": 0.009755373001098633, "step": 1042} {"info/global_step": 1043, "train_info/time_within_train_step": 27.88935685157776, "step": 1043} {"train_info/time_between_train_steps": 0.005264997482299805, "step": 1043} {"info/global_step": 1044, "train_info/time_within_train_step": 27.943812370300293, "step": 1044} {"train_info/time_between_train_steps": 0.005316495895385742, "step": 1044} {"info/global_step": 1045, "train_info/time_within_train_step": 27.898627996444702, "step": 1045} {"train_info/time_between_train_steps": 0.005282163619995117, "step": 1045} {"info/global_step": 1046, "train_info/time_within_train_step": 27.890408039093018, "step": 1046} {"train_info/time_between_train_steps": 0.005305767059326172, "step": 1046} {"info/global_step": 1047, "train_info/time_within_train_step": 27.83865213394165, "step": 1047} {"train_info/time_between_train_steps": 0.010326147079467773, "step": 1047} {"info/global_step": 1048, "train_info/time_within_train_step": 27.825844526290894, "step": 1048} {"train_info/time_between_train_steps": 0.005569934844970703, "step": 1048} {"info/global_step": 1049, "train_info/time_within_train_step": 27.864558696746826, "step": 1049} {"train_info/time_between_train_steps": 0.009278297424316406, "step": 1049} {"info/global_step": 1050, "train_info/time_within_train_step": 27.882912635803223, "step": 1050} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733891897, "_runtime": 30209}, "step": 1050} {"logs": {"train/loss": 3.8378, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 43.02, "_timestamp": 1733891897, "_runtime": 30209}, "step": 1050} {"train_info/time_between_train_steps": 0.010396003723144531, "step": 1050} {"info/global_step": 1051, "train_info/time_within_train_step": 27.870380401611328, "step": 1051} {"train_info/time_between_train_steps": 0.009507894515991211, "step": 1051} {"info/global_step": 1052, "train_info/time_within_train_step": 27.832257747650146, "step": 1052} {"train_info/time_between_train_steps": 0.009567975997924805, "step": 1052} {"info/global_step": 1053, "train_info/time_within_train_step": 27.935939073562622, "step": 1053} {"train_info/time_between_train_steps": 0.0055081844329833984, "step": 1053} {"info/global_step": 1054, "train_info/time_within_train_step": 27.880056619644165, "step": 1054} {"train_info/time_between_train_steps": 0.010406494140625, "step": 1054} {"info/global_step": 1055, "train_info/time_within_train_step": 27.860008001327515, "step": 1055} {"train_info/time_between_train_steps": 0.00567317008972168, "step": 1055} {"info/global_step": 1056, "train_info/time_within_train_step": 27.90692710876465, "step": 1056} {"train_info/time_between_train_steps": 0.00601959228515625, "step": 1056} {"train_info/time_between_train_steps": 5.076283693313599, "step": 1056} {"info/global_step": 1057, "train_info/time_within_train_step": 27.840405225753784, "step": 1057} {"train_info/time_between_train_steps": 0.005169391632080078, "step": 1057} {"info/global_step": 1058, "train_info/time_within_train_step": 28.035789966583252, "step": 1058} {"train_info/time_between_train_steps": 0.005443096160888672, "step": 1058} {"info/global_step": 1059, "train_info/time_within_train_step": 27.889871835708618, "step": 1059} {"train_info/time_between_train_steps": 0.005475044250488281, "step": 1059} {"info/global_step": 1060, "train_info/time_within_train_step": 28.028029918670654, "step": 1060} {"train_info/time_between_train_steps": 0.005610942840576172, "step": 1060} {"info/global_step": 1061, "train_info/time_within_train_step": 27.823429107666016, "step": 1061} {"train_info/time_between_train_steps": 0.005183219909667969, "step": 1061} {"info/global_step": 1062, "train_info/time_within_train_step": 27.829499006271362, "step": 1062} {"train_info/time_between_train_steps": 0.005187034606933594, "step": 1062} {"info/global_step": 1063, "train_info/time_within_train_step": 27.781425952911377, "step": 1063} {"train_info/time_between_train_steps": 0.005378246307373047, "step": 1063} {"info/global_step": 1064, "train_info/time_within_train_step": 27.827489137649536, "step": 1064} {"train_info/time_between_train_steps": 0.005195140838623047, "step": 1064} {"info/global_step": 1065, "train_info/time_within_train_step": 27.831575632095337, "step": 1065} {"train_info/time_between_train_steps": 0.005433797836303711, "step": 1065} {"info/global_step": 1066, "train_info/time_within_train_step": 27.86000967025757, "step": 1066} {"train_info/time_between_train_steps": 0.005422830581665039, "step": 1066} {"info/global_step": 1067, "train_info/time_within_train_step": 27.841500282287598, "step": 1067} {"train_info/time_between_train_steps": 0.005216360092163086, "step": 1067} {"info/global_step": 1068, "train_info/time_within_train_step": 27.848201990127563, "step": 1068} {"train_info/time_between_train_steps": 0.005240917205810547, "step": 1068} {"info/global_step": 1069, "train_info/time_within_train_step": 27.81586480140686, "step": 1069} {"train_info/time_between_train_steps": 0.00553584098815918, "step": 1069} {"info/global_step": 1070, "train_info/time_within_train_step": 27.87034583091736, "step": 1070} {"train_info/time_between_train_steps": 0.010185480117797852, "step": 1070} {"info/global_step": 1071, "train_info/time_within_train_step": 27.8208429813385, "step": 1071} {"train_info/time_between_train_steps": 0.005502939224243164, "step": 1071} {"info/global_step": 1072, "train_info/time_within_train_step": 27.8571138381958, "step": 1072} {"train_info/time_between_train_steps": 0.005479574203491211, "step": 1072} {"info/global_step": 1073, "train_info/time_within_train_step": 27.901679754257202, "step": 1073} {"train_info/time_between_train_steps": 0.0064699649810791016, "step": 1073} {"info/global_step": 1074, "train_info/time_within_train_step": 27.861160039901733, "step": 1074} {"train_info/time_between_train_steps": 0.005468606948852539, "step": 1074} {"info/global_step": 1075, "train_info/time_within_train_step": 28.04956865310669, "step": 1075} {"train_info/time_between_train_steps": 0.0055484771728515625, "step": 1075} {"info/global_step": 1076, "train_info/time_within_train_step": 27.876789331436157, "step": 1076} {"train_info/time_between_train_steps": 0.0059244632720947266, "step": 1076} {"info/global_step": 1077, "train_info/time_within_train_step": 27.894335746765137, "step": 1077} {"train_info/time_between_train_steps": 0.005440235137939453, "step": 1077} {"info/global_step": 1078, "train_info/time_within_train_step": 27.837372541427612, "step": 1078} {"train_info/time_between_train_steps": 0.00574803352355957, "step": 1078} {"info/global_step": 1079, "train_info/time_within_train_step": 27.862847328186035, "step": 1079} {"train_info/time_between_train_steps": 0.0058135986328125, "step": 1079} {"info/global_step": 1080, "train_info/time_within_train_step": 27.939833164215088, "step": 1080} {"train_info/time_between_train_steps": 0.006144285202026367, "step": 1080} {"train_info/time_between_train_steps": 5.433382272720337, "step": 1080} {"info/global_step": 1081, "train_info/time_within_train_step": 27.86947202682495, "step": 1081} {"train_info/time_between_train_steps": 0.01010751724243164, "step": 1081} {"info/global_step": 1082, "train_info/time_within_train_step": 28.01881718635559, "step": 1082} {"train_info/time_between_train_steps": 0.005396604537963867, "step": 1082} {"info/global_step": 1083, "train_info/time_within_train_step": 27.928024291992188, "step": 1083} {"train_info/time_between_train_steps": 0.005327701568603516, "step": 1083} {"info/global_step": 1084, "train_info/time_within_train_step": 27.879897832870483, "step": 1084} {"train_info/time_between_train_steps": 0.005597829818725586, "step": 1084} {"info/global_step": 1085, "train_info/time_within_train_step": 27.84545636177063, "step": 1085} {"train_info/time_between_train_steps": 0.00518035888671875, "step": 1085} {"info/global_step": 1086, "train_info/time_within_train_step": 27.820013761520386, "step": 1086} {"train_info/time_between_train_steps": 0.005136013031005859, "step": 1086} {"info/global_step": 1087, "train_info/time_within_train_step": 27.82221007347107, "step": 1087} {"train_info/time_between_train_steps": 0.00972437858581543, "step": 1087} {"info/global_step": 1088, "train_info/time_within_train_step": 27.811971187591553, "step": 1088} {"train_info/time_between_train_steps": 0.005386829376220703, "step": 1088} {"info/global_step": 1089, "train_info/time_within_train_step": 27.79498600959778, "step": 1089} {"train_info/time_between_train_steps": 0.005358219146728516, "step": 1089} {"info/global_step": 1090, "train_info/time_within_train_step": 27.800930976867676, "step": 1090} {"train_info/time_between_train_steps": 0.005383491516113281, "step": 1090} {"info/global_step": 1091, "train_info/time_within_train_step": 27.90198254585266, "step": 1091} {"train_info/time_between_train_steps": 0.009496688842773438, "step": 1091} {"info/global_step": 1092, "train_info/time_within_train_step": 27.837273836135864, "step": 1092} {"train_info/time_between_train_steps": 0.006284952163696289, "step": 1092} {"info/global_step": 1093, "train_info/time_within_train_step": 27.8120756149292, "step": 1093} {"train_info/time_between_train_steps": 0.0055468082427978516, "step": 1093} {"info/global_step": 1094, "train_info/time_within_train_step": 27.841538190841675, "step": 1094} {"train_info/time_between_train_steps": 0.005209922790527344, "step": 1094} {"info/global_step": 1095, "train_info/time_within_train_step": 27.830973625183105, "step": 1095} {"train_info/time_between_train_steps": 0.0053424835205078125, "step": 1095} {"info/global_step": 1096, "train_info/time_within_train_step": 27.84394598007202, "step": 1096} {"train_info/time_between_train_steps": 0.0053327083587646484, "step": 1096} {"info/global_step": 1097, "train_info/time_within_train_step": 27.92316508293152, "step": 1097} {"train_info/time_between_train_steps": 0.0055446624755859375, "step": 1097} {"info/global_step": 1098, "train_info/time_within_train_step": 27.883422374725342, "step": 1098} {"train_info/time_between_train_steps": 0.005305290222167969, "step": 1098} {"info/global_step": 1099, "train_info/time_within_train_step": 27.865355730056763, "step": 1099} {"train_info/time_between_train_steps": 0.005285024642944336, "step": 1099} {"info/global_step": 1100, "train_info/time_within_train_step": 27.873096704483032, "step": 1100} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733893302, "_runtime": 31614}, "step": 1100} {"logs": {"train/loss": 3.795, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 45.02, "_timestamp": 1733893302, "_runtime": 31614}, "step": 1100} {"train_info/time_between_train_steps": 2.3480334281921387, "step": 1100} {"info/global_step": 1101, "train_info/time_within_train_step": 27.819809436798096, "step": 1101} {"train_info/time_between_train_steps": 0.005479574203491211, "step": 1101} {"info/global_step": 1102, "train_info/time_within_train_step": 27.82911515235901, "step": 1102} {"train_info/time_between_train_steps": 0.005760908126831055, "step": 1102} {"info/global_step": 1103, "train_info/time_within_train_step": 27.89913821220398, "step": 1103} {"train_info/time_between_train_steps": 0.006544589996337891, "step": 1103} {"info/global_step": 1104, "train_info/time_within_train_step": 27.878231287002563, "step": 1104} {"train_info/time_between_train_steps": 0.00638127326965332, "step": 1104} {"train_info/time_between_train_steps": 5.429275035858154, "step": 1104} {"info/global_step": 1105, "train_info/time_within_train_step": 27.801952600479126, "step": 1105} {"train_info/time_between_train_steps": 0.00572657585144043, "step": 1105} {"info/global_step": 1106, "train_info/time_within_train_step": 28.12136435508728, "step": 1106} {"train_info/time_between_train_steps": 0.005679607391357422, "step": 1106} {"info/global_step": 1107, "train_info/time_within_train_step": 27.84022045135498, "step": 1107} {"train_info/time_between_train_steps": 0.005803108215332031, "step": 1107} {"info/global_step": 1108, "train_info/time_within_train_step": 27.927231311798096, "step": 1108} {"train_info/time_between_train_steps": 0.00576329231262207, "step": 1108} {"info/global_step": 1109, "train_info/time_within_train_step": 27.82115125656128, "step": 1109} {"train_info/time_between_train_steps": 0.009726524353027344, "step": 1109} {"info/global_step": 1110, "train_info/time_within_train_step": 27.84475016593933, "step": 1110} {"train_info/time_between_train_steps": 0.005287647247314453, "step": 1110} {"info/global_step": 1111, "train_info/time_within_train_step": 27.821574926376343, "step": 1111} {"train_info/time_between_train_steps": 0.005259513854980469, "step": 1111} {"info/global_step": 1112, "train_info/time_within_train_step": 27.83818030357361, "step": 1112} {"train_info/time_between_train_steps": 0.0053670406341552734, "step": 1112} {"info/global_step": 1113, "train_info/time_within_train_step": 27.871209621429443, "step": 1113} {"train_info/time_between_train_steps": 0.005872011184692383, "step": 1113} {"info/global_step": 1114, "train_info/time_within_train_step": 27.851113319396973, "step": 1114} {"train_info/time_between_train_steps": 0.005345582962036133, "step": 1114} {"info/global_step": 1115, "train_info/time_within_train_step": 27.8630211353302, "step": 1115} {"train_info/time_between_train_steps": 0.009368658065795898, "step": 1115} {"info/global_step": 1116, "train_info/time_within_train_step": 27.82919931411743, "step": 1116} {"train_info/time_between_train_steps": 0.005470991134643555, "step": 1116} {"info/global_step": 1117, "train_info/time_within_train_step": 27.795893669128418, "step": 1117} {"train_info/time_between_train_steps": 0.005371570587158203, "step": 1117} {"info/global_step": 1118, "train_info/time_within_train_step": 27.81351399421692, "step": 1118} {"train_info/time_between_train_steps": 0.005371809005737305, "step": 1118} {"info/global_step": 1119, "train_info/time_within_train_step": 27.87670087814331, "step": 1119} {"train_info/time_between_train_steps": 0.005535602569580078, "step": 1119} {"info/global_step": 1120, "train_info/time_within_train_step": 27.8546245098114, "step": 1120} {"train_info/time_between_train_steps": 0.005479335784912109, "step": 1120} {"info/global_step": 1121, "train_info/time_within_train_step": 27.780725955963135, "step": 1121} {"train_info/time_between_train_steps": 0.005257606506347656, "step": 1121} {"info/global_step": 1122, "train_info/time_within_train_step": 27.91702675819397, "step": 1122} {"train_info/time_between_train_steps": 0.005615711212158203, "step": 1122} {"info/global_step": 1123, "train_info/time_within_train_step": 27.83725619316101, "step": 1123} {"train_info/time_between_train_steps": 0.005323886871337891, "step": 1123} {"info/global_step": 1124, "train_info/time_within_train_step": 27.790276288986206, "step": 1124} {"train_info/time_between_train_steps": 0.005994558334350586, "step": 1124} {"info/global_step": 1125, "train_info/time_within_train_step": 27.972107410430908, "step": 1125} {"train_info/time_between_train_steps": 0.005520820617675781, "step": 1125} {"info/global_step": 1126, "train_info/time_within_train_step": 27.920991897583008, "step": 1126} {"train_info/time_between_train_steps": 0.0057659149169921875, "step": 1126} {"info/global_step": 1127, "train_info/time_within_train_step": 27.863704442977905, "step": 1127} {"train_info/time_between_train_steps": 0.005798816680908203, "step": 1127} {"info/global_step": 1128, "train_info/time_within_train_step": 27.84405493736267, "step": 1128} {"train_info/time_between_train_steps": 0.010540008544921875, "step": 1128} {"train_info/time_between_train_steps": 5.095949172973633, "step": 1128} {"info/global_step": 1129, "train_info/time_within_train_step": 27.899057149887085, "step": 1129} {"train_info/time_between_train_steps": 0.005826473236083984, "step": 1129} {"info/global_step": 1130, "train_info/time_within_train_step": 28.023507356643677, "step": 1130} {"train_info/time_between_train_steps": 0.005648374557495117, "step": 1130} {"info/global_step": 1131, "train_info/time_within_train_step": 27.80763292312622, "step": 1131} {"train_info/time_between_train_steps": 0.006804943084716797, "step": 1131} {"info/global_step": 1132, "train_info/time_within_train_step": 27.906848192214966, "step": 1132} {"train_info/time_between_train_steps": 0.0055999755859375, "step": 1132} {"info/global_step": 1133, "train_info/time_within_train_step": 27.797048568725586, "step": 1133} {"train_info/time_between_train_steps": 0.005110025405883789, "step": 1133} {"info/global_step": 1134, "train_info/time_within_train_step": 27.830748319625854, "step": 1134} {"train_info/time_between_train_steps": 0.010213136672973633, "step": 1134} {"info/global_step": 1135, "train_info/time_within_train_step": 27.767333269119263, "step": 1135} {"train_info/time_between_train_steps": 0.010088443756103516, "step": 1135} {"info/global_step": 1136, "train_info/time_within_train_step": 27.76253867149353, "step": 1136} {"train_info/time_between_train_steps": 0.00527644157409668, "step": 1136} {"info/global_step": 1137, "train_info/time_within_train_step": 27.88440203666687, "step": 1137} {"train_info/time_between_train_steps": 0.005332469940185547, "step": 1137} {"info/global_step": 1138, "train_info/time_within_train_step": 27.78595805168152, "step": 1138} {"train_info/time_between_train_steps": 0.0051119327545166016, "step": 1138} {"info/global_step": 1139, "train_info/time_within_train_step": 27.79640483856201, "step": 1139} {"train_info/time_between_train_steps": 0.005146503448486328, "step": 1139} {"info/global_step": 1140, "train_info/time_within_train_step": 27.97141933441162, "step": 1140} {"train_info/time_between_train_steps": 0.009627103805541992, "step": 1140} {"info/global_step": 1141, "train_info/time_within_train_step": 27.777838230133057, "step": 1141} {"train_info/time_between_train_steps": 0.006667375564575195, "step": 1141} {"info/global_step": 1142, "train_info/time_within_train_step": 27.77028489112854, "step": 1142} {"train_info/time_between_train_steps": 0.005158662796020508, "step": 1142} {"info/global_step": 1143, "train_info/time_within_train_step": 27.782121658325195, "step": 1143} {"train_info/time_between_train_steps": 0.005317211151123047, "step": 1143} {"info/global_step": 1144, "train_info/time_within_train_step": 27.75640892982483, "step": 1144} {"train_info/time_between_train_steps": 0.005335092544555664, "step": 1144} {"info/global_step": 1145, "train_info/time_within_train_step": 27.747837781906128, "step": 1145} {"train_info/time_between_train_steps": 0.00524592399597168, "step": 1145} {"info/global_step": 1146, "train_info/time_within_train_step": 27.794943809509277, "step": 1146} {"train_info/time_between_train_steps": 0.00536656379699707, "step": 1146} {"info/global_step": 1147, "train_info/time_within_train_step": 27.789411783218384, "step": 1147} {"train_info/time_between_train_steps": 0.005321979522705078, "step": 1147} {"info/global_step": 1148, "train_info/time_within_train_step": 27.785889863967896, "step": 1148} {"train_info/time_between_train_steps": 0.005522012710571289, "step": 1148} {"info/global_step": 1149, "train_info/time_within_train_step": 27.779873847961426, "step": 1149} {"train_info/time_between_train_steps": 0.01063680648803711, "step": 1149} {"info/global_step": 1150, "train_info/time_within_train_step": 27.966851949691772, "step": 1150} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733894707, "_runtime": 33019}, "step": 1150} {"logs": {"train/loss": 3.759, "train/learning_rate": 2.7777777777777772e-05, "train/epoch": 47.02, "_timestamp": 1733894707, "_runtime": 33019}, "step": 1150} {"train_info/time_between_train_steps": 0.007906436920166016, "step": 1150} {"info/global_step": 1151, "train_info/time_within_train_step": 27.835726022720337, "step": 1151} {"train_info/time_between_train_steps": 0.011323690414428711, "step": 1151} {"info/global_step": 1152, "train_info/time_within_train_step": 27.824504137039185, "step": 1152} {"train_info/time_between_train_steps": 0.005723237991333008, "step": 1152} {"train_info/time_between_train_steps": 5.2894017696380615, "step": 1152} {"info/global_step": 1153, "train_info/time_within_train_step": 27.985440492630005, "step": 1153} {"train_info/time_between_train_steps": 0.005067110061645508, "step": 1153} {"info/global_step": 1154, "train_info/time_within_train_step": 27.958593368530273, "step": 1154} {"train_info/time_between_train_steps": 0.005697965621948242, "step": 1154} {"info/global_step": 1155, "train_info/time_within_train_step": 27.82355284690857, "step": 1155} {"train_info/time_between_train_steps": 0.005614042282104492, "step": 1155} {"info/global_step": 1156, "train_info/time_within_train_step": 27.937049865722656, "step": 1156} {"train_info/time_between_train_steps": 0.0055696964263916016, "step": 1156} {"info/global_step": 1157, "train_info/time_within_train_step": 27.911148071289062, "step": 1157} {"train_info/time_between_train_steps": 0.010195493698120117, "step": 1157} {"info/global_step": 1158, "train_info/time_within_train_step": 27.859436988830566, "step": 1158} {"train_info/time_between_train_steps": 0.00612187385559082, "step": 1158} {"info/global_step": 1159, "train_info/time_within_train_step": 27.848834991455078, "step": 1159} {"train_info/time_between_train_steps": 0.0053653717041015625, "step": 1159} {"info/global_step": 1160, "train_info/time_within_train_step": 27.8270845413208, "step": 1160} {"train_info/time_between_train_steps": 0.005553483963012695, "step": 1160} {"info/global_step": 1161, "train_info/time_within_train_step": 27.937666654586792, "step": 1161} {"train_info/time_between_train_steps": 0.009557247161865234, "step": 1161} {"info/global_step": 1162, "train_info/time_within_train_step": 27.889426469802856, "step": 1162} {"train_info/time_between_train_steps": 0.005408048629760742, "step": 1162} {"info/global_step": 1163, "train_info/time_within_train_step": 27.807403087615967, "step": 1163} {"train_info/time_between_train_steps": 0.0055408477783203125, "step": 1163} {"info/global_step": 1164, "train_info/time_within_train_step": 27.82313847541809, "step": 1164} {"train_info/time_between_train_steps": 0.005788564682006836, "step": 1164} {"info/global_step": 1165, "train_info/time_within_train_step": 27.812424182891846, "step": 1165} {"train_info/time_between_train_steps": 0.005278825759887695, "step": 1165} {"info/global_step": 1166, "train_info/time_within_train_step": 27.809709787368774, "step": 1166} {"train_info/time_between_train_steps": 0.009994983673095703, "step": 1166} {"info/global_step": 1167, "train_info/time_within_train_step": 27.82848834991455, "step": 1167} {"train_info/time_between_train_steps": 0.005500316619873047, "step": 1167} {"info/global_step": 1168, "train_info/time_within_train_step": 27.817094564437866, "step": 1168} {"train_info/time_between_train_steps": 0.010876178741455078, "step": 1168} {"info/global_step": 1169, "train_info/time_within_train_step": 28.011725902557373, "step": 1169} {"train_info/time_between_train_steps": 0.005517721176147461, "step": 1169} {"info/global_step": 1170, "train_info/time_within_train_step": 27.841821432113647, "step": 1170} {"train_info/time_between_train_steps": 0.00686335563659668, "step": 1170} {"info/global_step": 1171, "train_info/time_within_train_step": 27.825981616973877, "step": 1171} {"train_info/time_between_train_steps": 0.005440235137939453, "step": 1171} {"info/global_step": 1172, "train_info/time_within_train_step": 27.810929775238037, "step": 1172} {"train_info/time_between_train_steps": 0.005632638931274414, "step": 1172} {"info/global_step": 1173, "train_info/time_within_train_step": 27.806205987930298, "step": 1173} {"train_info/time_between_train_steps": 0.005555629730224609, "step": 1173} {"info/global_step": 1174, "train_info/time_within_train_step": 27.86811661720276, "step": 1174} {"train_info/time_between_train_steps": 0.005770683288574219, "step": 1174} {"info/global_step": 1175, "train_info/time_within_train_step": 27.852508068084717, "step": 1175} {"train_info/time_between_train_steps": 0.005838632583618164, "step": 1175} {"info/global_step": 1176, "train_info/time_within_train_step": 27.874561309814453, "step": 1176} {"train_info/time_between_train_steps": 0.006274700164794922, "step": 1176} {"train_info/time_between_train_steps": 5.651469469070435, "step": 1176} {"info/global_step": 1177, "train_info/time_within_train_step": 27.818220615386963, "step": 1177} {"train_info/time_between_train_steps": 0.0054509639739990234, "step": 1177} {"info/global_step": 1178, "train_info/time_within_train_step": 27.972622394561768, "step": 1178} {"train_info/time_between_train_steps": 0.010340690612792969, "step": 1178} {"info/global_step": 1179, "train_info/time_within_train_step": 27.805202960968018, "step": 1179} {"train_info/time_between_train_steps": 0.0056116580963134766, "step": 1179} {"info/global_step": 1180, "train_info/time_within_train_step": 27.895092010498047, "step": 1180} {"train_info/time_between_train_steps": 0.005451679229736328, "step": 1180} {"info/global_step": 1181, "train_info/time_within_train_step": 27.863542079925537, "step": 1181} {"train_info/time_between_train_steps": 0.005273342132568359, "step": 1181} {"info/global_step": 1182, "train_info/time_within_train_step": 27.808309316635132, "step": 1182} {"train_info/time_between_train_steps": 0.0073893070220947266, "step": 1182} {"info/global_step": 1183, "train_info/time_within_train_step": 27.802002906799316, "step": 1183} {"train_info/time_between_train_steps": 0.005164623260498047, "step": 1183} {"info/global_step": 1184, "train_info/time_within_train_step": 27.897860527038574, "step": 1184} {"train_info/time_between_train_steps": 0.005354166030883789, "step": 1184} {"info/global_step": 1185, "train_info/time_within_train_step": 27.824500799179077, "step": 1185} {"train_info/time_between_train_steps": 0.0053369998931884766, "step": 1185} {"info/global_step": 1186, "train_info/time_within_train_step": 27.798107385635376, "step": 1186} {"train_info/time_between_train_steps": 0.005399942398071289, "step": 1186} {"info/global_step": 1187, "train_info/time_within_train_step": 27.82336711883545, "step": 1187} {"train_info/time_between_train_steps": 0.0055332183837890625, "step": 1187} {"info/global_step": 1188, "train_info/time_within_train_step": 27.878303050994873, "step": 1188} {"train_info/time_between_train_steps": 0.005467414855957031, "step": 1188} {"info/global_step": 1189, "train_info/time_within_train_step": 27.82072401046753, "step": 1189} {"train_info/time_between_train_steps": 0.0052378177642822266, "step": 1189} {"info/global_step": 1190, "train_info/time_within_train_step": 27.812041521072388, "step": 1190} {"train_info/time_between_train_steps": 0.005345582962036133, "step": 1190} {"info/global_step": 1191, "train_info/time_within_train_step": 27.769029140472412, "step": 1191} {"train_info/time_between_train_steps": 0.005259990692138672, "step": 1191} {"info/global_step": 1192, "train_info/time_within_train_step": 27.788742542266846, "step": 1192} {"train_info/time_between_train_steps": 0.006676197052001953, "step": 1192} {"info/global_step": 1193, "train_info/time_within_train_step": 27.83833622932434, "step": 1193} {"train_info/time_between_train_steps": 0.005631208419799805, "step": 1193} {"info/global_step": 1194, "train_info/time_within_train_step": 27.80966806411743, "step": 1194} {"train_info/time_between_train_steps": 0.005423784255981445, "step": 1194} {"info/global_step": 1195, "train_info/time_within_train_step": 27.84249782562256, "step": 1195} {"train_info/time_between_train_steps": 0.011593818664550781, "step": 1195} {"info/global_step": 1196, "train_info/time_within_train_step": 27.849767208099365, "step": 1196} {"train_info/time_between_train_steps": 0.010730266571044922, "step": 1196} {"info/global_step": 1197, "train_info/time_within_train_step": 27.838176727294922, "step": 1197} {"train_info/time_between_train_steps": 0.008304357528686523, "step": 1197} {"info/global_step": 1198, "train_info/time_within_train_step": 27.835001945495605, "step": 1198} {"train_info/time_between_train_steps": 0.011017560958862305, "step": 1198} {"info/global_step": 1199, "train_info/time_within_train_step": 27.881232976913452, "step": 1199} {"train_info/time_between_train_steps": 0.011040687561035156, "step": 1199} {"info/global_step": 1200, "train_info/time_within_train_step": 27.97308039665222, "step": 1200} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733896111, "_runtime": 34423}, "step": 1200} {"logs": {"train/loss": 3.7334, "train/learning_rate": 0.0, "train/epoch": 49.02, "_timestamp": 1733896111, "_runtime": 34423}, "step": 1200} {"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733896114, "_runtime": 34426}, "step": 1200} {"logs": {"train/train_runtime": 34426.6186, "train/train_samples_per_second": 17.847, "train/train_steps_per_second": 0.035, "train/total_flos": 3.21920667353088e+17, "train/train_loss": 4.8886952106157935, "train/epoch": 49.02, "_timestamp": 1733896114, "_runtime": 34426}, "step": 1200} {"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733896116, "_runtime": 34428}, "step": 1200} {"logs": {"eval/loss": 5.034140110015869, "eval/runtime": 1.8285, "eval/samples_per_second": 50.861, "eval/steps_per_second": 3.281, "train/epoch": 49.02, "_timestamp": 1733896116, "_runtime": 34428}, "step": 1200} {"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27358.0, "train_info/memory_max_reserved": 27358.0, "_timestamp": 1733896116, "_runtime": 34428}, "step": 1200} {"logs": {"eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_loss": 5.034140110015869, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_ppl": 153.567484678875, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_runtime": 1.8285, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_samples_per_second": 50.861, "train/epoch": 49.02, "_timestamp": 1733896116, "_runtime": 34428}, "step": 1200}